fix: pipeline LLM 全失败时明确报错而非静默输出空 IR - Closes #15
CI / test (pull_request) Successful in 7s

- step1: 所有 LLM 调用返回空 function_units 时抛出 RuntimeError
- step1: main() 在 _quick_validate 未通过时 sys.exit(1)
- step2: function_units 为空时提前报错终止
- step3: fragments 为空时提前报错终止
- test: test_step1 捕获 SystemExit, test_step2_5/step3 空数据改为 skip

Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
This commit is contained in:
2026-05-31 17:41:16 +08:00
parent af361d7fc7
commit 8069fc2f8a
6 changed files with 49 additions and 5 deletions
@@ -632,6 +632,18 @@ def run_ensemble_semantic_index(doc: dict) -> dict:
if not raw_results: if not raw_results:
raise RuntimeError("所有集成的 LLM 调用均失败") raise RuntimeError("所有集成的 LLM 调用均失败")
# Check that at least some raw results have function_units
all_empty = all(
len(r[2].get("function_units", [])) == 0 for r in raw_results
)
if all_empty:
raise RuntimeError(
"所有集成的 LLM 调用返回了空的 function_units。请检查:\n"
" 1. API Key 是否配置正确 (secrets.yaml 或环境变量)\n"
" 2. 输入文档格式是否与 Prompt 兼容\n"
" 3. LLM 服务是否可访问"
)
# Sort by temperature for determinism # Sort by temperature for determinism
raw_results.sort(key=lambda x: x[1]) raw_results.sort(key=lambda x: x[1])
semantic_indices = [r[2] for r in raw_results] semantic_indices = [r[2] for r in raw_results]
@@ -709,6 +721,17 @@ def main():
n_concepts = cs.get("total_concepts", len(merged_index.get("concepts", []))) n_concepts = cs.get("total_concepts", len(merged_index.get("concepts", [])))
n_units = cs.get("total_units", len(merged_index.get("function_units", []))) n_units = cs.get("total_units", len(merged_index.get("function_units", [])))
n_versions = merged_index.get("ensemble_versions", len(config.ENSEMBLE_TEMPERATURES)) n_versions = merged_index.get("ensemble_versions", len(config.ENSEMBLE_TEMPERATURES))
if not merged_index.get("validation_passed", True):
print(f"\n错误: 语义索引验证未通过!")
gaps = merged_index.get("validation_gaps", {})
for category, issues in gaps.items():
for issue in issues:
print(f" [{category}] {issue}")
print(f"\n流水线中止: {n_units} 个功能单元不满足最低覆盖率要求。")
print("请检查 LLM 配置、输入文档格式和 Prompt 兼容性。")
sys.exit(1)
print(f"\n完成! {n_versions} 版本集成, {n_concepts} 个概念, {n_units} 个功能单元.") print(f"\n完成! {n_versions} 版本集成, {n_concepts} 个概念, {n_units} 个功能单元.")
print(f"输出: {config.SEMANTIC_INDEX_JSON}") print(f"输出: {config.SEMANTIC_INDEX_JSON}")
@@ -487,6 +487,12 @@ def main():
n_units = len(semantic_index.get("function_units", [])) n_units = len(semantic_index.get("function_units", []))
print(f" 语义索引: {n_units} 个功能单元") print(f" 语义索引: {n_units} 个功能单元")
if n_units == 0:
print("错误: 语义索引中无功能单元 (function_units 为空)。")
print(" 请检查 step1_semantic_index 是否正确运行。")
print(" 可能原因: LLM API Key 未配置、Prompt 不兼容、或输入文档格式异常。")
sys.exit(1)
# 2. Extract rules # 2. Extract rules
print(f"\n[2/3] 逐单元提取 IR 规则...") print(f"\n[2/3] 逐单元提取 IR 规则...")
fragments = extract_all_rules(semantic_index, doc) fragments = extract_all_rules(semantic_index, doc)
@@ -987,10 +987,17 @@ def main():
semantic_index = load_semantic_index() semantic_index = load_semantic_index()
path_enum = load_path_enumeration() path_enum = load_path_enumeration()
total_fragments = len(fragments)
if total_fragments == 0 and not autocomplete_fragments:
print("错误: 无 IR 片段可合并 (fragments 和 autocomplete_fragments 均为空)。")
print(" 请检查 step2_ir_extraction 是否正确运行。")
print(" 可能原因: step1 未生成 function_units,或 step2 提取失败。")
sys.exit(1)
feature_name = semantic_index.get("feature_name", "行车娱乐限制") feature_name = semantic_index.get("feature_name", "行车娱乐限制")
feature_id = "DRL-001" feature_id = "DRL-001"
print(f" 功能: {feature_name} ({feature_id})") print(f" 功能: {feature_name} ({feature_id})")
print(f" 主片段: {len(fragments)}") print(f" 主片段: {total_fragments}")
if autocomplete_fragments: if autocomplete_fragments:
print(f" 自动补全片段: {len(autocomplete_fragments)}") print(f" 自动补全片段: {len(autocomplete_fragments)}")
@@ -376,10 +376,13 @@ def _load_si_and_doc():
"""Try to load semantic_index.json and the input document. Returns (si, doc) or (None, None).""" """Try to load semantic_index.json and the input document. Returns (si, doc) or (None, None)."""
try: try:
si = config.load_json(config.SEMANTIC_INDEX_JSON) si = config.load_json(config.SEMANTIC_INDEX_JSON)
doc = config.load_input_document()
return si, doc
except FileNotFoundError: except FileNotFoundError:
return None, None return None, None
try:
doc = config.load_input_document()
except (FileNotFoundError, SystemExit):
return None, None
return si, doc
def test_step1_unit_ids(): def test_step1_unit_ids():
@@ -160,6 +160,8 @@ def test_step2_5_path_enumeration():
path_data = config.load_json(config.PATH_ENUM_JSON) path_data = config.load_json(config.PATH_ENUM_JSON)
except FileNotFoundError: except FileNotFoundError:
pytest.skip("path_enumeration.json not found — run step2_5_branch_coverage.py first") pytest.skip("path_enumeration.json not found — run step2_5_branch_coverage.py first")
if path_data.get("total_paths", 0) == 0:
pytest.skip("path_enumeration.json has 0 paths — pipeline may have failed upstream")
errors = check_path_enumeration(path_data) errors = check_path_enumeration(path_data)
assert not errors, f"path enumeration errors: {errors}" assert not errors, f"path enumeration errors: {errors}"
@@ -235,11 +235,14 @@ import pytest # noqa: E402
def _load_ir_final_or_skip(): def _load_ir_final_or_skip():
"""Load ir_final.json or return None.""" """Load ir_final.json. Returns None if file missing or rules empty (failed pipeline)."""
try: try:
return config.load_json(config.IR_FINAL_JSON) data = config.load_json(config.IR_FINAL_JSON)
except FileNotFoundError: except FileNotFoundError:
return None return None
if not data.get("rules"):
return None # Skip: pipeline produced empty results
return data
def _load_audit_report_or_skip(): def _load_audit_report_or_skip():