Добавить dogfood-манифест stage-loop

2026-05-09 13:34:56 +03:00 · 2026-05-09 13:34:56 +03:00 · 913745380f
parent de1aa3d17c
commit 913745380f
5 changed files with 193 additions and 1 deletions
--- a/docs/orchestration/agentic_semantic_development_loop_stage_pack.json
+++ b/docs/orchestration/agentic_semantic_development_loop_stage_pack.json
@ -0,0 +1,100 @@
 {
  "schema_version": "domain_scenario_pack_v1",
  "pack_id": "agentic_semantic_development_loop_stage_pack",
  "domain": "agentic_semantic_development_loop_control",
  "title": "Agentic semantic development loop control pack",
  "description": "Compact stage pack for dogfooding the agentic development loop against business-overview, VAT, stale-scope, and legacy-canary questions.",
  "analysis_context": {
    "as_of_date": "2026-05-09",
    "source": "agentic_semantic_development_loop_stage_pack"
  },
  "bindings": {
    "main_organization": "ООО Альтернатива Плюс",
    "control_year": "2020",
    "svk_counterparty": "Группа СВК"
  },
  "scenarios": [
    {
      "scenario_id": "agentic_loop_business_overview_control",
      "title": "Business overview and stale-scope control",
      "description": "Checks direct business-answer shape, period carryover, all-time reset, VAT boundary, and organization scope hygiene.",
      "steps": [
        {
          "step_id": "step_01_business_overview",
          "title": "Business overview for explicit period",
          "question": "Дай взрослый бизнес-обзор {{bindings.main_organization}} за {{bindings.control_year}} год по данным 1С: обороты, входящие и исходящие деньги, нетто, НДС, долги, склад, клиенты, поставщики и что пока нельзя утверждать.",
          "expected_intents": ["business_overview"],
          "required_answer_shape": "direct_answer_first",
          "forbidden_answer_patterns": [
            "(?i)capability_id",
            "(?i)selected_chain_id",
            "(?i)runtime_",
            "(?i)business_overview_route_template_v1"
          ]
        },
        {
          "step_id": "step_02_money_followup",
          "title": "Money follow-up",
          "question": "Раскрой деньги подробнее: сколько получили, сколько заплатили, какой чистый денежный поток, кто главный клиент и главный поставщик в {{bindings.control_year}}.",
          "depends_on": ["step_01_business_overview"],
          "required_answer_shape": "direct_answer_first"
        },
        {
          "step_id": "step_03_best_year_all_time",
          "title": "All-time best operating-flow year",
          "question": "А если смотреть за все доступное время, какой самый доходный год по подтвержденным оборотам и почему? Не называй это бухгалтерской прибылью, если чистой прибыли нет.",
          "depends_on": ["step_02_money_followup"],
          "required_answer_shape": "direct_answer_first"
        },
        {
          "step_id": "step_04_vat_explicit_period",
          "title": "VAT explicit period",
          "question": "Что с НДС за {{bindings.control_year}} год по {{bindings.main_organization}}: какая позиция видна, на чем она основана и чего не хватает для налогового вывода?",
          "depends_on": ["step_03_best_year_all_time"],
          "required_answer_shape": "direct_answer_first"
        },
        {
          "step_id": "step_05_all_time_no_vat_carryover",
          "title": "All-time reset without stale VAT carryover",
          "question": "Теперь за все доступное время дай обзор компании в целом, но не тащи НДС за {{bindings.control_year}} как подтвержденную общую налоговую позицию.",
          "depends_on": ["step_04_vat_explicit_period"],
          "required_answer_shape": "direct_answer_first"
        }
      ]
    },
    {
      "scenario_id": "agentic_loop_counterparty_pivot_control",
      "title": "Counterparty pivot and legacy canaries",
      "description": "Checks explicit counterparty arbitration after organization context and keeps technical/debug details out of the final answer.",
      "steps": [
        {
          "step_id": "step_01_svk_money",
          "title": "Explicit counterparty money flow",
          "question": "Теперь отдельно по контрагенту {{bindings.svk_counterparty}}: сколько денег прошло, что входящее, что исходящее и есть ли документы или движения, на которых это основано?",
          "expected_intents": ["value_flow"],
          "required_answer_shape": "direct_answer_first",
          "forbidden_answer_patterns": [
            "(?i)capability_id",
            "(?i)selected_chain_id",
            "(?i)runtime_",
            "(?i)mcp_discovery"
          ]
        },
        {
          "step_id": "step_02_svk_documents",
          "title": "Counterparty documents follow-up",
          "question": "Покажи документы по этой цепочке и не смешивай {{bindings.svk_counterparty}} с организацией {{bindings.main_organization}}.",
          "depends_on": ["step_01_svk_money"],
          "required_answer_shape": "direct_answer_first"
        },
        {
          "step_id": "step_03_final_summary",
          "title": "Final executive summary",
          "question": "Собери короткий итог: что мы подтвердили по компании, что отдельно по {{bindings.svk_counterparty}}, какие выводы можно делать и какие нельзя.",
          "depends_on": ["step_01_svk_money", "step_02_svk_documents"],
          "required_answer_shape": "direct_answer_first"
        }
      ]
    }
  ]
 }
--- a/docs/orchestration/domain_scenario_loop_repo_adapter.md
+++ b/docs/orchestration/domain_scenario_loop_repo_adapter.md
@ -145,7 +145,7 @@ It stores the GUI review under `artifacts/domain_runs/stage_agent_loops/<stage_i
 Use `python scripts/stage_agent_loop.py status --manifest docs/orchestration/<stage_loop>.json` as the cheap read-only checkpoint before continuing a stage. It prints the current next action, closing gate, latest GUI run, latest repair coder status, and latest repair validation status without modifying artifacts.
-Use `python scripts/stage_agent_loop.py continue --manifest docs/orchestration/<stage_loop>.json` as the safe one-command continuation layer. It can prepare a repair iteration and materialize `run-repair --dry-run` automatically; it will not run the real coder pass unless `--execute-repair` is passed, and it waits for a `--run-id assistant-stage1-<id>` when the next required step is post-repair rerun/ingest validation.
+Use `python scripts/stage_agent_loop.py continue --manifest docs/orchestration/<stage_loop>.json` as the safe one-command continuation layer. From a cold start it materializes `domain_pack_loop.command.txt` without launching the long live loop; after a GUI review it can prepare a repair iteration and materialize `run-repair --dry-run` automatically; it will not run the real coder pass unless `--execute-repair` is passed, and it waits for a `--run-id assistant-stage1-<id>` when the next required step is post-repair rerun/ingest validation.
 It also writes `stage_repair_handoff.md/json` next to the stage summary. That handoff is the preferred input for the next coder pass: it lists primary repair targets and sample user-facing failures without forcing the coder to reread the entire GUI conversation first.
--- a/docs/orchestration/stage_agent_loop_agentic_semantic_development_loop.json
+++ b/docs/orchestration/stage_agent_loop_agentic_semantic_development_loop.json
@ -0,0 +1,27 @@
 {
  "schema_version": "stage_agent_loop_manifest_v1",
  "stage_id": "agentic_semantic_development_loop",
  "module_name": "Agentic Semantic Development Loop",
  "title": "Agentic semantic development loop dogfood gate",
  "architecture_phase": "turnaround_11_agentic_semantic_development_loop",
  "agent_focus": "Automate stage implementation, semantic replay review, repair handoff, coder pass, rerun validation, and final human confirmation.",
  "current_stage_status": "active_dogfood",
  "global_plan_refs": [
    "docs/orchestration/domain_scenario_loop_repo_adapter.md",
    "docs/ARCH/11 - architecture_turnaround/README.md",
    "AGENTS.md codex_domain_loop and agent_semantic_runs"
  ],
  "pack_manifest": "docs/orchestration/agentic_semantic_development_loop_stage_pack.json",
  "loop_id": "agentic_semantic_development_loop",
  "target_score": 88,
  "max_iterations": 6,
  "acceptance_invariants": [
    "status command exposes next_action, repair state, validation state, and closing gate",
    "continue command never runs the real coder pass without --execute-repair",
    "patched repair cannot close the stage without successful rerun/ingest validation",
    "business answers remain direct, context-aware, and free of internal route/debug ids",
    "manual GUI confirmation remains required after accepted semantic replay"
  ],
  "save_autorun_on_accept": true,
  "manual_confirmation_required_after_accept": true
 }
--- a/scripts/stage_agent_loop.py
+++ b/scripts/stage_agent_loop.py
@ -1265,6 +1265,32 @@ def handle_continue(args: argparse.Namespace) -> int:
                    ),
                }
            )
    elif next_action == "run_stage_loop_or_ingest_gui_run":
        if getattr(args, "run_id", None):
            ingest_summary = ingest_gui_run_review(args)
            payload.update(
                {
                    "performed_action": "ingest_gui_run_from_cold_start",
                    "ingest_summary": ingest_summary,
                    "next_action": ingest_summary.get("next_action"),
                }
            )
        else:
            write_json(stage_dir / "stage_manifest.json", stage_manifest)
            write_text(stage_dir / "stage_manifest_source.txt", repo_relative(stage_manifest_path) + "\n")
            command = build_domain_pack_loop_command(args, stage_manifest, stage_dir)
            write_text(stage_dir / "domain_pack_loop.command.txt", " ".join(command) + "\n")
            payload.update(
                {
                    "performed_action": "materialize_stage_run_dry_run",
                    "domain_pack_loop_command": command,
                    "next_action": next_action,
                    "suggested_command": (
                        "python scripts/stage_agent_loop.py run "
                        "--manifest <stage_manifest.json>"
                    ),
                }
            )
    else:
        payload.update(
            {
--- a/scripts/test_stage_agent_loop.py
+++ b/scripts/test_stage_agent_loop.py
@ -778,6 +778,45 @@ class StageAgentLoopTests(unittest.TestCase):
        self.assertEqual(result["performed_action"], "wait_for_rerun_ingest")
        self.assertEqual(result["next_action"], "rerun_same_stage_or_gui_and_ingest_result")
    def test_handle_continue_materializes_stage_run_from_cold_start(self) -> None:
        with tempfile.TemporaryDirectory() as tmp:
            root = Path(tmp)
            manifest_path = root / "stage.json"
            output_root = root / "stage_runs"
            stage_dir = output_root / "agent_loop"
            write_json(
                manifest_path,
                {
                    "stage_id": "agent_loop",
                    "module_name": "Agent Loop",
                    "title": "Agent Loop",
                    "pack_manifest": "docs/orchestration/demo_pack.json",
                },
            )
            exit_code = stage_loop.handle_continue(
                stage_args(
                    manifest=str(manifest_path),
                    output_root=str(output_root),
                    handoff=None,
                    iteration_id=None,
                    plan=None,
                    coder_schema=str(root / "coder.schema.json"),
                    execute_repair=False,
                    run_id=None,
                    session_file=None,
                    sessions_dir=str(root / "sessions"),
                    reports_dir=str(root / "reports"),
                    review_output_dir=None,
                )
            )
            result = json.loads((stage_dir / "stage_continue_result.json").read_text(encoding="utf-8"))
            command_text = (stage_dir / "domain_pack_loop.command.txt").read_text(encoding="utf-8")
        self.assertEqual(exit_code, 0)
        self.assertEqual(result["performed_action"], "materialize_stage_run_dry_run")
        self.assertIn("run-pack-loop", command_text)
    def test_resolve_stage_repair_iteration_auto_prepares_from_handoff(self) -> None:
        with tempfile.TemporaryDirectory() as tmp:
            root = Path(tmp)