From 6ddd61f9756acfbb5f3a6941526bac7cb8e156cf Mon Sep 17 00:00:00 2001 From: dctouch Date: Sat, 23 May 2026 22:13:25 +0300 Subject: [PATCH] =?UTF-8?q?=D0=94=D0=BE=D0=B1=D0=B0=D0=B2=D0=B8=D1=82?= =?UTF-8?q?=D1=8C=20AGENT-=D0=BF=D1=80=D0=BE=D0=B3=D0=BE=D0=BD=20selected-?= =?UTF-8?q?object=20=D0=B8=20multi-org=20=D0=BA=D0=BE=D0=BD=D1=82=D0=B5?= =?UTF-8?q?=D0=BA=D1=81=D1=82=D0=B0?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- ...autonomy_selected_object_mix_20260523.json | 378 ++++++++++++++++++ .../data/autorun_generators/history.json | 66 +++ ..._20260523191234_gen-ag05231912-4420c2.json | 259 ++++++++++++ ..._20260523191234_gen-ag05231912-4420c2.json | 70 ++++ 4 files changed, 773 insertions(+) create mode 100644 docs/orchestration/agent_autonomy_selected_object_mix_20260523.json create mode 100644 llm_normalizer/data/autorun_generators/saved_sessions/assistant_saved_session_20260523191234_gen-ag05231912-4420c2.json create mode 100644 llm_normalizer/data/eval_cases/assistant_autogen_saved_user_sessions_20260523191234_gen-ag05231912-4420c2.json diff --git a/docs/orchestration/agent_autonomy_selected_object_mix_20260523.json b/docs/orchestration/agent_autonomy_selected_object_mix_20260523.json new file mode 100644 index 0000000..390af0d --- /dev/null +++ b/docs/orchestration/agent_autonomy_selected_object_mix_20260523.json @@ -0,0 +1,378 @@ +{ + "schema_version": "domain_truth_harness_spec_v1", + "scenario_id": "address_truth_harness_phase7_meta_domain_mix", + "domain": "address_phase7_meta_domain_mix", + "title": "Phase 7 mixed replay for documents, selected-object continuity, meta context, and cross-domain pivots", + "description": "Mixed AGENT replay for turnaround 11. The pack interleaves counterparty documents, inventory root and selected-object continuity, meta-space interruptions, memory recap, receivables to inventory same-date pivot, and an account 60 tail check.", + "bindings": {}, + "steps": [ + { + "step_id": "step_01_smalltalk", + "title": "Casual chat stays human and non-technical", + "question": "привет, как дела?", + "required_answer_patterns_any": [ + "(?i)привет|дела|помочь|норм" + ], + "forbidden_answer_patterns": [ + "(?i)tool_gate_reason", + "(?i)address_mode", + "(?i)hard_meta_mode", + "(?i)living_reason" + ], + "criticality": "info", + "semantic_tags": [ + "meta_smalltalk" + ], + "notes": "[mixed_pack_slot=slot_01_smalltalk source=address_truth_harness_phase6_provider_axis_mix:step_01_smalltalk]" + }, + { + "step_id": "step_01_counterparty_documents", + "title": "Counterparty documents use the normalized legal name", + "question": "покажи все документы по чепурнову", + "allowed_reply_types": [ + "factual" + ], + "expected_intents": [ + "list_documents_by_counterparty" + ], + "required_direct_answer_patterns_any": [ + "(?i)контрагент:", + "(?i)чепурнов" + ], + "criticality": "critical", + "semantic_tags": [ + "counterparty_documents" + ], + "notes": "[mixed_pack_slot=slot_03_counterparty_documents source=address_truth_harness_phase4_coverage_evidence_mix:step_01_counterparty_documents]" + }, + { + "step_id": "step_02_counterparty_shipments_or_fallback", + "title": "Supplier shipment question stays human even when exact supply rows are absent", + "question": "что нам отгружал чепурнов, какой товар или услугу?", + "allowed_reply_types": [ + "factual", + "partial_coverage" + ], + "expected_intents": [ + "list_documents_by_counterparty" + ], + "required_direct_answer_patterns_any": [ + "(?i)чепурнов", + "(?i)постав", + "(?i)оплат|возврат|товар|услуг" + ], + "forbidden_direct_answer_patterns": [ + "(?i)^сейчас не дам прямой адресный ответ", + "(?i)^в текущем адресном контуре этот запрос лучше не закрывать в лоб" + ], + "criticality": "critical", + "semantic_tags": [ + "counterparty_shipment_fallback" + ], + "notes": "[mixed_pack_slot=slot_04_counterparty_shipment_fallback source=address_truth_harness_phase4_coverage_evidence_mix:step_02_counterparty_shipments_or_fallback]" + }, + { + "step_id": "step_01_inventory_march_2021", + "title": "Inventory root snapshot at March 2021 asks organization in multi-company scope", + "criticality": "critical", + "question": "какие остатки на складе на март 2021", + "allowed_reply_types": [ + "partial_coverage", + "factual" + ], + "expected_intents": [ + "inventory_on_hand_as_of_date" + ], + "required_filters": { + "as_of_date": "2021-03-31" + }, + "required_direct_answer_patterns_any": [ + "(?i)организац", + "(?i)компан", + "31\\.03\\.2021", + "(?i)на складе", + "(?i)столешница 600\\*3050\\*26 альмандин" + ], + "semantic_tags": [ + "inventory_root" + ], + "notes": "[mixed_pack_slot=slot_05_inventory_root source=address_truth_harness_phase7_acceptance_gate_mix:step_01_inventory_march_2021]" + }, + { + "step_id": "step_01b_inventory_march_2021_org_selection", + "title": "Organization selection resumes suspended inventory root snapshot", + "criticality": "critical", + "question": "АЛЬТЕРНАТИВА", + "allowed_reply_types": [ + "factual", + "partial_coverage" + ], + "expected_intents": [ + "inventory_on_hand_as_of_date" + ], + "required_filters": { + "as_of_date": "2021-03-31" + }, + "required_direct_answer_patterns_any": [ + "31\\.03\\.2021", + "(?i)на складе", + "(?i)столешница 600\\*3050\\*26 альмандин" + ], + "forbidden_answer_patterns": [ + "(?i)нужно уточнить организацию", + "(?i)по какой организации", + "runtime_", + "planner_", + "query_movements", + "primitive" + ], + "semantic_tags": [ + "inventory_root", + "clarification_continuation", + "multi_company_scope" + ], + "notes": "[agent_extension=multi_org_clarification_continuation source=agent_autonomy_selected_object_mix]" + }, + { + "step_id": "step_02_selected_item_supplier", + "title": "Selected-object supplier provenance", + "criticality": "critical", + "question": "По выбранному объекту \"Столешница 600*3050*26 альмандин\": кто нам это поставил?", + "allowed_reply_types": [ + "factual" + ], + "expected_intents": [ + "inventory_purchase_provenance_for_item" + ], + "required_direct_answer_patterns_any": [ + "(?i)столешница 600\\*3050\\*26 альмандин", + "(?i)поставщик|поставил|куплен", + "(?i)союз|торговый дом" + ], + "forbidden_direct_answer_patterns": [ + "(?i)^на 31\\.03\\.2021 на складе", + "(?i)^сейчас не дам прямой адресный ответ" + ], + "semantic_tags": [ + "selected_object", + "selected_object_supplier" + ], + "notes": "[mixed_pack_slot=slot_06_selected_object_supplier source=address_truth_harness_phase7_acceptance_gate_mix:step_02_selected_item_supplier]" + }, + { + "step_id": "step_05_capability_meta_interrupt", + "title": "Capability meta question does not break the address context", + "question": "что ты умеешь?", + "required_answer_patterns_any": [ + "(?i)могу|умею", + "(?i)остатк|документ|контрагент|ндс" + ], + "forbidden_answer_patterns": [ + "(?i)tool_gate_reason", + "(?i)address_mode" + ], + "criticality": "warning", + "semantic_tags": [ + "meta_capability" + ], + "notes": "[mixed_pack_slot=slot_07_meta_capability source=address_truth_harness_phase5_meta_memory_mix:step_05_capability_meta_interrupt]" + }, + { + "step_id": "step_03_selected_item_documents", + "title": "Selected-object documents stay in the same contour", + "criticality": "critical", + "question": "По выбранному объекту \"Столешница 600*3050*26 альмандин\": покажи документы по этой позиции", + "allowed_reply_types": [ + "factual" + ], + "expected_intents": [ + "inventory_purchase_documents_for_item" + ], + "required_direct_answer_patterns_any": [ + "(?i)столешница 600\\*3050\\*26 альмандин", + "(?i)документ", + "(?i)союз|торговый дом" + ], + "semantic_tags": [ + "selected_object", + "selected_object_documents" + ], + "notes": "[mixed_pack_slot=slot_08_selected_object_documents source=address_truth_harness_phase7_acceptance_gate_mix:step_03_selected_item_documents]" + }, + { + "step_id": "step_06_memory_recap_after_interrupts", + "title": "Memory recap still remembers the selected object after meta interruptions", + "question": "а ты помнишь, что мы по этой позиции уже выяснили?", + "required_answer_patterns_any": [ + "(?i)помню", + "(?i)столешница 600\\*3050\\*26 альмандин", + "(?i)позици" + ], + "forbidden_answer_patterns": [ + "(?i)^сейчас не дам прямой адресный ответ", + "(?i)^в текущем адресном контуре этот запрос лучше не закрывать в лоб" + ], + "criticality": "warning", + "semantic_tags": [ + "meta_memory" + ], + "required_answer_patterns_all": [ + "(?i)помню", + "(?i)столешница 600\\*3050\\*26 альмандин" + ], + "notes": "[mixed_pack_slot=slot_09_meta_memory source=address_truth_harness_phase5_meta_memory_mix:step_06_memory_recap_after_interrupts]" + }, + { + "step_id": "step_04_inventory_same_date_restore", + "title": "Same-date restore returns to the March root snapshot", + "criticality": "critical", + "question": "покажи еще раз остатки на эту же дату", + "allowed_reply_types": [ + "factual" + ], + "expected_intents": [ + "inventory_on_hand_as_of_date" + ], + "required_filters": { + "as_of_date": "2021-03-31", + "period_from": "2021-03-01", + "period_to": "2021-03-31" + }, + "required_direct_answer_patterns_any": [ + "31\\.03\\.2021", + "(?i)на складе" + ], + "forbidden_direct_answer_patterns": [ + "(?i)^сейчас не дам прямой адресный ответ", + "(?i)transition_not_supported_by_capability" + ], + "semantic_tags": [ + "inventory_root", + "same_date_restore" + ], + "notes": "[mixed_pack_slot=slot_10_same_date_restore source=address_truth_harness_phase7_acceptance_gate_mix:step_04_inventory_same_date_restore]" + }, + { + "step_id": "step_02_receivables_march_2020", + "title": "Receivables at March 2020", + "question": "кто нам должен на март 2020", + "allowed_reply_types": [ + "factual" + ], + "expected_intents": [ + "receivables_confirmed_as_of_date" + ], + "expected_capability": "confirmed_receivables_as_of_date", + "expected_result_mode": "confirmed_balance", + "required_filters": { + "as_of_date": "2020-03-31", + "period_from": "2020-03-01", + "period_to": "2020-03-31" + }, + "required_direct_answer_patterns_any": [ + "31\\.03\\.2020", + "(?i)дебиторск" + ], + "notes": "Базовый корневой финансовый вопрос должен отработать точно и задать март 2020 как carryover-якорь. [mixed_pack_slot=slot_11_receivables_root source=address_truth_harness_test2:step_02_receivables_march_2020]", + "criticality": "critical", + "semantic_tags": [ + "settlements_receivables" + ] + }, + { + "step_id": "step_03_inventory_same_date", + "title": "Inventory on the same date", + "question": "остатки по складу на эту же дату", + "allowed_reply_types": [ + "factual" + ], + "expected_intents": [ + "inventory_on_hand_as_of_date" + ], + "expected_capability": "confirmed_inventory_on_hand_as_of_date", + "expected_result_mode": "confirmed_balance", + "required_filters": { + "as_of_date": "{{step_02_receivables_march_2020.filters.as_of_date}}", + "period_from": "{{step_02_receivables_march_2020.filters.period_from}}", + "period_to": "{{step_02_receivables_march_2020.filters.period_to}}" + }, + "required_direct_answer_patterns_any": [ + "31\\.03\\.2020", + "(?i)на складе" + ], + "notes": "Смена контура receivables -> inventory должна сохранить ту же дату, без дополнительного ручного уточнения. [mixed_pack_slot=slot_12_same_date_pivot source=address_truth_harness_test2:step_03_inventory_same_date]", + "criticality": "critical", + "semantic_tags": [ + "inventory_root", + "same_date_pivot" + ] + }, + { + "step_id": "step_06_historical_capability_followup", + "title": "Historical capability follow-up stays human", + "criticality": "warning", + "question": "а исторические остатки тоже можешь?", + "required_answer_patterns_any": [ + "(?i)историческ|история", + "(?i)могу|умею" + ], + "forbidden_answer_patterns": [ + "(?i)^сейчас не дам прямой адресный ответ", + "(?i)^в текущем адресном контуре этот запрос лучше не закрывать в лоб", + "(?i)tool_gate_reason", + "(?i)hard_meta_mode" + ], + "semantic_tags": [ + "meta_historical_capability", + "inventory_root" + ], + "notes": "[mixed_pack_slot=slot_13_meta_historical source=address_truth_harness_phase7_acceptance_gate_mix:step_06_historical_capability_followup]" + }, + { + "step_id": "step_04_open_items_account_60", + "title": "Account 60 tails for August 2022", + "question": "хвосты покажи по счету 60 на август 2022", + "allowed_reply_types": [ + "factual", + "factual_with_explanation" + ], + "expected_intents": [ + "open_items_by_counterparty_or_contract" + ], + "required_filters": { + "account": "60", + "period_from": "2022-08-01", + "period_to": "2022-08-31", + "as_of_date": "2022-08-31" + }, + "required_direct_answer_patterns_any": [ + "(?i)счету 60", + "(?i)хвост" + ], + "criticality": "critical", + "semantic_tags": [ + "settlements_account_60" + ], + "notes": "[mixed_pack_slot=slot_14_account_60 source=address_truth_harness_targeted_counterparty_tails:step_04_open_items_account_60]" + }, + { + "step_id": "step_02_data_scope_meta", + "title": "Data-scope meta question stays deterministic and non-technical", + "question": "по какой компании мы сейчас работаем?", + "required_answer_patterns_any": [ + "(?i)компан|организац|контур", + "(?i)работ" + ], + "forbidden_answer_patterns": [ + "(?i)tool_gate_reason", + "(?i)hard_meta_mode", + "(?i)living_reason" + ], + "criticality": "warning", + "semantic_tags": [ + "meta_scope" + ], + "notes": "[mixed_pack_slot=slot_15_meta_scope source=address_truth_harness_phase6_provider_axis_mix:step_02_data_scope_meta]" + } + ] +} diff --git a/llm_normalizer/data/autorun_generators/history.json b/llm_normalizer/data/autorun_generators/history.json index 7553e3d..d09a27f 100644 --- a/llm_normalizer/data/autorun_generators/history.json +++ b/llm_normalizer/data/autorun_generators/history.json @@ -1,4 +1,70 @@ [ + { + "generation_id": "gen-ag05231912-4420c2", + "created_at": "2026-05-23T19:12:34+00:00", + "mode": "saved_user_sessions", + "title": "AGENT | selected-object + multi-org context mix", + "count": 15, + "domain": "address_phase7_meta_domain_mix", + "questions": [ + "привет, как дела?", + "покажи все документы по чепурнову", + "что нам отгружал чепурнов, какой товар или услугу?", + "какие остатки на складе на март 2021", + "АЛЬТЕРНАТИВА", + "По выбранному объекту \"Столешница 600*3050*26 альмандин\": кто нам это поставил?", + "что ты умеешь?", + "По выбранному объекту \"Столешница 600*3050*26 альмандин\": покажи документы по этой позиции", + "а ты помнишь, что мы по этой позиции уже выяснили?", + "покажи еще раз остатки на эту же дату", + "кто нам должен на март 2020", + "остатки по складу на эту же дату", + "а исторические остатки тоже можешь?", + "хвосты покажи по счету 60 на август 2022", + "по какой компании мы сейчас работаем?" + ], + "generated_by": "codex_agent", + "saved_case_set_file": "assistant_autogen_saved_user_sessions_20260523191234_gen-ag05231912-4420c2.json", + "context": { + "llm_provider": null, + "model": null, + "assistant_prompt_version": null, + "decomposition_prompt_version": null, + "prompt_fingerprint": null, + "autogen_personality_id": null, + "autogen_personality_prompt": null, + "source_session_id": null, + "saved_session_file": "assistant_saved_session_20260523191234_gen-ag05231912-4420c2.json", + "saved_case_set_kind": "agent_semantic_scenario", + "agent_run": true, + "agent_focus": "selected-object continuity, multi-org clarification, meta interruption recovery", + "architecture_phase": "autonomy_selected_object_context", + "source_spec_file": "X:\\1C\\NDC_1C\\docs\\orchestration\\agent_autonomy_selected_object_mix_20260523.json", + "scenario_id": "address_truth_harness_phase7_meta_domain_mix", + "semantic_tags": [ + "clarification_continuation", + "counterparty_documents", + "counterparty_shipment_fallback", + "inventory_root", + "meta_capability", + "meta_historical_capability", + "meta_memory", + "meta_scope", + "meta_smalltalk", + "multi_company_scope", + "same_date_pivot", + "same_date_restore", + "selected_object", + "selected_object_documents", + "selected_object_supplier", + "settlements_account_60", + "settlements_receivables" + ], + "validation_status": "accepted_live_replay", + "validated_run_dir": "artifacts\\domain_runs\\agent_autonomy_selected_object_mix_live_accepted_20260523", + "saved_after_validated_replay": true + } + }, { "generation_id": "gen-ag05231858-323f86", "created_at": "2026-05-23T18:58:48+00:00", diff --git a/llm_normalizer/data/autorun_generators/saved_sessions/assistant_saved_session_20260523191234_gen-ag05231912-4420c2.json b/llm_normalizer/data/autorun_generators/saved_sessions/assistant_saved_session_20260523191234_gen-ag05231912-4420c2.json new file mode 100644 index 0000000..3dc1849 --- /dev/null +++ b/llm_normalizer/data/autorun_generators/saved_sessions/assistant_saved_session_20260523191234_gen-ag05231912-4420c2.json @@ -0,0 +1,259 @@ +{ + "saved_at": "2026-05-23T19:12:34+00:00", + "generation_id": "gen-ag05231912-4420c2", + "mode": "saved_user_sessions", + "title": "AGENT | selected-object + multi-org context mix", + "agent_run": true, + "questions": [ + "привет, как дела?", + "покажи все документы по чепурнову", + "что нам отгружал чепурнов, какой товар или услугу?", + "какие остатки на складе на март 2021", + "АЛЬТЕРНАТИВА", + "По выбранному объекту \"Столешница 600*3050*26 альмандин\": кто нам это поставил?", + "что ты умеешь?", + "По выбранному объекту \"Столешница 600*3050*26 альмандин\": покажи документы по этой позиции", + "а ты помнишь, что мы по этой позиции уже выяснили?", + "покажи еще раз остатки на эту же дату", + "кто нам должен на март 2020", + "остатки по складу на эту же дату", + "а исторические остатки тоже можешь?", + "хвосты покажи по счету 60 на август 2022", + "по какой компании мы сейчас работаем?" + ], + "metadata": { + "assistant_prompt_version": null, + "decomposition_prompt_version": null, + "prompt_fingerprint": null, + "agent_focus": "selected-object continuity, multi-org clarification, meta interruption recovery", + "architecture_phase": "autonomy_selected_object_context", + "source_spec_file": "X:\\1C\\NDC_1C\\docs\\orchestration\\agent_autonomy_selected_object_mix_20260523.json", + "scenario_id": "address_truth_harness_phase7_meta_domain_mix", + "semantic_tags": [ + "clarification_continuation", + "counterparty_documents", + "counterparty_shipment_fallback", + "inventory_root", + "meta_capability", + "meta_historical_capability", + "meta_memory", + "meta_scope", + "meta_smalltalk", + "multi_company_scope", + "same_date_pivot", + "same_date_restore", + "selected_object", + "selected_object_documents", + "selected_object_supplier", + "settlements_account_60", + "settlements_receivables" + ], + "validation_status": "accepted_live_replay", + "validated_run_dir": "artifacts\\domain_runs\\agent_autonomy_selected_object_mix_live_accepted_20260523", + "saved_after_validated_replay": true, + "save_gate": { + "schema_version": "agent_semantic_save_gate_v1", + "validation_status": "accepted_live_replay", + "validated_run_dir": "artifacts\\domain_runs\\agent_autonomy_selected_object_mix_live_accepted_20260523", + "final_status": "accepted", + "review_overall_status": "pass", + "business_overall_status": "pass", + "steps_total": 15, + "steps_passed": 15, + "steps_failed": 0, + "steps_with_business_failures": 0, + "steps_with_business_warnings": 0, + "acceptance_gate_passed": true, + "saved_after_validated_replay": true + } + }, + "source_session_id": null, + "session": { + "session_id": null, + "mode": "agent_semantic_run", + "items": [ + { + "message_id": "agent-user-001", + "role": "user", + "text": "привет, как дела?", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-002", + "role": "user", + "text": "покажи все документы по чепурнову", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-003", + "role": "user", + "text": "что нам отгружал чепурнов, какой товар или услугу?", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-004", + "role": "user", + "text": "какие остатки на складе на март 2021", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-005", + "role": "user", + "text": "АЛЬТЕРНАТИВА", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-006", + "role": "user", + "text": "По выбранному объекту \"Столешница 600*3050*26 альмандин\": кто нам это поставил?", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-007", + "role": "user", + "text": "что ты умеешь?", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-008", + "role": "user", + "text": "По выбранному объекту \"Столешница 600*3050*26 альмандин\": покажи документы по этой позиции", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-009", + "role": "user", + "text": "а ты помнишь, что мы по этой позиции уже выяснили?", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-010", + "role": "user", + "text": "покажи еще раз остатки на эту же дату", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-011", + "role": "user", + "text": "кто нам должен на март 2020", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-012", + "role": "user", + "text": "остатки по складу на эту же дату", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-013", + "role": "user", + "text": "а исторические остатки тоже можешь?", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-014", + "role": "user", + "text": "хвосты покажи по счету 60 на август 2022", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + }, + { + "message_id": "agent-user-015", + "role": "user", + "text": "по какой компании мы сейчас работаем?", + "created_at": "2026-05-23T19:12:34+00:00", + "reply_type": null, + "trace_id": null, + "debug": null + } + ], + "agent_run": true, + "metadata": { + "assistant_prompt_version": null, + "decomposition_prompt_version": null, + "prompt_fingerprint": null, + "agent_focus": "selected-object continuity, multi-org clarification, meta interruption recovery", + "architecture_phase": "autonomy_selected_object_context", + "source_spec_file": "X:\\1C\\NDC_1C\\docs\\orchestration\\agent_autonomy_selected_object_mix_20260523.json", + "scenario_id": "address_truth_harness_phase7_meta_domain_mix", + "semantic_tags": [ + "clarification_continuation", + "counterparty_documents", + "counterparty_shipment_fallback", + "inventory_root", + "meta_capability", + "meta_historical_capability", + "meta_memory", + "meta_scope", + "meta_smalltalk", + "multi_company_scope", + "same_date_pivot", + "same_date_restore", + "selected_object", + "selected_object_documents", + "selected_object_supplier", + "settlements_account_60", + "settlements_receivables" + ], + "validation_status": "accepted_live_replay", + "validated_run_dir": "artifacts\\domain_runs\\agent_autonomy_selected_object_mix_live_accepted_20260523", + "saved_after_validated_replay": true, + "save_gate": { + "schema_version": "agent_semantic_save_gate_v1", + "validation_status": "accepted_live_replay", + "validated_run_dir": "artifacts\\domain_runs\\agent_autonomy_selected_object_mix_live_accepted_20260523", + "final_status": "accepted", + "review_overall_status": "pass", + "business_overall_status": "pass", + "steps_total": 15, + "steps_passed": 15, + "steps_failed": 0, + "steps_with_business_failures": 0, + "steps_with_business_warnings": 0, + "acceptance_gate_passed": true, + "saved_after_validated_replay": true + } + } + } +} diff --git a/llm_normalizer/data/eval_cases/assistant_autogen_saved_user_sessions_20260523191234_gen-ag05231912-4420c2.json b/llm_normalizer/data/eval_cases/assistant_autogen_saved_user_sessions_20260523191234_gen-ag05231912-4420c2.json new file mode 100644 index 0000000..6ac8eff --- /dev/null +++ b/llm_normalizer/data/eval_cases/assistant_autogen_saved_user_sessions_20260523191234_gen-ag05231912-4420c2.json @@ -0,0 +1,70 @@ +{ + "suite_id": "assistant_saved_session_gen-ag05231912-4420c2", + "suite_version": "0.1.0", + "schema_version": "assistant_saved_session_suite_v0_1", + "generated_at": "2026-05-23T19:12:34+00:00", + "generation_id": "gen-ag05231912-4420c2", + "mode": "saved_user_sessions", + "title": "AGENT | selected-object + multi-org context mix", + "domain": "address_phase7_meta_domain_mix", + "scenario_count": 1, + "case_ids": [ + "SAVED-001" + ], + "cases": [ + { + "case_id": "SAVED-001", + "scenario_tag": "agent_saved_user_sessions", + "title": "AGENT | selected-object + multi-org context mix", + "question_type": "followup", + "broadness_level": "medium", + "turns": [ + { + "user_message": "привет, как дела?" + }, + { + "user_message": "покажи все документы по чепурнову" + }, + { + "user_message": "что нам отгружал чепурнов, какой товар или услугу?" + }, + { + "user_message": "какие остатки на складе на март 2021" + }, + { + "user_message": "АЛЬТЕРНАТИВА" + }, + { + "user_message": "По выбранному объекту \"Столешница 600*3050*26 альмандин\": кто нам это поставил?" + }, + { + "user_message": "что ты умеешь?" + }, + { + "user_message": "По выбранному объекту \"Столешница 600*3050*26 альмандин\": покажи документы по этой позиции" + }, + { + "user_message": "а ты помнишь, что мы по этой позиции уже выяснили?" + }, + { + "user_message": "покажи еще раз остатки на эту же дату" + }, + { + "user_message": "кто нам должен на март 2020" + }, + { + "user_message": "остатки по складу на эту же дату" + }, + { + "user_message": "а исторические остатки тоже можешь?" + }, + { + "user_message": "хвосты покажи по счету 60 на август 2022" + }, + { + "user_message": "по какой компании мы сейчас работаем?" + } + ] + } + ] +}