|
{ |
|
"test_name": "level_up_planning_block_purity_pr6960_370bffb", |
|
"run_id": "level_up_planning_block_purity_pr6960_370bffb-001-20260521T001830", |
|
"iteration": 1, |
|
"bundle_version": "1.2.0", |
|
"timestamp": "2026-05-21T00:18:30.280555+00:00", |
|
"bundle_timestamp": "2026-05-21T00:18:30.280555+00:00", |
|
"evidence_mode": "lightweight_prompt_tracking", |
|
"evidence_mode_notes": "System instruction captured as filenames + char_count (not full text). Raw LLM request/response payloads captured in request_responses.jsonl. Server logs in artifacts/. Bundle file inventory in artifacts/collection_log.txt.", |
|
"git_provenance": { |
|
"git_head": "370bffb4859be98b8bd64661c3b107022bee965a", |
|
"git_branch": "fix/pr6906-successor-cc-guards", |
|
"merge_base": "f457ae58ab501c948aab8e9ff110c54899836f20", |
|
"commits_ahead_of_main": 70, |
|
"diff_stat_vs_main": ".beads/issues.jsonl | 17 +\n .claude/skills/zfc-leveling-roadmap/SKILL.md | 15 +\n docs/design/pr-designs/pr-6958.html | 237 ++++++\n docs/design/pr-designs/pr-6958.md | 90 +++\n docs/design/pr-designs/pr-6960.html | 295 +++++++\n docs/design/pr-designs/pr-6960.md | 101 +++\n mvp_site/llm_providers/gemini_provider.py | 9 +-\n mvp_site/prompts/level_up_instruction.md | 25 +-\n mvp_site/prompts/planning_protocol.md | 27 +-\n mvp_site/prompts/rewards_system_instruction.md | 51 +-\n mvp_site/rewards_engine.py | 851 +++++++++++++++++----\n mvp_site/schemas/prompt_tool_contracts.json | 4 +-\n mvp_site/tests/data/modal_routing_fixtures.json | 3 +-\n mvp_site/tests/test_canonicalize_invariants.py | 15 +-\n mvp_site/tests/test_freeze_time_choices.py | 44 +-\n mvp_site/tests/test_prompts.py | 36 +\n mvp_site/tests/test_rewards_engine.py | 602 ++++++++++++++-\n mvp_site/tests/test_world_logic.py | 274 ++++++-\n mvp_site/world_logic.py | 519 +++++--------\n roadmap/README.md | 2 +\n .../nextsteps-2026-05-19-pr6958-review-fixes.md | 94 +++\n scripts/validate_imports.py | 323 +++++---\n testing_mcp/lib/server_utils.py | 7 +-\n testing_mcp/test_level_up_planning_block_purity.py | 102 ++-\n .../test_level_up_rewards_planning_atomicity.py | 20 +-\n ..._level_up_rewards_planning_atomicity_browser.py | 51 +-\n 26 files changed, 3019 insertions(+), 795 deletions(-)", |
|
"working_tree_dirty": false, |
|
"working_tree_staged_changes": 0, |
|
"working_tree_unstaged_changes": 0, |
|
"working_tree_changed_files": [], |
|
"working_tree_diff_sha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855" |
|
}, |
|
"server": { |
|
"base_url": "http://127.0.0.1:8076", |
|
"hostname": "127.0.0.1", |
|
"mode": "local", |
|
"port": "8076", |
|
"pid": 34592, |
|
"process_cmdline": "/opt/homebrew/Cellar/[email protected]/3.12.11/Frameworks/Python.framework/Versions/3.12/Resources/Python.app/Contents/MacOS/Python -m gunicorn mvp_site.main:app --bind 0.0.0.0:8076 --workers 1 --worker-class gthread --threads 4 --timeout 600 --max-requests 50 --access-logfile - --error-logfile - --log-level info", |
|
"env_vars": { |
|
"WORLDAI_DEV_MODE": "true", |
|
"TESTING": null, |
|
"MOCK_SERVICES_MODE": "false", |
|
"GOOGLE_APPLICATION_CREDENTIALS": "[SET - file:serviceAccountKey.json]", |
|
"WORLDAI_GOOGLE_APPLICATION_CREDENTIALS": "[SET - file:serviceAccountKey.json]", |
|
"FIRESTORE_EMULATOR_HOST": null, |
|
"PORT": "8076", |
|
"FIREBASE_PROJECT_ID": "worldarchitecture-ai", |
|
"GEMINI_API_KEY": "[SET - 39 chars]", |
|
"LLM_REQUEST_RESPONSE_CAPTURE_PATH": "/tmp/worldarchitect.ai/fix_pr6906-successor-cc-guards/level_up_planning_block_purity_pr6960_370bffb/iteration_001/llm_request_responses_1779322605433.jsonl", |
|
"HTTP_REQUEST_RESPONSE_CAPTURE_PATH": "/tmp/worldarchitect.ai/fix_pr6906-successor-cc-guards/level_up_planning_block_purity_pr6960_370bffb/iteration_001/http_request_responses_1779322605433.jsonl", |
|
"GEMINI_HTTP_REQUEST_RESPONSE_CAPTURE_PATH": "/tmp/worldarchitect.ai/fix_pr6906-successor-cc-guards/level_up_planning_block_purity_pr6960_370bffb/iteration_001/gemini_http_request_responses_1779322605433.jsonl", |
|
"MCP_TEST_PROVIDER_HTTP_CAPTURE_PATH": "/tmp/worldarchitect.ai/fix_pr6906-successor-cc-guards/level_up_planning_block_purity_pr6960_370bffb/iteration_001/provider_http_request_responses_1779322605433.jsonl" |
|
}, |
|
"lsof_output": "COMMAND PID USER FD TYPE DEVICE SIZE/OFF NODE NAME\nPython 34592 jleechan 5u IPv4 0xc83de4b93143e3b6 0t0 TCP *:8076 (LISTEN)\nPython 34605 jleechan 5u IPv4 0xc83de4b93143e3b6 0t0 TCP *:8076 (LISTEN)", |
|
"ps_output": "PID USER ELAPSED ARGS\n34592 jleechan 01:29 /opt/homebrew/Cellar/[email protected]/3.12.11/Frameworks/Python.framework/Versions/3.12/Resources/Python.app/Contents/MacOS/Python -m gunicorn mvp_site.main:app --bind 0.0.0.0:8076 --workers 1 --worker-class gthread --threads 4 --timeout 600 --max-requests 50 --access-logfile - --error-logfile - --log-level info" |
|
}, |
|
"provenance": { |
|
"git_fetch_origin_main": { |
|
"returncode": 0, |
|
"stdout": null, |
|
"stderr": "From https://github.com/jleechanorg/worldarchitect.ai\n * branch main -> FETCH_HEAD\nAuto packing the repository in background for optimum performance.\nSee \"git help gc\" for manual housekeeping.\nwarning: The last gc run reported the following. Please correct the root cause\nand remove /Users/jleechan/projects/worldarchitect.ai/.git/worktrees/worldarchitect-pr6960/gc.log\nAutomatic cleanup will not be performed until the file is removed.\n\nwarning: There are too many unreachable loose objects; run 'git prune' to remove them." |
|
}, |
|
"git_head": "370bffb4859be98b8bd64661c3b107022bee965a", |
|
"git_branch": "fix/pr6906-successor-cc-guards", |
|
"merge_base": "f457ae58ab501c948aab8e9ff110c54899836f20", |
|
"commits_ahead_of_main": 70, |
|
"diff_stat_vs_main": ".beads/issues.jsonl | 17 +\n .claude/skills/zfc-leveling-roadmap/SKILL.md | 15 +\n docs/design/pr-designs/pr-6958.html | 237 ++++++\n docs/design/pr-designs/pr-6958.md | 90 +++\n docs/design/pr-designs/pr-6960.html | 295 +++++++\n docs/design/pr-designs/pr-6960.md | 101 +++\n mvp_site/llm_providers/gemini_provider.py | 9 +-\n mvp_site/prompts/level_up_instruction.md | 25 +-\n mvp_site/prompts/planning_protocol.md | 27 +-\n mvp_site/prompts/rewards_system_instruction.md | 51 +-\n mvp_site/rewards_engine.py | 851 +++++++++++++++++----\n mvp_site/schemas/prompt_tool_contracts.json | 4 +-\n mvp_site/tests/data/modal_routing_fixtures.json | 3 +-\n mvp_site/tests/test_canonicalize_invariants.py | 15 +-\n mvp_site/tests/test_freeze_time_choices.py | 44 +-\n mvp_site/tests/test_prompts.py | 36 +\n mvp_site/tests/test_rewards_engine.py | 602 ++++++++++++++-\n mvp_site/tests/test_world_logic.py | 274 ++++++-\n mvp_site/world_logic.py | 519 +++++--------\n roadmap/README.md | 2 +\n .../nextsteps-2026-05-19-pr6958-review-fixes.md | 94 +++\n scripts/validate_imports.py | 323 +++++---\n testing_mcp/lib/server_utils.py | 7 +-\n testing_mcp/test_level_up_planning_block_purity.py | 102 ++-\n .../test_level_up_rewards_planning_atomicity.py | 20 +-\n ..._level_up_rewards_planning_atomicity_browser.py | 51 +-\n 26 files changed, 3019 insertions(+), 795 deletions(-)", |
|
"working_tree_staged_changes": 0, |
|
"working_tree_unstaged_changes": 0, |
|
"working_tree_untracked_files": 0, |
|
"working_tree_changed_files": [], |
|
"working_tree_diff_sha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855", |
|
"working_tree_dirty": false, |
|
"server": { |
|
"base_url": "http://127.0.0.1:8076", |
|
"hostname": "127.0.0.1", |
|
"mode": "local", |
|
"port": "8076", |
|
"pid": 34592, |
|
"process_cmdline": "/opt/homebrew/Cellar/[email protected]/3.12.11/Frameworks/Python.framework/Versions/3.12/Resources/Python.app/Contents/MacOS/Python -m gunicorn mvp_site.main:app --bind 0.0.0.0:8076 --workers 1 --worker-class gthread --threads 4 --timeout 600 --max-requests 50 --access-logfile - --error-logfile - --log-level info", |
|
"env_vars": { |
|
"WORLDAI_DEV_MODE": "true", |
|
"TESTING": null, |
|
"MOCK_SERVICES_MODE": "false", |
|
"GOOGLE_APPLICATION_CREDENTIALS": "[SET - file:serviceAccountKey.json]", |
|
"WORLDAI_GOOGLE_APPLICATION_CREDENTIALS": "[SET - file:serviceAccountKey.json]", |
|
"FIRESTORE_EMULATOR_HOST": null, |
|
"PORT": "8076", |
|
"FIREBASE_PROJECT_ID": "worldarchitecture-ai", |
|
"GEMINI_API_KEY": "[SET - 39 chars]", |
|
"LLM_REQUEST_RESPONSE_CAPTURE_PATH": "/tmp/worldarchitect.ai/fix_pr6906-successor-cc-guards/level_up_planning_block_purity_pr6960_370bffb/iteration_001/llm_request_responses_1779322605433.jsonl", |
|
"HTTP_REQUEST_RESPONSE_CAPTURE_PATH": "/tmp/worldarchitect.ai/fix_pr6906-successor-cc-guards/level_up_planning_block_purity_pr6960_370bffb/iteration_001/http_request_responses_1779322605433.jsonl", |
|
"GEMINI_HTTP_REQUEST_RESPONSE_CAPTURE_PATH": "/tmp/worldarchitect.ai/fix_pr6906-successor-cc-guards/level_up_planning_block_purity_pr6960_370bffb/iteration_001/gemini_http_request_responses_1779322605433.jsonl", |
|
"MCP_TEST_PROVIDER_HTTP_CAPTURE_PATH": "/tmp/worldarchitect.ai/fix_pr6906-successor-cc-guards/level_up_planning_block_purity_pr6960_370bffb/iteration_001/provider_http_request_responses_1779322605433.jsonl" |
|
}, |
|
"lsof_output": "COMMAND PID USER FD TYPE DEVICE SIZE/OFF NODE NAME\nPython 34592 jleechan 5u IPv4 0xc83de4b93143e3b6 0t0 TCP *:8076 (LISTEN)\nPython 34605 jleechan 5u IPv4 0xc83de4b93143e3b6 0t0 TCP *:8076 (LISTEN)", |
|
"ps_output": "PID USER ELAPSED ARGS\n34592 jleechan 01:29 /opt/homebrew/Cellar/[email protected]/3.12.11/Frameworks/Python.framework/Versions/3.12/Resources/Python.app/Contents/MacOS/Python -m gunicorn mvp_site.main:app --bind 0.0.0.0:8076 --workers 1 --worker-class gthread --threads 4 --timeout 600 --max-requests 50 --access-logfile - --error-logfile - --log-level info" |
|
}, |
|
"timestamp": "2026-05-21T00:18:30.000187+00:00", |
|
"test_file": "/private/tmp/worldarchitect-pr6960/testing_mcp/test_level_up_planning_block_purity.py" |
|
}, |
|
"summary": { |
|
"total_scenarios": 2, |
|
"passed": 2, |
|
"failed": 0, |
|
"campaign_capture_total": 1, |
|
"campaign_capture_passed": 1, |
|
"campaign_capture_failed": 0, |
|
"raw_passed": 1, |
|
"raw_total": 1, |
|
"raw_pass_rate": "100.0%" |
|
} |
|
} |