docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260610T212455Z-704019a1.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260610T212500Z-031c9cc1.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260610T212504Z-f40edf53.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260610T212511Z-53b18c56.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260610T212536Z-6ea9dbf1.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260610T212540Z-52a07940.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260610T212544Z-7da2ea74.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260610T212556Z-457bbb81.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260610T212603Z-7d339931.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260610T212620Z-4ceae150.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260610T212625Z-92f5101a.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260610T212629Z-67032e2d.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260610T212632Z-9d264b12.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260610T212636Z-8c8dbca9.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260610T212638Z-9f82ee80.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260610T212641Z-163b548e.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260610T212647Z-33fa8134.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260610T212650Z-8cdbb0ac.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260610T212656Z-18802363.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260610T212702Z-bf24cc29.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260610T212704Z-a793c4a0.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260610T212709Z-2bcdfa89.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260610T212711Z-289e4faa.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260610T212714Z-6f611561.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260610T212801Z-1b5998a5.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/29/results/20260610T212809Z-a4bc2a2b.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/29/results/20260610T212820Z-eb040107.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/29/results/20260610T212827Z-59ce9058.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/29/results/20260610T212830Z-917b7397.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/29/results/20260610T212849Z-4af9f7dc.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260610T212906Z-57272639.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260610T212921Z-841bdf78.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260610T212933Z-6a1241b9.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260610T212952Z-7a73eb96.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260610T212959Z-76e5d3f2.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260610T213003Z-ec714947.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260610T213007Z-f45e88b9.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260610T213012Z-f06fafd3.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260610T213023Z-b9364249.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260610T213032Z-4a3432bf.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/2/results/20260610T213040Z-06226d53.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/2/results/20260610T213050Z-84d17cea.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/2/results/20260610T213052Z-9ba8426a.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/2/results/20260610T213054Z-c59d79ff.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/2/results/20260610T213101Z-3df52dbd.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260610T213104Z-0414a743.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260610T213113Z-fdbd2f71.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260610T213117Z-0b64be9d.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260610T213124Z-a5269b41.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260610T213127Z-deb04bde.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260610T213131Z-4493744f.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260610T213136Z-9a402558.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260610T213138Z-e32565b6.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260610T213150Z-4dda3571.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260610T213158Z-183837f9.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/7/results/20260610T213201Z-8a2ad6de.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/7/results/20260610T213206Z-ebdf94be.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/7/results/20260610T213209Z-230f592e.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/7/results/20260610T213218Z-e422b322.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/7/results/20260610T213226Z-9b8458d2.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260610T213232Z-e3528fcb.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260610T213237Z-c8cc08a1.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260610T213253Z-7e6a44b0.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260610T213304Z-919cc287.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260610T213312Z-afc5a9ef.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260610T213322Z-3dc6fcfc.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260610T213326Z-a1a4fefa.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260610T213334Z-925a2177.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260610T213345Z-b35e469d.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260610T213352Z-5ee3eb25.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260610T213357Z-cb4e28af.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260610T213401Z-64e639c6.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260610T213404Z-f6b6562a.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260610T213407Z-4ea6dabe.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260610T213419Z-b13c4d73.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260610T213435Z-91efc669.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260610T213447Z-53177607.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260610T213452Z-606270e4.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260610T213459Z-f32c7406.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260610T213509Z-9653d64c.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260610T213513Z-96cfd9f2.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260610T213515Z-6818fe0a.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260610T213518Z-b9f17a98.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260610T213521Z-24966a66.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260610T213528Z-4dd82aa3.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260610T213543Z-505b64ab.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260610T213548Z-5ef4549a.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260610T213605Z-23ea1076.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260610T213627Z-21649751.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260610T213635Z-61358ce7.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260610T213655Z-bfc60440.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260610T213657Z-14ed0a3a.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260610T213703Z-473b39e0.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260610T213712Z-e65b017e.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260610T213722Z-3edc5870.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260610T213727Z-b1619628.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260610T213732Z-cd5e7dd7.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260610T213734Z-89148a4f.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260610T213743Z-58cdb137.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260610T213756Z-07408020.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260610T213759Z-bc630adb.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260610T213801Z-69532ece.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260610T213805Z-75107231.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260610T213815Z-5387ff81.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260610T213824Z-9a817504.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260610T213840Z-52cb25ce.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260610T213842Z-24443479.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260610T213845Z-4fbadb05.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260610T213850Z-705d6ae7.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260610T213919Z-1c4cee43.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260610T213947Z-4bb2bd45.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260610T213951Z-851fca73.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260610T214024Z-7361f078.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260610T214035Z-a48e2999.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260610T214038Z-91c426ea.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__codex/app-server-v2-only/results/20260610T214053Z-443e5143.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__codex/app-server-v2-only/results/20260610T214059Z-4c29c3d4.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__codex/app-server-v2-only/results/20260610T214103Z-cfd68b75.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__codex/app-server-v2-only/results/20260610T214110Z-11f187a5.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__codex/app-server-v2-only/results/20260610T214123Z-46f3559d.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260610T214133Z-b8ac58c4.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260610T214137Z-403ca03a.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260610T214143Z-61db1bb9.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260610T214151Z-b3073c2e.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260610T214204Z-b440e539.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260610T214212Z-87c6fa21.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260610T214215Z-35f14f83.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260610T214220Z-cd8e24ed.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260610T214224Z-d7dfc5e5.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260610T214228Z-dada4074.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260610T214239Z-54e5c412.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260610T214254Z-c2db0531.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260610T214300Z-4ed1f8c9.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260610T214308Z-3688fdd7.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260610T214319Z-08d7c5bc.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260610T214327Z-fd291ac2.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260610T214332Z-1f0666fb.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260610T214335Z-03deb986.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260610T214347Z-e25a68f6.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260610T214455Z-078ba2b1.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260610T214502Z-a7ccda89.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260610T214506Z-1d03ac60.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260610T214509Z-74e1971d.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260610T214516Z-7a64c03a.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260610T214519Z-5879db2b.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/6/results/20260610T214523Z-87d4ed9a.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/6/results/20260610T214528Z-ac5e55f7.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/6/results/20260610T214533Z-dce4caa0.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/6/results/20260610T214548Z-f02ac57c.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/6/results/20260610T214558Z-faac6f1c.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260610T214615Z-ccfb99e2.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260610T214628Z-70132055.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260610T214630Z-432cc46f.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260610T214634Z-f7346093.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260610T214643Z-1480df64.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260610T214648Z-0dfd261c.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260610T214654Z-55123f06.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260610T214657Z-cc341ad4.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260610T214714Z-7c019f75.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260610T214739Z-fa23eced.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/29/results/20260610T214742Z-39098185.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/29/results/20260610T214745Z-af9f3fb9.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/29/results/20260610T214748Z-0caf906c.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/29/results/20260610T214752Z-7e1642df.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/29/results/20260610T214802Z-550b76fc.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260610T214856Z-98b0655b.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260610T214900Z-30a3a9d0.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260610T214904Z-22ef709d.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260610T214909Z-e0c541f0.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260610T214919Z-8eeb49b6.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260610T214924Z-e625d40c.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260610T214928Z-1ba59238.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260610T214931Z-2698778c.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260610T214939Z-d68724bf.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260610T214943Z-09d78ae3.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260610T214953Z-af9c94ca.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260610T214957Z-b647cf3b.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260610T215002Z-6567e21b.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260610T215012Z-afca517f.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260610T215017Z-ee25e3bd.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260610T215049Z-9e98ca54.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260610T215056Z-4544f879.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260610T215117Z-4743cd17.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260610T215135Z-0ea20403.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260610T215203Z-e4b2d4b4.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260610T215209Z-a01a4c1b.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260610T215214Z-b257d31d.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260610T215221Z-918f678d.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260610T215225Z-42d03438.json
docs/eval_runs/full/20260607_current_full_after_trace_harness_fix/tool-ifc/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260610T215237Z-6cbe6b8a.json
