docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260606T192706Z-fa3d55b7.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260606T192713Z-e945ce88.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260606T192720Z-56a1def6.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260606T192727Z-08e8e21b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260606T192735Z-7969742a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/NousResearch__hermes-agent/29/results/20260606T192743Z-d801507b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260606T192752Z-44803cf2.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260606T192759Z-f2644ae5.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/OpenPipe__ART/2/results/20260606T192814Z-053577cb.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260606T192826Z-7c057241.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260606T192940Z-cbdf1723.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/alibaba__OpenSandbox/7/results/20260606T192946Z-0c24ab43.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260606T192953Z-412028ef.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260606T193001Z-f1fdd17d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260606T193008Z-020e4c9e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260606T193014Z-5970fcd8.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260606T193021Z-9688d757.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260606T193029Z-6d58679c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260606T101515Z-7ed4d3a9.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260606T193036Z-4fb673af.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T101524Z-5741b175.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T101530Z-d6531dcf.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T101537Z-44a37946.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T101544Z-a02bcf06.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T101551Z-dfb15086.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T193058Z-c414193e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T101609Z-f1b4f1fd.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T101625Z-cbdc2964.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T101640Z-627fc75e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T101651Z-4e909d86.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T101659Z-f6d5e289.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T193105Z-3363751b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T101722Z-faf51e98.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T101729Z-2f7ed473.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T101743Z-3d58ba0a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T101750Z-9c8f143b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T101756Z-2b9a6d0a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T193621Z-c55e29ee.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T101805Z-10a8d07c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T101830Z-e662bafb.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T101903Z-6421e821.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T101910Z-c83cee1f.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T101917Z-dbee8cb3.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T193629Z-f2f30aea.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T101939Z-d1fdce05.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T101947Z-742cfd9a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T101954Z-81022664.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T102000Z-d621608d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T102009Z-46e82c0a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T193636Z-415ada94.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T102016Z-ed1ece6f.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T102023Z-6a536eaa.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T102037Z-cdbe3e2a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T102051Z-7854e51c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T102058Z-13c3d323.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T193643Z-d74f0ee4.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T102106Z-1b60a29d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T102115Z-577ff86e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T102128Z-34002575.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T102142Z-a18b96bf.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T102148Z-76096f70.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T193651Z-94cd12a1.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T102205Z-52668c1a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T102222Z-9125c928.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T102241Z-136708f1.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T102256Z-8de4f0cc.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T102310Z-53fe977f.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T193701Z-8be78985.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T102320Z-b06f086b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T102336Z-91401b72.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T102351Z-21070d95.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T102405Z-48418618.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T102413Z-acbdbae1.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T193709Z-e12e9efb.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T102426Z-e8e724c7.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T102434Z-8a39886e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T102443Z-1fde2f40.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T102451Z-744bf274.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T102458Z-f609af0f.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T193717Z-e972fab4.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T102507Z-34b4ed83.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T102515Z-6201318d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T102522Z-31372d7b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T102529Z-d5800af2.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T102536Z-3b5fef6c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T193727Z-e4f32d47.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T102630Z-e76974eb.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T102637Z-29454469.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T102644Z-e5d876b8.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T102653Z-e14e2977.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T102707Z-952beb7b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T193733Z-4af2ff57.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T102719Z-bf1cecb0.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T102746Z-7c4cd752.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T102759Z-e8db9893.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T102830Z-102cff8c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T102850Z-f36fd3ed.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T193741Z-0997a779.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/29/results/20260606T102905Z-c1438fee.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/29/results/20260606T102914Z-206c34be.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/29/results/20260606T102920Z-f15340cb.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/29/results/20260606T102927Z-2e34e55b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/29/results/20260606T102934Z-fd28ff53.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/29/results/20260606T193748Z-39726fc9.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T102940Z-53ebe875.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T102953Z-2679cc9d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T103000Z-c3501029.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T103007Z-deb57328.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T103013Z-ee3a925c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T193756Z-422a9156.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T103022Z-4dbdda67.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T103029Z-da9ac93a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T103043Z-b1aa5085.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T103050Z-5889c9a6.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T103056Z-211c545a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T193804Z-1a2b75a9.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T103103Z-695946c3.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T103113Z-8edab5f6.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T103120Z-1744579c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T103129Z-5afc7c7a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T103141Z-b9e18370.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T193813Z-1f9337b0.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T103215Z-6db3616b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T103224Z-57fe00a5.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T103240Z-3c677004.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T103336Z-02a08597.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T103343Z-02001071.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T195448Z-3463d78a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T103351Z-93a05f5a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T103358Z-44eedc6c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T103412Z-48a8a949.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T103418Z-5f363db9.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T103424Z-ac3f0d5e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane-opaque/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T195455Z-c27998d7.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260606T091410Z-266d669c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260606T091417Z-c38664cb.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260606T091438Z-71a58b37.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260606T091501Z-98cd2649.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260606T091510Z-131afc75.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260606T192144Z-e22b640e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260606T091520Z-a493382f.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260606T091528Z-c0faf563.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260606T091538Z-9fc30ce1.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260606T091553Z-95121682.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260606T091618Z-db35460d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260606T192153Z-697e19dd.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260606T091627Z-2a10bb83.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260606T091712Z-7e856129.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260606T091719Z-9172b62d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260606T091726Z-52aeb333.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260606T091736Z-c8a1b204.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260606T192200Z-f27c0e4e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260606T091743Z-f4b89917.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260606T091752Z-80211b15.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260606T091759Z-dae5444d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260606T091807Z-1772b2b8.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260606T091815Z-fff73a0c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260606T192206Z-2345fdd4.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260606T091822Z-b5d0f5ff.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260606T091829Z-344bf12d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260606T091835Z-88152199.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260606T091841Z-c446658e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260606T091847Z-c508edfb.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260606T192214Z-e54d3fa7.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/29/results/20260606T091902Z-5bf817e5.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/29/results/20260606T091915Z-2ed6a16c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/29/results/20260606T091925Z-08988dbe.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/29/results/20260606T091933Z-1af2541c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/29/results/20260606T091941Z-99502fd5.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/29/results/20260606T192222Z-7c6e1582.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260606T092031Z-05f9bf15.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260606T092045Z-ac50a7fd.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260606T092101Z-71c62c30.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260606T092122Z-27008f40.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260606T092137Z-85ac0f7a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260606T192230Z-3aef9dbc.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260606T092157Z-d4cff6ac.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260606T092219Z-5e9b100e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260606T092235Z-f84c4a62.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260606T092255Z-3e0a1b4c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260606T092310Z-0de4d29d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260606T192247Z-b5190dcb.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/2/results/20260606T092326Z-264dd645.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/2/results/20260606T092334Z-3703bb60.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/2/results/20260606T092351Z-88cdbb94.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/2/results/20260606T092407Z-b7439be0.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/2/results/20260606T092415Z-e3916514.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/2/results/20260606T192257Z-aa7244e1.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260606T092433Z-a55676f5.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260606T092440Z-32a86318.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260606T092455Z-40415d19.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260606T092511Z-b62ab9f0.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260606T092519Z-18821941.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260606T192312Z-854a2731.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260606T092536Z-edb96a63.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260606T092545Z-adb20925.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260606T092552Z-89d7a933.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260606T092603Z-74f516fa.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260606T092610Z-1a5440e1.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260606T192319Z-9b4434c2.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/7/results/20260606T092620Z-2c78c916.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/7/results/20260606T092632Z-54fd6fc5.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/7/results/20260606T092640Z-58b9c4e8.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/7/results/20260606T092649Z-80b913fc.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/7/results/20260606T092701Z-bb4b0735.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/7/results/20260606T192330Z-dafd091a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260606T092716Z-008962e9.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260606T092733Z-63565aab.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260606T092749Z-08c6f4b8.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260606T092806Z-74283139.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260606T092839Z-c2016b6f.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260606T192338Z-73c5833f.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260606T092847Z-b7a0f80e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260606T092901Z-211030d8.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260606T092914Z-f66a886a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260606T092931Z-348168bd.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260606T092948Z-c1f18916.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260606T192346Z-dfd58f86.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260606T092955Z-6d0c364d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260606T093022Z-299c3cdc.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260606T093032Z-5796a57c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260606T093043Z-906739b4.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260606T093053Z-85371098.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260606T192352Z-6a81f964.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260606T093108Z-415f892b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260606T093135Z-e10811f6.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260606T093147Z-dccc1684.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260606T093200Z-c32c7f11.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260606T093214Z-48d4a1d5.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260606T192359Z-aa676a30.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260606T093233Z-77648e49.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260606T093240Z-1935394e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260606T093248Z-9bb273f1.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260606T093255Z-25de3534.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260606T093301Z-458289a1.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260606T192406Z-8ac679ec.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260606T093318Z-ef5b658d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260606T093325Z-95dfd9ff.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260606T093340Z-fd1eda5b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260606T093347Z-adc70e0d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260606T093359Z-3110ecf2.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260606T192413Z-e8f7e2a9.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260606T093430Z-50df6994.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260606T093452Z-3ca3baff.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260606T093505Z-0cdb81c4.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260606T093519Z-0c916eb5.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260606T093532Z-5278f029.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260606T192420Z-89ebb002.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T093543Z-9b774460.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T093552Z-de77a99b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T093603Z-6a260f2d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T093609Z-51e95535.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T093616Z-6eacf0d4.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T192431Z-cab90571.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T093632Z-aa9df0d9.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T093647Z-e4dc530f.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T093704Z-108cf64a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T093717Z-715110e2.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T093725Z-215adcc4.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T192440Z-75e5593a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T093741Z-753b21a7.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T093747Z-afa1d246.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T093803Z-1e00bf1a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T093818Z-8d3a2efa.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T093825Z-c92080ce.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T192446Z-dd5cc537.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T093834Z-b1ad03c0.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T093856Z-f1fe2fe8.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T093910Z-4bab3b0a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T093928Z-775dd732.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T093943Z-29ea8c4a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T192454Z-ba9c9fea.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T094002Z-9301980d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T094010Z-2d53f64e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T094022Z-82be70db.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T094035Z-ffd252b2.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T094052Z-4d841b40.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T192502Z-14b32f02.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T094059Z-b6bb104f.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T094106Z-e0ea8076.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T094122Z-ced1e4c6.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T094138Z-d3139de6.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T094145Z-92986c57.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T192511Z-82d3dd65.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T094153Z-0693c7bc.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T094201Z-f1376c18.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T094213Z-278a5566.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T094227Z-27f33b85.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T094234Z-ab065224.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T192518Z-a6bc7d45.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T094255Z-67769388.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T094315Z-2e8d2af6.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T094336Z-18dc80e4.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T094352Z-406ee3de.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T094408Z-156c978f.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T192529Z-f4a1f1f0.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T094418Z-5c62ba8d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T094433Z-aa8c60d7.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T094456Z-17b3cb5b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T094514Z-3749cd11.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T094522Z-389fe6ea.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T192536Z-6416abdd.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T094535Z-15c6d88a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T094542Z-27351b5e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T094550Z-4dd5f9cb.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T094602Z-b297fb23.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T094610Z-40bd3e8a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T192545Z-deb85250.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T094619Z-1c11c3dd.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T094627Z-3856b5a6.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T094636Z-1d77c743.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T094643Z-00bab359.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T094651Z-69ea69c9.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T192552Z-534c131e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T094705Z-d8af7c38.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T094713Z-7b786ae5.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T094720Z-571049a5.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T094729Z-bb57699d.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T094735Z-5a9fb9c3.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T192559Z-35d0d12c.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T094748Z-855fd03e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T094808Z-18f4acef.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T094822Z-c677ed06.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T094830Z-c41a8c7e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T094901Z-4def8b18.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T192606Z-1415f15f.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/29/results/20260606T094919Z-97c6839f.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/29/results/20260606T094930Z-1be6f073.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/29/results/20260606T094939Z-9eccf079.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/29/results/20260606T094950Z-6dc122ea.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/29/results/20260606T095000Z-c0e59385.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/29/results/20260606T192613Z-05b80e72.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T095007Z-fafab577.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T095019Z-47ea19c0.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T095031Z-ac7d0c67.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T095041Z-b2ec9ce0.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T095052Z-0f197c3a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T192620Z-9ee226b3.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T095100Z-b15a3fc2.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T095107Z-b4aa2513.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T095114Z-65b4b0b4.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T095121Z-d31f8333.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T095127Z-6b60a6a3.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T192628Z-f1cfd7be.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T095136Z-a54a1110.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T095145Z-292666d7.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T095155Z-e4a48aab.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T095202Z-bbb64861.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T095215Z-d7276e16.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T192636Z-f225ea04.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T095251Z-cce40b4e.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T095300Z-cb05c7a2.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T095308Z-19915f8b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T095315Z-2df7a39a.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T095322Z-a0ec53ff.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T192650Z-dc345404.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T095330Z-b7a63b93.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T095337Z-0d159a3b.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T095349Z-bb926f28.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T095401Z-e67a9d58.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T095407Z-719d8a75.json
docs/eval_runs/full/20260606T_clean190_llama/actplane/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T192658Z-f8468c35.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260606T191129Z-53af3c4f.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260606T191147Z-df136cc5.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260606T191203Z-421f1fa5.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260606T191218Z-4ae36637.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260606T191224Z-f071d106.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/NousResearch__hermes-agent/29/results/20260606T191231Z-19b4e108.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260606T191236Z-8a1c3158.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260606T191242Z-9df9b918.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/OpenPipe__ART/2/results/20260606T191256Z-649eeec9.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260606T191315Z-5d346f3e.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260606T191321Z-5b130104.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/alibaba__OpenSandbox/7/results/20260606T191326Z-2cefba8a.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260606T191332Z-c63fb309.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260606T191338Z-ac50656e.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260606T191342Z-392a2145.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260606T191345Z-c47c5e8e.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260606T191400Z-40ea2ed6.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260606T191404Z-8841e3f6.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260606T191408Z-fa402bc0.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T191416Z-c88accae.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T191424Z-dd55d349.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T191428Z-04962c3b.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T191432Z-5cd84637.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T191437Z-14cfd345.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T191442Z-6a25babf.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T191446Z-3d5e40d9.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T191454Z-e3e26fcd.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T191459Z-13774286.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T191505Z-8e45020a.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T191513Z-181805bf.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T191517Z-9719f866.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T191522Z-09baef7c.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/ruvnet__ruflo/29/results/20260606T191527Z-1294b78b.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T191531Z-8ccab9ed.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T191907Z-a27d920e.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T191914Z-a4b61548.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T191924Z-d61af8ef.json
docs/eval_runs/full/20260606T_clean190_llama/prompt-filter/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T191929Z-07973471.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260606T191933Z-6be691d0.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260606T191940Z-49a72331.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260606T191942Z-157f2ee7.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260606T191944Z-480bb686.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260606T191948Z-aac9e178.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/NousResearch__hermes-agent/29/results/20260606T191951Z-4672408b.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260606T191955Z-fd6225a5.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260606T191959Z-8cb6abec.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/OpenPipe__ART/2/results/20260606T192002Z-cb621c6a.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260606T192006Z-22ce1edb.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/OpenPipe__ART/uv_managed_dependencies/results/20260606T192010Z-ade61174.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/alibaba__OpenSandbox/7/results/20260606T192012Z-b223e8e3.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/alibaba__OpenSandbox/kubernetes_apis_make_manifests_generate/results/20260606T192015Z-3b606399.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/alibaba__OpenSandbox/sdk_generated_output_not_only_fix/results/20260606T192019Z-e01291e5.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/browser-use__browser-harness/agent-workspace-only/results/20260606T192021Z-c1bf97ad.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/browser-use__browser-harness/direct-browser-harness-cli/results/20260606T192024Z-698c922d.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/code-yeongyu__oh-my-openagent/53/results/20260606T192027Z-b451a1ab.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/code-yeongyu__oh-my-openagent/bun-only-runtime/results/20260606T192030Z-49664d56.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/code-yeongyu__oh-my-openagent/platform-binaries-generated/results/20260606T192033Z-5aa82ca8.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/czlonkowski__n8n-mcp/41/results/20260606T192037Z-2ce3f04e.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/czlonkowski__n8n-mcp/no_committed_sensitive_test_env/results/20260606T192039Z-58d288d8.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/google__adk-python/generated-agentconfig-schema/results/20260606T192041Z-f2c3d0c1.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/google__adk-python/session-db-migration-root/results/20260606T192044Z-508e7813.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/openai__codex/app-server-v2-only/results/20260606T192048Z-b778ee41.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/openai__codex/generated-typescript-protocol/results/20260606T192051Z-bf737495.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/openai__openai-agents-python/generated-translated-docs-readonly/results/20260606T192054Z-471f0772.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/openai__openai-agents-python/repo-python-through-uv/results/20260606T192056Z-d547e295.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/openclaw__openclaw/generated-locale-protection/results/20260606T192100Z-3835123e.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/openclaw__openclaw/release-changelog-protection/results/20260606T192103Z-f3824deb.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/rohitg00__agentmemory/6/results/20260606T192107Z-09f6658c.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/rohitg00__agentmemory/agent-hooks-not-manual/results/20260606T192110Z-cfc1d5f1.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/rohitg00__agentmemory/container-entrypoints-only/results/20260606T192117Z-7f4f8487.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/ruvnet__ruflo/29/results/20260606T192120Z-fe06e93f.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/ruvnet__ruflo/no-root-workfiles/results/20260606T192123Z-57fb6f43.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/ruvnet__ruflo/read-before-edit/results/20260606T192126Z-4754526e.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/yusufkaraaslan__Skill_Seekers/68/results/20260606T192130Z-f6e94983.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/yusufkaraaslan__Skill_Seekers/local-fast-test-scope/results/20260606T192135Z-1ce83f5e.json
docs/eval_runs/full/20260606T_clean190_llama/tool-regex/docs/corpus-test/yusufkaraaslan__Skill_Seekers/pyproject-version-source/results/20260606T192138Z-acca848a.json
