docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260605T031525Z-71862c3f.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260605T031629Z-09ed6c51.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260605T032003Z-0dc16f50.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260605T032307Z-b7b92a4c.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260605T032522Z-0f2db426.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260605T033006Z-211a0e0a.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260605T033459Z-222ba586.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/Alishahryar1__free-claude-code/s02_no_type_ignores/results/20260605T033653Z-c1d57a4c.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/Alishahryar1__free-claude-code/s02_no_type_ignores/results/20260605T033712Z-f7bc5f99.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/Alishahryar1__free-claude-code/s02_no_type_ignores/results/20260605T033853Z-01d61c85.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/Alishahryar1__free-claude-code/s02_no_type_ignores/results/20260605T033906Z-33bcfa97.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/Alishahryar1__free-claude-code/s02_no_type_ignores/results/20260605T034153Z-1b42ee42.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/third-party-barrel-imports/results/20260605T034240Z-6d699229.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/third-party-barrel-imports/results/20260605T034327Z-394cd7e0.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/third-party-barrel-imports/results/20260605T034414Z-0193d2d4.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/third-party-barrel-imports/results/20260605T034700Z-5205acf5.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/third-party-barrel-imports/results/20260605T034748Z-6f115116.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/tool-schema-flat-zod/results/20260605T034835Z-e97aca64.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/tool-schema-flat-zod/results/20260605T034923Z-4f79922e.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/tool-schema-flat-zod/results/20260605T035209Z-df69b6c9.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/tool-schema-flat-zod/results/20260605T035456Z-54c1a17c.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/tool-schema-flat-zod/results/20260605T035544Z-82d83868.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260605T035632Z-09db6054.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260605T035920Z-43906992.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260605T040007Z-7c5d0d8f.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260605T040055Z-d6897ac1.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260605T040142Z-6f83d018.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260605T040429Z-eec90648.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260605T040517Z-829e43ea.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260605T040605Z-186f3b12.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260605T040851Z-8a1ffd5a.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260605T040939Z-015f7921.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260605T041026Z-e9a81830.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260605T041211Z-9f85a639.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NousResearch__hermes-agent/29/results/20260605T041242Z-0ffd6f82.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NousResearch__hermes-agent/29/results/20260605T041245Z-a700b795.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260605T041255Z-dca6a931.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260605T041533Z-464c90d8.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260605T041822Z-85fcdfbd.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260605T041913Z-dd6042fb.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260605T041944Z-7b07cc85.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260605T042301Z-2963286b.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260605T042358Z-6cc67045.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260605T042645Z-4c55f19d.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260605T042734Z-3dc74e2a.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260605T042933Z-6b2e9cb6.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/OpenPipe__ART/2/results/20260605T042949Z-13840628.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/OpenPipe__ART/2/results/20260605T042958Z-2f19442c.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260605T043246Z-7f1457d5.json
docs/eval_runs/baseline/20260605T031337Z/prompt-only/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260605T043334Z-9a774cd9.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260605T072354Z-dfffb274.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/6/results/20260605T072510Z-1a92f964.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260605T072629Z-6a804068.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260605T072725Z-d71c2f6c.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260605T072813Z-c5e2521c.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260605T072816Z-7c94acf9.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/s01_use_uv_run/results/20260605T072958Z-e8d4f3e7.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/s02_no_type_ignores/results/20260605T073008Z-11632367.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/s02_no_type_ignores/results/20260605T073015Z-b326a526.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/s02_no_type_ignores/results/20260605T073048Z-d4975c44.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/s02_no_type_ignores/results/20260605T073058Z-bf605ea1.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/Alishahryar1__free-claude-code/s02_no_type_ignores/results/20260605T073140Z-8f541a16.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/third-party-barrel-imports/results/20260605T073207Z-c9e86206.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/third-party-barrel-imports/results/20260605T073312Z-885ad15b.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/third-party-barrel-imports/results/20260605T073350Z-e5b7e2c5.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/third-party-barrel-imports/results/20260605T073503Z-72b5a3cf.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/third-party-barrel-imports/results/20260605T073508Z-2eed22a0.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/tool-schema-flat-zod/results/20260605T073531Z-9d9aebc6.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/tool-schema-flat-zod/results/20260605T073555Z-6e578bfc.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/tool-schema-flat-zod/results/20260605T073926Z-dc274c90.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/tool-schema-flat-zod/results/20260605T074650Z-fce345f3.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/ChromeDevTools__chrome-devtools-mcp/tool-schema-flat-zod/results/20260605T074738Z-84eb42a5.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260605T074825Z-f7bbee89.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/19/results/20260605T075113Z-250a1398.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260605T075201Z-8a2c109f.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260605T075250Z-2117438e.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260605T075536Z-3ec61b96.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260605T075624Z-dcd0406d.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/s01_private_vulnerability_reporting/results/20260605T075712Z-d6059656.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260605T075959Z-0978765e.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260605T080047Z-4ec2f05d.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260605T080135Z-b6b639e4.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260605T080421Z-765299ae.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NVIDIA__NemoClaw/s02_no_new_javascript_sources/results/20260605T080509Z-781b0e55.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NousResearch__hermes-agent/29/results/20260605T080757Z-36d58e06.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NousResearch__hermes-agent/29/results/20260605T080845Z-be462812.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260605T080935Z-9abf8786.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260605T081226Z-fe557f5d.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260605T081314Z-1642f64f.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260605T081605Z-86a7541f.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NousResearch__hermes-agent/s01_use_test_wrapper/results/20260605T081656Z-f5b3602c.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260605T081746Z-32f62871.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260605T082141Z-2c6064f0.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260605T082428Z-a5a30465.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260605T082518Z-3fe325d5.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/NousResearch__hermes-agent/s02_keep_credentials_out_of_repo/results/20260605T082608Z-674ba000.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/OpenPipe__ART/2/results/20260605T082856Z-a27246e8.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/OpenPipe__ART/2/results/20260605T082944Z-45d002be.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260605T083231Z-9f625d87.json
docs/eval_runs/baseline/20260605T031337Z/tool-regex/docs/corpus-test/OpenPipe__ART/prek_before_commit/results/20260605T083318Z-73d464a1.json
