{python} {benchmark}/_parent/frontier_eval/evaluate_unified.py --benchmark-dir {benchmark} --candidate {candidate}
