cd /Users/vatcheisahagian/UserData/VSCode/terminal-bench/runs && for d in */; do
rj="$d/results.json"
if [ -f "$rj" ]; then
python3 -c "
import json, sys
with open('$rj') as f:
r = json.load(f)
for t in r.get('results', []):
print(f"{t.get('task_id'):35} {'PASS' if t.get('is_resolved') else 'FAIL':4} fail_mode={t.get('failure_mode')} run=$d")
" 2>/dev/null
fi
done
Aggregate all run results
Unhandled node type: string
cd /Users/vatcheisahagian/UserData/VSCode/terminal-bench/runs && for d in */; do
rj="$d/results.json"
if [ -f "$rj" ]; then
python3 -c "
import json, sys
with open('$rj') as f:
r = json.load(f)
for t in r.get('results', []):
print(f"{t.get('task_id'):35} {'PASS' if t.get('is_resolved') else 'FAIL':4} fail_mode={t.get('failure_mode')} run=$d")
" 2>/dev/null
fi
done
Aggregate all run results
Unhandled node type: string