-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathrq4.sh
More file actions
22 lines (20 loc) · 1.24 KB
/
rq4.sh
File metadata and controls
22 lines (20 loc) · 1.24 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
rm tmp/* || mkdir tmp
rm logs/* || mkdir logs
echo "evaluating codellama13b-baseline on defects4j"
python3 test_d4j.py -m baseline -n 10 > logs/d4j-codellama13b-baseline.log
echo "evaluating codellama13b-stdft on defects4j"
python3 test_d4j.py -m stdft -n 10 > logs/d4j-codellama13b-stdft.log
echo "evaluating codellama13b-morepair on defects4j"
python3 test_d4j.py -m morepair -n 10 > logs/d4j-codellama13b-morepair.log
cd swebench_result
echo "evaluating codellama13b-baseline on swebench"
python3 -m swebench.harness.run_evaluation --dataset SWE-Bench --predictions_path patches/baseline.jsonl --max_worker 16 --run_id baseline --timeout 900 > logs/swe-codellama13b-baseline.log
echo "evaluating codellama13b-stdft on swebench"
python3 -m swebench.harness.run_evaluation --dataset SWE-Bench --predictions_path patches/stdft.jsonl --max_worker 16 --run_id stdft --timeout 900 > logs/swe-codellama13b-stdft.log
echo "evaluating codellama13b-morepair on swebench"
python3 -m swebench.harness.run_evaluation --dataset SWE-Bench --predictions_path patches/morepair.jsonl --max_worker 16 --run_id morepair --timeout 900 > logs/swe-codellama13b-morepair.log
cd ..
for log_file in logs/*.log; do
echo -n "$(basename "$log_file") : "
tail -n 5 "$log_file"
done