Skip to content

Commit b4d2758

Browse files
committed
fix: update run example
1 parent cc814a3 commit b4d2758

File tree

1 file changed

+7
-5
lines changed

1 file changed

+7
-5
lines changed

run.sh

Lines changed: 7 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,8 @@ BACKEND=openai
55
TEMP=0
66
N_SAMPLES=1
77
NUM_GPU=1
8-
SUBSET=instruct
8+
SPLIT=complete
9+
SUBSET=hard
910
if [[ $MODEL == *"/"* ]]; then
1011
ORG=$(echo $MODEL | cut -d'/' -f1)--
1112
BASE_MODEL=$(echo $MODEL | cut -d'/' -f2)
@@ -18,20 +19,21 @@ FILE_HEADER=$ORG$BASE_MODEL--$DATASET-$SUBSET--$BACKEND-$TEMP-$N_SAMPLES
1819

1920
echo $FILE_HEADER
2021
bigcodebench.generate \
21-
--id_range 0 1 \
2222
--tp $NUM_GPU \
2323
--model $MODEL \
2424
--bs $BS \
2525
--temperature $TEMP \
2626
--n_samples $N_SAMPLES \
2727
--resume \
28+
--split $SPLIT \
2829
--subset $SUBSET \
29-
--backend $BACKEND
30+
--backend $BACKEND \
31+
--trust_remote_code
3032

3133
bigcodebench.sanitize --samples $FILE_HEADER.jsonl --calibrate
3234

3335
# Check if the ground truth works on your machine
34-
bigcodebench.evaluate --subset $SUBSET --samples $FILE_HEADER-sanitized-calibrated.jsonl
36+
bigcodebench.evaluate --split $SUBSET --samples $FILE_HEADER-sanitized-calibrated.jsonl
3537

3638
# If the execution is slow:
37-
bigcodebench.evaluate --subset $SUBSET --samples $FILE_HEADER-sanitized-calibrated.jsonl --parallel 32
39+
bigcodebench.evaluate --split $SUBSET --samples $FILE_HEADER-sanitized-calibrated.jsonl --parallel 32

0 commit comments

Comments
 (0)