Skip to content

Commit b2a14b6

Browse files
committed
add tokenizer_name argument for custom tokenizer
1 parent 32324d2 commit b2a14b6

File tree

1 file changed

+6
-3
lines changed

1 file changed

+6
-3
lines changed

bigcodebench/generate.py

Lines changed: 6 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@ def codegen(
3535

3636
if model.is_direct_completion() and subset == "instruct":
3737
raise Exception("Base model does not support direct completion for instruct tasks")
38-
38+
3939
# create save_path if it doesn't exist, e.g., a/b.jsonl
4040
dirname = os.path.dirname(save_path)
4141
if not os.path.exists(dirname) and dirname != "":
@@ -118,6 +118,8 @@ def main():
118118
parser.add_argument("--base_url", default=None, type=str)
119119
parser.add_argument("--tp", default=1, type=int)
120120
parser.add_argument("--trust_remote_code", action="store_true")
121+
parser.add_argument("--tokenizer_name", default=None, type=str)
122+
121123
args = parser.parse_args()
122124

123125

@@ -145,7 +147,8 @@ def main():
145147
temperature=args.temperature,
146148
base_url=args.base_url,
147149
tp=args.tp,
148-
trust_remote_code=args.trust_remote_code
150+
trust_remote_code=args.trust_remote_code,
151+
tokenizer_name=args.tokenizer_name
149152
)
150153

151154
if not args.save_path:
@@ -161,7 +164,7 @@ def main():
161164
strip_newlines=args.strip_newlines,
162165
n_samples=args.n_samples,
163166
resume=args.resume,
164-
id_range=args.id_range,
167+
id_range=args.id_range
165168
)
166169

167170

0 commit comments

Comments
 (0)