diff --git a/bindings/python/benches/bench_gpt2.py b/bindings/python/benches/bench_gpt2.py index 7809d643d..e6a64abe3 100755 --- a/bindings/python/benches/bench_gpt2.py +++ b/bindings/python/benches/bench_gpt2.py @@ -38,7 +38,7 @@ def benchmark_batch(documents: list[str]) -> None: readable_size, unit = format_byte_size(num_bytes / (end - start) * 1e9) print(f"tiktoken \t{readable_size} / s") - hf_enc = Tokenizer.from_pretrained("gpt2") + hf_enc = Tokenizer.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct") hf_enc.encode("warmup") start = time.perf_counter_ns()