Skip to content

Commit 262e9a7

Browse files
Use pretrained model for huggingface tokenizer and add equivalence test
1 parent b3bac7e commit 262e9a7

File tree

12 files changed

+251
-600204
lines changed

12 files changed

+251
-600204
lines changed

crates/bpe/benchmarks/Cargo.toml

Lines changed: 12 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,17 +1,26 @@
11
[package]
2-
name = "bpe-benches"
2+
name = "bpe-benchmarks"
33
edition = "2021"
44

5+
[lib]
6+
path = "lib.rs"
7+
58
[[bench]]
69
name = "performance"
710
path = "performance.rs"
811
harness = false
912
test = false
1013

11-
[dev-dependencies]
14+
[[test]]
15+
name = "equivalence"
16+
path = "equivalence.rs"
17+
harness = true
18+
test = true
19+
20+
[dependencies]
1221
bpe = { path = "../../bpe", features = ["rand", "tiktoken-rs"] }
1322
bpe-openai = { path = "../../bpe-openai" }
1423
criterion = "0.5"
1524
rand = "0.8"
1625
tiktoken-rs = "0.5"
17-
tokenizers = "0.20"
26+
tokenizers = { version = "0.20", features = ["http"] }

0 commit comments

Comments
 (0)