Skip to content

Commit 5026d82

Browse files
committed
Update the tests.
1 parent 378e4e4 commit 5026d82

File tree

2 files changed

+9
-2
lines changed

2 files changed

+9
-2
lines changed

tokenizers/src/models/bpe/serialization.rs

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -178,10 +178,14 @@ mod test {
178178
.build()
179179
.unwrap();
180180

181+
let legacy = r#"{"type":"BPE","dropout":null,"unk_token":"<unk>","continuing_subword_prefix":null,"end_of_word_suffix":null,"fuse_unk":false,"byte_fallback":false,"ignore_merges":true,"vocab":{"<unk>":0,"a":1,"b":2,"ab":3},"merges":["a b"]}"#;
182+
let legacy = serde_json::from_str(&legacy).unwrap();
183+
assert_eq!(bpe, legacy);
184+
181185
let data = serde_json::to_string(&bpe).unwrap();
182186
assert_eq!(
183187
data,
184-
r#"{"type":"BPE","dropout":null,"unk_token":"<unk>","continuing_subword_prefix":null,"end_of_word_suffix":null,"fuse_unk":false,"byte_fallback":false,"ignore_merges":true,"vocab":{"<unk>":0,"a":1,"b":2,"ab":3},"merges":["a b"]}"#
188+
r#"{"type":"BPE","dropout":null,"unk_token":"<unk>","continuing_subword_prefix":null,"end_of_word_suffix":null,"fuse_unk":false,"byte_fallback":false,"ignore_merges":true,"vocab":{"<unk>":0,"a":1,"b":2,"ab":3},"merges":[["a","b"]]}"#
185189
);
186190
let reconstructed = serde_json::from_str(&data).unwrap();
187191

tokenizers/src/models/mod.rs

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -312,11 +312,14 @@ mod tests {
312312
.unwrap();
313313

314314
let model = ModelWrapper::BPE(bpe);
315+
let legacy = r#"{"type":"BPE","dropout":null,"unk_token":"<unk>","continuing_subword_prefix":null,"end_of_word_suffix":null,"fuse_unk":false,"byte_fallback":false,"ignore_merges":true,"vocab":{"<unk>":0,"a":1,"b":2,"ab":3},"merges":["a b"]}"#;
316+
let legacy = serde_json::from_str(&legacy).unwrap();
317+
assert_eq!(model, legacy);
315318

316319
let data = serde_json::to_string(&model).unwrap();
317320
assert_eq!(
318321
data,
319-
r#"{"type":"BPE","dropout":null,"unk_token":"<unk>","continuing_subword_prefix":null,"end_of_word_suffix":null,"fuse_unk":false,"byte_fallback":false,"ignore_merges":true,"vocab":{"<unk>":0,"a":1,"b":2,"ab":3},"merges":["a b"]}"#
322+
r#"{"type":"BPE","dropout":null,"unk_token":"<unk>","continuing_subword_prefix":null,"end_of_word_suffix":null,"fuse_unk":false,"byte_fallback":false,"ignore_merges":true,"vocab":{"<unk>":0,"a":1,"b":2,"ab":3},"merges":[["a","b"]]}"#
320323
);
321324
let reconstructed = serde_json::from_str(&data).unwrap();
322325
assert_eq!(model, reconstructed);

0 commit comments

Comments
 (0)