Skip to content

Commit f93307f

Browse files
committed
nit
1 parent 801e387 commit f93307f

File tree

1 file changed

+5
-2
lines changed

1 file changed

+5
-2
lines changed

tokenizers/src/tokenizer/added_vocabulary.rs

+5-2
Original file line numberDiff line numberDiff line change
@@ -465,7 +465,7 @@ impl AddedVocabulary {
465465
.slice(Range::Normalized(byte_offsets.0..byte_offsets.1))
466466
.expect("AddedVocabulary bad split");
467467
if let Some(id) = id {
468-
(slice, Some(vec![Token::new(id, String::new(), (0,))]))
468+
(slice, Some(vec![Token::new(id, String::new(), (0, 0))]))
469469
} else {
470470
(slice, None)
471471
}
@@ -537,7 +537,10 @@ impl AddedVocabulary {
537537
pretokenized
538538
.split(|_, mut sequence| {
539539
normalizer.map(|n| n.normalize(&mut sequence));
540-
Ok(self.split_with_indices(sequence, &self.split_normalized_trie_vec))
540+
Ok(self.split_with_indices(
541+
sequence,
542+
&self.split_normalized_trie_vec[hash_current_thread() % MAX_NUM_THREADS],
543+
))
541544
})
542545
.expect("AddedVocabulary bad split");
543546

0 commit comments

Comments
 (0)