d10ecd7 f4973d4 d10ecd7
1
2
3
4
5
6
7
from vocab.baichuan import tokenizer id1 = tokenizer.encode("<pad>") token1 = tokenizer.decode(125696)