openai/tiktoken

Public

mirrored fromhttps://github.com/openai/tiktokenAvailable

CodeCommitsIssuesPull requestsActionsInsightsSecurity
0.8.0

Branches

Tags

  • No tags available.
0Branches0Tags
Go to file
Add file
Code

Clone

HTTPS

Download ZIP

tests/test_pickle.py

23lines · modecode

1import tiktoken
2
3
4def test_pickle():
5 import pickle
6
7 enc_old = tiktoken.get_encoding("r50k_base")
8 enc_new = pickle.loads(pickle.dumps(enc_old))
9 assert enc_old.encode("hello world") == enc_new.encode("hello world")
10
11 enc_old = tiktoken.Encoding(
12 name="custom_enc",
13 pat_str=enc_old._pat_str,
14 mergeable_ranks=enc_old._mergeable_ranks,
15 special_tokens={"<|pickle|>": 100_000},
16 )
17 enc_new = pickle.loads(pickle.dumps(enc_old))
18 assert enc_old.encode("hello world") == enc_new.encode("hello world")
19 assert (
20 enc_old.encode("<|pickle|>", allowed_special="all")
21 == enc_new.encode("<|pickle|>", allowed_special="all")
22 == [100_000]
23 )
24