Skip to content

Commit 52fceb8

Browse files
authored
Replace <|endoftext|> with constant (#186)
1 parent cc1848c commit 52fceb8

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

tiktoken_ext/openai_public.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ def gpt2():
1717
"explicit_n_vocab": 50257,
1818
"pat_str": r"""'s|'t|'re|'ve|'m|'ll|'d| ?\p{L}+| ?\p{N}+| ?[^\s\p{L}\p{N}]+|\s+(?!\S)|\s+""",
1919
"mergeable_ranks": mergeable_ranks,
20-
"special_tokens": {"<|endoftext|>": 50256},
20+
"special_tokens": {ENDOFTEXT: 50256},
2121
}
2222

2323

0 commit comments

Comments
 (0)