1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
[]
# Extend the default configuration
= [
# Allow tiktoken-specific terms
"tiktoken",
"gpt",
"openai",
"bpe",
# Allow common variable names
"mut",
"impl",
"struct",
"enum",
"fn",
"const",
"static",
"async",
"await",
# Allow hex values
"[0-9a-fA-F]{8,}",
]
[]
# Add project-specific words that should not be flagged as typos
= "tiktoken"
= "openai"
= "gpt"
= "bpe"
= "mergeable"
= "detokenization"
= "tokenization"
= "endoftext"
= "endofprompt"
# BPE tokens that are legitimate but might be flagged as typos
= "nd"
[]
= [
"target/",
"*.lock",
"*.toml",
"*.json",
"*.md",
]