Walid-Ahmed commited on
Commit
d059dbe
·
verified ·
1 Parent(s): 4837fdc

Upload tokenizer

Browse files
special_tokens_map.json CHANGED
@@ -8,9 +8,21 @@
8
  ">>ANSWER<<",
9
  ">>QUESTION<<",
10
  ">>DOMAIN<<",
11
- ">>PREFIX<<",
12
- ">>SUFFIX<<",
13
- ">>MIDDLE<<"
 
 
 
 
 
 
 
 
 
 
 
 
14
  ],
15
  "eos_token": {
16
  "content": "<|endoftext|>",
 
8
  ">>ANSWER<<",
9
  ">>QUESTION<<",
10
  ">>DOMAIN<<",
11
+ ">>EMAIL_ADDRESS<<",
12
+ ">>IP_ADDRESS<<",
13
+ "<|startoftext|>",
14
+ ">>IP_ADDRESS_0<<",
15
+ ">>IP_ADDRESS_1<<",
16
+ ">>IP_ADDRESS_2<<",
17
+ ">>IP_ADDRESS_3<<",
18
+ ">>IP_ADDRESS_4<<",
19
+ ">>IP_ADDRESS_5<<",
20
+ ">>IP_ADDRESS_6<<",
21
+ ">>IP_ADDRESS_7<<",
22
+ ">>IP_ADDRESS_8<<",
23
+ ">>IP_ADDRESS_9<<",
24
+ ">>PASSWORD<<",
25
+ ">>KEY<<"
26
  ],
27
  "eos_token": {
28
  "content": "<|endoftext|>",
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
The diff for this file is too large to render. See raw diff