Canstralian commited on
Commit
40d9120
·
verified ·
1 Parent(s): b1a4eb5

Create tokenizers/vocab.json

Browse files
Files changed (1) hide show
  1. tokenizers/vocab.json +22 -0
tokenizers/vocab.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "[PAD]": 0,
3
+ "[UNK]": 1,
4
+ "[CLS]": 2,
5
+ "[SEP]": 3,
6
+ "the": 4,
7
+ "to": 5,
8
+ "and": 6,
9
+ "in": 7,
10
+ "of": 8,
11
+ "a": 9,
12
+ "is": 10,
13
+ "it": 11,
14
+ "you": 12,
15
+ "for": 13,
16
+ "that": 14,
17
+ "with": 15,
18
+ "this": 16,
19
+ "on": 17,
20
+ "was": 18,
21
+ "at": 19
22
+ }