Thalesian commited on
Commit
72495d4
ยท
verified ยท
1 Parent(s): 56cac06

End of training

Browse files
README.md CHANGED
@@ -14,7 +14,7 @@ should probably proofread and complete it, then remove this comment. -->
14
 
15
  This model was trained from scratch on the None dataset.
16
  It achieves the following results on the evaluation set:
17
- - Loss: 0.1642
18
 
19
  ## Model description
20
 
@@ -37,7 +37,7 @@ The following hyperparameters were used during training:
37
  - train_batch_size: 128
38
  - eval_batch_size: 128
39
  - seed: 42
40
- - optimizer: Use adamw_torch_fused with betas=(0.826646043090655,0.991636944120939) and epsilon=3.4341677539323e-07 and optimizer_args=No additional optimizer arguments
41
  - lr_scheduler_type: linear
42
  - lr_scheduler_warmup_steps: 5000
43
  - num_epochs: 200
@@ -46,27 +46,43 @@ The following hyperparameters were used during training:
46
 
47
  | Training Loss | Epoch | Step | Validation Loss |
48
  |:-------------:|:-----:|:-----:|:---------------:|
49
- | 0.0263 | 1.0 | 3131 | 0.1478 |
50
- | 0.0254 | 2.0 | 6262 | 0.1588 |
51
- | 0.0248 | 3.0 | 9393 | 0.1532 |
52
- | 0.0243 | 4.0 | 12524 | 0.1565 |
53
- | 0.0237 | 5.0 | 15655 | 0.1578 |
54
- | 0.0235 | 6.0 | 18786 | 0.1584 |
55
- | 0.0245 | 7.0 | 21917 | 0.1604 |
56
- | 0.0242 | 8.0 | 25048 | 0.1560 |
57
- | 0.0236 | 9.0 | 28179 | 0.1594 |
58
- | 0.0234 | 10.0 | 31310 | 0.1635 |
59
- | 0.0229 | 11.0 | 34441 | 0.1582 |
60
- | 0.0226 | 12.0 | 37572 | 0.1618 |
61
- | 0.0223 | 13.0 | 40703 | 0.1606 |
62
- | 0.022 | 14.0 | 43834 | 0.1948 |
63
- | 0.0217 | 15.0 | 46965 | 0.1626 |
64
- | 0.0216 | 16.0 | 50096 | 0.1642 |
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
65
 
66
 
67
  ### Framework versions
68
 
69
  - Transformers 4.51.3
70
- - Pytorch 2.8.0.dev20250425
71
- - Datasets 2.14.0
72
- - Tokenizers 0.21.1
 
14
 
15
  This model was trained from scratch on the None dataset.
16
  It achieves the following results on the evaluation set:
17
+ - Loss: 0.3609
18
 
19
  ## Model description
20
 
 
37
  - train_batch_size: 128
38
  - eval_batch_size: 128
39
  - seed: 42
40
+ - optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
41
  - lr_scheduler_type: linear
42
  - lr_scheduler_warmup_steps: 5000
43
  - num_epochs: 200
 
46
 
47
  | Training Loss | Epoch | Step | Validation Loss |
48
  |:-------------:|:-----:|:-----:|:---------------:|
49
+ | 0.1074 | 1.0 | 568 | 0.3485 |
50
+ | 0.108 | 2.0 | 1136 | 0.3540 |
51
+ | 0.106 | 3.0 | 1704 | 0.3306 |
52
+ | 0.1045 | 4.0 | 2272 | 0.3545 |
53
+ | 0.1052 | 5.0 | 2840 | 0.3218 |
54
+ | 0.1033 | 6.0 | 3408 | 0.3230 |
55
+ | 0.1023 | 7.0 | 3976 | 0.3480 |
56
+ | 0.0995 | 8.0 | 4544 | 0.4591 |
57
+ | 0.1 | 9.0 | 5112 | 0.3469 |
58
+ | 0.0978 | 10.0 | 5680 | 0.3328 |
59
+ | 0.0974 | 11.0 | 6248 | 0.3641 |
60
+ | 0.0965 | 12.0 | 6816 | 0.3167 |
61
+ | 0.0951 | 13.0 | 7384 | 0.3220 |
62
+ | 0.0953 | 14.0 | 7952 | 0.3034 |
63
+ | 0.0935 | 15.0 | 8520 | 0.3595 |
64
+ | 0.0934 | 16.0 | 9088 | 0.3090 |
65
+ | 0.0942 | 17.0 | 9656 | 0.2997 |
66
+ | 0.0939 | 18.0 | 10224 | 0.3231 |
67
+ | 0.0918 | 19.0 | 10792 | 0.3788 |
68
+ | 0.0933 | 20.0 | 11360 | 0.3888 |
69
+ | 0.0916 | 21.0 | 11928 | 0.5056 |
70
+ | 0.0907 | 22.0 | 12496 | 0.3029 |
71
+ | 0.0905 | 23.0 | 13064 | 0.3338 |
72
+ | 0.0898 | 24.0 | 13632 | 0.3883 |
73
+ | 0.0892 | 25.0 | 14200 | 0.4280 |
74
+ | 0.0884 | 26.0 | 14768 | 0.3281 |
75
+ | 0.0894 | 27.0 | 15336 | 0.3609 |
76
+ | 0.0879 | 28.0 | 15904 | 0.3560 |
77
+ | 0.0881 | 29.0 | 16472 | 0.3502 |
78
+ | 0.0873 | 30.0 | 17040 | 0.3961 |
79
+ | 0.0866 | 31.0 | 17608 | 0.3481 |
80
+ | 0.0864 | 32.0 | 18176 | 0.3609 |
81
 
82
 
83
  ### Framework versions
84
 
85
  - Transformers 4.51.3
86
+ - Pytorch 2.8.0.dev20250424
87
+ - Datasets 2.20.0
88
+ - Tokenizers 0.21.0
added_tokens.json CHANGED
@@ -1,47 +1,247 @@
1
  {
2
- "Elamite": 32109,
3
- "English:": 32120,
4
- "Hittite": 32136,
5
- "Translate": 32107,
6
- "ai": 32123,
7
- "am3": 32139,
8
- "bar8": 32140,
9
- "bi2": 32111,
10
- "complex": 32132,
11
- "cz": 32122,
12
- "de3": 32128,
13
- "e11": 32117,
14
- "e2": 32118,
15
- "esz": 32105,
16
- "et9": 32131,
17
- "ga5": 32125,
18
- "gestin'": 32137,
19
- "gi4": 32115,
20
- "gu2": 32103,
21
- "ita": 32134,
22
- "ket9": 32143,
23
- "lut": 32135,
24
- "mmed": 32114,
25
- "nis": 32133,
26
- "nn": 32116,
27
- "pil2": 32113,
28
- "qad": 32127,
29
- "ri2": 32144,
30
- "ru14": 32102,
31
- "sahar": 32129,
32
- "si11": 32101,
33
- "siร—sa": 32124,
34
- "skal": 32106,
35
- "suen": 32108,
36
- "sz": 32110,
37
- "szum": 32130,
38
- "szuszin": 32142,
39
- "transliteration": 32138,
40
- "tu2": 32119,
41
- "u19": 32100,
42
- "uhaldi": 32121,
43
- "ummeda": 32126,
44
- "urus": 32112,
45
- "ut2": 32141,
46
- "ze2": 32104
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
47
  }
 
1
  {
2
+ "ยฑ": 32211,
3
+ "โ†’": 32101,
4
+ "โŒœ": 32246,
5
+ "โŒ": 32194,
6
+ "โ—": 32109,
7
+ "โŸฆ": 32281,
8
+ "โŸง": 32269,
9
+ "๐€€": 32172,
10
+ "๐€": 32237,
11
+ "๐€‚": 32300,
12
+ "๐€ƒ": 32244,
13
+ "๐€„": 32210,
14
+ "๐€…": 32169,
15
+ "๐€†": 32228,
16
+ "๐€‡": 32327,
17
+ "๐€ˆ": 32238,
18
+ "๐€‰": 32106,
19
+ "๐€Š": 32301,
20
+ "๐€‹": 32119,
21
+ "๐€": 32243,
22
+ "๐€Ž": 32187,
23
+ "๐€": 32284,
24
+ "๐€": 32295,
25
+ "๐€‘": 32339,
26
+ "๐€’": 32275,
27
+ "๐€“": 32333,
28
+ "๐€”": 32251,
29
+ "๐€•": 32276,
30
+ "๐€–": 32274,
31
+ "๐€—": 32166,
32
+ "๐€˜": 32120,
33
+ "๐€™": 32311,
34
+ "๐€š": 32104,
35
+ "๐€›": 32183,
36
+ "๐€œ": 32242,
37
+ "๐€": 32298,
38
+ "๐€ž": 32217,
39
+ "๐€Ÿ": 32272,
40
+ "๐€ ": 32174,
41
+ "๐€ก": 32115,
42
+ "๐€ข": 32320,
43
+ "๐€ฃ": 32204,
44
+ "๐€ค": 32315,
45
+ "๐€ฅ": 32277,
46
+ "๐€ฆ": 32157,
47
+ "๐€จ": 32283,
48
+ "๐€ฉ": 32165,
49
+ "๐€ช": 32205,
50
+ "๐€ซ": 32289,
51
+ "๐€ฌ": 32140,
52
+ "๐€ญ": 32232,
53
+ "๐€ฎ": 32112,
54
+ "๐€ฏ": 32341,
55
+ "๐€ฐ": 32207,
56
+ "๐€ฑ": 32152,
57
+ "๐€ฒ": 32213,
58
+ "๐€ณ": 32221,
59
+ "๐€ด": 32321,
60
+ "๐€ต": 32310,
61
+ "๐€ถ": 32198,
62
+ "๐€ท": 32241,
63
+ "๐€ธ": 32188,
64
+ "๐€น": 32208,
65
+ "๐€บ": 32324,
66
+ "๐€ผ": 32133,
67
+ "๐€ฝ": 32121,
68
+ "๐€ฟ": 32325,
69
+ "๐€": 32189,
70
+ "๐": 32279,
71
+ "๐‚": 32278,
72
+ "๐ƒ": 32323,
73
+ "๐„": 32250,
74
+ "๐…": 32286,
75
+ "๐†": 32177,
76
+ "๐‡": 32314,
77
+ "๐ˆ": 32159,
78
+ "๐‰": 32191,
79
+ "๐Š": 32132,
80
+ "๐‹": 32234,
81
+ "๐Œ": 32273,
82
+ "๐": 32291,
83
+ "๐": 32134,
84
+ "๐‘": 32293,
85
+ "๐’": 32224,
86
+ "๐“": 32190,
87
+ "๐”": 32261,
88
+ "๐•": 32105,
89
+ "๐–": 32285,
90
+ "๐—": 32260,
91
+ "๐˜": 32334,
92
+ "๐™": 32146,
93
+ "๐š": 32160,
94
+ "๐›": 32230,
95
+ "๐œ": 32184,
96
+ "๐": 32259,
97
+ "๐‚€": 32223,
98
+ "๐‚": 32305,
99
+ "๐‚‚": 32173,
100
+ "๐‚ƒ": 32258,
101
+ "๐‚„": 32127,
102
+ "๐‚…": 32192,
103
+ "๐‚†": 32265,
104
+ "๐‚‡": 32313,
105
+ "๐‚ˆ": 32144,
106
+ "๐‚‰": 32138,
107
+ "๐‚Š": 32330,
108
+ "๐‚‹": 32110,
109
+ "๐‚Œ": 32337,
110
+ "๐‚": 32107,
111
+ "๐‚Ž": 32236,
112
+ "๐‚": 32229,
113
+ "๐‚": 32199,
114
+ "๐‚‘": 32163,
115
+ "๐‚’": 32257,
116
+ "๐‚”": 32130,
117
+ "๐‚•": 32282,
118
+ "๐‚–": 32297,
119
+ "๐‚—": 32212,
120
+ "๐‚š": 32254,
121
+ "๐‚›": 32126,
122
+ "๐‚œ": 32249,
123
+ "๐‚": 32154,
124
+ "๐‚ž": 32145,
125
+ "๐‚Ÿ": 32149,
126
+ "๐‚ก": 32326,
127
+ "๐‚ข": 32186,
128
+ "๐‚ฃ": 32335,
129
+ "๐‚ฅ": 32142,
130
+ "๐‚ฆ": 32123,
131
+ "๐‚ง": 32171,
132
+ "๐‚จ": 32233,
133
+ "๐‚ฉ": 32268,
134
+ "๐‚ช": 32308,
135
+ "๐‚ซ": 32340,
136
+ "๐‚ฌ": 32181,
137
+ "๐‚ญ": 32216,
138
+ "๐‚ฎ": 32131,
139
+ "๐‚ฏ": 32218,
140
+ "๐‚ฐ": 32153,
141
+ "๐‚ฑ": 32332,
142
+ "๐‚ฒ": 32255,
143
+ "๐‚ณ": 32245,
144
+ "๐‚ด": 32267,
145
+ "๐‚ต": 32227,
146
+ "๐‚ถ": 32209,
147
+ "๐‚ท": 32182,
148
+ "๐‚ธ": 32316,
149
+ "๐‚น": 32240,
150
+ "๐‚บ": 32122,
151
+ "๐‚ป": 32225,
152
+ "๐‚ผ": 32124,
153
+ "๐‚ฝ": 32248,
154
+ "๐‚พ": 32262,
155
+ "๐‚ฟ": 32158,
156
+ "๐ƒ€": 32195,
157
+ "๐ƒ": 32125,
158
+ "๐ƒ‚": 32215,
159
+ "๐ƒ„": 32156,
160
+ "๐ƒ†": 32247,
161
+ "๐ƒ‡": 32136,
162
+ "๐ƒˆ": 32292,
163
+ "๐ƒ‰": 32290,
164
+ "๐ƒŠ": 32150,
165
+ "๐ƒŒ": 32118,
166
+ "๐ƒ": 32288,
167
+ "๐ƒŽ": 32256,
168
+ "๐ƒ": 32304,
169
+ "๐ƒ": 32344,
170
+ "๐ƒ‘": 32180,
171
+ "๐ƒ“": 32220,
172
+ "๐ƒ”": 32193,
173
+ "๐ƒ•": 32147,
174
+ "๐ƒ—": 32306,
175
+ "๐ƒ™": 32252,
176
+ "๐ƒš": 32176,
177
+ "๐ƒ›": 32179,
178
+ "๐ƒœ": 32168,
179
+ "๐ƒ": 32135,
180
+ "๐ƒž": 32100,
181
+ "๐ƒŸ": 32117,
182
+ "๐ƒ ": 32312,
183
+ "๐ƒก": 32151,
184
+ "๐ƒข": 32331,
185
+ "๐ƒฃ": 32164,
186
+ "๐ƒค": 32139,
187
+ "๐ƒฅ": 32309,
188
+ "๐ƒฆ": 32307,
189
+ "๐ƒง": 32264,
190
+ "๐ƒจ": 32328,
191
+ "๐ƒฉ": 32162,
192
+ "๐ƒช": 32196,
193
+ "๐ƒซ": 32338,
194
+ "๐ƒฌ": 32201,
195
+ "๐ƒญ": 32271,
196
+ "๐ƒฎ": 32342,
197
+ "๐ƒฏ": 32343,
198
+ "๐ƒฐ": 32280,
199
+ "๐ƒฑ": 32287,
200
+ "๐ƒฒ": 32302,
201
+ "๐ƒณ": 32102,
202
+ "๐ƒด": 32161,
203
+ "๐ƒต": 32329,
204
+ "๐ƒถ": 32231,
205
+ "๐ƒท": 32239,
206
+ "๐ƒธ": 32270,
207
+ "๐ƒน": 32206,
208
+ "๐„ˆ": 32317,
209
+ "๐„‰": 32116,
210
+ "๐„Š": 32294,
211
+ "๐„‹": 32170,
212
+ "๐„Œ": 32137,
213
+ "๐„": 32178,
214
+ "๐„Ž": 32226,
215
+ "๐„": 32203,
216
+ "๐„": 32108,
217
+ "๐„‘": 32336,
218
+ "๐„’": 32167,
219
+ "๐„“": 32103,
220
+ "๐„”": 32185,
221
+ "๐„•": 32129,
222
+ "๐„–": 32299,
223
+ "๐„—": 32235,
224
+ "๐„˜": 32111,
225
+ "๐„™": 32141,
226
+ "๐„š": 32296,
227
+ "๐„›": 32219,
228
+ "๐„œ": 32202,
229
+ "๐„": 32128,
230
+ "๐„ž": 32197,
231
+ "๐„Ÿ": 32319,
232
+ "๐„ก": 32200,
233
+ "๐„ข": 32303,
234
+ "๐„ฃ": 32318,
235
+ "๐„ค": 32214,
236
+ "๐„ฅ": 32322,
237
+ "๐„ง": 32155,
238
+ "๐„ช": 32143,
239
+ "๐„ซ": 32113,
240
+ "๐„ท": 32148,
241
+ "๐„ธ": 32263,
242
+ "๐„น": 32114,
243
+ "๐„บ": 32222,
244
+ "๐„ฝ": 32175,
245
+ "๐„พ": 32253,
246
+ "๐„ฟ": 32266
247
  }
config.json CHANGED
@@ -3,9 +3,9 @@
3
  "T5ForConditionalGeneration"
4
  ],
5
  "classifier_dropout": 0.0,
6
- "d_ff": 3072,
7
  "d_kv": 64,
8
- "d_model": 768,
9
  "decoder_start_token_id": 0,
10
  "dense_act_fn": "relu",
11
  "dropout_rate": 0.1,
@@ -17,9 +17,9 @@
17
  "layer_norm_epsilon": 1e-06,
18
  "model_type": "t5",
19
  "n_positions": 512,
20
- "num_decoder_layers": 12,
21
- "num_heads": 12,
22
- "num_layers": 12,
23
  "output_past": true,
24
  "pad_token_id": 0,
25
  "relative_attention_max_distance": 128,
@@ -56,5 +56,5 @@
56
  "torch_dtype": "float32",
57
  "transformers_version": "4.51.3",
58
  "use_cache": true,
59
- "vocab_size": 32145
60
  }
 
3
  "T5ForConditionalGeneration"
4
  ],
5
  "classifier_dropout": 0.0,
6
+ "d_ff": 2048,
7
  "d_kv": 64,
8
+ "d_model": 512,
9
  "decoder_start_token_id": 0,
10
  "dense_act_fn": "relu",
11
  "dropout_rate": 0.1,
 
17
  "layer_norm_epsilon": 1e-06,
18
  "model_type": "t5",
19
  "n_positions": 512,
20
+ "num_decoder_layers": 6,
21
+ "num_heads": 8,
22
+ "num_layers": 6,
23
  "output_past": true,
24
  "pad_token_id": 0,
25
  "relative_attention_max_distance": 128,
 
56
  "torch_dtype": "float32",
57
  "transformers_version": "4.51.3",
58
  "use_cache": true,
59
+ "vocab_size": 32345
60
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a662e6dd70560a686bab885b1e4e7fda2f1dd2f075201cd0aede21b02aefc579
3
- size 891696936
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81b67ad53b8990a9fa4f5be0358ee894da8cbe75240a7a2ceffeaaff0d412450
3
+ size 242486312
runs/May01_13-02-37_Lees-MacBook-Pro.local/events.out.tfevents.1746126158.Lees-MacBook-Pro.local ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3009c494e16fc687693279d36ef0f380dea1543d96778554e5f15354244de465
3
+ size 22714
special_tokens_map.json CHANGED
@@ -101,7 +101,25 @@
101
  "<extra_id_98>",
102
  "<extra_id_99>"
103
  ],
104
- "eos_token": "</s>",
105
- "pad_token": "<pad>",
106
- "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
107
  }
 
101
  "<extra_id_98>",
102
  "<extra_id_99>"
103
  ],
104
+ "eos_token": {
105
+ "content": "</s>",
106
+ "lstrip": false,
107
+ "normalized": false,
108
+ "rstrip": false,
109
+ "single_word": false
110
+ },
111
+ "pad_token": {
112
+ "content": "<pad>",
113
+ "lstrip": false,
114
+ "normalized": false,
115
+ "rstrip": false,
116
+ "single_word": false
117
+ },
118
+ "unk_token": {
119
+ "content": "<unk>",
120
+ "lstrip": false,
121
+ "normalized": false,
122
+ "rstrip": false,
123
+ "single_word": false
124
+ }
125
  }
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f850f1efc314e2a2fd3849c561d76d4742bf4cf53a646280b9f0f3bc5ea29d74
3
- size 2430283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e578db7613aa70d6461123b8983113a4b2449abeb718e43f7ebef37afb49973f
3
+ size 2466261
tokenizer_config.json CHANGED
@@ -826,7 +826,7 @@
826
  "special": true
827
  },
828
  "32100": {
829
- "content": "u19",
830
  "lstrip": false,
831
  "normalized": true,
832
  "rstrip": false,
@@ -834,7 +834,7 @@
834
  "special": false
835
  },
836
  "32101": {
837
- "content": "si11",
838
  "lstrip": false,
839
  "normalized": true,
840
  "rstrip": false,
@@ -842,7 +842,7 @@
842
  "special": false
843
  },
844
  "32102": {
845
- "content": "ru14",
846
  "lstrip": false,
847
  "normalized": true,
848
  "rstrip": false,
@@ -850,7 +850,7 @@
850
  "special": false
851
  },
852
  "32103": {
853
- "content": "gu2",
854
  "lstrip": false,
855
  "normalized": true,
856
  "rstrip": false,
@@ -858,7 +858,7 @@
858
  "special": false
859
  },
860
  "32104": {
861
- "content": "ze2",
862
  "lstrip": false,
863
  "normalized": true,
864
  "rstrip": false,
@@ -866,7 +866,7 @@
866
  "special": false
867
  },
868
  "32105": {
869
- "content": "esz",
870
  "lstrip": false,
871
  "normalized": true,
872
  "rstrip": false,
@@ -874,7 +874,7 @@
874
  "special": false
875
  },
876
  "32106": {
877
- "content": "skal",
878
  "lstrip": false,
879
  "normalized": true,
880
  "rstrip": false,
@@ -882,7 +882,7 @@
882
  "special": false
883
  },
884
  "32107": {
885
- "content": "Translate",
886
  "lstrip": false,
887
  "normalized": true,
888
  "rstrip": false,
@@ -890,7 +890,7 @@
890
  "special": false
891
  },
892
  "32108": {
893
- "content": "suen",
894
  "lstrip": false,
895
  "normalized": true,
896
  "rstrip": false,
@@ -898,7 +898,7 @@
898
  "special": false
899
  },
900
  "32109": {
901
- "content": "Elamite",
902
  "lstrip": false,
903
  "normalized": true,
904
  "rstrip": false,
@@ -906,7 +906,7 @@
906
  "special": false
907
  },
908
  "32110": {
909
- "content": "sz",
910
  "lstrip": false,
911
  "normalized": true,
912
  "rstrip": false,
@@ -914,7 +914,7 @@
914
  "special": false
915
  },
916
  "32111": {
917
- "content": "bi2",
918
  "lstrip": false,
919
  "normalized": true,
920
  "rstrip": false,
@@ -922,7 +922,7 @@
922
  "special": false
923
  },
924
  "32112": {
925
- "content": "urus",
926
  "lstrip": false,
927
  "normalized": true,
928
  "rstrip": false,
@@ -930,7 +930,7 @@
930
  "special": false
931
  },
932
  "32113": {
933
- "content": "pil2",
934
  "lstrip": false,
935
  "normalized": true,
936
  "rstrip": false,
@@ -938,7 +938,7 @@
938
  "special": false
939
  },
940
  "32114": {
941
- "content": "mmed",
942
  "lstrip": false,
943
  "normalized": true,
944
  "rstrip": false,
@@ -946,7 +946,7 @@
946
  "special": false
947
  },
948
  "32115": {
949
- "content": "gi4",
950
  "lstrip": false,
951
  "normalized": true,
952
  "rstrip": false,
@@ -954,7 +954,7 @@
954
  "special": false
955
  },
956
  "32116": {
957
- "content": "nn",
958
  "lstrip": false,
959
  "normalized": true,
960
  "rstrip": false,
@@ -962,7 +962,7 @@
962
  "special": false
963
  },
964
  "32117": {
965
- "content": "e11",
966
  "lstrip": false,
967
  "normalized": true,
968
  "rstrip": false,
@@ -970,7 +970,7 @@
970
  "special": false
971
  },
972
  "32118": {
973
- "content": "e2",
974
  "lstrip": false,
975
  "normalized": true,
976
  "rstrip": false,
@@ -978,7 +978,7 @@
978
  "special": false
979
  },
980
  "32119": {
981
- "content": "tu2",
982
  "lstrip": false,
983
  "normalized": true,
984
  "rstrip": false,
@@ -986,7 +986,7 @@
986
  "special": false
987
  },
988
  "32120": {
989
- "content": "English:",
990
  "lstrip": false,
991
  "normalized": true,
992
  "rstrip": false,
@@ -994,7 +994,7 @@
994
  "special": false
995
  },
996
  "32121": {
997
- "content": "uhaldi",
998
  "lstrip": false,
999
  "normalized": true,
1000
  "rstrip": false,
@@ -1002,7 +1002,7 @@
1002
  "special": false
1003
  },
1004
  "32122": {
1005
- "content": "cz",
1006
  "lstrip": false,
1007
  "normalized": true,
1008
  "rstrip": false,
@@ -1010,7 +1010,7 @@
1010
  "special": false
1011
  },
1012
  "32123": {
1013
- "content": "ai",
1014
  "lstrip": false,
1015
  "normalized": true,
1016
  "rstrip": false,
@@ -1018,7 +1018,7 @@
1018
  "special": false
1019
  },
1020
  "32124": {
1021
- "content": "siร—sa",
1022
  "lstrip": false,
1023
  "normalized": true,
1024
  "rstrip": false,
@@ -1026,7 +1026,7 @@
1026
  "special": false
1027
  },
1028
  "32125": {
1029
- "content": "ga5",
1030
  "lstrip": false,
1031
  "normalized": true,
1032
  "rstrip": false,
@@ -1034,7 +1034,7 @@
1034
  "special": false
1035
  },
1036
  "32126": {
1037
- "content": "ummeda",
1038
  "lstrip": false,
1039
  "normalized": true,
1040
  "rstrip": false,
@@ -1042,7 +1042,7 @@
1042
  "special": false
1043
  },
1044
  "32127": {
1045
- "content": "qad",
1046
  "lstrip": false,
1047
  "normalized": true,
1048
  "rstrip": false,
@@ -1050,7 +1050,7 @@
1050
  "special": false
1051
  },
1052
  "32128": {
1053
- "content": "de3",
1054
  "lstrip": false,
1055
  "normalized": true,
1056
  "rstrip": false,
@@ -1058,7 +1058,7 @@
1058
  "special": false
1059
  },
1060
  "32129": {
1061
- "content": "sahar",
1062
  "lstrip": false,
1063
  "normalized": true,
1064
  "rstrip": false,
@@ -1066,7 +1066,7 @@
1066
  "special": false
1067
  },
1068
  "32130": {
1069
- "content": "szum",
1070
  "lstrip": false,
1071
  "normalized": true,
1072
  "rstrip": false,
@@ -1074,7 +1074,7 @@
1074
  "special": false
1075
  },
1076
  "32131": {
1077
- "content": "et9",
1078
  "lstrip": false,
1079
  "normalized": true,
1080
  "rstrip": false,
@@ -1082,7 +1082,7 @@
1082
  "special": false
1083
  },
1084
  "32132": {
1085
- "content": "complex",
1086
  "lstrip": false,
1087
  "normalized": true,
1088
  "rstrip": false,
@@ -1090,7 +1090,7 @@
1090
  "special": false
1091
  },
1092
  "32133": {
1093
- "content": "nis",
1094
  "lstrip": false,
1095
  "normalized": true,
1096
  "rstrip": false,
@@ -1098,7 +1098,7 @@
1098
  "special": false
1099
  },
1100
  "32134": {
1101
- "content": "ita",
1102
  "lstrip": false,
1103
  "normalized": true,
1104
  "rstrip": false,
@@ -1106,7 +1106,7 @@
1106
  "special": false
1107
  },
1108
  "32135": {
1109
- "content": "lut",
1110
  "lstrip": false,
1111
  "normalized": true,
1112
  "rstrip": false,
@@ -1114,7 +1114,7 @@
1114
  "special": false
1115
  },
1116
  "32136": {
1117
- "content": "Hittite",
1118
  "lstrip": false,
1119
  "normalized": true,
1120
  "rstrip": false,
@@ -1122,7 +1122,7 @@
1122
  "special": false
1123
  },
1124
  "32137": {
1125
- "content": "gestin'",
1126
  "lstrip": false,
1127
  "normalized": true,
1128
  "rstrip": false,
@@ -1130,7 +1130,7 @@
1130
  "special": false
1131
  },
1132
  "32138": {
1133
- "content": "transliteration",
1134
  "lstrip": false,
1135
  "normalized": true,
1136
  "rstrip": false,
@@ -1138,7 +1138,7 @@
1138
  "special": false
1139
  },
1140
  "32139": {
1141
- "content": "am3",
1142
  "lstrip": false,
1143
  "normalized": true,
1144
  "rstrip": false,
@@ -1146,7 +1146,7 @@
1146
  "special": false
1147
  },
1148
  "32140": {
1149
- "content": "bar8",
1150
  "lstrip": false,
1151
  "normalized": true,
1152
  "rstrip": false,
@@ -1154,7 +1154,7 @@
1154
  "special": false
1155
  },
1156
  "32141": {
1157
- "content": "ut2",
1158
  "lstrip": false,
1159
  "normalized": true,
1160
  "rstrip": false,
@@ -1162,7 +1162,7 @@
1162
  "special": false
1163
  },
1164
  "32142": {
1165
- "content": "szuszin",
1166
  "lstrip": false,
1167
  "normalized": true,
1168
  "rstrip": false,
@@ -1170,7 +1170,7 @@
1170
  "special": false
1171
  },
1172
  "32143": {
1173
- "content": "ket9",
1174
  "lstrip": false,
1175
  "normalized": true,
1176
  "rstrip": false,
@@ -1178,7 +1178,1607 @@
1178
  "special": false
1179
  },
1180
  "32144": {
1181
- "content": "ri2",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1182
  "lstrip": false,
1183
  "normalized": true,
1184
  "rstrip": false,
@@ -1288,11 +2888,11 @@
1288
  "<extra_id_98>",
1289
  "<extra_id_99>"
1290
  ],
1291
- "clean_up_tokenization_spaces": false,
1292
  "eos_token": "</s>",
1293
  "extra_ids": 100,
1294
  "extra_special_tokens": {},
1295
- "model_max_length": 1000000000000000019884624838656,
1296
  "pad_token": "<pad>",
1297
  "tokenizer_class": "T5Tokenizer",
1298
  "unk_token": "<unk>"
 
826
  "special": true
827
  },
828
  "32100": {
829
+ "content": "๐ƒž",
830
  "lstrip": false,
831
  "normalized": true,
832
  "rstrip": false,
 
834
  "special": false
835
  },
836
  "32101": {
837
+ "content": "โ†’",
838
  "lstrip": false,
839
  "normalized": true,
840
  "rstrip": false,
 
842
  "special": false
843
  },
844
  "32102": {
845
+ "content": "๐ƒณ",
846
  "lstrip": false,
847
  "normalized": true,
848
  "rstrip": false,
 
850
  "special": false
851
  },
852
  "32103": {
853
+ "content": "๐„“",
854
  "lstrip": false,
855
  "normalized": true,
856
  "rstrip": false,
 
858
  "special": false
859
  },
860
  "32104": {
861
+ "content": "๐€š",
862
  "lstrip": false,
863
  "normalized": true,
864
  "rstrip": false,
 
866
  "special": false
867
  },
868
  "32105": {
869
+ "content": "๐•",
870
  "lstrip": false,
871
  "normalized": true,
872
  "rstrip": false,
 
874
  "special": false
875
  },
876
  "32106": {
877
+ "content": "๐€‰",
878
  "lstrip": false,
879
  "normalized": true,
880
  "rstrip": false,
 
882
  "special": false
883
  },
884
  "32107": {
885
+ "content": "๐‚",
886
  "lstrip": false,
887
  "normalized": true,
888
  "rstrip": false,
 
890
  "special": false
891
  },
892
  "32108": {
893
+ "content": "๐„",
894
  "lstrip": false,
895
  "normalized": true,
896
  "rstrip": false,
 
898
  "special": false
899
  },
900
  "32109": {
901
+ "content": "โ—",
902
  "lstrip": false,
903
  "normalized": true,
904
  "rstrip": false,
 
906
  "special": false
907
  },
908
  "32110": {
909
+ "content": "๐‚‹",
910
  "lstrip": false,
911
  "normalized": true,
912
  "rstrip": false,
 
914
  "special": false
915
  },
916
  "32111": {
917
+ "content": "๐„˜",
918
  "lstrip": false,
919
  "normalized": true,
920
  "rstrip": false,
 
922
  "special": false
923
  },
924
  "32112": {
925
+ "content": "๐€ฎ",
926
  "lstrip": false,
927
  "normalized": true,
928
  "rstrip": false,
 
930
  "special": false
931
  },
932
  "32113": {
933
+ "content": "๐„ซ",
934
  "lstrip": false,
935
  "normalized": true,
936
  "rstrip": false,
 
938
  "special": false
939
  },
940
  "32114": {
941
+ "content": "๐„น",
942
  "lstrip": false,
943
  "normalized": true,
944
  "rstrip": false,
 
946
  "special": false
947
  },
948
  "32115": {
949
+ "content": "๐€ก",
950
  "lstrip": false,
951
  "normalized": true,
952
  "rstrip": false,
 
954
  "special": false
955
  },
956
  "32116": {
957
+ "content": "๐„‰",
958
  "lstrip": false,
959
  "normalized": true,
960
  "rstrip": false,
 
962
  "special": false
963
  },
964
  "32117": {
965
+ "content": "๐ƒŸ",
966
  "lstrip": false,
967
  "normalized": true,
968
  "rstrip": false,
 
970
  "special": false
971
  },
972
  "32118": {
973
+ "content": "๐ƒŒ",
974
  "lstrip": false,
975
  "normalized": true,
976
  "rstrip": false,
 
978
  "special": false
979
  },
980
  "32119": {
981
+ "content": "๐€‹",
982
  "lstrip": false,
983
  "normalized": true,
984
  "rstrip": false,
 
986
  "special": false
987
  },
988
  "32120": {
989
+ "content": "๐€˜",
990
  "lstrip": false,
991
  "normalized": true,
992
  "rstrip": false,
 
994
  "special": false
995
  },
996
  "32121": {
997
+ "content": "๐€ฝ",
998
  "lstrip": false,
999
  "normalized": true,
1000
  "rstrip": false,
 
1002
  "special": false
1003
  },
1004
  "32122": {
1005
+ "content": "๐‚บ",
1006
  "lstrip": false,
1007
  "normalized": true,
1008
  "rstrip": false,
 
1010
  "special": false
1011
  },
1012
  "32123": {
1013
+ "content": "๐‚ฆ",
1014
  "lstrip": false,
1015
  "normalized": true,
1016
  "rstrip": false,
 
1018
  "special": false
1019
  },
1020
  "32124": {
1021
+ "content": "๐‚ผ",
1022
  "lstrip": false,
1023
  "normalized": true,
1024
  "rstrip": false,
 
1026
  "special": false
1027
  },
1028
  "32125": {
1029
+ "content": "๐ƒ",
1030
  "lstrip": false,
1031
  "normalized": true,
1032
  "rstrip": false,
 
1034
  "special": false
1035
  },
1036
  "32126": {
1037
+ "content": "๐‚›",
1038
  "lstrip": false,
1039
  "normalized": true,
1040
  "rstrip": false,
 
1042
  "special": false
1043
  },
1044
  "32127": {
1045
+ "content": "๐‚„",
1046
  "lstrip": false,
1047
  "normalized": true,
1048
  "rstrip": false,
 
1050
  "special": false
1051
  },
1052
  "32128": {
1053
+ "content": "๐„",
1054
  "lstrip": false,
1055
  "normalized": true,
1056
  "rstrip": false,
 
1058
  "special": false
1059
  },
1060
  "32129": {
1061
+ "content": "๐„•",
1062
  "lstrip": false,
1063
  "normalized": true,
1064
  "rstrip": false,
 
1066
  "special": false
1067
  },
1068
  "32130": {
1069
+ "content": "๐‚”",
1070
  "lstrip": false,
1071
  "normalized": true,
1072
  "rstrip": false,
 
1074
  "special": false
1075
  },
1076
  "32131": {
1077
+ "content": "๐‚ฎ",
1078
  "lstrip": false,
1079
  "normalized": true,
1080
  "rstrip": false,
 
1082
  "special": false
1083
  },
1084
  "32132": {
1085
+ "content": "๐Š",
1086
  "lstrip": false,
1087
  "normalized": true,
1088
  "rstrip": false,
 
1090
  "special": false
1091
  },
1092
  "32133": {
1093
+ "content": "๐€ผ",
1094
  "lstrip": false,
1095
  "normalized": true,
1096
  "rstrip": false,
 
1098
  "special": false
1099
  },
1100
  "32134": {
1101
+ "content": "๐",
1102
  "lstrip": false,
1103
  "normalized": true,
1104
  "rstrip": false,
 
1106
  "special": false
1107
  },
1108
  "32135": {
1109
+ "content": "๐ƒ",
1110
  "lstrip": false,
1111
  "normalized": true,
1112
  "rstrip": false,
 
1114
  "special": false
1115
  },
1116
  "32136": {
1117
+ "content": "๐ƒ‡",
1118
  "lstrip": false,
1119
  "normalized": true,
1120
  "rstrip": false,
 
1122
  "special": false
1123
  },
1124
  "32137": {
1125
+ "content": "๐„Œ",
1126
  "lstrip": false,
1127
  "normalized": true,
1128
  "rstrip": false,
 
1130
  "special": false
1131
  },
1132
  "32138": {
1133
+ "content": "๐‚‰",
1134
  "lstrip": false,
1135
  "normalized": true,
1136
  "rstrip": false,
 
1138
  "special": false
1139
  },
1140
  "32139": {
1141
+ "content": "๐ƒค",
1142
  "lstrip": false,
1143
  "normalized": true,
1144
  "rstrip": false,
 
1146
  "special": false
1147
  },
1148
  "32140": {
1149
+ "content": "๐€ฌ",
1150
  "lstrip": false,
1151
  "normalized": true,
1152
  "rstrip": false,
 
1154
  "special": false
1155
  },
1156
  "32141": {
1157
+ "content": "๐„™",
1158
  "lstrip": false,
1159
  "normalized": true,
1160
  "rstrip": false,
 
1162
  "special": false
1163
  },
1164
  "32142": {
1165
+ "content": "๐‚ฅ",
1166
  "lstrip": false,
1167
  "normalized": true,
1168
  "rstrip": false,
 
1170
  "special": false
1171
  },
1172
  "32143": {
1173
+ "content": "๐„ช",
1174
  "lstrip": false,
1175
  "normalized": true,
1176
  "rstrip": false,
 
1178
  "special": false
1179
  },
1180
  "32144": {
1181
+ "content": "๐‚ˆ",
1182
+ "lstrip": false,
1183
+ "normalized": true,
1184
+ "rstrip": false,
1185
+ "single_word": false,
1186
+ "special": false
1187
+ },
1188
+ "32145": {
1189
+ "content": "๐‚ž",
1190
+ "lstrip": false,
1191
+ "normalized": true,
1192
+ "rstrip": false,
1193
+ "single_word": false,
1194
+ "special": false
1195
+ },
1196
+ "32146": {
1197
+ "content": "๐™",
1198
+ "lstrip": false,
1199
+ "normalized": true,
1200
+ "rstrip": false,
1201
+ "single_word": false,
1202
+ "special": false
1203
+ },
1204
+ "32147": {
1205
+ "content": "๐ƒ•",
1206
+ "lstrip": false,
1207
+ "normalized": true,
1208
+ "rstrip": false,
1209
+ "single_word": false,
1210
+ "special": false
1211
+ },
1212
+ "32148": {
1213
+ "content": "๐„ท",
1214
+ "lstrip": false,
1215
+ "normalized": true,
1216
+ "rstrip": false,
1217
+ "single_word": false,
1218
+ "special": false
1219
+ },
1220
+ "32149": {
1221
+ "content": "๐‚Ÿ",
1222
+ "lstrip": false,
1223
+ "normalized": true,
1224
+ "rstrip": false,
1225
+ "single_word": false,
1226
+ "special": false
1227
+ },
1228
+ "32150": {
1229
+ "content": "๐ƒŠ",
1230
+ "lstrip": false,
1231
+ "normalized": true,
1232
+ "rstrip": false,
1233
+ "single_word": false,
1234
+ "special": false
1235
+ },
1236
+ "32151": {
1237
+ "content": "๐ƒก",
1238
+ "lstrip": false,
1239
+ "normalized": true,
1240
+ "rstrip": false,
1241
+ "single_word": false,
1242
+ "special": false
1243
+ },
1244
+ "32152": {
1245
+ "content": "๐€ฑ",
1246
+ "lstrip": false,
1247
+ "normalized": true,
1248
+ "rstrip": false,
1249
+ "single_word": false,
1250
+ "special": false
1251
+ },
1252
+ "32153": {
1253
+ "content": "๐‚ฐ",
1254
+ "lstrip": false,
1255
+ "normalized": true,
1256
+ "rstrip": false,
1257
+ "single_word": false,
1258
+ "special": false
1259
+ },
1260
+ "32154": {
1261
+ "content": "๐‚",
1262
+ "lstrip": false,
1263
+ "normalized": true,
1264
+ "rstrip": false,
1265
+ "single_word": false,
1266
+ "special": false
1267
+ },
1268
+ "32155": {
1269
+ "content": "๐„ง",
1270
+ "lstrip": false,
1271
+ "normalized": true,
1272
+ "rstrip": false,
1273
+ "single_word": false,
1274
+ "special": false
1275
+ },
1276
+ "32156": {
1277
+ "content": "๐ƒ„",
1278
+ "lstrip": false,
1279
+ "normalized": true,
1280
+ "rstrip": false,
1281
+ "single_word": false,
1282
+ "special": false
1283
+ },
1284
+ "32157": {
1285
+ "content": "๐€ฆ",
1286
+ "lstrip": false,
1287
+ "normalized": true,
1288
+ "rstrip": false,
1289
+ "single_word": false,
1290
+ "special": false
1291
+ },
1292
+ "32158": {
1293
+ "content": "๐‚ฟ",
1294
+ "lstrip": false,
1295
+ "normalized": true,
1296
+ "rstrip": false,
1297
+ "single_word": false,
1298
+ "special": false
1299
+ },
1300
+ "32159": {
1301
+ "content": "๐ˆ",
1302
+ "lstrip": false,
1303
+ "normalized": true,
1304
+ "rstrip": false,
1305
+ "single_word": false,
1306
+ "special": false
1307
+ },
1308
+ "32160": {
1309
+ "content": "๐š",
1310
+ "lstrip": false,
1311
+ "normalized": true,
1312
+ "rstrip": false,
1313
+ "single_word": false,
1314
+ "special": false
1315
+ },
1316
+ "32161": {
1317
+ "content": "๐ƒด",
1318
+ "lstrip": false,
1319
+ "normalized": true,
1320
+ "rstrip": false,
1321
+ "single_word": false,
1322
+ "special": false
1323
+ },
1324
+ "32162": {
1325
+ "content": "๐ƒฉ",
1326
+ "lstrip": false,
1327
+ "normalized": true,
1328
+ "rstrip": false,
1329
+ "single_word": false,
1330
+ "special": false
1331
+ },
1332
+ "32163": {
1333
+ "content": "๐‚‘",
1334
+ "lstrip": false,
1335
+ "normalized": true,
1336
+ "rstrip": false,
1337
+ "single_word": false,
1338
+ "special": false
1339
+ },
1340
+ "32164": {
1341
+ "content": "๐ƒฃ",
1342
+ "lstrip": false,
1343
+ "normalized": true,
1344
+ "rstrip": false,
1345
+ "single_word": false,
1346
+ "special": false
1347
+ },
1348
+ "32165": {
1349
+ "content": "๐€ฉ",
1350
+ "lstrip": false,
1351
+ "normalized": true,
1352
+ "rstrip": false,
1353
+ "single_word": false,
1354
+ "special": false
1355
+ },
1356
+ "32166": {
1357
+ "content": "๐€—",
1358
+ "lstrip": false,
1359
+ "normalized": true,
1360
+ "rstrip": false,
1361
+ "single_word": false,
1362
+ "special": false
1363
+ },
1364
+ "32167": {
1365
+ "content": "๐„’",
1366
+ "lstrip": false,
1367
+ "normalized": true,
1368
+ "rstrip": false,
1369
+ "single_word": false,
1370
+ "special": false
1371
+ },
1372
+ "32168": {
1373
+ "content": "๐ƒœ",
1374
+ "lstrip": false,
1375
+ "normalized": true,
1376
+ "rstrip": false,
1377
+ "single_word": false,
1378
+ "special": false
1379
+ },
1380
+ "32169": {
1381
+ "content": "๐€…",
1382
+ "lstrip": false,
1383
+ "normalized": true,
1384
+ "rstrip": false,
1385
+ "single_word": false,
1386
+ "special": false
1387
+ },
1388
+ "32170": {
1389
+ "content": "๐„‹",
1390
+ "lstrip": false,
1391
+ "normalized": true,
1392
+ "rstrip": false,
1393
+ "single_word": false,
1394
+ "special": false
1395
+ },
1396
+ "32171": {
1397
+ "content": "๐‚ง",
1398
+ "lstrip": false,
1399
+ "normalized": true,
1400
+ "rstrip": false,
1401
+ "single_word": false,
1402
+ "special": false
1403
+ },
1404
+ "32172": {
1405
+ "content": "๐€€",
1406
+ "lstrip": false,
1407
+ "normalized": true,
1408
+ "rstrip": false,
1409
+ "single_word": false,
1410
+ "special": false
1411
+ },
1412
+ "32173": {
1413
+ "content": "๐‚‚",
1414
+ "lstrip": false,
1415
+ "normalized": true,
1416
+ "rstrip": false,
1417
+ "single_word": false,
1418
+ "special": false
1419
+ },
1420
+ "32174": {
1421
+ "content": "๐€ ",
1422
+ "lstrip": false,
1423
+ "normalized": true,
1424
+ "rstrip": false,
1425
+ "single_word": false,
1426
+ "special": false
1427
+ },
1428
+ "32175": {
1429
+ "content": "๐„ฝ",
1430
+ "lstrip": false,
1431
+ "normalized": true,
1432
+ "rstrip": false,
1433
+ "single_word": false,
1434
+ "special": false
1435
+ },
1436
+ "32176": {
1437
+ "content": "๐ƒš",
1438
+ "lstrip": false,
1439
+ "normalized": true,
1440
+ "rstrip": false,
1441
+ "single_word": false,
1442
+ "special": false
1443
+ },
1444
+ "32177": {
1445
+ "content": "๐†",
1446
+ "lstrip": false,
1447
+ "normalized": true,
1448
+ "rstrip": false,
1449
+ "single_word": false,
1450
+ "special": false
1451
+ },
1452
+ "32178": {
1453
+ "content": "๐„",
1454
+ "lstrip": false,
1455
+ "normalized": true,
1456
+ "rstrip": false,
1457
+ "single_word": false,
1458
+ "special": false
1459
+ },
1460
+ "32179": {
1461
+ "content": "๐ƒ›",
1462
+ "lstrip": false,
1463
+ "normalized": true,
1464
+ "rstrip": false,
1465
+ "single_word": false,
1466
+ "special": false
1467
+ },
1468
+ "32180": {
1469
+ "content": "๐ƒ‘",
1470
+ "lstrip": false,
1471
+ "normalized": true,
1472
+ "rstrip": false,
1473
+ "single_word": false,
1474
+ "special": false
1475
+ },
1476
+ "32181": {
1477
+ "content": "๐‚ฌ",
1478
+ "lstrip": false,
1479
+ "normalized": true,
1480
+ "rstrip": false,
1481
+ "single_word": false,
1482
+ "special": false
1483
+ },
1484
+ "32182": {
1485
+ "content": "๐‚ท",
1486
+ "lstrip": false,
1487
+ "normalized": true,
1488
+ "rstrip": false,
1489
+ "single_word": false,
1490
+ "special": false
1491
+ },
1492
+ "32183": {
1493
+ "content": "๐€›",
1494
+ "lstrip": false,
1495
+ "normalized": true,
1496
+ "rstrip": false,
1497
+ "single_word": false,
1498
+ "special": false
1499
+ },
1500
+ "32184": {
1501
+ "content": "๐œ",
1502
+ "lstrip": false,
1503
+ "normalized": true,
1504
+ "rstrip": false,
1505
+ "single_word": false,
1506
+ "special": false
1507
+ },
1508
+ "32185": {
1509
+ "content": "๐„”",
1510
+ "lstrip": false,
1511
+ "normalized": true,
1512
+ "rstrip": false,
1513
+ "single_word": false,
1514
+ "special": false
1515
+ },
1516
+ "32186": {
1517
+ "content": "๐‚ข",
1518
+ "lstrip": false,
1519
+ "normalized": true,
1520
+ "rstrip": false,
1521
+ "single_word": false,
1522
+ "special": false
1523
+ },
1524
+ "32187": {
1525
+ "content": "๐€Ž",
1526
+ "lstrip": false,
1527
+ "normalized": true,
1528
+ "rstrip": false,
1529
+ "single_word": false,
1530
+ "special": false
1531
+ },
1532
+ "32188": {
1533
+ "content": "๐€ธ",
1534
+ "lstrip": false,
1535
+ "normalized": true,
1536
+ "rstrip": false,
1537
+ "single_word": false,
1538
+ "special": false
1539
+ },
1540
+ "32189": {
1541
+ "content": "๐€",
1542
+ "lstrip": false,
1543
+ "normalized": true,
1544
+ "rstrip": false,
1545
+ "single_word": false,
1546
+ "special": false
1547
+ },
1548
+ "32190": {
1549
+ "content": "๐“",
1550
+ "lstrip": false,
1551
+ "normalized": true,
1552
+ "rstrip": false,
1553
+ "single_word": false,
1554
+ "special": false
1555
+ },
1556
+ "32191": {
1557
+ "content": "๐‰",
1558
+ "lstrip": false,
1559
+ "normalized": true,
1560
+ "rstrip": false,
1561
+ "single_word": false,
1562
+ "special": false
1563
+ },
1564
+ "32192": {
1565
+ "content": "๐‚…",
1566
+ "lstrip": false,
1567
+ "normalized": true,
1568
+ "rstrip": false,
1569
+ "single_word": false,
1570
+ "special": false
1571
+ },
1572
+ "32193": {
1573
+ "content": "๐ƒ”",
1574
+ "lstrip": false,
1575
+ "normalized": true,
1576
+ "rstrip": false,
1577
+ "single_word": false,
1578
+ "special": false
1579
+ },
1580
+ "32194": {
1581
+ "content": "โŒ",
1582
+ "lstrip": false,
1583
+ "normalized": true,
1584
+ "rstrip": false,
1585
+ "single_word": false,
1586
+ "special": false
1587
+ },
1588
+ "32195": {
1589
+ "content": "๐ƒ€",
1590
+ "lstrip": false,
1591
+ "normalized": true,
1592
+ "rstrip": false,
1593
+ "single_word": false,
1594
+ "special": false
1595
+ },
1596
+ "32196": {
1597
+ "content": "๐ƒช",
1598
+ "lstrip": false,
1599
+ "normalized": true,
1600
+ "rstrip": false,
1601
+ "single_word": false,
1602
+ "special": false
1603
+ },
1604
+ "32197": {
1605
+ "content": "๐„ž",
1606
+ "lstrip": false,
1607
+ "normalized": true,
1608
+ "rstrip": false,
1609
+ "single_word": false,
1610
+ "special": false
1611
+ },
1612
+ "32198": {
1613
+ "content": "๐€ถ",
1614
+ "lstrip": false,
1615
+ "normalized": true,
1616
+ "rstrip": false,
1617
+ "single_word": false,
1618
+ "special": false
1619
+ },
1620
+ "32199": {
1621
+ "content": "๐‚",
1622
+ "lstrip": false,
1623
+ "normalized": true,
1624
+ "rstrip": false,
1625
+ "single_word": false,
1626
+ "special": false
1627
+ },
1628
+ "32200": {
1629
+ "content": "๐„ก",
1630
+ "lstrip": false,
1631
+ "normalized": true,
1632
+ "rstrip": false,
1633
+ "single_word": false,
1634
+ "special": false
1635
+ },
1636
+ "32201": {
1637
+ "content": "๐ƒฌ",
1638
+ "lstrip": false,
1639
+ "normalized": true,
1640
+ "rstrip": false,
1641
+ "single_word": false,
1642
+ "special": false
1643
+ },
1644
+ "32202": {
1645
+ "content": "๐„œ",
1646
+ "lstrip": false,
1647
+ "normalized": true,
1648
+ "rstrip": false,
1649
+ "single_word": false,
1650
+ "special": false
1651
+ },
1652
+ "32203": {
1653
+ "content": "๐„",
1654
+ "lstrip": false,
1655
+ "normalized": true,
1656
+ "rstrip": false,
1657
+ "single_word": false,
1658
+ "special": false
1659
+ },
1660
+ "32204": {
1661
+ "content": "๐€ฃ",
1662
+ "lstrip": false,
1663
+ "normalized": true,
1664
+ "rstrip": false,
1665
+ "single_word": false,
1666
+ "special": false
1667
+ },
1668
+ "32205": {
1669
+ "content": "๐€ช",
1670
+ "lstrip": false,
1671
+ "normalized": true,
1672
+ "rstrip": false,
1673
+ "single_word": false,
1674
+ "special": false
1675
+ },
1676
+ "32206": {
1677
+ "content": "๐ƒน",
1678
+ "lstrip": false,
1679
+ "normalized": true,
1680
+ "rstrip": false,
1681
+ "single_word": false,
1682
+ "special": false
1683
+ },
1684
+ "32207": {
1685
+ "content": "๐€ฐ",
1686
+ "lstrip": false,
1687
+ "normalized": true,
1688
+ "rstrip": false,
1689
+ "single_word": false,
1690
+ "special": false
1691
+ },
1692
+ "32208": {
1693
+ "content": "๐€น",
1694
+ "lstrip": false,
1695
+ "normalized": true,
1696
+ "rstrip": false,
1697
+ "single_word": false,
1698
+ "special": false
1699
+ },
1700
+ "32209": {
1701
+ "content": "๐‚ถ",
1702
+ "lstrip": false,
1703
+ "normalized": true,
1704
+ "rstrip": false,
1705
+ "single_word": false,
1706
+ "special": false
1707
+ },
1708
+ "32210": {
1709
+ "content": "๐€„",
1710
+ "lstrip": false,
1711
+ "normalized": true,
1712
+ "rstrip": false,
1713
+ "single_word": false,
1714
+ "special": false
1715
+ },
1716
+ "32211": {
1717
+ "content": "ยฑ",
1718
+ "lstrip": false,
1719
+ "normalized": true,
1720
+ "rstrip": false,
1721
+ "single_word": false,
1722
+ "special": false
1723
+ },
1724
+ "32212": {
1725
+ "content": "๐‚—",
1726
+ "lstrip": false,
1727
+ "normalized": true,
1728
+ "rstrip": false,
1729
+ "single_word": false,
1730
+ "special": false
1731
+ },
1732
+ "32213": {
1733
+ "content": "๐€ฒ",
1734
+ "lstrip": false,
1735
+ "normalized": true,
1736
+ "rstrip": false,
1737
+ "single_word": false,
1738
+ "special": false
1739
+ },
1740
+ "32214": {
1741
+ "content": "๐„ค",
1742
+ "lstrip": false,
1743
+ "normalized": true,
1744
+ "rstrip": false,
1745
+ "single_word": false,
1746
+ "special": false
1747
+ },
1748
+ "32215": {
1749
+ "content": "๐ƒ‚",
1750
+ "lstrip": false,
1751
+ "normalized": true,
1752
+ "rstrip": false,
1753
+ "single_word": false,
1754
+ "special": false
1755
+ },
1756
+ "32216": {
1757
+ "content": "๐‚ญ",
1758
+ "lstrip": false,
1759
+ "normalized": true,
1760
+ "rstrip": false,
1761
+ "single_word": false,
1762
+ "special": false
1763
+ },
1764
+ "32217": {
1765
+ "content": "๐€ž",
1766
+ "lstrip": false,
1767
+ "normalized": true,
1768
+ "rstrip": false,
1769
+ "single_word": false,
1770
+ "special": false
1771
+ },
1772
+ "32218": {
1773
+ "content": "๐‚ฏ",
1774
+ "lstrip": false,
1775
+ "normalized": true,
1776
+ "rstrip": false,
1777
+ "single_word": false,
1778
+ "special": false
1779
+ },
1780
+ "32219": {
1781
+ "content": "๐„›",
1782
+ "lstrip": false,
1783
+ "normalized": true,
1784
+ "rstrip": false,
1785
+ "single_word": false,
1786
+ "special": false
1787
+ },
1788
+ "32220": {
1789
+ "content": "๐ƒ“",
1790
+ "lstrip": false,
1791
+ "normalized": true,
1792
+ "rstrip": false,
1793
+ "single_word": false,
1794
+ "special": false
1795
+ },
1796
+ "32221": {
1797
+ "content": "๐€ณ",
1798
+ "lstrip": false,
1799
+ "normalized": true,
1800
+ "rstrip": false,
1801
+ "single_word": false,
1802
+ "special": false
1803
+ },
1804
+ "32222": {
1805
+ "content": "๐„บ",
1806
+ "lstrip": false,
1807
+ "normalized": true,
1808
+ "rstrip": false,
1809
+ "single_word": false,
1810
+ "special": false
1811
+ },
1812
+ "32223": {
1813
+ "content": "๐‚€",
1814
+ "lstrip": false,
1815
+ "normalized": true,
1816
+ "rstrip": false,
1817
+ "single_word": false,
1818
+ "special": false
1819
+ },
1820
+ "32224": {
1821
+ "content": "๐’",
1822
+ "lstrip": false,
1823
+ "normalized": true,
1824
+ "rstrip": false,
1825
+ "single_word": false,
1826
+ "special": false
1827
+ },
1828
+ "32225": {
1829
+ "content": "๐‚ป",
1830
+ "lstrip": false,
1831
+ "normalized": true,
1832
+ "rstrip": false,
1833
+ "single_word": false,
1834
+ "special": false
1835
+ },
1836
+ "32226": {
1837
+ "content": "๐„Ž",
1838
+ "lstrip": false,
1839
+ "normalized": true,
1840
+ "rstrip": false,
1841
+ "single_word": false,
1842
+ "special": false
1843
+ },
1844
+ "32227": {
1845
+ "content": "๐‚ต",
1846
+ "lstrip": false,
1847
+ "normalized": true,
1848
+ "rstrip": false,
1849
+ "single_word": false,
1850
+ "special": false
1851
+ },
1852
+ "32228": {
1853
+ "content": "๐€†",
1854
+ "lstrip": false,
1855
+ "normalized": true,
1856
+ "rstrip": false,
1857
+ "single_word": false,
1858
+ "special": false
1859
+ },
1860
+ "32229": {
1861
+ "content": "๐‚",
1862
+ "lstrip": false,
1863
+ "normalized": true,
1864
+ "rstrip": false,
1865
+ "single_word": false,
1866
+ "special": false
1867
+ },
1868
+ "32230": {
1869
+ "content": "๐›",
1870
+ "lstrip": false,
1871
+ "normalized": true,
1872
+ "rstrip": false,
1873
+ "single_word": false,
1874
+ "special": false
1875
+ },
1876
+ "32231": {
1877
+ "content": "๐ƒถ",
1878
+ "lstrip": false,
1879
+ "normalized": true,
1880
+ "rstrip": false,
1881
+ "single_word": false,
1882
+ "special": false
1883
+ },
1884
+ "32232": {
1885
+ "content": "๐€ญ",
1886
+ "lstrip": false,
1887
+ "normalized": true,
1888
+ "rstrip": false,
1889
+ "single_word": false,
1890
+ "special": false
1891
+ },
1892
+ "32233": {
1893
+ "content": "๐‚จ",
1894
+ "lstrip": false,
1895
+ "normalized": true,
1896
+ "rstrip": false,
1897
+ "single_word": false,
1898
+ "special": false
1899
+ },
1900
+ "32234": {
1901
+ "content": "๐‹",
1902
+ "lstrip": false,
1903
+ "normalized": true,
1904
+ "rstrip": false,
1905
+ "single_word": false,
1906
+ "special": false
1907
+ },
1908
+ "32235": {
1909
+ "content": "๐„—",
1910
+ "lstrip": false,
1911
+ "normalized": true,
1912
+ "rstrip": false,
1913
+ "single_word": false,
1914
+ "special": false
1915
+ },
1916
+ "32236": {
1917
+ "content": "๐‚Ž",
1918
+ "lstrip": false,
1919
+ "normalized": true,
1920
+ "rstrip": false,
1921
+ "single_word": false,
1922
+ "special": false
1923
+ },
1924
+ "32237": {
1925
+ "content": "๐€",
1926
+ "lstrip": false,
1927
+ "normalized": true,
1928
+ "rstrip": false,
1929
+ "single_word": false,
1930
+ "special": false
1931
+ },
1932
+ "32238": {
1933
+ "content": "๐€ˆ",
1934
+ "lstrip": false,
1935
+ "normalized": true,
1936
+ "rstrip": false,
1937
+ "single_word": false,
1938
+ "special": false
1939
+ },
1940
+ "32239": {
1941
+ "content": "๐ƒท",
1942
+ "lstrip": false,
1943
+ "normalized": true,
1944
+ "rstrip": false,
1945
+ "single_word": false,
1946
+ "special": false
1947
+ },
1948
+ "32240": {
1949
+ "content": "๐‚น",
1950
+ "lstrip": false,
1951
+ "normalized": true,
1952
+ "rstrip": false,
1953
+ "single_word": false,
1954
+ "special": false
1955
+ },
1956
+ "32241": {
1957
+ "content": "๐€ท",
1958
+ "lstrip": false,
1959
+ "normalized": true,
1960
+ "rstrip": false,
1961
+ "single_word": false,
1962
+ "special": false
1963
+ },
1964
+ "32242": {
1965
+ "content": "๐€œ",
1966
+ "lstrip": false,
1967
+ "normalized": true,
1968
+ "rstrip": false,
1969
+ "single_word": false,
1970
+ "special": false
1971
+ },
1972
+ "32243": {
1973
+ "content": "๐€",
1974
+ "lstrip": false,
1975
+ "normalized": true,
1976
+ "rstrip": false,
1977
+ "single_word": false,
1978
+ "special": false
1979
+ },
1980
+ "32244": {
1981
+ "content": "๐€ƒ",
1982
+ "lstrip": false,
1983
+ "normalized": true,
1984
+ "rstrip": false,
1985
+ "single_word": false,
1986
+ "special": false
1987
+ },
1988
+ "32245": {
1989
+ "content": "๐‚ณ",
1990
+ "lstrip": false,
1991
+ "normalized": true,
1992
+ "rstrip": false,
1993
+ "single_word": false,
1994
+ "special": false
1995
+ },
1996
+ "32246": {
1997
+ "content": "โŒœ",
1998
+ "lstrip": false,
1999
+ "normalized": true,
2000
+ "rstrip": false,
2001
+ "single_word": false,
2002
+ "special": false
2003
+ },
2004
+ "32247": {
2005
+ "content": "๐ƒ†",
2006
+ "lstrip": false,
2007
+ "normalized": true,
2008
+ "rstrip": false,
2009
+ "single_word": false,
2010
+ "special": false
2011
+ },
2012
+ "32248": {
2013
+ "content": "๐‚ฝ",
2014
+ "lstrip": false,
2015
+ "normalized": true,
2016
+ "rstrip": false,
2017
+ "single_word": false,
2018
+ "special": false
2019
+ },
2020
+ "32249": {
2021
+ "content": "๐‚œ",
2022
+ "lstrip": false,
2023
+ "normalized": true,
2024
+ "rstrip": false,
2025
+ "single_word": false,
2026
+ "special": false
2027
+ },
2028
+ "32250": {
2029
+ "content": "๐„",
2030
+ "lstrip": false,
2031
+ "normalized": true,
2032
+ "rstrip": false,
2033
+ "single_word": false,
2034
+ "special": false
2035
+ },
2036
+ "32251": {
2037
+ "content": "๐€”",
2038
+ "lstrip": false,
2039
+ "normalized": true,
2040
+ "rstrip": false,
2041
+ "single_word": false,
2042
+ "special": false
2043
+ },
2044
+ "32252": {
2045
+ "content": "๐ƒ™",
2046
+ "lstrip": false,
2047
+ "normalized": true,
2048
+ "rstrip": false,
2049
+ "single_word": false,
2050
+ "special": false
2051
+ },
2052
+ "32253": {
2053
+ "content": "๐„พ",
2054
+ "lstrip": false,
2055
+ "normalized": true,
2056
+ "rstrip": false,
2057
+ "single_word": false,
2058
+ "special": false
2059
+ },
2060
+ "32254": {
2061
+ "content": "๐‚š",
2062
+ "lstrip": false,
2063
+ "normalized": true,
2064
+ "rstrip": false,
2065
+ "single_word": false,
2066
+ "special": false
2067
+ },
2068
+ "32255": {
2069
+ "content": "๐‚ฒ",
2070
+ "lstrip": false,
2071
+ "normalized": true,
2072
+ "rstrip": false,
2073
+ "single_word": false,
2074
+ "special": false
2075
+ },
2076
+ "32256": {
2077
+ "content": "๐ƒŽ",
2078
+ "lstrip": false,
2079
+ "normalized": true,
2080
+ "rstrip": false,
2081
+ "single_word": false,
2082
+ "special": false
2083
+ },
2084
+ "32257": {
2085
+ "content": "๐‚’",
2086
+ "lstrip": false,
2087
+ "normalized": true,
2088
+ "rstrip": false,
2089
+ "single_word": false,
2090
+ "special": false
2091
+ },
2092
+ "32258": {
2093
+ "content": "๐‚ƒ",
2094
+ "lstrip": false,
2095
+ "normalized": true,
2096
+ "rstrip": false,
2097
+ "single_word": false,
2098
+ "special": false
2099
+ },
2100
+ "32259": {
2101
+ "content": "๐",
2102
+ "lstrip": false,
2103
+ "normalized": true,
2104
+ "rstrip": false,
2105
+ "single_word": false,
2106
+ "special": false
2107
+ },
2108
+ "32260": {
2109
+ "content": "๐—",
2110
+ "lstrip": false,
2111
+ "normalized": true,
2112
+ "rstrip": false,
2113
+ "single_word": false,
2114
+ "special": false
2115
+ },
2116
+ "32261": {
2117
+ "content": "๐”",
2118
+ "lstrip": false,
2119
+ "normalized": true,
2120
+ "rstrip": false,
2121
+ "single_word": false,
2122
+ "special": false
2123
+ },
2124
+ "32262": {
2125
+ "content": "๐‚พ",
2126
+ "lstrip": false,
2127
+ "normalized": true,
2128
+ "rstrip": false,
2129
+ "single_word": false,
2130
+ "special": false
2131
+ },
2132
+ "32263": {
2133
+ "content": "๐„ธ",
2134
+ "lstrip": false,
2135
+ "normalized": true,
2136
+ "rstrip": false,
2137
+ "single_word": false,
2138
+ "special": false
2139
+ },
2140
+ "32264": {
2141
+ "content": "๐ƒง",
2142
+ "lstrip": false,
2143
+ "normalized": true,
2144
+ "rstrip": false,
2145
+ "single_word": false,
2146
+ "special": false
2147
+ },
2148
+ "32265": {
2149
+ "content": "๐‚†",
2150
+ "lstrip": false,
2151
+ "normalized": true,
2152
+ "rstrip": false,
2153
+ "single_word": false,
2154
+ "special": false
2155
+ },
2156
+ "32266": {
2157
+ "content": "๐„ฟ",
2158
+ "lstrip": false,
2159
+ "normalized": true,
2160
+ "rstrip": false,
2161
+ "single_word": false,
2162
+ "special": false
2163
+ },
2164
+ "32267": {
2165
+ "content": "๐‚ด",
2166
+ "lstrip": false,
2167
+ "normalized": true,
2168
+ "rstrip": false,
2169
+ "single_word": false,
2170
+ "special": false
2171
+ },
2172
+ "32268": {
2173
+ "content": "๐‚ฉ",
2174
+ "lstrip": false,
2175
+ "normalized": true,
2176
+ "rstrip": false,
2177
+ "single_word": false,
2178
+ "special": false
2179
+ },
2180
+ "32269": {
2181
+ "content": "โŸง",
2182
+ "lstrip": false,
2183
+ "normalized": true,
2184
+ "rstrip": false,
2185
+ "single_word": false,
2186
+ "special": false
2187
+ },
2188
+ "32270": {
2189
+ "content": "๐ƒธ",
2190
+ "lstrip": false,
2191
+ "normalized": true,
2192
+ "rstrip": false,
2193
+ "single_word": false,
2194
+ "special": false
2195
+ },
2196
+ "32271": {
2197
+ "content": "๐ƒญ",
2198
+ "lstrip": false,
2199
+ "normalized": true,
2200
+ "rstrip": false,
2201
+ "single_word": false,
2202
+ "special": false
2203
+ },
2204
+ "32272": {
2205
+ "content": "๐€Ÿ",
2206
+ "lstrip": false,
2207
+ "normalized": true,
2208
+ "rstrip": false,
2209
+ "single_word": false,
2210
+ "special": false
2211
+ },
2212
+ "32273": {
2213
+ "content": "๐Œ",
2214
+ "lstrip": false,
2215
+ "normalized": true,
2216
+ "rstrip": false,
2217
+ "single_word": false,
2218
+ "special": false
2219
+ },
2220
+ "32274": {
2221
+ "content": "๐€–",
2222
+ "lstrip": false,
2223
+ "normalized": true,
2224
+ "rstrip": false,
2225
+ "single_word": false,
2226
+ "special": false
2227
+ },
2228
+ "32275": {
2229
+ "content": "๐€’",
2230
+ "lstrip": false,
2231
+ "normalized": true,
2232
+ "rstrip": false,
2233
+ "single_word": false,
2234
+ "special": false
2235
+ },
2236
+ "32276": {
2237
+ "content": "๐€•",
2238
+ "lstrip": false,
2239
+ "normalized": true,
2240
+ "rstrip": false,
2241
+ "single_word": false,
2242
+ "special": false
2243
+ },
2244
+ "32277": {
2245
+ "content": "๐€ฅ",
2246
+ "lstrip": false,
2247
+ "normalized": true,
2248
+ "rstrip": false,
2249
+ "single_word": false,
2250
+ "special": false
2251
+ },
2252
+ "32278": {
2253
+ "content": "๐‚",
2254
+ "lstrip": false,
2255
+ "normalized": true,
2256
+ "rstrip": false,
2257
+ "single_word": false,
2258
+ "special": false
2259
+ },
2260
+ "32279": {
2261
+ "content": "๐",
2262
+ "lstrip": false,
2263
+ "normalized": true,
2264
+ "rstrip": false,
2265
+ "single_word": false,
2266
+ "special": false
2267
+ },
2268
+ "32280": {
2269
+ "content": "๐ƒฐ",
2270
+ "lstrip": false,
2271
+ "normalized": true,
2272
+ "rstrip": false,
2273
+ "single_word": false,
2274
+ "special": false
2275
+ },
2276
+ "32281": {
2277
+ "content": "โŸฆ",
2278
+ "lstrip": false,
2279
+ "normalized": true,
2280
+ "rstrip": false,
2281
+ "single_word": false,
2282
+ "special": false
2283
+ },
2284
+ "32282": {
2285
+ "content": "๐‚•",
2286
+ "lstrip": false,
2287
+ "normalized": true,
2288
+ "rstrip": false,
2289
+ "single_word": false,
2290
+ "special": false
2291
+ },
2292
+ "32283": {
2293
+ "content": "๐€จ",
2294
+ "lstrip": false,
2295
+ "normalized": true,
2296
+ "rstrip": false,
2297
+ "single_word": false,
2298
+ "special": false
2299
+ },
2300
+ "32284": {
2301
+ "content": "๐€",
2302
+ "lstrip": false,
2303
+ "normalized": true,
2304
+ "rstrip": false,
2305
+ "single_word": false,
2306
+ "special": false
2307
+ },
2308
+ "32285": {
2309
+ "content": "๐–",
2310
+ "lstrip": false,
2311
+ "normalized": true,
2312
+ "rstrip": false,
2313
+ "single_word": false,
2314
+ "special": false
2315
+ },
2316
+ "32286": {
2317
+ "content": "๐…",
2318
+ "lstrip": false,
2319
+ "normalized": true,
2320
+ "rstrip": false,
2321
+ "single_word": false,
2322
+ "special": false
2323
+ },
2324
+ "32287": {
2325
+ "content": "๐ƒฑ",
2326
+ "lstrip": false,
2327
+ "normalized": true,
2328
+ "rstrip": false,
2329
+ "single_word": false,
2330
+ "special": false
2331
+ },
2332
+ "32288": {
2333
+ "content": "๐ƒ",
2334
+ "lstrip": false,
2335
+ "normalized": true,
2336
+ "rstrip": false,
2337
+ "single_word": false,
2338
+ "special": false
2339
+ },
2340
+ "32289": {
2341
+ "content": "๐€ซ",
2342
+ "lstrip": false,
2343
+ "normalized": true,
2344
+ "rstrip": false,
2345
+ "single_word": false,
2346
+ "special": false
2347
+ },
2348
+ "32290": {
2349
+ "content": "๐ƒ‰",
2350
+ "lstrip": false,
2351
+ "normalized": true,
2352
+ "rstrip": false,
2353
+ "single_word": false,
2354
+ "special": false
2355
+ },
2356
+ "32291": {
2357
+ "content": "๐",
2358
+ "lstrip": false,
2359
+ "normalized": true,
2360
+ "rstrip": false,
2361
+ "single_word": false,
2362
+ "special": false
2363
+ },
2364
+ "32292": {
2365
+ "content": "๐ƒˆ",
2366
+ "lstrip": false,
2367
+ "normalized": true,
2368
+ "rstrip": false,
2369
+ "single_word": false,
2370
+ "special": false
2371
+ },
2372
+ "32293": {
2373
+ "content": "๐‘",
2374
+ "lstrip": false,
2375
+ "normalized": true,
2376
+ "rstrip": false,
2377
+ "single_word": false,
2378
+ "special": false
2379
+ },
2380
+ "32294": {
2381
+ "content": "๐„Š",
2382
+ "lstrip": false,
2383
+ "normalized": true,
2384
+ "rstrip": false,
2385
+ "single_word": false,
2386
+ "special": false
2387
+ },
2388
+ "32295": {
2389
+ "content": "๐€",
2390
+ "lstrip": false,
2391
+ "normalized": true,
2392
+ "rstrip": false,
2393
+ "single_word": false,
2394
+ "special": false
2395
+ },
2396
+ "32296": {
2397
+ "content": "๐„š",
2398
+ "lstrip": false,
2399
+ "normalized": true,
2400
+ "rstrip": false,
2401
+ "single_word": false,
2402
+ "special": false
2403
+ },
2404
+ "32297": {
2405
+ "content": "๐‚–",
2406
+ "lstrip": false,
2407
+ "normalized": true,
2408
+ "rstrip": false,
2409
+ "single_word": false,
2410
+ "special": false
2411
+ },
2412
+ "32298": {
2413
+ "content": "๐€",
2414
+ "lstrip": false,
2415
+ "normalized": true,
2416
+ "rstrip": false,
2417
+ "single_word": false,
2418
+ "special": false
2419
+ },
2420
+ "32299": {
2421
+ "content": "๐„–",
2422
+ "lstrip": false,
2423
+ "normalized": true,
2424
+ "rstrip": false,
2425
+ "single_word": false,
2426
+ "special": false
2427
+ },
2428
+ "32300": {
2429
+ "content": "๐€‚",
2430
+ "lstrip": false,
2431
+ "normalized": true,
2432
+ "rstrip": false,
2433
+ "single_word": false,
2434
+ "special": false
2435
+ },
2436
+ "32301": {
2437
+ "content": "๐€Š",
2438
+ "lstrip": false,
2439
+ "normalized": true,
2440
+ "rstrip": false,
2441
+ "single_word": false,
2442
+ "special": false
2443
+ },
2444
+ "32302": {
2445
+ "content": "๐ƒฒ",
2446
+ "lstrip": false,
2447
+ "normalized": true,
2448
+ "rstrip": false,
2449
+ "single_word": false,
2450
+ "special": false
2451
+ },
2452
+ "32303": {
2453
+ "content": "๐„ข",
2454
+ "lstrip": false,
2455
+ "normalized": true,
2456
+ "rstrip": false,
2457
+ "single_word": false,
2458
+ "special": false
2459
+ },
2460
+ "32304": {
2461
+ "content": "๐ƒ",
2462
+ "lstrip": false,
2463
+ "normalized": true,
2464
+ "rstrip": false,
2465
+ "single_word": false,
2466
+ "special": false
2467
+ },
2468
+ "32305": {
2469
+ "content": "๐‚",
2470
+ "lstrip": false,
2471
+ "normalized": true,
2472
+ "rstrip": false,
2473
+ "single_word": false,
2474
+ "special": false
2475
+ },
2476
+ "32306": {
2477
+ "content": "๐ƒ—",
2478
+ "lstrip": false,
2479
+ "normalized": true,
2480
+ "rstrip": false,
2481
+ "single_word": false,
2482
+ "special": false
2483
+ },
2484
+ "32307": {
2485
+ "content": "๐ƒฆ",
2486
+ "lstrip": false,
2487
+ "normalized": true,
2488
+ "rstrip": false,
2489
+ "single_word": false,
2490
+ "special": false
2491
+ },
2492
+ "32308": {
2493
+ "content": "๐‚ช",
2494
+ "lstrip": false,
2495
+ "normalized": true,
2496
+ "rstrip": false,
2497
+ "single_word": false,
2498
+ "special": false
2499
+ },
2500
+ "32309": {
2501
+ "content": "๐ƒฅ",
2502
+ "lstrip": false,
2503
+ "normalized": true,
2504
+ "rstrip": false,
2505
+ "single_word": false,
2506
+ "special": false
2507
+ },
2508
+ "32310": {
2509
+ "content": "๐€ต",
2510
+ "lstrip": false,
2511
+ "normalized": true,
2512
+ "rstrip": false,
2513
+ "single_word": false,
2514
+ "special": false
2515
+ },
2516
+ "32311": {
2517
+ "content": "๐€™",
2518
+ "lstrip": false,
2519
+ "normalized": true,
2520
+ "rstrip": false,
2521
+ "single_word": false,
2522
+ "special": false
2523
+ },
2524
+ "32312": {
2525
+ "content": "๐ƒ ",
2526
+ "lstrip": false,
2527
+ "normalized": true,
2528
+ "rstrip": false,
2529
+ "single_word": false,
2530
+ "special": false
2531
+ },
2532
+ "32313": {
2533
+ "content": "๐‚‡",
2534
+ "lstrip": false,
2535
+ "normalized": true,
2536
+ "rstrip": false,
2537
+ "single_word": false,
2538
+ "special": false
2539
+ },
2540
+ "32314": {
2541
+ "content": "๐‡",
2542
+ "lstrip": false,
2543
+ "normalized": true,
2544
+ "rstrip": false,
2545
+ "single_word": false,
2546
+ "special": false
2547
+ },
2548
+ "32315": {
2549
+ "content": "๐€ค",
2550
+ "lstrip": false,
2551
+ "normalized": true,
2552
+ "rstrip": false,
2553
+ "single_word": false,
2554
+ "special": false
2555
+ },
2556
+ "32316": {
2557
+ "content": "๐‚ธ",
2558
+ "lstrip": false,
2559
+ "normalized": true,
2560
+ "rstrip": false,
2561
+ "single_word": false,
2562
+ "special": false
2563
+ },
2564
+ "32317": {
2565
+ "content": "๐„ˆ",
2566
+ "lstrip": false,
2567
+ "normalized": true,
2568
+ "rstrip": false,
2569
+ "single_word": false,
2570
+ "special": false
2571
+ },
2572
+ "32318": {
2573
+ "content": "๐„ฃ",
2574
+ "lstrip": false,
2575
+ "normalized": true,
2576
+ "rstrip": false,
2577
+ "single_word": false,
2578
+ "special": false
2579
+ },
2580
+ "32319": {
2581
+ "content": "๐„Ÿ",
2582
+ "lstrip": false,
2583
+ "normalized": true,
2584
+ "rstrip": false,
2585
+ "single_word": false,
2586
+ "special": false
2587
+ },
2588
+ "32320": {
2589
+ "content": "๐€ข",
2590
+ "lstrip": false,
2591
+ "normalized": true,
2592
+ "rstrip": false,
2593
+ "single_word": false,
2594
+ "special": false
2595
+ },
2596
+ "32321": {
2597
+ "content": "๐€ด",
2598
+ "lstrip": false,
2599
+ "normalized": true,
2600
+ "rstrip": false,
2601
+ "single_word": false,
2602
+ "special": false
2603
+ },
2604
+ "32322": {
2605
+ "content": "๐„ฅ",
2606
+ "lstrip": false,
2607
+ "normalized": true,
2608
+ "rstrip": false,
2609
+ "single_word": false,
2610
+ "special": false
2611
+ },
2612
+ "32323": {
2613
+ "content": "๐ƒ",
2614
+ "lstrip": false,
2615
+ "normalized": true,
2616
+ "rstrip": false,
2617
+ "single_word": false,
2618
+ "special": false
2619
+ },
2620
+ "32324": {
2621
+ "content": "๐€บ",
2622
+ "lstrip": false,
2623
+ "normalized": true,
2624
+ "rstrip": false,
2625
+ "single_word": false,
2626
+ "special": false
2627
+ },
2628
+ "32325": {
2629
+ "content": "๐€ฟ",
2630
+ "lstrip": false,
2631
+ "normalized": true,
2632
+ "rstrip": false,
2633
+ "single_word": false,
2634
+ "special": false
2635
+ },
2636
+ "32326": {
2637
+ "content": "๐‚ก",
2638
+ "lstrip": false,
2639
+ "normalized": true,
2640
+ "rstrip": false,
2641
+ "single_word": false,
2642
+ "special": false
2643
+ },
2644
+ "32327": {
2645
+ "content": "๐€‡",
2646
+ "lstrip": false,
2647
+ "normalized": true,
2648
+ "rstrip": false,
2649
+ "single_word": false,
2650
+ "special": false
2651
+ },
2652
+ "32328": {
2653
+ "content": "๐ƒจ",
2654
+ "lstrip": false,
2655
+ "normalized": true,
2656
+ "rstrip": false,
2657
+ "single_word": false,
2658
+ "special": false
2659
+ },
2660
+ "32329": {
2661
+ "content": "๐ƒต",
2662
+ "lstrip": false,
2663
+ "normalized": true,
2664
+ "rstrip": false,
2665
+ "single_word": false,
2666
+ "special": false
2667
+ },
2668
+ "32330": {
2669
+ "content": "๐‚Š",
2670
+ "lstrip": false,
2671
+ "normalized": true,
2672
+ "rstrip": false,
2673
+ "single_word": false,
2674
+ "special": false
2675
+ },
2676
+ "32331": {
2677
+ "content": "๐ƒข",
2678
+ "lstrip": false,
2679
+ "normalized": true,
2680
+ "rstrip": false,
2681
+ "single_word": false,
2682
+ "special": false
2683
+ },
2684
+ "32332": {
2685
+ "content": "๐‚ฑ",
2686
+ "lstrip": false,
2687
+ "normalized": true,
2688
+ "rstrip": false,
2689
+ "single_word": false,
2690
+ "special": false
2691
+ },
2692
+ "32333": {
2693
+ "content": "๐€“",
2694
+ "lstrip": false,
2695
+ "normalized": true,
2696
+ "rstrip": false,
2697
+ "single_word": false,
2698
+ "special": false
2699
+ },
2700
+ "32334": {
2701
+ "content": "๐˜",
2702
+ "lstrip": false,
2703
+ "normalized": true,
2704
+ "rstrip": false,
2705
+ "single_word": false,
2706
+ "special": false
2707
+ },
2708
+ "32335": {
2709
+ "content": "๐‚ฃ",
2710
+ "lstrip": false,
2711
+ "normalized": true,
2712
+ "rstrip": false,
2713
+ "single_word": false,
2714
+ "special": false
2715
+ },
2716
+ "32336": {
2717
+ "content": "๐„‘",
2718
+ "lstrip": false,
2719
+ "normalized": true,
2720
+ "rstrip": false,
2721
+ "single_word": false,
2722
+ "special": false
2723
+ },
2724
+ "32337": {
2725
+ "content": "๐‚Œ",
2726
+ "lstrip": false,
2727
+ "normalized": true,
2728
+ "rstrip": false,
2729
+ "single_word": false,
2730
+ "special": false
2731
+ },
2732
+ "32338": {
2733
+ "content": "๐ƒซ",
2734
+ "lstrip": false,
2735
+ "normalized": true,
2736
+ "rstrip": false,
2737
+ "single_word": false,
2738
+ "special": false
2739
+ },
2740
+ "32339": {
2741
+ "content": "๐€‘",
2742
+ "lstrip": false,
2743
+ "normalized": true,
2744
+ "rstrip": false,
2745
+ "single_word": false,
2746
+ "special": false
2747
+ },
2748
+ "32340": {
2749
+ "content": "๐‚ซ",
2750
+ "lstrip": false,
2751
+ "normalized": true,
2752
+ "rstrip": false,
2753
+ "single_word": false,
2754
+ "special": false
2755
+ },
2756
+ "32341": {
2757
+ "content": "๐€ฏ",
2758
+ "lstrip": false,
2759
+ "normalized": true,
2760
+ "rstrip": false,
2761
+ "single_word": false,
2762
+ "special": false
2763
+ },
2764
+ "32342": {
2765
+ "content": "๐ƒฎ",
2766
+ "lstrip": false,
2767
+ "normalized": true,
2768
+ "rstrip": false,
2769
+ "single_word": false,
2770
+ "special": false
2771
+ },
2772
+ "32343": {
2773
+ "content": "๐ƒฏ",
2774
+ "lstrip": false,
2775
+ "normalized": true,
2776
+ "rstrip": false,
2777
+ "single_word": false,
2778
+ "special": false
2779
+ },
2780
+ "32344": {
2781
+ "content": "๐ƒ",
2782
  "lstrip": false,
2783
  "normalized": true,
2784
  "rstrip": false,
 
2888
  "<extra_id_98>",
2889
  "<extra_id_99>"
2890
  ],
2891
+ "clean_up_tokenization_spaces": true,
2892
  "eos_token": "</s>",
2893
  "extra_ids": 100,
2894
  "extra_special_tokens": {},
2895
+ "model_max_length": 512,
2896
  "pad_token": "<pad>",
2897
  "tokenizer_class": "T5Tokenizer",
2898
  "unk_token": "<unk>"
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8a92891584bf869ae6fcdc9272477ed521d4bd4c81af5a95c4818269dec3d69
3
  size 5969
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6411eabd7ab053f58f1ad50c273d1ced6ddce181a1053baed6c4fab8f72d7c85
3
  size 5969