gpol13 commited on
Commit
d5d745c
·
verified ·
1 Parent(s): 138f96f

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -199,4 +199,4 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
199
  [More Information Needed]
200
  ### Framework versions
201
 
202
- - PEFT 0.14.0
 
199
  [More Information Needed]
200
  ### Framework versions
201
 
202
+ - PEFT 0.12.0
adapter_config.json CHANGED
@@ -3,8 +3,6 @@
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "Salesforce/codet5-base",
5
  "bias": "none",
6
- "eva_config": null,
7
- "exclude_modules": null,
8
  "fan_in_fan_out": false,
9
  "inference_mode": true,
10
  "init_lora_weights": true,
@@ -13,7 +11,6 @@
13
  "layers_to_transform": null,
14
  "loftq_config": {},
15
  "lora_alpha": 16,
16
- "lora_bias": false,
17
  "lora_dropout": 0.1,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
@@ -24,7 +21,9 @@
24
  "revision": null,
25
  "target_modules": [
26
  "q",
27
- "v"
 
 
28
  ],
29
  "task_type": "SEQ_2_SEQ_LM",
30
  "use_dora": false,
 
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "Salesforce/codet5-base",
5
  "bias": "none",
 
 
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
8
  "init_lora_weights": true,
 
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
  "lora_alpha": 16,
 
14
  "lora_dropout": 0.1,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
 
21
  "revision": null,
22
  "target_modules": [
23
  "q",
24
+ "v",
25
+ "k",
26
+ "o"
27
  ],
28
  "task_type": "SEQ_2_SEQ_LM",
29
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:626aff5650b6dcfb6222236d07bcc5b0b087d26230196dfb68526f0dc5e7275a
3
- size 3558888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b87fd4500c6c9300429679f9f63df6321344be4518b290be0dfce13c896cff96
3
+ size 7117824
checkpoint-9213/README.md ADDED
@@ -0,0 +1,202 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: Salesforce/codet5-base
3
+ library_name: peft
4
+ ---
5
+
6
+ # Model Card for Model ID
7
+
8
+ <!-- Provide a quick summary of what the model is/does. -->
9
+
10
+
11
+
12
+ ## Model Details
13
+
14
+ ### Model Description
15
+
16
+ <!-- Provide a longer summary of what this model is. -->
17
+
18
+
19
+
20
+ - **Developed by:** [More Information Needed]
21
+ - **Funded by [optional]:** [More Information Needed]
22
+ - **Shared by [optional]:** [More Information Needed]
23
+ - **Model type:** [More Information Needed]
24
+ - **Language(s) (NLP):** [More Information Needed]
25
+ - **License:** [More Information Needed]
26
+ - **Finetuned from model [optional]:** [More Information Needed]
27
+
28
+ ### Model Sources [optional]
29
+
30
+ <!-- Provide the basic links for the model. -->
31
+
32
+ - **Repository:** [More Information Needed]
33
+ - **Paper [optional]:** [More Information Needed]
34
+ - **Demo [optional]:** [More Information Needed]
35
+
36
+ ## Uses
37
+
38
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
39
+
40
+ ### Direct Use
41
+
42
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
43
+
44
+ [More Information Needed]
45
+
46
+ ### Downstream Use [optional]
47
+
48
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
49
+
50
+ [More Information Needed]
51
+
52
+ ### Out-of-Scope Use
53
+
54
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
55
+
56
+ [More Information Needed]
57
+
58
+ ## Bias, Risks, and Limitations
59
+
60
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
61
+
62
+ [More Information Needed]
63
+
64
+ ### Recommendations
65
+
66
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
67
+
68
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
69
+
70
+ ## How to Get Started with the Model
71
+
72
+ Use the code below to get started with the model.
73
+
74
+ [More Information Needed]
75
+
76
+ ## Training Details
77
+
78
+ ### Training Data
79
+
80
+ <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
81
+
82
+ [More Information Needed]
83
+
84
+ ### Training Procedure
85
+
86
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
87
+
88
+ #### Preprocessing [optional]
89
+
90
+ [More Information Needed]
91
+
92
+
93
+ #### Training Hyperparameters
94
+
95
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
96
+
97
+ #### Speeds, Sizes, Times [optional]
98
+
99
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
100
+
101
+ [More Information Needed]
102
+
103
+ ## Evaluation
104
+
105
+ <!-- This section describes the evaluation protocols and provides the results. -->
106
+
107
+ ### Testing Data, Factors & Metrics
108
+
109
+ #### Testing Data
110
+
111
+ <!-- This should link to a Dataset Card if possible. -->
112
+
113
+ [More Information Needed]
114
+
115
+ #### Factors
116
+
117
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
118
+
119
+ [More Information Needed]
120
+
121
+ #### Metrics
122
+
123
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
124
+
125
+ [More Information Needed]
126
+
127
+ ### Results
128
+
129
+ [More Information Needed]
130
+
131
+ #### Summary
132
+
133
+
134
+
135
+ ## Model Examination [optional]
136
+
137
+ <!-- Relevant interpretability work for the model goes here -->
138
+
139
+ [More Information Needed]
140
+
141
+ ## Environmental Impact
142
+
143
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
144
+
145
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
146
+
147
+ - **Hardware Type:** [More Information Needed]
148
+ - **Hours used:** [More Information Needed]
149
+ - **Cloud Provider:** [More Information Needed]
150
+ - **Compute Region:** [More Information Needed]
151
+ - **Carbon Emitted:** [More Information Needed]
152
+
153
+ ## Technical Specifications [optional]
154
+
155
+ ### Model Architecture and Objective
156
+
157
+ [More Information Needed]
158
+
159
+ ### Compute Infrastructure
160
+
161
+ [More Information Needed]
162
+
163
+ #### Hardware
164
+
165
+ [More Information Needed]
166
+
167
+ #### Software
168
+
169
+ [More Information Needed]
170
+
171
+ ## Citation [optional]
172
+
173
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
174
+
175
+ **BibTeX:**
176
+
177
+ [More Information Needed]
178
+
179
+ **APA:**
180
+
181
+ [More Information Needed]
182
+
183
+ ## Glossary [optional]
184
+
185
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
186
+
187
+ [More Information Needed]
188
+
189
+ ## More Information [optional]
190
+
191
+ [More Information Needed]
192
+
193
+ ## Model Card Authors [optional]
194
+
195
+ [More Information Needed]
196
+
197
+ ## Model Card Contact
198
+
199
+ [More Information Needed]
200
+ ### Framework versions
201
+
202
+ - PEFT 0.12.0
checkpoint-9213/adapter_config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "Salesforce/codet5-base",
5
+ "bias": "none",
6
+ "fan_in_fan_out": false,
7
+ "inference_mode": true,
8
+ "init_lora_weights": true,
9
+ "layer_replication": null,
10
+ "layers_pattern": null,
11
+ "layers_to_transform": null,
12
+ "loftq_config": {},
13
+ "lora_alpha": 16,
14
+ "lora_dropout": 0.1,
15
+ "megatron_config": null,
16
+ "megatron_core": "megatron.core",
17
+ "modules_to_save": null,
18
+ "peft_type": "LORA",
19
+ "r": 8,
20
+ "rank_pattern": {},
21
+ "revision": null,
22
+ "target_modules": [
23
+ "q",
24
+ "v",
25
+ "k",
26
+ "o"
27
+ ],
28
+ "task_type": "SEQ_2_SEQ_LM",
29
+ "use_dora": false,
30
+ "use_rslora": false
31
+ }
checkpoint-9213/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b87fd4500c6c9300429679f9f63df6321344be4518b290be0dfce13c896cff96
3
+ size 7117824
checkpoint-9213/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c20c3421f0b146d60025b0b2185ba0b8930533f1dab202a1b41b5b3c01d2f78f
3
+ size 14397434
checkpoint-9213/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be754dba0c3662c12f8b07c5fd72ef60160e13708e25173bb6b57ab26d1fc1b8
3
+ size 14244
checkpoint-9213/scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbdb7492a0661aca7d7ba8026bad4935918d9a2cd6ddeb5e7d11db4707b6d6a7
3
+ size 988
checkpoint-9213/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86f76c2ec4b565b492a4eb45c2841a642f13f08f818fe4b2b9aace67ef4630b6
3
+ size 1064
checkpoint-9213/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-9213/tokenizer_config.json ADDED
@@ -0,0 +1,719 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "additional_special_tokens": [
4
+ {
5
+ "content": "<extra_id_99>",
6
+ "lstrip": true,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false
10
+ },
11
+ {
12
+ "content": "<extra_id_98>",
13
+ "lstrip": true,
14
+ "normalized": true,
15
+ "rstrip": false,
16
+ "single_word": false
17
+ },
18
+ {
19
+ "content": "<extra_id_97>",
20
+ "lstrip": true,
21
+ "normalized": true,
22
+ "rstrip": false,
23
+ "single_word": false
24
+ },
25
+ {
26
+ "content": "<extra_id_96>",
27
+ "lstrip": true,
28
+ "normalized": true,
29
+ "rstrip": false,
30
+ "single_word": false
31
+ },
32
+ {
33
+ "content": "<extra_id_95>",
34
+ "lstrip": true,
35
+ "normalized": true,
36
+ "rstrip": false,
37
+ "single_word": false
38
+ },
39
+ {
40
+ "content": "<extra_id_94>",
41
+ "lstrip": true,
42
+ "normalized": true,
43
+ "rstrip": false,
44
+ "single_word": false
45
+ },
46
+ {
47
+ "content": "<extra_id_93>",
48
+ "lstrip": true,
49
+ "normalized": true,
50
+ "rstrip": false,
51
+ "single_word": false
52
+ },
53
+ {
54
+ "content": "<extra_id_92>",
55
+ "lstrip": true,
56
+ "normalized": true,
57
+ "rstrip": false,
58
+ "single_word": false
59
+ },
60
+ {
61
+ "content": "<extra_id_91>",
62
+ "lstrip": true,
63
+ "normalized": true,
64
+ "rstrip": false,
65
+ "single_word": false
66
+ },
67
+ {
68
+ "content": "<extra_id_90>",
69
+ "lstrip": true,
70
+ "normalized": true,
71
+ "rstrip": false,
72
+ "single_word": false
73
+ },
74
+ {
75
+ "content": "<extra_id_89>",
76
+ "lstrip": true,
77
+ "normalized": true,
78
+ "rstrip": false,
79
+ "single_word": false
80
+ },
81
+ {
82
+ "content": "<extra_id_88>",
83
+ "lstrip": true,
84
+ "normalized": true,
85
+ "rstrip": false,
86
+ "single_word": false
87
+ },
88
+ {
89
+ "content": "<extra_id_87>",
90
+ "lstrip": true,
91
+ "normalized": true,
92
+ "rstrip": false,
93
+ "single_word": false
94
+ },
95
+ {
96
+ "content": "<extra_id_86>",
97
+ "lstrip": true,
98
+ "normalized": true,
99
+ "rstrip": false,
100
+ "single_word": false
101
+ },
102
+ {
103
+ "content": "<extra_id_85>",
104
+ "lstrip": true,
105
+ "normalized": true,
106
+ "rstrip": false,
107
+ "single_word": false
108
+ },
109
+ {
110
+ "content": "<extra_id_84>",
111
+ "lstrip": true,
112
+ "normalized": true,
113
+ "rstrip": false,
114
+ "single_word": false
115
+ },
116
+ {
117
+ "content": "<extra_id_83>",
118
+ "lstrip": true,
119
+ "normalized": true,
120
+ "rstrip": false,
121
+ "single_word": false
122
+ },
123
+ {
124
+ "content": "<extra_id_82>",
125
+ "lstrip": true,
126
+ "normalized": true,
127
+ "rstrip": false,
128
+ "single_word": false
129
+ },
130
+ {
131
+ "content": "<extra_id_81>",
132
+ "lstrip": true,
133
+ "normalized": true,
134
+ "rstrip": false,
135
+ "single_word": false
136
+ },
137
+ {
138
+ "content": "<extra_id_80>",
139
+ "lstrip": true,
140
+ "normalized": true,
141
+ "rstrip": false,
142
+ "single_word": false
143
+ },
144
+ {
145
+ "content": "<extra_id_79>",
146
+ "lstrip": true,
147
+ "normalized": true,
148
+ "rstrip": false,
149
+ "single_word": false
150
+ },
151
+ {
152
+ "content": "<extra_id_78>",
153
+ "lstrip": true,
154
+ "normalized": true,
155
+ "rstrip": false,
156
+ "single_word": false
157
+ },
158
+ {
159
+ "content": "<extra_id_77>",
160
+ "lstrip": true,
161
+ "normalized": true,
162
+ "rstrip": false,
163
+ "single_word": false
164
+ },
165
+ {
166
+ "content": "<extra_id_76>",
167
+ "lstrip": true,
168
+ "normalized": true,
169
+ "rstrip": false,
170
+ "single_word": false
171
+ },
172
+ {
173
+ "content": "<extra_id_75>",
174
+ "lstrip": true,
175
+ "normalized": true,
176
+ "rstrip": false,
177
+ "single_word": false
178
+ },
179
+ {
180
+ "content": "<extra_id_74>",
181
+ "lstrip": true,
182
+ "normalized": true,
183
+ "rstrip": false,
184
+ "single_word": false
185
+ },
186
+ {
187
+ "content": "<extra_id_73>",
188
+ "lstrip": true,
189
+ "normalized": true,
190
+ "rstrip": false,
191
+ "single_word": false
192
+ },
193
+ {
194
+ "content": "<extra_id_72>",
195
+ "lstrip": true,
196
+ "normalized": true,
197
+ "rstrip": false,
198
+ "single_word": false
199
+ },
200
+ {
201
+ "content": "<extra_id_71>",
202
+ "lstrip": true,
203
+ "normalized": true,
204
+ "rstrip": false,
205
+ "single_word": false
206
+ },
207
+ {
208
+ "content": "<extra_id_70>",
209
+ "lstrip": true,
210
+ "normalized": true,
211
+ "rstrip": false,
212
+ "single_word": false
213
+ },
214
+ {
215
+ "content": "<extra_id_69>",
216
+ "lstrip": true,
217
+ "normalized": true,
218
+ "rstrip": false,
219
+ "single_word": false
220
+ },
221
+ {
222
+ "content": "<extra_id_68>",
223
+ "lstrip": true,
224
+ "normalized": true,
225
+ "rstrip": false,
226
+ "single_word": false
227
+ },
228
+ {
229
+ "content": "<extra_id_67>",
230
+ "lstrip": true,
231
+ "normalized": true,
232
+ "rstrip": false,
233
+ "single_word": false
234
+ },
235
+ {
236
+ "content": "<extra_id_66>",
237
+ "lstrip": true,
238
+ "normalized": true,
239
+ "rstrip": false,
240
+ "single_word": false
241
+ },
242
+ {
243
+ "content": "<extra_id_65>",
244
+ "lstrip": true,
245
+ "normalized": true,
246
+ "rstrip": false,
247
+ "single_word": false
248
+ },
249
+ {
250
+ "content": "<extra_id_64>",
251
+ "lstrip": true,
252
+ "normalized": true,
253
+ "rstrip": false,
254
+ "single_word": false
255
+ },
256
+ {
257
+ "content": "<extra_id_63>",
258
+ "lstrip": true,
259
+ "normalized": true,
260
+ "rstrip": false,
261
+ "single_word": false
262
+ },
263
+ {
264
+ "content": "<extra_id_62>",
265
+ "lstrip": true,
266
+ "normalized": true,
267
+ "rstrip": false,
268
+ "single_word": false
269
+ },
270
+ {
271
+ "content": "<extra_id_61>",
272
+ "lstrip": true,
273
+ "normalized": true,
274
+ "rstrip": false,
275
+ "single_word": false
276
+ },
277
+ {
278
+ "content": "<extra_id_60>",
279
+ "lstrip": true,
280
+ "normalized": true,
281
+ "rstrip": false,
282
+ "single_word": false
283
+ },
284
+ {
285
+ "content": "<extra_id_59>",
286
+ "lstrip": true,
287
+ "normalized": true,
288
+ "rstrip": false,
289
+ "single_word": false
290
+ },
291
+ {
292
+ "content": "<extra_id_58>",
293
+ "lstrip": true,
294
+ "normalized": true,
295
+ "rstrip": false,
296
+ "single_word": false
297
+ },
298
+ {
299
+ "content": "<extra_id_57>",
300
+ "lstrip": true,
301
+ "normalized": true,
302
+ "rstrip": false,
303
+ "single_word": false
304
+ },
305
+ {
306
+ "content": "<extra_id_56>",
307
+ "lstrip": true,
308
+ "normalized": true,
309
+ "rstrip": false,
310
+ "single_word": false
311
+ },
312
+ {
313
+ "content": "<extra_id_55>",
314
+ "lstrip": true,
315
+ "normalized": true,
316
+ "rstrip": false,
317
+ "single_word": false
318
+ },
319
+ {
320
+ "content": "<extra_id_54>",
321
+ "lstrip": true,
322
+ "normalized": true,
323
+ "rstrip": false,
324
+ "single_word": false
325
+ },
326
+ {
327
+ "content": "<extra_id_53>",
328
+ "lstrip": true,
329
+ "normalized": true,
330
+ "rstrip": false,
331
+ "single_word": false
332
+ },
333
+ {
334
+ "content": "<extra_id_52>",
335
+ "lstrip": true,
336
+ "normalized": true,
337
+ "rstrip": false,
338
+ "single_word": false
339
+ },
340
+ {
341
+ "content": "<extra_id_51>",
342
+ "lstrip": true,
343
+ "normalized": true,
344
+ "rstrip": false,
345
+ "single_word": false
346
+ },
347
+ {
348
+ "content": "<extra_id_50>",
349
+ "lstrip": true,
350
+ "normalized": true,
351
+ "rstrip": false,
352
+ "single_word": false
353
+ },
354
+ {
355
+ "content": "<extra_id_49>",
356
+ "lstrip": true,
357
+ "normalized": true,
358
+ "rstrip": false,
359
+ "single_word": false
360
+ },
361
+ {
362
+ "content": "<extra_id_48>",
363
+ "lstrip": true,
364
+ "normalized": true,
365
+ "rstrip": false,
366
+ "single_word": false
367
+ },
368
+ {
369
+ "content": "<extra_id_47>",
370
+ "lstrip": true,
371
+ "normalized": true,
372
+ "rstrip": false,
373
+ "single_word": false
374
+ },
375
+ {
376
+ "content": "<extra_id_46>",
377
+ "lstrip": true,
378
+ "normalized": true,
379
+ "rstrip": false,
380
+ "single_word": false
381
+ },
382
+ {
383
+ "content": "<extra_id_45>",
384
+ "lstrip": true,
385
+ "normalized": true,
386
+ "rstrip": false,
387
+ "single_word": false
388
+ },
389
+ {
390
+ "content": "<extra_id_44>",
391
+ "lstrip": true,
392
+ "normalized": true,
393
+ "rstrip": false,
394
+ "single_word": false
395
+ },
396
+ {
397
+ "content": "<extra_id_43>",
398
+ "lstrip": true,
399
+ "normalized": true,
400
+ "rstrip": false,
401
+ "single_word": false
402
+ },
403
+ {
404
+ "content": "<extra_id_42>",
405
+ "lstrip": true,
406
+ "normalized": true,
407
+ "rstrip": false,
408
+ "single_word": false
409
+ },
410
+ {
411
+ "content": "<extra_id_41>",
412
+ "lstrip": true,
413
+ "normalized": true,
414
+ "rstrip": false,
415
+ "single_word": false
416
+ },
417
+ {
418
+ "content": "<extra_id_40>",
419
+ "lstrip": true,
420
+ "normalized": true,
421
+ "rstrip": false,
422
+ "single_word": false
423
+ },
424
+ {
425
+ "content": "<extra_id_39>",
426
+ "lstrip": true,
427
+ "normalized": true,
428
+ "rstrip": false,
429
+ "single_word": false
430
+ },
431
+ {
432
+ "content": "<extra_id_38>",
433
+ "lstrip": true,
434
+ "normalized": true,
435
+ "rstrip": false,
436
+ "single_word": false
437
+ },
438
+ {
439
+ "content": "<extra_id_37>",
440
+ "lstrip": true,
441
+ "normalized": true,
442
+ "rstrip": false,
443
+ "single_word": false
444
+ },
445
+ {
446
+ "content": "<extra_id_36>",
447
+ "lstrip": true,
448
+ "normalized": true,
449
+ "rstrip": false,
450
+ "single_word": false
451
+ },
452
+ {
453
+ "content": "<extra_id_35>",
454
+ "lstrip": true,
455
+ "normalized": true,
456
+ "rstrip": false,
457
+ "single_word": false
458
+ },
459
+ {
460
+ "content": "<extra_id_34>",
461
+ "lstrip": true,
462
+ "normalized": true,
463
+ "rstrip": false,
464
+ "single_word": false
465
+ },
466
+ {
467
+ "content": "<extra_id_33>",
468
+ "lstrip": true,
469
+ "normalized": true,
470
+ "rstrip": false,
471
+ "single_word": false
472
+ },
473
+ {
474
+ "content": "<extra_id_32>",
475
+ "lstrip": true,
476
+ "normalized": true,
477
+ "rstrip": false,
478
+ "single_word": false
479
+ },
480
+ {
481
+ "content": "<extra_id_31>",
482
+ "lstrip": true,
483
+ "normalized": true,
484
+ "rstrip": false,
485
+ "single_word": false
486
+ },
487
+ {
488
+ "content": "<extra_id_30>",
489
+ "lstrip": true,
490
+ "normalized": true,
491
+ "rstrip": false,
492
+ "single_word": false
493
+ },
494
+ {
495
+ "content": "<extra_id_29>",
496
+ "lstrip": true,
497
+ "normalized": true,
498
+ "rstrip": false,
499
+ "single_word": false
500
+ },
501
+ {
502
+ "content": "<extra_id_28>",
503
+ "lstrip": true,
504
+ "normalized": true,
505
+ "rstrip": false,
506
+ "single_word": false
507
+ },
508
+ {
509
+ "content": "<extra_id_27>",
510
+ "lstrip": true,
511
+ "normalized": true,
512
+ "rstrip": false,
513
+ "single_word": false
514
+ },
515
+ {
516
+ "content": "<extra_id_26>",
517
+ "lstrip": true,
518
+ "normalized": true,
519
+ "rstrip": false,
520
+ "single_word": false
521
+ },
522
+ {
523
+ "content": "<extra_id_25>",
524
+ "lstrip": true,
525
+ "normalized": true,
526
+ "rstrip": false,
527
+ "single_word": false
528
+ },
529
+ {
530
+ "content": "<extra_id_24>",
531
+ "lstrip": true,
532
+ "normalized": true,
533
+ "rstrip": false,
534
+ "single_word": false
535
+ },
536
+ {
537
+ "content": "<extra_id_23>",
538
+ "lstrip": true,
539
+ "normalized": true,
540
+ "rstrip": false,
541
+ "single_word": false
542
+ },
543
+ {
544
+ "content": "<extra_id_22>",
545
+ "lstrip": true,
546
+ "normalized": true,
547
+ "rstrip": false,
548
+ "single_word": false
549
+ },
550
+ {
551
+ "content": "<extra_id_21>",
552
+ "lstrip": true,
553
+ "normalized": true,
554
+ "rstrip": false,
555
+ "single_word": false
556
+ },
557
+ {
558
+ "content": "<extra_id_20>",
559
+ "lstrip": true,
560
+ "normalized": true,
561
+ "rstrip": false,
562
+ "single_word": false
563
+ },
564
+ {
565
+ "content": "<extra_id_19>",
566
+ "lstrip": true,
567
+ "normalized": true,
568
+ "rstrip": false,
569
+ "single_word": false
570
+ },
571
+ {
572
+ "content": "<extra_id_18>",
573
+ "lstrip": true,
574
+ "normalized": true,
575
+ "rstrip": false,
576
+ "single_word": false
577
+ },
578
+ {
579
+ "content": "<extra_id_17>",
580
+ "lstrip": true,
581
+ "normalized": true,
582
+ "rstrip": false,
583
+ "single_word": false
584
+ },
585
+ {
586
+ "content": "<extra_id_16>",
587
+ "lstrip": true,
588
+ "normalized": true,
589
+ "rstrip": false,
590
+ "single_word": false
591
+ },
592
+ {
593
+ "content": "<extra_id_15>",
594
+ "lstrip": true,
595
+ "normalized": true,
596
+ "rstrip": false,
597
+ "single_word": false
598
+ },
599
+ {
600
+ "content": "<extra_id_14>",
601
+ "lstrip": true,
602
+ "normalized": true,
603
+ "rstrip": false,
604
+ "single_word": false
605
+ },
606
+ {
607
+ "content": "<extra_id_13>",
608
+ "lstrip": true,
609
+ "normalized": true,
610
+ "rstrip": false,
611
+ "single_word": false
612
+ },
613
+ {
614
+ "content": "<extra_id_12>",
615
+ "lstrip": true,
616
+ "normalized": true,
617
+ "rstrip": false,
618
+ "single_word": false
619
+ },
620
+ {
621
+ "content": "<extra_id_11>",
622
+ "lstrip": true,
623
+ "normalized": true,
624
+ "rstrip": false,
625
+ "single_word": false
626
+ },
627
+ {
628
+ "content": "<extra_id_10>",
629
+ "lstrip": true,
630
+ "normalized": true,
631
+ "rstrip": false,
632
+ "single_word": false
633
+ },
634
+ {
635
+ "content": "<extra_id_9>",
636
+ "lstrip": true,
637
+ "normalized": true,
638
+ "rstrip": false,
639
+ "single_word": false
640
+ },
641
+ {
642
+ "content": "<extra_id_8>",
643
+ "lstrip": true,
644
+ "normalized": true,
645
+ "rstrip": false,
646
+ "single_word": false
647
+ },
648
+ {
649
+ "content": "<extra_id_7>",
650
+ "lstrip": true,
651
+ "normalized": true,
652
+ "rstrip": false,
653
+ "single_word": false
654
+ },
655
+ {
656
+ "content": "<extra_id_6>",
657
+ "lstrip": true,
658
+ "normalized": true,
659
+ "rstrip": false,
660
+ "single_word": false
661
+ },
662
+ {
663
+ "content": "<extra_id_5>",
664
+ "lstrip": true,
665
+ "normalized": true,
666
+ "rstrip": false,
667
+ "single_word": false
668
+ },
669
+ {
670
+ "content": "<extra_id_4>",
671
+ "lstrip": true,
672
+ "normalized": true,
673
+ "rstrip": false,
674
+ "single_word": false
675
+ },
676
+ {
677
+ "content": "<extra_id_3>",
678
+ "lstrip": true,
679
+ "normalized": true,
680
+ "rstrip": false,
681
+ "single_word": false
682
+ },
683
+ {
684
+ "content": "<extra_id_2>",
685
+ "lstrip": true,
686
+ "normalized": true,
687
+ "rstrip": false,
688
+ "single_word": false
689
+ },
690
+ {
691
+ "content": "<extra_id_1>",
692
+ "lstrip": true,
693
+ "normalized": true,
694
+ "rstrip": false,
695
+ "single_word": false
696
+ },
697
+ {
698
+ "content": "<extra_id_0>",
699
+ "lstrip": true,
700
+ "normalized": true,
701
+ "rstrip": false,
702
+ "single_word": false
703
+ }
704
+ ],
705
+ "backend": "tokenizers",
706
+ "bos_token": "<s>",
707
+ "cls_token": "<s>",
708
+ "eos_token": "</s>",
709
+ "errors": "replace",
710
+ "extra_special_tokens": [],
711
+ "is_local": false,
712
+ "mask_token": "<mask>",
713
+ "model_max_length": 512,
714
+ "pad_token": "<pad>",
715
+ "sep_token": "</s>",
716
+ "tokenizer_class": "RobertaTokenizer",
717
+ "trim_offsets": true,
718
+ "unk_token": "<unk>"
719
+ }
checkpoint-9213/trainer_state.json ADDED
@@ -0,0 +1,1361 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 3.0,
6
+ "eval_steps": 500,
7
+ "global_step": 9213,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.0162813415825464,
14
+ "grad_norm": 1.3799059391021729,
15
+ "learning_rate": 4.974492564854011e-05,
16
+ "loss": 4.366279296875,
17
+ "step": 50
18
+ },
19
+ {
20
+ "epoch": 0.0325626831650928,
21
+ "grad_norm": NaN,
22
+ "learning_rate": 4.9473569955497666e-05,
23
+ "loss": 3.2682159423828123,
24
+ "step": 100
25
+ },
26
+ {
27
+ "epoch": 0.04884402474763921,
28
+ "grad_norm": 1.1759626865386963,
29
+ "learning_rate": 4.9207641376316076e-05,
30
+ "loss": 2.121284637451172,
31
+ "step": 150
32
+ },
33
+ {
34
+ "epoch": 0.0651253663301856,
35
+ "grad_norm": 1.299229383468628,
36
+ "learning_rate": 4.8936285683273635e-05,
37
+ "loss": 1.8733770751953125,
38
+ "step": 200
39
+ },
40
+ {
41
+ "epoch": 0.08140670791273201,
42
+ "grad_norm": 1.3079231977462769,
43
+ "learning_rate": 4.8664929990231194e-05,
44
+ "loss": 1.8073320007324218,
45
+ "step": 250
46
+ },
47
+ {
48
+ "epoch": 0.09768804949527841,
49
+ "grad_norm": 1.5056711435317993,
50
+ "learning_rate": 4.839357429718876e-05,
51
+ "loss": 1.7036862182617187,
52
+ "step": 300
53
+ },
54
+ {
55
+ "epoch": 0.11396939107782482,
56
+ "grad_norm": 1.5221471786499023,
57
+ "learning_rate": 4.812221860414632e-05,
58
+ "loss": 1.6605093383789062,
59
+ "step": 350
60
+ },
61
+ {
62
+ "epoch": 0.1302507326603712,
63
+ "grad_norm": 1.4612085819244385,
64
+ "learning_rate": 4.785086291110388e-05,
65
+ "loss": 1.582379608154297,
66
+ "step": 400
67
+ },
68
+ {
69
+ "epoch": 0.14653207424291761,
70
+ "grad_norm": 1.3166944980621338,
71
+ "learning_rate": 4.7579507218061436e-05,
72
+ "loss": 1.5711520385742188,
73
+ "step": 450
74
+ },
75
+ {
76
+ "epoch": 0.16281341582546402,
77
+ "grad_norm": 1.8040547370910645,
78
+ "learning_rate": 4.7308151525018995e-05,
79
+ "loss": 1.436278076171875,
80
+ "step": 500
81
+ },
82
+ {
83
+ "epoch": 0.17909475740801042,
84
+ "grad_norm": 1.7718613147735596,
85
+ "learning_rate": 4.7036795831976553e-05,
86
+ "loss": 1.4956285095214843,
87
+ "step": 550
88
+ },
89
+ {
90
+ "epoch": 0.19537609899055683,
91
+ "grad_norm": 2.499027967453003,
92
+ "learning_rate": 4.676544013893412e-05,
93
+ "loss": 1.3423948669433594,
94
+ "step": 600
95
+ },
96
+ {
97
+ "epoch": 0.21165744057310323,
98
+ "grad_norm": 1.7684857845306396,
99
+ "learning_rate": 4.649408444589168e-05,
100
+ "loss": 1.358212432861328,
101
+ "step": 650
102
+ },
103
+ {
104
+ "epoch": 0.22793878215564964,
105
+ "grad_norm": 1.8858190774917603,
106
+ "learning_rate": 4.622815586671009e-05,
107
+ "loss": 1.3155609130859376,
108
+ "step": 700
109
+ },
110
+ {
111
+ "epoch": 0.24422012373819602,
112
+ "grad_norm": 1.708154559135437,
113
+ "learning_rate": 4.5956800173667646e-05,
114
+ "loss": 1.204995346069336,
115
+ "step": 750
116
+ },
117
+ {
118
+ "epoch": 0.2605014653207424,
119
+ "grad_norm": 2.377797842025757,
120
+ "learning_rate": 4.5685444480625205e-05,
121
+ "loss": 1.2155376434326173,
122
+ "step": 800
123
+ },
124
+ {
125
+ "epoch": 0.2767828069032888,
126
+ "grad_norm": 2.3532145023345947,
127
+ "learning_rate": 4.5414088787582764e-05,
128
+ "loss": 1.2571015930175782,
129
+ "step": 850
130
+ },
131
+ {
132
+ "epoch": 0.29306414848583523,
133
+ "grad_norm": 2.745908498764038,
134
+ "learning_rate": 4.514273309454032e-05,
135
+ "loss": 1.1259475708007813,
136
+ "step": 900
137
+ },
138
+ {
139
+ "epoch": 0.30934549006838163,
140
+ "grad_norm": 4.180660247802734,
141
+ "learning_rate": 4.487137740149789e-05,
142
+ "loss": 1.1778811645507812,
143
+ "step": 950
144
+ },
145
+ {
146
+ "epoch": 0.32562683165092804,
147
+ "grad_norm": 2.554922103881836,
148
+ "learning_rate": 4.460002170845545e-05,
149
+ "loss": 1.144913787841797,
150
+ "step": 1000
151
+ },
152
+ {
153
+ "epoch": 0.34190817323347444,
154
+ "grad_norm": 2.6831798553466797,
155
+ "learning_rate": 4.4328666015413006e-05,
156
+ "loss": 1.1192340850830078,
157
+ "step": 1050
158
+ },
159
+ {
160
+ "epoch": 0.35818951481602085,
161
+ "grad_norm": 2.5000758171081543,
162
+ "learning_rate": 4.4057310322370565e-05,
163
+ "loss": 1.0886085510253907,
164
+ "step": 1100
165
+ },
166
+ {
167
+ "epoch": 0.37447085639856725,
168
+ "grad_norm": 2.5406346321105957,
169
+ "learning_rate": 4.3785954629328124e-05,
170
+ "loss": 1.0647865295410157,
171
+ "step": 1150
172
+ },
173
+ {
174
+ "epoch": 0.39075219798111366,
175
+ "grad_norm": 2.5966973304748535,
176
+ "learning_rate": 4.351459893628568e-05,
177
+ "loss": 1.0138130187988281,
178
+ "step": 1200
179
+ },
180
+ {
181
+ "epoch": 0.40703353956366006,
182
+ "grad_norm": 2.9423012733459473,
183
+ "learning_rate": 4.324324324324325e-05,
184
+ "loss": 0.971071548461914,
185
+ "step": 1250
186
+ },
187
+ {
188
+ "epoch": 0.42331488114620647,
189
+ "grad_norm": 2.9763288497924805,
190
+ "learning_rate": 4.297188755020081e-05,
191
+ "loss": 0.9740264129638672,
192
+ "step": 1300
193
+ },
194
+ {
195
+ "epoch": 0.4395962227287529,
196
+ "grad_norm": 2.0831127166748047,
197
+ "learning_rate": 4.270595897101922e-05,
198
+ "loss": 1.0225084686279298,
199
+ "step": 1350
200
+ },
201
+ {
202
+ "epoch": 0.4558775643112993,
203
+ "grad_norm": 3.093662977218628,
204
+ "learning_rate": 4.2434603277976776e-05,
205
+ "loss": 0.9085057830810547,
206
+ "step": 1400
207
+ },
208
+ {
209
+ "epoch": 0.4721589058938456,
210
+ "grad_norm": 3.1048061847686768,
211
+ "learning_rate": 4.2163247584934335e-05,
212
+ "loss": 0.9657279968261718,
213
+ "step": 1450
214
+ },
215
+ {
216
+ "epoch": 0.48844024747639203,
217
+ "grad_norm": 89.80404663085938,
218
+ "learning_rate": 4.189189189189189e-05,
219
+ "loss": 0.9195979309082031,
220
+ "step": 1500
221
+ },
222
+ {
223
+ "epoch": 0.5047215890589385,
224
+ "grad_norm": 2.7518820762634277,
225
+ "learning_rate": 4.162053619884945e-05,
226
+ "loss": 0.8844217681884765,
227
+ "step": 1550
228
+ },
229
+ {
230
+ "epoch": 0.5210029306414848,
231
+ "grad_norm": 2.216895818710327,
232
+ "learning_rate": 4.134918050580701e-05,
233
+ "loss": 0.9437327575683594,
234
+ "step": 1600
235
+ },
236
+ {
237
+ "epoch": 0.5372842722240313,
238
+ "grad_norm": 2.756894826889038,
239
+ "learning_rate": 4.1077824812764577e-05,
240
+ "loss": 0.9072888946533203,
241
+ "step": 1650
242
+ },
243
+ {
244
+ "epoch": 0.5535656138065776,
245
+ "grad_norm": 2.630861759185791,
246
+ "learning_rate": 4.0806469119722135e-05,
247
+ "loss": 0.9133613586425782,
248
+ "step": 1700
249
+ },
250
+ {
251
+ "epoch": 0.5698469553891241,
252
+ "grad_norm": 2.3018958568573,
253
+ "learning_rate": 4.0535113426679694e-05,
254
+ "loss": 0.9179753875732422,
255
+ "step": 1750
256
+ },
257
+ {
258
+ "epoch": 0.5861282969716705,
259
+ "grad_norm": 2.2267212867736816,
260
+ "learning_rate": 4.026375773363725e-05,
261
+ "loss": 0.8736819458007813,
262
+ "step": 1800
263
+ },
264
+ {
265
+ "epoch": 0.6024096385542169,
266
+ "grad_norm": 3.817021369934082,
267
+ "learning_rate": 3.999240204059481e-05,
268
+ "loss": 0.8818047332763672,
269
+ "step": 1850
270
+ },
271
+ {
272
+ "epoch": 0.6186909801367633,
273
+ "grad_norm": 2.8244123458862305,
274
+ "learning_rate": 3.972104634755237e-05,
275
+ "loss": 0.8710990142822266,
276
+ "step": 1900
277
+ },
278
+ {
279
+ "epoch": 0.6349723217193096,
280
+ "grad_norm": 2.787409782409668,
281
+ "learning_rate": 3.9449690654509936e-05,
282
+ "loss": 0.791876220703125,
283
+ "step": 1950
284
+ },
285
+ {
286
+ "epoch": 0.6512536633018561,
287
+ "grad_norm": 2.5339832305908203,
288
+ "learning_rate": 3.9178334961467495e-05,
289
+ "loss": 0.8330724334716797,
290
+ "step": 2000
291
+ },
292
+ {
293
+ "epoch": 0.6675350048844024,
294
+ "grad_norm": 2.2571518421173096,
295
+ "learning_rate": 3.8906979268425054e-05,
296
+ "loss": 0.8065113067626953,
297
+ "step": 2050
298
+ },
299
+ {
300
+ "epoch": 0.6838163464669489,
301
+ "grad_norm": 3.3255224227905273,
302
+ "learning_rate": 3.863562357538261e-05,
303
+ "loss": 0.7839543151855469,
304
+ "step": 2100
305
+ },
306
+ {
307
+ "epoch": 0.7000976880494952,
308
+ "grad_norm": 2.493654727935791,
309
+ "learning_rate": 3.836426788234017e-05,
310
+ "loss": 0.7902137756347656,
311
+ "step": 2150
312
+ },
313
+ {
314
+ "epoch": 0.7163790296320417,
315
+ "grad_norm": 2.943366527557373,
316
+ "learning_rate": 3.809291218929774e-05,
317
+ "loss": 0.9532376861572266,
318
+ "step": 2200
319
+ },
320
+ {
321
+ "epoch": 0.732660371214588,
322
+ "grad_norm": 2.404705762863159,
323
+ "learning_rate": 3.7821556496255296e-05,
324
+ "loss": 0.8227187347412109,
325
+ "step": 2250
326
+ },
327
+ {
328
+ "epoch": 0.7489417127971345,
329
+ "grad_norm": 8.06905460357666,
330
+ "learning_rate": 3.7550200803212855e-05,
331
+ "loss": 0.7640556335449219,
332
+ "step": 2300
333
+ },
334
+ {
335
+ "epoch": 0.7652230543796809,
336
+ "grad_norm": 3.540977954864502,
337
+ "learning_rate": 3.7278845110170414e-05,
338
+ "loss": 0.8362091064453125,
339
+ "step": 2350
340
+ },
341
+ {
342
+ "epoch": 0.7815043959622273,
343
+ "grad_norm": 2.233323574066162,
344
+ "learning_rate": 3.700748941712797e-05,
345
+ "loss": 0.6893608093261718,
346
+ "step": 2400
347
+ },
348
+ {
349
+ "epoch": 0.7977857375447737,
350
+ "grad_norm": 2.947315216064453,
351
+ "learning_rate": 3.673613372408553e-05,
352
+ "loss": 0.7564961242675782,
353
+ "step": 2450
354
+ },
355
+ {
356
+ "epoch": 0.8140670791273201,
357
+ "grad_norm": 2.9839603900909424,
358
+ "learning_rate": 3.64647780310431e-05,
359
+ "loss": 0.7726463317871094,
360
+ "step": 2500
361
+ },
362
+ {
363
+ "epoch": 0.8303484207098665,
364
+ "grad_norm": 2.638998508453369,
365
+ "learning_rate": 3.6193422338000656e-05,
366
+ "loss": 0.7850227355957031,
367
+ "step": 2550
368
+ },
369
+ {
370
+ "epoch": 0.8466297622924129,
371
+ "grad_norm": 2.203768730163574,
372
+ "learning_rate": 3.5922066644958215e-05,
373
+ "loss": 0.7540821838378906,
374
+ "step": 2600
375
+ },
376
+ {
377
+ "epoch": 0.8629111038749593,
378
+ "grad_norm": 2.7057082653045654,
379
+ "learning_rate": 3.565071095191577e-05,
380
+ "loss": 0.6677760314941407,
381
+ "step": 2650
382
+ },
383
+ {
384
+ "epoch": 0.8791924454575057,
385
+ "grad_norm": 3.2892088890075684,
386
+ "learning_rate": 3.537935525887333e-05,
387
+ "loss": 0.74295654296875,
388
+ "step": 2700
389
+ },
390
+ {
391
+ "epoch": 0.8954737870400521,
392
+ "grad_norm": 2.8778061866760254,
393
+ "learning_rate": 3.510799956583089e-05,
394
+ "loss": 0.7150550842285156,
395
+ "step": 2750
396
+ },
397
+ {
398
+ "epoch": 0.9117551286225986,
399
+ "grad_norm": 1.9023234844207764,
400
+ "learning_rate": 3.483664387278846e-05,
401
+ "loss": 0.7367278289794922,
402
+ "step": 2800
403
+ },
404
+ {
405
+ "epoch": 0.9280364702051449,
406
+ "grad_norm": 3.3899879455566406,
407
+ "learning_rate": 3.4565288179746015e-05,
408
+ "loss": 0.7095525360107422,
409
+ "step": 2850
410
+ },
411
+ {
412
+ "epoch": 0.9443178117876913,
413
+ "grad_norm": 3.202036142349243,
414
+ "learning_rate": 3.4293932486703574e-05,
415
+ "loss": 0.7237194061279297,
416
+ "step": 2900
417
+ },
418
+ {
419
+ "epoch": 0.9605991533702377,
420
+ "grad_norm": 2.44712233543396,
421
+ "learning_rate": 3.402257679366113e-05,
422
+ "loss": 0.710773696899414,
423
+ "step": 2950
424
+ },
425
+ {
426
+ "epoch": 0.9768804949527841,
427
+ "grad_norm": 3.5873775482177734,
428
+ "learning_rate": 3.375122110061869e-05,
429
+ "loss": 0.6593586730957032,
430
+ "step": 3000
431
+ },
432
+ {
433
+ "epoch": 0.9931618365353305,
434
+ "grad_norm": 2.8714234828948975,
435
+ "learning_rate": 3.347986540757626e-05,
436
+ "loss": 0.7627605438232422,
437
+ "step": 3050
438
+ },
439
+ {
440
+ "epoch": 1.0,
441
+ "eval_bertscore_f1": 0.9653369394064688,
442
+ "eval_bleu": 0.6270834635129311,
443
+ "eval_loss": 0.48991522192955017,
444
+ "eval_meteor": 0.7251021230424122,
445
+ "eval_rouge1": 0.8465042416762141,
446
+ "eval_rouge2": 0.738163460778114,
447
+ "eval_runtime": 68.0737,
448
+ "eval_samples_per_second": 18.979,
449
+ "eval_steps_per_second": 2.38,
450
+ "step": 3071
451
+ },
452
+ {
453
+ "epoch": 1.009443178117877,
454
+ "grad_norm": 3.2640202045440674,
455
+ "learning_rate": 3.3208509714533816e-05,
456
+ "loss": 0.5927775573730468,
457
+ "step": 3100
458
+ },
459
+ {
460
+ "epoch": 1.0257245197004232,
461
+ "grad_norm": 3.130765914916992,
462
+ "learning_rate": 3.2937154021491375e-05,
463
+ "loss": 0.5853068161010743,
464
+ "step": 3150
465
+ },
466
+ {
467
+ "epoch": 1.0420058612829697,
468
+ "grad_norm": 3.2238473892211914,
469
+ "learning_rate": 3.2665798328448934e-05,
470
+ "loss": 0.6931375885009765,
471
+ "step": 3200
472
+ },
473
+ {
474
+ "epoch": 1.0582872028655161,
475
+ "grad_norm": 4.1798176765441895,
476
+ "learning_rate": 3.239444263540649e-05,
477
+ "loss": 0.6535150146484375,
478
+ "step": 3250
479
+ },
480
+ {
481
+ "epoch": 1.0745685444480626,
482
+ "grad_norm": 3.4835116863250732,
483
+ "learning_rate": 3.212308694236405e-05,
484
+ "loss": 0.6570293426513671,
485
+ "step": 3300
486
+ },
487
+ {
488
+ "epoch": 1.0908498860306088,
489
+ "grad_norm": 3.2468245029449463,
490
+ "learning_rate": 3.185173124932162e-05,
491
+ "loss": 0.6235344696044922,
492
+ "step": 3350
493
+ },
494
+ {
495
+ "epoch": 1.1071312276131553,
496
+ "grad_norm": 2.503023862838745,
497
+ "learning_rate": 3.1580375556279176e-05,
498
+ "loss": 0.6021703720092774,
499
+ "step": 3400
500
+ },
501
+ {
502
+ "epoch": 1.1234125691957018,
503
+ "grad_norm": 3.5487520694732666,
504
+ "learning_rate": 3.1309019863236735e-05,
505
+ "loss": 0.6459141540527343,
506
+ "step": 3450
507
+ },
508
+ {
509
+ "epoch": 1.1396939107782482,
510
+ "grad_norm": 2.8496859073638916,
511
+ "learning_rate": 3.1037664170194294e-05,
512
+ "loss": 0.5954633712768554,
513
+ "step": 3500
514
+ },
515
+ {
516
+ "epoch": 1.1559752523607945,
517
+ "grad_norm": 2.746445894241333,
518
+ "learning_rate": 3.076630847715185e-05,
519
+ "loss": 0.5743134689331054,
520
+ "step": 3550
521
+ },
522
+ {
523
+ "epoch": 1.172256593943341,
524
+ "grad_norm": 3.843780517578125,
525
+ "learning_rate": 3.0494952784109408e-05,
526
+ "loss": 0.7025726318359375,
527
+ "step": 3600
528
+ },
529
+ {
530
+ "epoch": 1.1885379355258874,
531
+ "grad_norm": 2.3990111351013184,
532
+ "learning_rate": 3.0223597091066974e-05,
533
+ "loss": 0.6482646942138672,
534
+ "step": 3650
535
+ },
536
+ {
537
+ "epoch": 1.2048192771084336,
538
+ "grad_norm": 3.495655059814453,
539
+ "learning_rate": 2.9952241398024532e-05,
540
+ "loss": 0.6225572967529297,
541
+ "step": 3700
542
+ },
543
+ {
544
+ "epoch": 1.22110061869098,
545
+ "grad_norm": 3.0918631553649902,
546
+ "learning_rate": 2.968088570498209e-05,
547
+ "loss": 0.6018490982055664,
548
+ "step": 3750
549
+ },
550
+ {
551
+ "epoch": 1.2373819602735265,
552
+ "grad_norm": 3.54016375541687,
553
+ "learning_rate": 2.940953001193965e-05,
554
+ "loss": 0.6204871749877929,
555
+ "step": 3800
556
+ },
557
+ {
558
+ "epoch": 1.253663301856073,
559
+ "grad_norm": 3.330631971359253,
560
+ "learning_rate": 2.913817431889721e-05,
561
+ "loss": 0.5625830459594726,
562
+ "step": 3850
563
+ },
564
+ {
565
+ "epoch": 1.2699446434386195,
566
+ "grad_norm": 3.4091968536376953,
567
+ "learning_rate": 2.8866818625854774e-05,
568
+ "loss": 0.6275486755371094,
569
+ "step": 3900
570
+ },
571
+ {
572
+ "epoch": 1.2862259850211657,
573
+ "grad_norm": 3.535207748413086,
574
+ "learning_rate": 2.8595462932812333e-05,
575
+ "loss": 0.6113796997070312,
576
+ "step": 3950
577
+ },
578
+ {
579
+ "epoch": 1.3025073266037122,
580
+ "grad_norm": 2.739208459854126,
581
+ "learning_rate": 2.8324107239769892e-05,
582
+ "loss": 0.6166405487060547,
583
+ "step": 4000
584
+ },
585
+ {
586
+ "epoch": 1.3187886681862586,
587
+ "grad_norm": 2.3887178897857666,
588
+ "learning_rate": 2.805275154672745e-05,
589
+ "loss": 0.6348526000976562,
590
+ "step": 4050
591
+ },
592
+ {
593
+ "epoch": 1.3350700097688049,
594
+ "grad_norm": 3.2300209999084473,
595
+ "learning_rate": 2.778139585368501e-05,
596
+ "loss": 0.6592056274414062,
597
+ "step": 4100
598
+ },
599
+ {
600
+ "epoch": 1.3513513513513513,
601
+ "grad_norm": 2.4417901039123535,
602
+ "learning_rate": 2.751004016064257e-05,
603
+ "loss": 0.5736191177368164,
604
+ "step": 4150
605
+ },
606
+ {
607
+ "epoch": 1.3676326929338978,
608
+ "grad_norm": 4.1886467933654785,
609
+ "learning_rate": 2.7238684467600134e-05,
610
+ "loss": 0.5781734466552735,
611
+ "step": 4200
612
+ },
613
+ {
614
+ "epoch": 1.3839140345164442,
615
+ "grad_norm": 2.7025551795959473,
616
+ "learning_rate": 2.6967328774557693e-05,
617
+ "loss": 0.5421427917480469,
618
+ "step": 4250
619
+ },
620
+ {
621
+ "epoch": 1.4001953760989905,
622
+ "grad_norm": 3.4467735290527344,
623
+ "learning_rate": 2.6695973081515252e-05,
624
+ "loss": 0.6328504180908203,
625
+ "step": 4300
626
+ },
627
+ {
628
+ "epoch": 1.416476717681537,
629
+ "grad_norm": 2.252255916595459,
630
+ "learning_rate": 2.642461738847281e-05,
631
+ "loss": 0.565279884338379,
632
+ "step": 4350
633
+ },
634
+ {
635
+ "epoch": 1.4327580592640834,
636
+ "grad_norm": 2.3594324588775635,
637
+ "learning_rate": 2.615326169543037e-05,
638
+ "loss": 0.585950927734375,
639
+ "step": 4400
640
+ },
641
+ {
642
+ "epoch": 1.4490394008466296,
643
+ "grad_norm": 3.1787843704223633,
644
+ "learning_rate": 2.5881906002387928e-05,
645
+ "loss": 0.6461568450927735,
646
+ "step": 4450
647
+ },
648
+ {
649
+ "epoch": 1.465320742429176,
650
+ "grad_norm": 9.052631378173828,
651
+ "learning_rate": 2.5610550309345494e-05,
652
+ "loss": 0.5787173461914062,
653
+ "step": 4500
654
+ },
655
+ {
656
+ "epoch": 1.4816020840117226,
657
+ "grad_norm": 3.1000287532806396,
658
+ "learning_rate": 2.5339194616303053e-05,
659
+ "loss": 0.5753350830078126,
660
+ "step": 4550
661
+ },
662
+ {
663
+ "epoch": 1.497883425594269,
664
+ "grad_norm": 2.160932779312134,
665
+ "learning_rate": 2.506783892326061e-05,
666
+ "loss": 0.6055181503295899,
667
+ "step": 4600
668
+ },
669
+ {
670
+ "epoch": 1.5141647671768155,
671
+ "grad_norm": 5.498105525970459,
672
+ "learning_rate": 2.479648323021817e-05,
673
+ "loss": 0.5424030303955079,
674
+ "step": 4650
675
+ },
676
+ {
677
+ "epoch": 1.530446108759362,
678
+ "grad_norm": 2.4782474040985107,
679
+ "learning_rate": 2.4525127537175733e-05,
680
+ "loss": 0.6082788848876953,
681
+ "step": 4700
682
+ },
683
+ {
684
+ "epoch": 1.5467274503419082,
685
+ "grad_norm": 2.7400150299072266,
686
+ "learning_rate": 2.425377184413329e-05,
687
+ "loss": 0.5984983444213867,
688
+ "step": 4750
689
+ },
690
+ {
691
+ "epoch": 1.5630087919244544,
692
+ "grad_norm": 3.0426690578460693,
693
+ "learning_rate": 2.398241615109085e-05,
694
+ "loss": 0.6066116333007813,
695
+ "step": 4800
696
+ },
697
+ {
698
+ "epoch": 1.5792901335070009,
699
+ "grad_norm": 3.5095133781433105,
700
+ "learning_rate": 2.3711060458048412e-05,
701
+ "loss": 0.605382080078125,
702
+ "step": 4850
703
+ },
704
+ {
705
+ "epoch": 1.5955714750895473,
706
+ "grad_norm": 3.64323091506958,
707
+ "learning_rate": 2.343970476500597e-05,
708
+ "loss": 0.5372691726684571,
709
+ "step": 4900
710
+ },
711
+ {
712
+ "epoch": 1.6118528166720938,
713
+ "grad_norm": 6.410864353179932,
714
+ "learning_rate": 2.316834907196353e-05,
715
+ "loss": 0.4930916976928711,
716
+ "step": 4950
717
+ },
718
+ {
719
+ "epoch": 1.6281341582546403,
720
+ "grad_norm": 2.9752631187438965,
721
+ "learning_rate": 2.2896993378921092e-05,
722
+ "loss": 0.49088024139404296,
723
+ "step": 5000
724
+ },
725
+ {
726
+ "epoch": 1.6444154998371867,
727
+ "grad_norm": 2.8982131481170654,
728
+ "learning_rate": 2.262563768587865e-05,
729
+ "loss": 0.5840103912353516,
730
+ "step": 5050
731
+ },
732
+ {
733
+ "epoch": 1.660696841419733,
734
+ "grad_norm": 3.7222821712493896,
735
+ "learning_rate": 2.235428199283621e-05,
736
+ "loss": 0.5301944732666015,
737
+ "step": 5100
738
+ },
739
+ {
740
+ "epoch": 1.6769781830022794,
741
+ "grad_norm": 3.526601791381836,
742
+ "learning_rate": 2.2082926299793772e-05,
743
+ "loss": 0.4781329345703125,
744
+ "step": 5150
745
+ },
746
+ {
747
+ "epoch": 1.6932595245848256,
748
+ "grad_norm": 3.4005913734436035,
749
+ "learning_rate": 2.181157060675133e-05,
750
+ "loss": 0.5219943237304687,
751
+ "step": 5200
752
+ },
753
+ {
754
+ "epoch": 1.709540866167372,
755
+ "grad_norm": 3.9888486862182617,
756
+ "learning_rate": 2.154021491370889e-05,
757
+ "loss": 0.5756942367553711,
758
+ "step": 5250
759
+ },
760
+ {
761
+ "epoch": 1.7258222077499186,
762
+ "grad_norm": 3.6952855587005615,
763
+ "learning_rate": 2.1268859220666452e-05,
764
+ "loss": 0.5279730606079102,
765
+ "step": 5300
766
+ },
767
+ {
768
+ "epoch": 1.742103549332465,
769
+ "grad_norm": 3.1715617179870605,
770
+ "learning_rate": 2.099750352762401e-05,
771
+ "loss": 0.5441674423217774,
772
+ "step": 5350
773
+ },
774
+ {
775
+ "epoch": 1.7583848909150115,
776
+ "grad_norm": 3.5982584953308105,
777
+ "learning_rate": 2.0726147834581573e-05,
778
+ "loss": 0.46869205474853515,
779
+ "step": 5400
780
+ },
781
+ {
782
+ "epoch": 1.774666232497558,
783
+ "grad_norm": 3.594470977783203,
784
+ "learning_rate": 2.0454792141539132e-05,
785
+ "loss": 0.5004570388793945,
786
+ "step": 5450
787
+ },
788
+ {
789
+ "epoch": 1.7909475740801042,
790
+ "grad_norm": 3.198012351989746,
791
+ "learning_rate": 2.018343644849669e-05,
792
+ "loss": 0.49389095306396485,
793
+ "step": 5500
794
+ },
795
+ {
796
+ "epoch": 1.8072289156626506,
797
+ "grad_norm": 2.3895151615142822,
798
+ "learning_rate": 1.9912080755454253e-05,
799
+ "loss": 0.5188541793823243,
800
+ "step": 5550
801
+ },
802
+ {
803
+ "epoch": 1.8235102572451969,
804
+ "grad_norm": 2.874993085861206,
805
+ "learning_rate": 1.964072506241181e-05,
806
+ "loss": 0.4755914306640625,
807
+ "step": 5600
808
+ },
809
+ {
810
+ "epoch": 1.8397915988277433,
811
+ "grad_norm": 4.330140590667725,
812
+ "learning_rate": 1.936936936936937e-05,
813
+ "loss": 0.49986125946044924,
814
+ "step": 5650
815
+ },
816
+ {
817
+ "epoch": 1.8560729404102898,
818
+ "grad_norm": 3.2301809787750244,
819
+ "learning_rate": 1.9098013676326933e-05,
820
+ "loss": 0.5472452163696289,
821
+ "step": 5700
822
+ },
823
+ {
824
+ "epoch": 1.8723542819928363,
825
+ "grad_norm": 2.056736946105957,
826
+ "learning_rate": 1.883208509714534e-05,
827
+ "loss": 0.5061603164672852,
828
+ "step": 5750
829
+ },
830
+ {
831
+ "epoch": 1.8886356235753827,
832
+ "grad_norm": 4.6902031898498535,
833
+ "learning_rate": 1.85607294041029e-05,
834
+ "loss": 0.4669316101074219,
835
+ "step": 5800
836
+ },
837
+ {
838
+ "epoch": 1.904916965157929,
839
+ "grad_norm": 3.790092945098877,
840
+ "learning_rate": 1.828937371106046e-05,
841
+ "loss": 0.561137809753418,
842
+ "step": 5850
843
+ },
844
+ {
845
+ "epoch": 1.9211983067404754,
846
+ "grad_norm": 4.152039527893066,
847
+ "learning_rate": 1.801801801801802e-05,
848
+ "loss": 0.4813918304443359,
849
+ "step": 5900
850
+ },
851
+ {
852
+ "epoch": 1.9374796483230217,
853
+ "grad_norm": 3.3476598262786865,
854
+ "learning_rate": 1.774666232497558e-05,
855
+ "loss": 0.5630344390869141,
856
+ "step": 5950
857
+ },
858
+ {
859
+ "epoch": 1.9537609899055681,
860
+ "grad_norm": 4.2672810554504395,
861
+ "learning_rate": 1.747530663193314e-05,
862
+ "loss": 0.48508411407470703,
863
+ "step": 6000
864
+ },
865
+ {
866
+ "epoch": 1.9700423314881146,
867
+ "grad_norm": 4.236985206604004,
868
+ "learning_rate": 1.72039509388907e-05,
869
+ "loss": 0.5445558929443359,
870
+ "step": 6050
871
+ },
872
+ {
873
+ "epoch": 1.986323673070661,
874
+ "grad_norm": 2.686180591583252,
875
+ "learning_rate": 1.693259524584826e-05,
876
+ "loss": 0.5194969558715821,
877
+ "step": 6100
878
+ },
879
+ {
880
+ "epoch": 2.0,
881
+ "eval_bertscore_f1": 0.9755530517905858,
882
+ "eval_bleu": 0.7363057302997511,
883
+ "eval_loss": 0.3618590235710144,
884
+ "eval_meteor": 0.813260581053782,
885
+ "eval_rouge1": 0.8844645577727277,
886
+ "eval_rouge2": 0.8050353100012327,
887
+ "eval_runtime": 70.0732,
888
+ "eval_samples_per_second": 18.438,
889
+ "eval_steps_per_second": 2.312,
890
+ "step": 6142
891
+ },
892
+ {
893
+ "epoch": 2.0026050146532075,
894
+ "grad_norm": 2.022204637527466,
895
+ "learning_rate": 1.666123955280582e-05,
896
+ "loss": 0.48952743530273435,
897
+ "step": 6150
898
+ },
899
+ {
900
+ "epoch": 2.018886356235754,
901
+ "grad_norm": 4.96242094039917,
902
+ "learning_rate": 1.638988385976338e-05,
903
+ "loss": 0.5839331436157227,
904
+ "step": 6200
905
+ },
906
+ {
907
+ "epoch": 2.0351676978183004,
908
+ "grad_norm": 3.4074771404266357,
909
+ "learning_rate": 1.611852816672094e-05,
910
+ "loss": 0.5070013427734374,
911
+ "step": 6250
912
+ },
913
+ {
914
+ "epoch": 2.0514490394008464,
915
+ "grad_norm": 3.10239577293396,
916
+ "learning_rate": 1.58471724736785e-05,
917
+ "loss": 0.4913197708129883,
918
+ "step": 6300
919
+ },
920
+ {
921
+ "epoch": 2.067730380983393,
922
+ "grad_norm": 3.764558792114258,
923
+ "learning_rate": 1.557581678063606e-05,
924
+ "loss": 0.4683738327026367,
925
+ "step": 6350
926
+ },
927
+ {
928
+ "epoch": 2.0840117225659394,
929
+ "grad_norm": 4.150667667388916,
930
+ "learning_rate": 1.5304461087593617e-05,
931
+ "loss": 0.4650471878051758,
932
+ "step": 6400
933
+ },
934
+ {
935
+ "epoch": 2.100293064148486,
936
+ "grad_norm": 3.9944324493408203,
937
+ "learning_rate": 1.5033105394551178e-05,
938
+ "loss": 0.5024824905395507,
939
+ "step": 6450
940
+ },
941
+ {
942
+ "epoch": 2.1165744057310323,
943
+ "grad_norm": 2.410952568054199,
944
+ "learning_rate": 1.476174970150874e-05,
945
+ "loss": 0.5205254745483399,
946
+ "step": 6500
947
+ },
948
+ {
949
+ "epoch": 2.1328557473135787,
950
+ "grad_norm": 4.4830098152160645,
951
+ "learning_rate": 1.4490394008466299e-05,
952
+ "loss": 0.5458049011230469,
953
+ "step": 6550
954
+ },
955
+ {
956
+ "epoch": 2.149137088896125,
957
+ "grad_norm": 3.420327663421631,
958
+ "learning_rate": 1.4219038315423858e-05,
959
+ "loss": 0.544830436706543,
960
+ "step": 6600
961
+ },
962
+ {
963
+ "epoch": 2.165418430478671,
964
+ "grad_norm": 4.262825012207031,
965
+ "learning_rate": 1.394768262238142e-05,
966
+ "loss": 0.4901109313964844,
967
+ "step": 6650
968
+ },
969
+ {
970
+ "epoch": 2.1816997720612177,
971
+ "grad_norm": 2.969730854034424,
972
+ "learning_rate": 1.3676326929338979e-05,
973
+ "loss": 0.48183216094970704,
974
+ "step": 6700
975
+ },
976
+ {
977
+ "epoch": 2.197981113643764,
978
+ "grad_norm": 2.7617075443267822,
979
+ "learning_rate": 1.3404971236296538e-05,
980
+ "loss": 0.5208282470703125,
981
+ "step": 6750
982
+ },
983
+ {
984
+ "epoch": 2.2142624552263106,
985
+ "grad_norm": 2.8121178150177,
986
+ "learning_rate": 1.31336155432541e-05,
987
+ "loss": 0.47464847564697266,
988
+ "step": 6800
989
+ },
990
+ {
991
+ "epoch": 2.230543796808857,
992
+ "grad_norm": 2.1643424034118652,
993
+ "learning_rate": 1.2862259850211659e-05,
994
+ "loss": 0.5135415267944335,
995
+ "step": 6850
996
+ },
997
+ {
998
+ "epoch": 2.2468251383914035,
999
+ "grad_norm": 3.0597665309906006,
1000
+ "learning_rate": 1.2590904157169217e-05,
1001
+ "loss": 0.48383502960205077,
1002
+ "step": 6900
1003
+ },
1004
+ {
1005
+ "epoch": 2.26310647997395,
1006
+ "grad_norm": 3.4192488193511963,
1007
+ "learning_rate": 1.2319548464126778e-05,
1008
+ "loss": 0.5295528411865235,
1009
+ "step": 6950
1010
+ },
1011
+ {
1012
+ "epoch": 2.2793878215564964,
1013
+ "grad_norm": 3.485333204269409,
1014
+ "learning_rate": 1.2048192771084338e-05,
1015
+ "loss": 0.5490006637573243,
1016
+ "step": 7000
1017
+ },
1018
+ {
1019
+ "epoch": 2.295669163139043,
1020
+ "grad_norm": 3.5061099529266357,
1021
+ "learning_rate": 1.1776837078041899e-05,
1022
+ "loss": 0.444782600402832,
1023
+ "step": 7050
1024
+ },
1025
+ {
1026
+ "epoch": 2.311950504721589,
1027
+ "grad_norm": 4.059643745422363,
1028
+ "learning_rate": 1.1505481384999458e-05,
1029
+ "loss": 0.4735762786865234,
1030
+ "step": 7100
1031
+ },
1032
+ {
1033
+ "epoch": 2.3282318463041354,
1034
+ "grad_norm": 3.1162891387939453,
1035
+ "learning_rate": 1.1234125691957018e-05,
1036
+ "loss": 0.5211288452148437,
1037
+ "step": 7150
1038
+ },
1039
+ {
1040
+ "epoch": 2.344513187886682,
1041
+ "grad_norm": 1.198476791381836,
1042
+ "learning_rate": 1.0962769998914577e-05,
1043
+ "loss": 0.5121672439575196,
1044
+ "step": 7200
1045
+ },
1046
+ {
1047
+ "epoch": 2.3607945294692283,
1048
+ "grad_norm": 3.9411354064941406,
1049
+ "learning_rate": 1.0691414305872138e-05,
1050
+ "loss": 0.5504902267456054,
1051
+ "step": 7250
1052
+ },
1053
+ {
1054
+ "epoch": 2.3770758710517748,
1055
+ "grad_norm": 3.590696334838867,
1056
+ "learning_rate": 1.0420058612829696e-05,
1057
+ "loss": 0.4592051315307617,
1058
+ "step": 7300
1059
+ },
1060
+ {
1061
+ "epoch": 2.393357212634321,
1062
+ "grad_norm": 2.1098175048828125,
1063
+ "learning_rate": 1.0148702919787257e-05,
1064
+ "loss": 0.4932923126220703,
1065
+ "step": 7350
1066
+ },
1067
+ {
1068
+ "epoch": 2.4096385542168672,
1069
+ "grad_norm": 4.837367057800293,
1070
+ "learning_rate": 9.877347226744818e-06,
1071
+ "loss": 0.45726318359375,
1072
+ "step": 7400
1073
+ },
1074
+ {
1075
+ "epoch": 2.4259198957994137,
1076
+ "grad_norm": 2.808544874191284,
1077
+ "learning_rate": 9.605991533702376e-06,
1078
+ "loss": 0.4931900787353516,
1079
+ "step": 7450
1080
+ },
1081
+ {
1082
+ "epoch": 2.44220123738196,
1083
+ "grad_norm": 2.6487984657287598,
1084
+ "learning_rate": 9.334635840659937e-06,
1085
+ "loss": 0.4715615844726562,
1086
+ "step": 7500
1087
+ },
1088
+ {
1089
+ "epoch": 2.4584825789645066,
1090
+ "grad_norm": 4.251109600067139,
1091
+ "learning_rate": 9.063280147617497e-06,
1092
+ "loss": 0.5373792266845703,
1093
+ "step": 7550
1094
+ },
1095
+ {
1096
+ "epoch": 2.474763920547053,
1097
+ "grad_norm": 3.84010648727417,
1098
+ "learning_rate": 8.791924454575056e-06,
1099
+ "loss": 0.44632495880126954,
1100
+ "step": 7600
1101
+ },
1102
+ {
1103
+ "epoch": 2.4910452621295995,
1104
+ "grad_norm": 1.9418392181396484,
1105
+ "learning_rate": 8.520568761532617e-06,
1106
+ "loss": 0.48151702880859376,
1107
+ "step": 7650
1108
+ },
1109
+ {
1110
+ "epoch": 2.507326603712146,
1111
+ "grad_norm": 4.140622138977051,
1112
+ "learning_rate": 8.249213068490177e-06,
1113
+ "loss": 0.4063055419921875,
1114
+ "step": 7700
1115
+ },
1116
+ {
1117
+ "epoch": 2.5236079452946925,
1118
+ "grad_norm": 3.0216522216796875,
1119
+ "learning_rate": 7.977857375447738e-06,
1120
+ "loss": 0.4796050262451172,
1121
+ "step": 7750
1122
+ },
1123
+ {
1124
+ "epoch": 2.539889286877239,
1125
+ "grad_norm": 4.727103233337402,
1126
+ "learning_rate": 7.706501682405297e-06,
1127
+ "loss": 0.46068046569824217,
1128
+ "step": 7800
1129
+ },
1130
+ {
1131
+ "epoch": 2.556170628459785,
1132
+ "grad_norm": 4.281773567199707,
1133
+ "learning_rate": 7.435145989362857e-06,
1134
+ "loss": 0.44071575164794924,
1135
+ "step": 7850
1136
+ },
1137
+ {
1138
+ "epoch": 2.5724519700423314,
1139
+ "grad_norm": 3.134763479232788,
1140
+ "learning_rate": 7.163790296320418e-06,
1141
+ "loss": 0.4763399887084961,
1142
+ "step": 7900
1143
+ },
1144
+ {
1145
+ "epoch": 2.588733311624878,
1146
+ "grad_norm": 3.584044933319092,
1147
+ "learning_rate": 6.8924346032779764e-06,
1148
+ "loss": 0.4629644012451172,
1149
+ "step": 7950
1150
+ },
1151
+ {
1152
+ "epoch": 2.6050146532074243,
1153
+ "grad_norm": 2.601400852203369,
1154
+ "learning_rate": 6.621078910235537e-06,
1155
+ "loss": 0.4727302551269531,
1156
+ "step": 8000
1157
+ },
1158
+ {
1159
+ "epoch": 2.6212959947899708,
1160
+ "grad_norm": 3.5354995727539062,
1161
+ "learning_rate": 6.3497232171930975e-06,
1162
+ "loss": 0.42160026550292967,
1163
+ "step": 8050
1164
+ },
1165
+ {
1166
+ "epoch": 2.6375773363725172,
1167
+ "grad_norm": 2.9206888675689697,
1168
+ "learning_rate": 6.078367524150657e-06,
1169
+ "loss": 0.4754294204711914,
1170
+ "step": 8100
1171
+ },
1172
+ {
1173
+ "epoch": 2.6538586779550632,
1174
+ "grad_norm": 2.4927732944488525,
1175
+ "learning_rate": 5.807011831108217e-06,
1176
+ "loss": 0.5114262390136719,
1177
+ "step": 8150
1178
+ },
1179
+ {
1180
+ "epoch": 2.6701400195376097,
1181
+ "grad_norm": 4.378971099853516,
1182
+ "learning_rate": 5.535656138065777e-06,
1183
+ "loss": 0.5084254837036133,
1184
+ "step": 8200
1185
+ },
1186
+ {
1187
+ "epoch": 2.686421361120156,
1188
+ "grad_norm": 2.4034016132354736,
1189
+ "learning_rate": 5.264300445023337e-06,
1190
+ "loss": 0.527303466796875,
1191
+ "step": 8250
1192
+ },
1193
+ {
1194
+ "epoch": 2.7027027027027026,
1195
+ "grad_norm": 3.7141177654266357,
1196
+ "learning_rate": 4.9929447519808975e-06,
1197
+ "loss": 0.4662747573852539,
1198
+ "step": 8300
1199
+ },
1200
+ {
1201
+ "epoch": 2.718984044285249,
1202
+ "grad_norm": 3.871277332305908,
1203
+ "learning_rate": 4.721589058938457e-06,
1204
+ "loss": 0.5126468276977539,
1205
+ "step": 8350
1206
+ },
1207
+ {
1208
+ "epoch": 2.7352653858677956,
1209
+ "grad_norm": 2.500791072845459,
1210
+ "learning_rate": 4.450233365896017e-06,
1211
+ "loss": 0.47957534790039064,
1212
+ "step": 8400
1213
+ },
1214
+ {
1215
+ "epoch": 2.751546727450342,
1216
+ "grad_norm": 5.441941738128662,
1217
+ "learning_rate": 4.1788776728535765e-06,
1218
+ "loss": 0.38029510498046876,
1219
+ "step": 8450
1220
+ },
1221
+ {
1222
+ "epoch": 2.7678280690328885,
1223
+ "grad_norm": 3.3940446376800537,
1224
+ "learning_rate": 3.907521979811136e-06,
1225
+ "loss": 0.4626531219482422,
1226
+ "step": 8500
1227
+ },
1228
+ {
1229
+ "epoch": 2.784109410615435,
1230
+ "grad_norm": 4.125059127807617,
1231
+ "learning_rate": 3.6361662867686967e-06,
1232
+ "loss": 0.4890303039550781,
1233
+ "step": 8550
1234
+ },
1235
+ {
1236
+ "epoch": 2.800390752197981,
1237
+ "grad_norm": 2.758863687515259,
1238
+ "learning_rate": 3.3648105937262564e-06,
1239
+ "loss": 0.4689041519165039,
1240
+ "step": 8600
1241
+ },
1242
+ {
1243
+ "epoch": 2.8166720937805274,
1244
+ "grad_norm": 4.864498138427734,
1245
+ "learning_rate": 3.0934549006838165e-06,
1246
+ "loss": 0.46032047271728516,
1247
+ "step": 8650
1248
+ },
1249
+ {
1250
+ "epoch": 2.832953435363074,
1251
+ "grad_norm": 3.3108010292053223,
1252
+ "learning_rate": 2.8220992076413766e-06,
1253
+ "loss": 0.43362377166748045,
1254
+ "step": 8700
1255
+ },
1256
+ {
1257
+ "epoch": 2.8492347769456203,
1258
+ "grad_norm": 2.3421084880828857,
1259
+ "learning_rate": 2.5507435145989362e-06,
1260
+ "loss": 0.44478134155273436,
1261
+ "step": 8750
1262
+ },
1263
+ {
1264
+ "epoch": 2.865516118528167,
1265
+ "grad_norm": 3.283203601837158,
1266
+ "learning_rate": 2.2793878215564963e-06,
1267
+ "loss": 0.5047480392456055,
1268
+ "step": 8800
1269
+ },
1270
+ {
1271
+ "epoch": 2.8817974601107132,
1272
+ "grad_norm": 2.0124731063842773,
1273
+ "learning_rate": 2.0080321285140564e-06,
1274
+ "loss": 0.4658950424194336,
1275
+ "step": 8850
1276
+ },
1277
+ {
1278
+ "epoch": 2.8980788016932593,
1279
+ "grad_norm": 3.839552879333496,
1280
+ "learning_rate": 1.7366764354716163e-06,
1281
+ "loss": 0.45034191131591794,
1282
+ "step": 8900
1283
+ },
1284
+ {
1285
+ "epoch": 2.9143601432758057,
1286
+ "grad_norm": 4.701524257659912,
1287
+ "learning_rate": 1.4653207424291762e-06,
1288
+ "loss": 0.47517498016357423,
1289
+ "step": 8950
1290
+ },
1291
+ {
1292
+ "epoch": 2.930641484858352,
1293
+ "grad_norm": 6.58011531829834,
1294
+ "learning_rate": 1.1939650493867363e-06,
1295
+ "loss": 0.44451316833496096,
1296
+ "step": 9000
1297
+ },
1298
+ {
1299
+ "epoch": 2.9469228264408986,
1300
+ "grad_norm": 2.9627132415771484,
1301
+ "learning_rate": 9.226093563442963e-07,
1302
+ "loss": 0.41320926666259766,
1303
+ "step": 9050
1304
+ },
1305
+ {
1306
+ "epoch": 2.963204168023445,
1307
+ "grad_norm": 3.003753185272217,
1308
+ "learning_rate": 6.51253663301856e-07,
1309
+ "loss": 0.3974274444580078,
1310
+ "step": 9100
1311
+ },
1312
+ {
1313
+ "epoch": 2.9794855096059916,
1314
+ "grad_norm": 2.0012876987457275,
1315
+ "learning_rate": 3.7989797025941607e-07,
1316
+ "loss": 0.42885406494140627,
1317
+ "step": 9150
1318
+ },
1319
+ {
1320
+ "epoch": 2.995766851188538,
1321
+ "grad_norm": 3.7651121616363525,
1322
+ "learning_rate": 1.0854227721697602e-07,
1323
+ "loss": 0.4800850296020508,
1324
+ "step": 9200
1325
+ },
1326
+ {
1327
+ "epoch": 3.0,
1328
+ "eval_bertscore_f1": 0.9785511039727982,
1329
+ "eval_bleu": 0.7645620244248046,
1330
+ "eval_loss": 0.3346184194087982,
1331
+ "eval_meteor": 0.8355226256477348,
1332
+ "eval_rouge1": 0.8968326891869934,
1333
+ "eval_rouge2": 0.8250429516845066,
1334
+ "eval_runtime": 68.0941,
1335
+ "eval_samples_per_second": 18.974,
1336
+ "eval_steps_per_second": 2.379,
1337
+ "step": 9213
1338
+ }
1339
+ ],
1340
+ "logging_steps": 50,
1341
+ "max_steps": 9213,
1342
+ "num_input_tokens_seen": 0,
1343
+ "num_train_epochs": 3,
1344
+ "save_steps": 500,
1345
+ "stateful_callbacks": {
1346
+ "TrainerControl": {
1347
+ "args": {
1348
+ "should_epoch_stop": false,
1349
+ "should_evaluate": false,
1350
+ "should_log": false,
1351
+ "should_save": true,
1352
+ "should_training_stop": true
1353
+ },
1354
+ "attributes": {}
1355
+ }
1356
+ },
1357
+ "total_flos": 2.263887217557504e+16,
1358
+ "train_batch_size": 8,
1359
+ "trial_name": null,
1360
+ "trial_params": null
1361
+ }
checkpoint-9213/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbfa7bf50b61cfe7132d62e007366c9711e52c063135607d451ce0590569a343
3
+ size 4920
tokenizer.json CHANGED
@@ -2,13 +2,13 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 128,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 128
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
@@ -61,906 +61,6 @@
61
  "rstrip": false,
62
  "normalized": true,
63
  "special": true
64
- },
65
- {
66
- "id": 32000,
67
- "content": "<extra_id_99>",
68
- "single_word": false,
69
- "lstrip": true,
70
- "rstrip": false,
71
- "normalized": true,
72
- "special": true
73
- },
74
- {
75
- "id": 32001,
76
- "content": "<extra_id_98>",
77
- "single_word": false,
78
- "lstrip": true,
79
- "rstrip": false,
80
- "normalized": true,
81
- "special": true
82
- },
83
- {
84
- "id": 32002,
85
- "content": "<extra_id_97>",
86
- "single_word": false,
87
- "lstrip": true,
88
- "rstrip": false,
89
- "normalized": true,
90
- "special": true
91
- },
92
- {
93
- "id": 32003,
94
- "content": "<extra_id_96>",
95
- "single_word": false,
96
- "lstrip": true,
97
- "rstrip": false,
98
- "normalized": true,
99
- "special": true
100
- },
101
- {
102
- "id": 32004,
103
- "content": "<extra_id_95>",
104
- "single_word": false,
105
- "lstrip": true,
106
- "rstrip": false,
107
- "normalized": true,
108
- "special": true
109
- },
110
- {
111
- "id": 32005,
112
- "content": "<extra_id_94>",
113
- "single_word": false,
114
- "lstrip": true,
115
- "rstrip": false,
116
- "normalized": true,
117
- "special": true
118
- },
119
- {
120
- "id": 32006,
121
- "content": "<extra_id_93>",
122
- "single_word": false,
123
- "lstrip": true,
124
- "rstrip": false,
125
- "normalized": true,
126
- "special": true
127
- },
128
- {
129
- "id": 32007,
130
- "content": "<extra_id_92>",
131
- "single_word": false,
132
- "lstrip": true,
133
- "rstrip": false,
134
- "normalized": true,
135
- "special": true
136
- },
137
- {
138
- "id": 32008,
139
- "content": "<extra_id_91>",
140
- "single_word": false,
141
- "lstrip": true,
142
- "rstrip": false,
143
- "normalized": true,
144
- "special": true
145
- },
146
- {
147
- "id": 32009,
148
- "content": "<extra_id_90>",
149
- "single_word": false,
150
- "lstrip": true,
151
- "rstrip": false,
152
- "normalized": true,
153
- "special": true
154
- },
155
- {
156
- "id": 32010,
157
- "content": "<extra_id_89>",
158
- "single_word": false,
159
- "lstrip": true,
160
- "rstrip": false,
161
- "normalized": true,
162
- "special": true
163
- },
164
- {
165
- "id": 32011,
166
- "content": "<extra_id_88>",
167
- "single_word": false,
168
- "lstrip": true,
169
- "rstrip": false,
170
- "normalized": true,
171
- "special": true
172
- },
173
- {
174
- "id": 32012,
175
- "content": "<extra_id_87>",
176
- "single_word": false,
177
- "lstrip": true,
178
- "rstrip": false,
179
- "normalized": true,
180
- "special": true
181
- },
182
- {
183
- "id": 32013,
184
- "content": "<extra_id_86>",
185
- "single_word": false,
186
- "lstrip": true,
187
- "rstrip": false,
188
- "normalized": true,
189
- "special": true
190
- },
191
- {
192
- "id": 32014,
193
- "content": "<extra_id_85>",
194
- "single_word": false,
195
- "lstrip": true,
196
- "rstrip": false,
197
- "normalized": true,
198
- "special": true
199
- },
200
- {
201
- "id": 32015,
202
- "content": "<extra_id_84>",
203
- "single_word": false,
204
- "lstrip": true,
205
- "rstrip": false,
206
- "normalized": true,
207
- "special": true
208
- },
209
- {
210
- "id": 32016,
211
- "content": "<extra_id_83>",
212
- "single_word": false,
213
- "lstrip": true,
214
- "rstrip": false,
215
- "normalized": true,
216
- "special": true
217
- },
218
- {
219
- "id": 32017,
220
- "content": "<extra_id_82>",
221
- "single_word": false,
222
- "lstrip": true,
223
- "rstrip": false,
224
- "normalized": true,
225
- "special": true
226
- },
227
- {
228
- "id": 32018,
229
- "content": "<extra_id_81>",
230
- "single_word": false,
231
- "lstrip": true,
232
- "rstrip": false,
233
- "normalized": true,
234
- "special": true
235
- },
236
- {
237
- "id": 32019,
238
- "content": "<extra_id_80>",
239
- "single_word": false,
240
- "lstrip": true,
241
- "rstrip": false,
242
- "normalized": true,
243
- "special": true
244
- },
245
- {
246
- "id": 32020,
247
- "content": "<extra_id_79>",
248
- "single_word": false,
249
- "lstrip": true,
250
- "rstrip": false,
251
- "normalized": true,
252
- "special": true
253
- },
254
- {
255
- "id": 32021,
256
- "content": "<extra_id_78>",
257
- "single_word": false,
258
- "lstrip": true,
259
- "rstrip": false,
260
- "normalized": true,
261
- "special": true
262
- },
263
- {
264
- "id": 32022,
265
- "content": "<extra_id_77>",
266
- "single_word": false,
267
- "lstrip": true,
268
- "rstrip": false,
269
- "normalized": true,
270
- "special": true
271
- },
272
- {
273
- "id": 32023,
274
- "content": "<extra_id_76>",
275
- "single_word": false,
276
- "lstrip": true,
277
- "rstrip": false,
278
- "normalized": true,
279
- "special": true
280
- },
281
- {
282
- "id": 32024,
283
- "content": "<extra_id_75>",
284
- "single_word": false,
285
- "lstrip": true,
286
- "rstrip": false,
287
- "normalized": true,
288
- "special": true
289
- },
290
- {
291
- "id": 32025,
292
- "content": "<extra_id_74>",
293
- "single_word": false,
294
- "lstrip": true,
295
- "rstrip": false,
296
- "normalized": true,
297
- "special": true
298
- },
299
- {
300
- "id": 32026,
301
- "content": "<extra_id_73>",
302
- "single_word": false,
303
- "lstrip": true,
304
- "rstrip": false,
305
- "normalized": true,
306
- "special": true
307
- },
308
- {
309
- "id": 32027,
310
- "content": "<extra_id_72>",
311
- "single_word": false,
312
- "lstrip": true,
313
- "rstrip": false,
314
- "normalized": true,
315
- "special": true
316
- },
317
- {
318
- "id": 32028,
319
- "content": "<extra_id_71>",
320
- "single_word": false,
321
- "lstrip": true,
322
- "rstrip": false,
323
- "normalized": true,
324
- "special": true
325
- },
326
- {
327
- "id": 32029,
328
- "content": "<extra_id_70>",
329
- "single_word": false,
330
- "lstrip": true,
331
- "rstrip": false,
332
- "normalized": true,
333
- "special": true
334
- },
335
- {
336
- "id": 32030,
337
- "content": "<extra_id_69>",
338
- "single_word": false,
339
- "lstrip": true,
340
- "rstrip": false,
341
- "normalized": true,
342
- "special": true
343
- },
344
- {
345
- "id": 32031,
346
- "content": "<extra_id_68>",
347
- "single_word": false,
348
- "lstrip": true,
349
- "rstrip": false,
350
- "normalized": true,
351
- "special": true
352
- },
353
- {
354
- "id": 32032,
355
- "content": "<extra_id_67>",
356
- "single_word": false,
357
- "lstrip": true,
358
- "rstrip": false,
359
- "normalized": true,
360
- "special": true
361
- },
362
- {
363
- "id": 32033,
364
- "content": "<extra_id_66>",
365
- "single_word": false,
366
- "lstrip": true,
367
- "rstrip": false,
368
- "normalized": true,
369
- "special": true
370
- },
371
- {
372
- "id": 32034,
373
- "content": "<extra_id_65>",
374
- "single_word": false,
375
- "lstrip": true,
376
- "rstrip": false,
377
- "normalized": true,
378
- "special": true
379
- },
380
- {
381
- "id": 32035,
382
- "content": "<extra_id_64>",
383
- "single_word": false,
384
- "lstrip": true,
385
- "rstrip": false,
386
- "normalized": true,
387
- "special": true
388
- },
389
- {
390
- "id": 32036,
391
- "content": "<extra_id_63>",
392
- "single_word": false,
393
- "lstrip": true,
394
- "rstrip": false,
395
- "normalized": true,
396
- "special": true
397
- },
398
- {
399
- "id": 32037,
400
- "content": "<extra_id_62>",
401
- "single_word": false,
402
- "lstrip": true,
403
- "rstrip": false,
404
- "normalized": true,
405
- "special": true
406
- },
407
- {
408
- "id": 32038,
409
- "content": "<extra_id_61>",
410
- "single_word": false,
411
- "lstrip": true,
412
- "rstrip": false,
413
- "normalized": true,
414
- "special": true
415
- },
416
- {
417
- "id": 32039,
418
- "content": "<extra_id_60>",
419
- "single_word": false,
420
- "lstrip": true,
421
- "rstrip": false,
422
- "normalized": true,
423
- "special": true
424
- },
425
- {
426
- "id": 32040,
427
- "content": "<extra_id_59>",
428
- "single_word": false,
429
- "lstrip": true,
430
- "rstrip": false,
431
- "normalized": true,
432
- "special": true
433
- },
434
- {
435
- "id": 32041,
436
- "content": "<extra_id_58>",
437
- "single_word": false,
438
- "lstrip": true,
439
- "rstrip": false,
440
- "normalized": true,
441
- "special": true
442
- },
443
- {
444
- "id": 32042,
445
- "content": "<extra_id_57>",
446
- "single_word": false,
447
- "lstrip": true,
448
- "rstrip": false,
449
- "normalized": true,
450
- "special": true
451
- },
452
- {
453
- "id": 32043,
454
- "content": "<extra_id_56>",
455
- "single_word": false,
456
- "lstrip": true,
457
- "rstrip": false,
458
- "normalized": true,
459
- "special": true
460
- },
461
- {
462
- "id": 32044,
463
- "content": "<extra_id_55>",
464
- "single_word": false,
465
- "lstrip": true,
466
- "rstrip": false,
467
- "normalized": true,
468
- "special": true
469
- },
470
- {
471
- "id": 32045,
472
- "content": "<extra_id_54>",
473
- "single_word": false,
474
- "lstrip": true,
475
- "rstrip": false,
476
- "normalized": true,
477
- "special": true
478
- },
479
- {
480
- "id": 32046,
481
- "content": "<extra_id_53>",
482
- "single_word": false,
483
- "lstrip": true,
484
- "rstrip": false,
485
- "normalized": true,
486
- "special": true
487
- },
488
- {
489
- "id": 32047,
490
- "content": "<extra_id_52>",
491
- "single_word": false,
492
- "lstrip": true,
493
- "rstrip": false,
494
- "normalized": true,
495
- "special": true
496
- },
497
- {
498
- "id": 32048,
499
- "content": "<extra_id_51>",
500
- "single_word": false,
501
- "lstrip": true,
502
- "rstrip": false,
503
- "normalized": true,
504
- "special": true
505
- },
506
- {
507
- "id": 32049,
508
- "content": "<extra_id_50>",
509
- "single_word": false,
510
- "lstrip": true,
511
- "rstrip": false,
512
- "normalized": true,
513
- "special": true
514
- },
515
- {
516
- "id": 32050,
517
- "content": "<extra_id_49>",
518
- "single_word": false,
519
- "lstrip": true,
520
- "rstrip": false,
521
- "normalized": true,
522
- "special": true
523
- },
524
- {
525
- "id": 32051,
526
- "content": "<extra_id_48>",
527
- "single_word": false,
528
- "lstrip": true,
529
- "rstrip": false,
530
- "normalized": true,
531
- "special": true
532
- },
533
- {
534
- "id": 32052,
535
- "content": "<extra_id_47>",
536
- "single_word": false,
537
- "lstrip": true,
538
- "rstrip": false,
539
- "normalized": true,
540
- "special": true
541
- },
542
- {
543
- "id": 32053,
544
- "content": "<extra_id_46>",
545
- "single_word": false,
546
- "lstrip": true,
547
- "rstrip": false,
548
- "normalized": true,
549
- "special": true
550
- },
551
- {
552
- "id": 32054,
553
- "content": "<extra_id_45>",
554
- "single_word": false,
555
- "lstrip": true,
556
- "rstrip": false,
557
- "normalized": true,
558
- "special": true
559
- },
560
- {
561
- "id": 32055,
562
- "content": "<extra_id_44>",
563
- "single_word": false,
564
- "lstrip": true,
565
- "rstrip": false,
566
- "normalized": true,
567
- "special": true
568
- },
569
- {
570
- "id": 32056,
571
- "content": "<extra_id_43>",
572
- "single_word": false,
573
- "lstrip": true,
574
- "rstrip": false,
575
- "normalized": true,
576
- "special": true
577
- },
578
- {
579
- "id": 32057,
580
- "content": "<extra_id_42>",
581
- "single_word": false,
582
- "lstrip": true,
583
- "rstrip": false,
584
- "normalized": true,
585
- "special": true
586
- },
587
- {
588
- "id": 32058,
589
- "content": "<extra_id_41>",
590
- "single_word": false,
591
- "lstrip": true,
592
- "rstrip": false,
593
- "normalized": true,
594
- "special": true
595
- },
596
- {
597
- "id": 32059,
598
- "content": "<extra_id_40>",
599
- "single_word": false,
600
- "lstrip": true,
601
- "rstrip": false,
602
- "normalized": true,
603
- "special": true
604
- },
605
- {
606
- "id": 32060,
607
- "content": "<extra_id_39>",
608
- "single_word": false,
609
- "lstrip": true,
610
- "rstrip": false,
611
- "normalized": true,
612
- "special": true
613
- },
614
- {
615
- "id": 32061,
616
- "content": "<extra_id_38>",
617
- "single_word": false,
618
- "lstrip": true,
619
- "rstrip": false,
620
- "normalized": true,
621
- "special": true
622
- },
623
- {
624
- "id": 32062,
625
- "content": "<extra_id_37>",
626
- "single_word": false,
627
- "lstrip": true,
628
- "rstrip": false,
629
- "normalized": true,
630
- "special": true
631
- },
632
- {
633
- "id": 32063,
634
- "content": "<extra_id_36>",
635
- "single_word": false,
636
- "lstrip": true,
637
- "rstrip": false,
638
- "normalized": true,
639
- "special": true
640
- },
641
- {
642
- "id": 32064,
643
- "content": "<extra_id_35>",
644
- "single_word": false,
645
- "lstrip": true,
646
- "rstrip": false,
647
- "normalized": true,
648
- "special": true
649
- },
650
- {
651
- "id": 32065,
652
- "content": "<extra_id_34>",
653
- "single_word": false,
654
- "lstrip": true,
655
- "rstrip": false,
656
- "normalized": true,
657
- "special": true
658
- },
659
- {
660
- "id": 32066,
661
- "content": "<extra_id_33>",
662
- "single_word": false,
663
- "lstrip": true,
664
- "rstrip": false,
665
- "normalized": true,
666
- "special": true
667
- },
668
- {
669
- "id": 32067,
670
- "content": "<extra_id_32>",
671
- "single_word": false,
672
- "lstrip": true,
673
- "rstrip": false,
674
- "normalized": true,
675
- "special": true
676
- },
677
- {
678
- "id": 32068,
679
- "content": "<extra_id_31>",
680
- "single_word": false,
681
- "lstrip": true,
682
- "rstrip": false,
683
- "normalized": true,
684
- "special": true
685
- },
686
- {
687
- "id": 32069,
688
- "content": "<extra_id_30>",
689
- "single_word": false,
690
- "lstrip": true,
691
- "rstrip": false,
692
- "normalized": true,
693
- "special": true
694
- },
695
- {
696
- "id": 32070,
697
- "content": "<extra_id_29>",
698
- "single_word": false,
699
- "lstrip": true,
700
- "rstrip": false,
701
- "normalized": true,
702
- "special": true
703
- },
704
- {
705
- "id": 32071,
706
- "content": "<extra_id_28>",
707
- "single_word": false,
708
- "lstrip": true,
709
- "rstrip": false,
710
- "normalized": true,
711
- "special": true
712
- },
713
- {
714
- "id": 32072,
715
- "content": "<extra_id_27>",
716
- "single_word": false,
717
- "lstrip": true,
718
- "rstrip": false,
719
- "normalized": true,
720
- "special": true
721
- },
722
- {
723
- "id": 32073,
724
- "content": "<extra_id_26>",
725
- "single_word": false,
726
- "lstrip": true,
727
- "rstrip": false,
728
- "normalized": true,
729
- "special": true
730
- },
731
- {
732
- "id": 32074,
733
- "content": "<extra_id_25>",
734
- "single_word": false,
735
- "lstrip": true,
736
- "rstrip": false,
737
- "normalized": true,
738
- "special": true
739
- },
740
- {
741
- "id": 32075,
742
- "content": "<extra_id_24>",
743
- "single_word": false,
744
- "lstrip": true,
745
- "rstrip": false,
746
- "normalized": true,
747
- "special": true
748
- },
749
- {
750
- "id": 32076,
751
- "content": "<extra_id_23>",
752
- "single_word": false,
753
- "lstrip": true,
754
- "rstrip": false,
755
- "normalized": true,
756
- "special": true
757
- },
758
- {
759
- "id": 32077,
760
- "content": "<extra_id_22>",
761
- "single_word": false,
762
- "lstrip": true,
763
- "rstrip": false,
764
- "normalized": true,
765
- "special": true
766
- },
767
- {
768
- "id": 32078,
769
- "content": "<extra_id_21>",
770
- "single_word": false,
771
- "lstrip": true,
772
- "rstrip": false,
773
- "normalized": true,
774
- "special": true
775
- },
776
- {
777
- "id": 32079,
778
- "content": "<extra_id_20>",
779
- "single_word": false,
780
- "lstrip": true,
781
- "rstrip": false,
782
- "normalized": true,
783
- "special": true
784
- },
785
- {
786
- "id": 32080,
787
- "content": "<extra_id_19>",
788
- "single_word": false,
789
- "lstrip": true,
790
- "rstrip": false,
791
- "normalized": true,
792
- "special": true
793
- },
794
- {
795
- "id": 32081,
796
- "content": "<extra_id_18>",
797
- "single_word": false,
798
- "lstrip": true,
799
- "rstrip": false,
800
- "normalized": true,
801
- "special": true
802
- },
803
- {
804
- "id": 32082,
805
- "content": "<extra_id_17>",
806
- "single_word": false,
807
- "lstrip": true,
808
- "rstrip": false,
809
- "normalized": true,
810
- "special": true
811
- },
812
- {
813
- "id": 32083,
814
- "content": "<extra_id_16>",
815
- "single_word": false,
816
- "lstrip": true,
817
- "rstrip": false,
818
- "normalized": true,
819
- "special": true
820
- },
821
- {
822
- "id": 32084,
823
- "content": "<extra_id_15>",
824
- "single_word": false,
825
- "lstrip": true,
826
- "rstrip": false,
827
- "normalized": true,
828
- "special": true
829
- },
830
- {
831
- "id": 32085,
832
- "content": "<extra_id_14>",
833
- "single_word": false,
834
- "lstrip": true,
835
- "rstrip": false,
836
- "normalized": true,
837
- "special": true
838
- },
839
- {
840
- "id": 32086,
841
- "content": "<extra_id_13>",
842
- "single_word": false,
843
- "lstrip": true,
844
- "rstrip": false,
845
- "normalized": true,
846
- "special": true
847
- },
848
- {
849
- "id": 32087,
850
- "content": "<extra_id_12>",
851
- "single_word": false,
852
- "lstrip": true,
853
- "rstrip": false,
854
- "normalized": true,
855
- "special": true
856
- },
857
- {
858
- "id": 32088,
859
- "content": "<extra_id_11>",
860
- "single_word": false,
861
- "lstrip": true,
862
- "rstrip": false,
863
- "normalized": true,
864
- "special": true
865
- },
866
- {
867
- "id": 32089,
868
- "content": "<extra_id_10>",
869
- "single_word": false,
870
- "lstrip": true,
871
- "rstrip": false,
872
- "normalized": true,
873
- "special": true
874
- },
875
- {
876
- "id": 32090,
877
- "content": "<extra_id_9>",
878
- "single_word": false,
879
- "lstrip": true,
880
- "rstrip": false,
881
- "normalized": true,
882
- "special": true
883
- },
884
- {
885
- "id": 32091,
886
- "content": "<extra_id_8>",
887
- "single_word": false,
888
- "lstrip": true,
889
- "rstrip": false,
890
- "normalized": true,
891
- "special": true
892
- },
893
- {
894
- "id": 32092,
895
- "content": "<extra_id_7>",
896
- "single_word": false,
897
- "lstrip": true,
898
- "rstrip": false,
899
- "normalized": true,
900
- "special": true
901
- },
902
- {
903
- "id": 32093,
904
- "content": "<extra_id_6>",
905
- "single_word": false,
906
- "lstrip": true,
907
- "rstrip": false,
908
- "normalized": true,
909
- "special": true
910
- },
911
- {
912
- "id": 32094,
913
- "content": "<extra_id_5>",
914
- "single_word": false,
915
- "lstrip": true,
916
- "rstrip": false,
917
- "normalized": true,
918
- "special": true
919
- },
920
- {
921
- "id": 32095,
922
- "content": "<extra_id_4>",
923
- "single_word": false,
924
- "lstrip": true,
925
- "rstrip": false,
926
- "normalized": true,
927
- "special": true
928
- },
929
- {
930
- "id": 32096,
931
- "content": "<extra_id_3>",
932
- "single_word": false,
933
- "lstrip": true,
934
- "rstrip": false,
935
- "normalized": true,
936
- "special": true
937
- },
938
- {
939
- "id": 32097,
940
- "content": "<extra_id_2>",
941
- "single_word": false,
942
- "lstrip": true,
943
- "rstrip": false,
944
- "normalized": true,
945
- "special": true
946
- },
947
- {
948
- "id": 32098,
949
- "content": "<extra_id_1>",
950
- "single_word": false,
951
- "lstrip": true,
952
- "rstrip": false,
953
- "normalized": true,
954
- "special": true
955
- },
956
- {
957
- "id": 32099,
958
- "content": "<extra_id_0>",
959
- "single_word": false,
960
- "lstrip": true,
961
- "rstrip": false,
962
- "normalized": true,
963
- "special": true
964
  }
965
  ],
966
  "normalizer": null,
@@ -36813,10 +35913,6 @@
36813
  "pr",
36814
  "int"
36815
  ],
36816
- [
36817
- "#",
36818
- "#"
36819
- ],
36820
  [
36821
  "W",
36822
  "ith"
@@ -39937,10 +39033,6 @@
39937
  "b",
39938
  "ase"
39939
  ],
39940
- [
39941
- "##",
39942
- "##"
39943
- ],
39944
  [
39945
  "R",
39946
  "el"
@@ -44969,10 +44061,6 @@
44969
  "Ġre",
44970
  "trie"
44971
  ],
44972
- [
44973
- "####",
44974
- "####"
44975
- ],
44976
  [
44977
  "Ġmult",
44978
  "iple"
@@ -46625,10 +45713,6 @@
46625
  "At",
46626
  "om"
46627
  ],
46628
- [
46629
- "#",
46630
- "{"
46631
- ],
46632
  [
46633
  "Ġro",
46634
  "und"
@@ -54121,10 +53205,6 @@
54121
  "Ġex",
54122
  "plicit"
54123
  ],
54124
- [
54125
- "########",
54126
- "########"
54127
- ],
54128
  [
54129
  "Service",
54130
  "Response"
@@ -72209,10 +71289,6 @@
72209
  "el",
72210
  "em"
72211
  ],
72212
- [
72213
- "#",
72214
- "'"
72215
- ],
72216
  [
72217
  "Ġcon",
72218
  "versation"
@@ -72617,10 +71693,6 @@
72617
  "ĠPre",
72618
  "fix"
72619
  ],
72620
- [
72621
- "################",
72622
- "################"
72623
- ],
72624
  [
72625
  "s",
72626
  "ources"
@@ -84661,10 +83733,6 @@
84661
  "Ġh",
84662
  "el"
84663
  ],
84664
- [
84665
- "##",
84666
- "#"
84667
- ],
84668
  [
84669
  "And",
84670
  "Set"
@@ -100589,10 +99657,6 @@
100589
  "Ġrule",
100590
  "ValidID"
100591
  ],
100592
- [
100593
- "#",
100594
- "\""
100595
- ],
100596
  [
100597
  "^",
100598
  "\\"
@@ -116621,10 +115685,6 @@
116621
  "ĠUn",
116622
  "der"
116623
  ],
116624
- [
116625
- "#{",
116626
- "@"
116627
- ],
116628
  [
116629
  "ĠAct",
116630
  "or"
@@ -138005,10 +137065,6 @@
138005
  "Queue",
138006
  "Entry"
138007
  ],
138008
- [
138009
- "########",
138010
- "####"
138011
- ],
138012
  [
138013
  "alan",
138014
  "ces"
@@ -154045,10 +153101,6 @@
154045
  "SETT",
154046
  "ABLE"
154047
  ],
154048
- [
154049
- "#",
154050
- "$"
154051
- ],
154052
  [
154053
  "C",
154054
  "ores"
@@ -154449,10 +153501,6 @@
154449
  "ENDI",
154450
  "AN"
154451
  ],
154452
- [
154453
- "#",
154454
- "__"
154455
- ],
154456
  [
154457
  ">",
154458
  "`"
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 256,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 256
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
 
61
  "rstrip": false,
62
  "normalized": true,
63
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
64
  }
65
  ],
66
  "normalizer": null,
 
35913
  "pr",
35914
  "int"
35915
  ],
 
 
 
 
35916
  [
35917
  "W",
35918
  "ith"
 
39033
  "b",
39034
  "ase"
39035
  ],
 
 
 
 
39036
  [
39037
  "R",
39038
  "el"
 
44061
  "Ġre",
44062
  "trie"
44063
  ],
 
 
 
 
44064
  [
44065
  "Ġmult",
44066
  "iple"
 
45713
  "At",
45714
  "om"
45715
  ],
 
 
 
 
45716
  [
45717
  "Ġro",
45718
  "und"
 
53205
  "Ġex",
53206
  "plicit"
53207
  ],
 
 
 
 
53208
  [
53209
  "Service",
53210
  "Response"
 
71289
  "el",
71290
  "em"
71291
  ],
 
 
 
 
71292
  [
71293
  "Ġcon",
71294
  "versation"
 
71693
  "ĠPre",
71694
  "fix"
71695
  ],
 
 
 
 
71696
  [
71697
  "s",
71698
  "ources"
 
83733
  "Ġh",
83734
  "el"
83735
  ],
 
 
 
 
83736
  [
83737
  "And",
83738
  "Set"
 
99657
  "Ġrule",
99658
  "ValidID"
99659
  ],
 
 
 
 
99660
  [
99661
  "^",
99662
  "\\"
 
115685
  "ĠUn",
115686
  "der"
115687
  ],
 
 
 
 
115688
  [
115689
  "ĠAct",
115690
  "or"
 
137065
  "Queue",
137066
  "Entry"
137067
  ],
 
 
 
 
137068
  [
137069
  "alan",
137070
  "ces"
 
153101
  "SETT",
153102
  "ABLE"
153103
  ],
 
 
 
 
153104
  [
153105
  "C",
153106
  "ores"
 
153501
  "ENDI",
153502
  "AN"
153503
  ],
 
 
 
 
153504
  [
153505
  ">",
153506
  "`"
tokenizer_config.json CHANGED
@@ -1,955 +1,714 @@
1
  {
2
  "add_prefix_space": false,
3
- "added_tokens_decoder": {
4
- "0": {
5
- "content": "<pad>",
6
- "lstrip": false,
7
- "normalized": true,
8
- "rstrip": false,
9
- "single_word": false,
10
- "special": true
11
- },
12
- "1": {
13
- "content": "<s>",
14
- "lstrip": false,
15
- "normalized": true,
16
- "rstrip": false,
17
- "single_word": false,
18
- "special": true
19
- },
20
- "2": {
21
- "content": "</s>",
22
- "lstrip": false,
23
- "normalized": true,
24
- "rstrip": false,
25
- "single_word": false,
26
- "special": true
27
- },
28
- "3": {
29
- "content": "<unk>",
30
- "lstrip": false,
31
- "normalized": true,
32
- "rstrip": false,
33
- "single_word": false,
34
- "special": true
35
- },
36
- "4": {
37
- "content": "<mask>",
38
- "lstrip": true,
39
- "normalized": true,
40
- "rstrip": false,
41
- "single_word": false,
42
- "special": true
43
- },
44
- "32000": {
45
  "content": "<extra_id_99>",
46
  "lstrip": true,
47
  "normalized": true,
48
  "rstrip": false,
49
- "single_word": false,
50
- "special": true
51
  },
52
- "32001": {
53
  "content": "<extra_id_98>",
54
  "lstrip": true,
55
  "normalized": true,
56
  "rstrip": false,
57
- "single_word": false,
58
- "special": true
59
  },
60
- "32002": {
61
  "content": "<extra_id_97>",
62
  "lstrip": true,
63
  "normalized": true,
64
  "rstrip": false,
65
- "single_word": false,
66
- "special": true
67
  },
68
- "32003": {
69
  "content": "<extra_id_96>",
70
  "lstrip": true,
71
  "normalized": true,
72
  "rstrip": false,
73
- "single_word": false,
74
- "special": true
75
  },
76
- "32004": {
77
  "content": "<extra_id_95>",
78
  "lstrip": true,
79
  "normalized": true,
80
  "rstrip": false,
81
- "single_word": false,
82
- "special": true
83
  },
84
- "32005": {
85
  "content": "<extra_id_94>",
86
  "lstrip": true,
87
  "normalized": true,
88
  "rstrip": false,
89
- "single_word": false,
90
- "special": true
91
  },
92
- "32006": {
93
  "content": "<extra_id_93>",
94
  "lstrip": true,
95
  "normalized": true,
96
  "rstrip": false,
97
- "single_word": false,
98
- "special": true
99
  },
100
- "32007": {
101
  "content": "<extra_id_92>",
102
  "lstrip": true,
103
  "normalized": true,
104
  "rstrip": false,
105
- "single_word": false,
106
- "special": true
107
  },
108
- "32008": {
109
  "content": "<extra_id_91>",
110
  "lstrip": true,
111
  "normalized": true,
112
  "rstrip": false,
113
- "single_word": false,
114
- "special": true
115
  },
116
- "32009": {
117
  "content": "<extra_id_90>",
118
  "lstrip": true,
119
  "normalized": true,
120
  "rstrip": false,
121
- "single_word": false,
122
- "special": true
123
  },
124
- "32010": {
125
  "content": "<extra_id_89>",
126
  "lstrip": true,
127
  "normalized": true,
128
  "rstrip": false,
129
- "single_word": false,
130
- "special": true
131
  },
132
- "32011": {
133
  "content": "<extra_id_88>",
134
  "lstrip": true,
135
  "normalized": true,
136
  "rstrip": false,
137
- "single_word": false,
138
- "special": true
139
  },
140
- "32012": {
141
  "content": "<extra_id_87>",
142
  "lstrip": true,
143
  "normalized": true,
144
  "rstrip": false,
145
- "single_word": false,
146
- "special": true
147
  },
148
- "32013": {
149
  "content": "<extra_id_86>",
150
  "lstrip": true,
151
  "normalized": true,
152
  "rstrip": false,
153
- "single_word": false,
154
- "special": true
155
  },
156
- "32014": {
157
  "content": "<extra_id_85>",
158
  "lstrip": true,
159
  "normalized": true,
160
  "rstrip": false,
161
- "single_word": false,
162
- "special": true
163
  },
164
- "32015": {
165
  "content": "<extra_id_84>",
166
  "lstrip": true,
167
  "normalized": true,
168
  "rstrip": false,
169
- "single_word": false,
170
- "special": true
171
  },
172
- "32016": {
173
  "content": "<extra_id_83>",
174
  "lstrip": true,
175
  "normalized": true,
176
  "rstrip": false,
177
- "single_word": false,
178
- "special": true
179
  },
180
- "32017": {
181
  "content": "<extra_id_82>",
182
  "lstrip": true,
183
  "normalized": true,
184
  "rstrip": false,
185
- "single_word": false,
186
- "special": true
187
  },
188
- "32018": {
189
  "content": "<extra_id_81>",
190
  "lstrip": true,
191
  "normalized": true,
192
  "rstrip": false,
193
- "single_word": false,
194
- "special": true
195
  },
196
- "32019": {
197
  "content": "<extra_id_80>",
198
  "lstrip": true,
199
  "normalized": true,
200
  "rstrip": false,
201
- "single_word": false,
202
- "special": true
203
  },
204
- "32020": {
205
  "content": "<extra_id_79>",
206
  "lstrip": true,
207
  "normalized": true,
208
  "rstrip": false,
209
- "single_word": false,
210
- "special": true
211
  },
212
- "32021": {
213
  "content": "<extra_id_78>",
214
  "lstrip": true,
215
  "normalized": true,
216
  "rstrip": false,
217
- "single_word": false,
218
- "special": true
219
  },
220
- "32022": {
221
  "content": "<extra_id_77>",
222
  "lstrip": true,
223
  "normalized": true,
224
  "rstrip": false,
225
- "single_word": false,
226
- "special": true
227
  },
228
- "32023": {
229
  "content": "<extra_id_76>",
230
  "lstrip": true,
231
  "normalized": true,
232
  "rstrip": false,
233
- "single_word": false,
234
- "special": true
235
  },
236
- "32024": {
237
  "content": "<extra_id_75>",
238
  "lstrip": true,
239
  "normalized": true,
240
  "rstrip": false,
241
- "single_word": false,
242
- "special": true
243
  },
244
- "32025": {
245
  "content": "<extra_id_74>",
246
  "lstrip": true,
247
  "normalized": true,
248
  "rstrip": false,
249
- "single_word": false,
250
- "special": true
251
  },
252
- "32026": {
253
  "content": "<extra_id_73>",
254
  "lstrip": true,
255
  "normalized": true,
256
  "rstrip": false,
257
- "single_word": false,
258
- "special": true
259
  },
260
- "32027": {
261
  "content": "<extra_id_72>",
262
  "lstrip": true,
263
  "normalized": true,
264
  "rstrip": false,
265
- "single_word": false,
266
- "special": true
267
  },
268
- "32028": {
269
  "content": "<extra_id_71>",
270
  "lstrip": true,
271
  "normalized": true,
272
  "rstrip": false,
273
- "single_word": false,
274
- "special": true
275
  },
276
- "32029": {
277
  "content": "<extra_id_70>",
278
  "lstrip": true,
279
  "normalized": true,
280
  "rstrip": false,
281
- "single_word": false,
282
- "special": true
283
  },
284
- "32030": {
285
  "content": "<extra_id_69>",
286
  "lstrip": true,
287
  "normalized": true,
288
  "rstrip": false,
289
- "single_word": false,
290
- "special": true
291
  },
292
- "32031": {
293
  "content": "<extra_id_68>",
294
  "lstrip": true,
295
  "normalized": true,
296
  "rstrip": false,
297
- "single_word": false,
298
- "special": true
299
  },
300
- "32032": {
301
  "content": "<extra_id_67>",
302
  "lstrip": true,
303
  "normalized": true,
304
  "rstrip": false,
305
- "single_word": false,
306
- "special": true
307
  },
308
- "32033": {
309
  "content": "<extra_id_66>",
310
  "lstrip": true,
311
  "normalized": true,
312
  "rstrip": false,
313
- "single_word": false,
314
- "special": true
315
  },
316
- "32034": {
317
  "content": "<extra_id_65>",
318
  "lstrip": true,
319
  "normalized": true,
320
  "rstrip": false,
321
- "single_word": false,
322
- "special": true
323
  },
324
- "32035": {
325
  "content": "<extra_id_64>",
326
  "lstrip": true,
327
  "normalized": true,
328
  "rstrip": false,
329
- "single_word": false,
330
- "special": true
331
  },
332
- "32036": {
333
  "content": "<extra_id_63>",
334
  "lstrip": true,
335
  "normalized": true,
336
  "rstrip": false,
337
- "single_word": false,
338
- "special": true
339
  },
340
- "32037": {
341
  "content": "<extra_id_62>",
342
  "lstrip": true,
343
  "normalized": true,
344
  "rstrip": false,
345
- "single_word": false,
346
- "special": true
347
  },
348
- "32038": {
349
  "content": "<extra_id_61>",
350
  "lstrip": true,
351
  "normalized": true,
352
  "rstrip": false,
353
- "single_word": false,
354
- "special": true
355
  },
356
- "32039": {
357
  "content": "<extra_id_60>",
358
  "lstrip": true,
359
  "normalized": true,
360
  "rstrip": false,
361
- "single_word": false,
362
- "special": true
363
  },
364
- "32040": {
365
  "content": "<extra_id_59>",
366
  "lstrip": true,
367
  "normalized": true,
368
  "rstrip": false,
369
- "single_word": false,
370
- "special": true
371
  },
372
- "32041": {
373
  "content": "<extra_id_58>",
374
  "lstrip": true,
375
  "normalized": true,
376
  "rstrip": false,
377
- "single_word": false,
378
- "special": true
379
  },
380
- "32042": {
381
  "content": "<extra_id_57>",
382
  "lstrip": true,
383
  "normalized": true,
384
  "rstrip": false,
385
- "single_word": false,
386
- "special": true
387
  },
388
- "32043": {
389
  "content": "<extra_id_56>",
390
  "lstrip": true,
391
  "normalized": true,
392
  "rstrip": false,
393
- "single_word": false,
394
- "special": true
395
  },
396
- "32044": {
397
  "content": "<extra_id_55>",
398
  "lstrip": true,
399
  "normalized": true,
400
  "rstrip": false,
401
- "single_word": false,
402
- "special": true
403
  },
404
- "32045": {
405
  "content": "<extra_id_54>",
406
  "lstrip": true,
407
  "normalized": true,
408
  "rstrip": false,
409
- "single_word": false,
410
- "special": true
411
  },
412
- "32046": {
413
  "content": "<extra_id_53>",
414
  "lstrip": true,
415
  "normalized": true,
416
  "rstrip": false,
417
- "single_word": false,
418
- "special": true
419
  },
420
- "32047": {
421
  "content": "<extra_id_52>",
422
  "lstrip": true,
423
  "normalized": true,
424
  "rstrip": false,
425
- "single_word": false,
426
- "special": true
427
  },
428
- "32048": {
429
  "content": "<extra_id_51>",
430
  "lstrip": true,
431
  "normalized": true,
432
  "rstrip": false,
433
- "single_word": false,
434
- "special": true
435
  },
436
- "32049": {
437
  "content": "<extra_id_50>",
438
  "lstrip": true,
439
  "normalized": true,
440
  "rstrip": false,
441
- "single_word": false,
442
- "special": true
443
  },
444
- "32050": {
445
  "content": "<extra_id_49>",
446
  "lstrip": true,
447
  "normalized": true,
448
  "rstrip": false,
449
- "single_word": false,
450
- "special": true
451
  },
452
- "32051": {
453
  "content": "<extra_id_48>",
454
  "lstrip": true,
455
  "normalized": true,
456
  "rstrip": false,
457
- "single_word": false,
458
- "special": true
459
  },
460
- "32052": {
461
  "content": "<extra_id_47>",
462
  "lstrip": true,
463
  "normalized": true,
464
  "rstrip": false,
465
- "single_word": false,
466
- "special": true
467
  },
468
- "32053": {
469
  "content": "<extra_id_46>",
470
  "lstrip": true,
471
  "normalized": true,
472
  "rstrip": false,
473
- "single_word": false,
474
- "special": true
475
  },
476
- "32054": {
477
  "content": "<extra_id_45>",
478
  "lstrip": true,
479
  "normalized": true,
480
  "rstrip": false,
481
- "single_word": false,
482
- "special": true
483
  },
484
- "32055": {
485
  "content": "<extra_id_44>",
486
  "lstrip": true,
487
  "normalized": true,
488
  "rstrip": false,
489
- "single_word": false,
490
- "special": true
491
  },
492
- "32056": {
493
  "content": "<extra_id_43>",
494
  "lstrip": true,
495
  "normalized": true,
496
  "rstrip": false,
497
- "single_word": false,
498
- "special": true
499
  },
500
- "32057": {
501
  "content": "<extra_id_42>",
502
  "lstrip": true,
503
  "normalized": true,
504
  "rstrip": false,
505
- "single_word": false,
506
- "special": true
507
  },
508
- "32058": {
509
  "content": "<extra_id_41>",
510
  "lstrip": true,
511
  "normalized": true,
512
  "rstrip": false,
513
- "single_word": false,
514
- "special": true
515
  },
516
- "32059": {
517
  "content": "<extra_id_40>",
518
  "lstrip": true,
519
  "normalized": true,
520
  "rstrip": false,
521
- "single_word": false,
522
- "special": true
523
  },
524
- "32060": {
525
  "content": "<extra_id_39>",
526
  "lstrip": true,
527
  "normalized": true,
528
  "rstrip": false,
529
- "single_word": false,
530
- "special": true
531
  },
532
- "32061": {
533
  "content": "<extra_id_38>",
534
  "lstrip": true,
535
  "normalized": true,
536
  "rstrip": false,
537
- "single_word": false,
538
- "special": true
539
  },
540
- "32062": {
541
  "content": "<extra_id_37>",
542
  "lstrip": true,
543
  "normalized": true,
544
  "rstrip": false,
545
- "single_word": false,
546
- "special": true
547
  },
548
- "32063": {
549
  "content": "<extra_id_36>",
550
  "lstrip": true,
551
  "normalized": true,
552
  "rstrip": false,
553
- "single_word": false,
554
- "special": true
555
  },
556
- "32064": {
557
  "content": "<extra_id_35>",
558
  "lstrip": true,
559
  "normalized": true,
560
  "rstrip": false,
561
- "single_word": false,
562
- "special": true
563
  },
564
- "32065": {
565
  "content": "<extra_id_34>",
566
  "lstrip": true,
567
  "normalized": true,
568
  "rstrip": false,
569
- "single_word": false,
570
- "special": true
571
  },
572
- "32066": {
573
  "content": "<extra_id_33>",
574
  "lstrip": true,
575
  "normalized": true,
576
  "rstrip": false,
577
- "single_word": false,
578
- "special": true
579
  },
580
- "32067": {
581
  "content": "<extra_id_32>",
582
  "lstrip": true,
583
  "normalized": true,
584
  "rstrip": false,
585
- "single_word": false,
586
- "special": true
587
  },
588
- "32068": {
589
  "content": "<extra_id_31>",
590
  "lstrip": true,
591
  "normalized": true,
592
  "rstrip": false,
593
- "single_word": false,
594
- "special": true
595
  },
596
- "32069": {
597
  "content": "<extra_id_30>",
598
  "lstrip": true,
599
  "normalized": true,
600
  "rstrip": false,
601
- "single_word": false,
602
- "special": true
603
  },
604
- "32070": {
605
  "content": "<extra_id_29>",
606
  "lstrip": true,
607
  "normalized": true,
608
  "rstrip": false,
609
- "single_word": false,
610
- "special": true
611
  },
612
- "32071": {
613
  "content": "<extra_id_28>",
614
  "lstrip": true,
615
  "normalized": true,
616
  "rstrip": false,
617
- "single_word": false,
618
- "special": true
619
  },
620
- "32072": {
621
  "content": "<extra_id_27>",
622
  "lstrip": true,
623
  "normalized": true,
624
  "rstrip": false,
625
- "single_word": false,
626
- "special": true
627
  },
628
- "32073": {
629
  "content": "<extra_id_26>",
630
  "lstrip": true,
631
  "normalized": true,
632
  "rstrip": false,
633
- "single_word": false,
634
- "special": true
635
  },
636
- "32074": {
637
  "content": "<extra_id_25>",
638
  "lstrip": true,
639
  "normalized": true,
640
  "rstrip": false,
641
- "single_word": false,
642
- "special": true
643
  },
644
- "32075": {
645
  "content": "<extra_id_24>",
646
  "lstrip": true,
647
  "normalized": true,
648
  "rstrip": false,
649
- "single_word": false,
650
- "special": true
651
  },
652
- "32076": {
653
  "content": "<extra_id_23>",
654
  "lstrip": true,
655
  "normalized": true,
656
  "rstrip": false,
657
- "single_word": false,
658
- "special": true
659
  },
660
- "32077": {
661
  "content": "<extra_id_22>",
662
  "lstrip": true,
663
  "normalized": true,
664
  "rstrip": false,
665
- "single_word": false,
666
- "special": true
667
  },
668
- "32078": {
669
  "content": "<extra_id_21>",
670
  "lstrip": true,
671
  "normalized": true,
672
  "rstrip": false,
673
- "single_word": false,
674
- "special": true
675
  },
676
- "32079": {
677
  "content": "<extra_id_20>",
678
  "lstrip": true,
679
  "normalized": true,
680
  "rstrip": false,
681
- "single_word": false,
682
- "special": true
683
  },
684
- "32080": {
685
  "content": "<extra_id_19>",
686
  "lstrip": true,
687
  "normalized": true,
688
  "rstrip": false,
689
- "single_word": false,
690
- "special": true
691
  },
692
- "32081": {
693
  "content": "<extra_id_18>",
694
  "lstrip": true,
695
  "normalized": true,
696
  "rstrip": false,
697
- "single_word": false,
698
- "special": true
699
  },
700
- "32082": {
701
  "content": "<extra_id_17>",
702
  "lstrip": true,
703
  "normalized": true,
704
  "rstrip": false,
705
- "single_word": false,
706
- "special": true
707
  },
708
- "32083": {
709
  "content": "<extra_id_16>",
710
  "lstrip": true,
711
  "normalized": true,
712
  "rstrip": false,
713
- "single_word": false,
714
- "special": true
715
  },
716
- "32084": {
717
  "content": "<extra_id_15>",
718
  "lstrip": true,
719
  "normalized": true,
720
  "rstrip": false,
721
- "single_word": false,
722
- "special": true
723
  },
724
- "32085": {
725
  "content": "<extra_id_14>",
726
  "lstrip": true,
727
  "normalized": true,
728
  "rstrip": false,
729
- "single_word": false,
730
- "special": true
731
  },
732
- "32086": {
733
  "content": "<extra_id_13>",
734
  "lstrip": true,
735
  "normalized": true,
736
  "rstrip": false,
737
- "single_word": false,
738
- "special": true
739
  },
740
- "32087": {
741
  "content": "<extra_id_12>",
742
  "lstrip": true,
743
  "normalized": true,
744
  "rstrip": false,
745
- "single_word": false,
746
- "special": true
747
  },
748
- "32088": {
749
  "content": "<extra_id_11>",
750
  "lstrip": true,
751
  "normalized": true,
752
  "rstrip": false,
753
- "single_word": false,
754
- "special": true
755
  },
756
- "32089": {
757
  "content": "<extra_id_10>",
758
  "lstrip": true,
759
  "normalized": true,
760
  "rstrip": false,
761
- "single_word": false,
762
- "special": true
763
  },
764
- "32090": {
765
  "content": "<extra_id_9>",
766
  "lstrip": true,
767
  "normalized": true,
768
  "rstrip": false,
769
- "single_word": false,
770
- "special": true
771
  },
772
- "32091": {
773
  "content": "<extra_id_8>",
774
  "lstrip": true,
775
  "normalized": true,
776
  "rstrip": false,
777
- "single_word": false,
778
- "special": true
779
  },
780
- "32092": {
781
  "content": "<extra_id_7>",
782
  "lstrip": true,
783
  "normalized": true,
784
  "rstrip": false,
785
- "single_word": false,
786
- "special": true
787
  },
788
- "32093": {
789
  "content": "<extra_id_6>",
790
  "lstrip": true,
791
  "normalized": true,
792
  "rstrip": false,
793
- "single_word": false,
794
- "special": true
795
  },
796
- "32094": {
797
  "content": "<extra_id_5>",
798
  "lstrip": true,
799
  "normalized": true,
800
  "rstrip": false,
801
- "single_word": false,
802
- "special": true
803
  },
804
- "32095": {
805
  "content": "<extra_id_4>",
806
  "lstrip": true,
807
  "normalized": true,
808
  "rstrip": false,
809
- "single_word": false,
810
- "special": true
811
  },
812
- "32096": {
813
  "content": "<extra_id_3>",
814
  "lstrip": true,
815
  "normalized": true,
816
  "rstrip": false,
817
- "single_word": false,
818
- "special": true
819
  },
820
- "32097": {
821
  "content": "<extra_id_2>",
822
  "lstrip": true,
823
  "normalized": true,
824
  "rstrip": false,
825
- "single_word": false,
826
- "special": true
827
  },
828
- "32098": {
829
  "content": "<extra_id_1>",
830
  "lstrip": true,
831
  "normalized": true,
832
  "rstrip": false,
833
- "single_word": false,
834
- "special": true
835
  },
836
- "32099": {
837
  "content": "<extra_id_0>",
838
  "lstrip": true,
839
  "normalized": true,
840
  "rstrip": false,
841
- "single_word": false,
842
- "special": true
843
  }
844
- },
845
- "additional_special_tokens": [
846
- "<extra_id_99>",
847
- "<extra_id_98>",
848
- "<extra_id_97>",
849
- "<extra_id_96>",
850
- "<extra_id_95>",
851
- "<extra_id_94>",
852
- "<extra_id_93>",
853
- "<extra_id_92>",
854
- "<extra_id_91>",
855
- "<extra_id_90>",
856
- "<extra_id_89>",
857
- "<extra_id_88>",
858
- "<extra_id_87>",
859
- "<extra_id_86>",
860
- "<extra_id_85>",
861
- "<extra_id_84>",
862
- "<extra_id_83>",
863
- "<extra_id_82>",
864
- "<extra_id_81>",
865
- "<extra_id_80>",
866
- "<extra_id_79>",
867
- "<extra_id_78>",
868
- "<extra_id_77>",
869
- "<extra_id_76>",
870
- "<extra_id_75>",
871
- "<extra_id_74>",
872
- "<extra_id_73>",
873
- "<extra_id_72>",
874
- "<extra_id_71>",
875
- "<extra_id_70>",
876
- "<extra_id_69>",
877
- "<extra_id_68>",
878
- "<extra_id_67>",
879
- "<extra_id_66>",
880
- "<extra_id_65>",
881
- "<extra_id_64>",
882
- "<extra_id_63>",
883
- "<extra_id_62>",
884
- "<extra_id_61>",
885
- "<extra_id_60>",
886
- "<extra_id_59>",
887
- "<extra_id_58>",
888
- "<extra_id_57>",
889
- "<extra_id_56>",
890
- "<extra_id_55>",
891
- "<extra_id_54>",
892
- "<extra_id_53>",
893
- "<extra_id_52>",
894
- "<extra_id_51>",
895
- "<extra_id_50>",
896
- "<extra_id_49>",
897
- "<extra_id_48>",
898
- "<extra_id_47>",
899
- "<extra_id_46>",
900
- "<extra_id_45>",
901
- "<extra_id_44>",
902
- "<extra_id_43>",
903
- "<extra_id_42>",
904
- "<extra_id_41>",
905
- "<extra_id_40>",
906
- "<extra_id_39>",
907
- "<extra_id_38>",
908
- "<extra_id_37>",
909
- "<extra_id_36>",
910
- "<extra_id_35>",
911
- "<extra_id_34>",
912
- "<extra_id_33>",
913
- "<extra_id_32>",
914
- "<extra_id_31>",
915
- "<extra_id_30>",
916
- "<extra_id_29>",
917
- "<extra_id_28>",
918
- "<extra_id_27>",
919
- "<extra_id_26>",
920
- "<extra_id_25>",
921
- "<extra_id_24>",
922
- "<extra_id_23>",
923
- "<extra_id_22>",
924
- "<extra_id_21>",
925
- "<extra_id_20>",
926
- "<extra_id_19>",
927
- "<extra_id_18>",
928
- "<extra_id_17>",
929
- "<extra_id_16>",
930
- "<extra_id_15>",
931
- "<extra_id_14>",
932
- "<extra_id_13>",
933
- "<extra_id_12>",
934
- "<extra_id_11>",
935
- "<extra_id_10>",
936
- "<extra_id_9>",
937
- "<extra_id_8>",
938
- "<extra_id_7>",
939
- "<extra_id_6>",
940
- "<extra_id_5>",
941
- "<extra_id_4>",
942
- "<extra_id_3>",
943
- "<extra_id_2>",
944
- "<extra_id_1>",
945
- "<extra_id_0>"
946
  ],
 
947
  "bos_token": "<s>",
948
- "clean_up_tokenization_spaces": false,
949
  "cls_token": "<s>",
950
  "eos_token": "</s>",
951
  "errors": "replace",
952
- "extra_special_tokens": {},
 
953
  "mask_token": "<mask>",
954
  "model_max_length": 512,
955
  "pad_token": "<pad>",
 
1
  {
2
  "add_prefix_space": false,
3
+ "additional_special_tokens": [
4
+ {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "content": "<extra_id_99>",
6
  "lstrip": true,
7
  "normalized": true,
8
  "rstrip": false,
9
+ "single_word": false
 
10
  },
11
+ {
12
  "content": "<extra_id_98>",
13
  "lstrip": true,
14
  "normalized": true,
15
  "rstrip": false,
16
+ "single_word": false
 
17
  },
18
+ {
19
  "content": "<extra_id_97>",
20
  "lstrip": true,
21
  "normalized": true,
22
  "rstrip": false,
23
+ "single_word": false
 
24
  },
25
+ {
26
  "content": "<extra_id_96>",
27
  "lstrip": true,
28
  "normalized": true,
29
  "rstrip": false,
30
+ "single_word": false
 
31
  },
32
+ {
33
  "content": "<extra_id_95>",
34
  "lstrip": true,
35
  "normalized": true,
36
  "rstrip": false,
37
+ "single_word": false
 
38
  },
39
+ {
40
  "content": "<extra_id_94>",
41
  "lstrip": true,
42
  "normalized": true,
43
  "rstrip": false,
44
+ "single_word": false
 
45
  },
46
+ {
47
  "content": "<extra_id_93>",
48
  "lstrip": true,
49
  "normalized": true,
50
  "rstrip": false,
51
+ "single_word": false
 
52
  },
53
+ {
54
  "content": "<extra_id_92>",
55
  "lstrip": true,
56
  "normalized": true,
57
  "rstrip": false,
58
+ "single_word": false
 
59
  },
60
+ {
61
  "content": "<extra_id_91>",
62
  "lstrip": true,
63
  "normalized": true,
64
  "rstrip": false,
65
+ "single_word": false
 
66
  },
67
+ {
68
  "content": "<extra_id_90>",
69
  "lstrip": true,
70
  "normalized": true,
71
  "rstrip": false,
72
+ "single_word": false
 
73
  },
74
+ {
75
  "content": "<extra_id_89>",
76
  "lstrip": true,
77
  "normalized": true,
78
  "rstrip": false,
79
+ "single_word": false
 
80
  },
81
+ {
82
  "content": "<extra_id_88>",
83
  "lstrip": true,
84
  "normalized": true,
85
  "rstrip": false,
86
+ "single_word": false
 
87
  },
88
+ {
89
  "content": "<extra_id_87>",
90
  "lstrip": true,
91
  "normalized": true,
92
  "rstrip": false,
93
+ "single_word": false
 
94
  },
95
+ {
96
  "content": "<extra_id_86>",
97
  "lstrip": true,
98
  "normalized": true,
99
  "rstrip": false,
100
+ "single_word": false
 
101
  },
102
+ {
103
  "content": "<extra_id_85>",
104
  "lstrip": true,
105
  "normalized": true,
106
  "rstrip": false,
107
+ "single_word": false
 
108
  },
109
+ {
110
  "content": "<extra_id_84>",
111
  "lstrip": true,
112
  "normalized": true,
113
  "rstrip": false,
114
+ "single_word": false
 
115
  },
116
+ {
117
  "content": "<extra_id_83>",
118
  "lstrip": true,
119
  "normalized": true,
120
  "rstrip": false,
121
+ "single_word": false
 
122
  },
123
+ {
124
  "content": "<extra_id_82>",
125
  "lstrip": true,
126
  "normalized": true,
127
  "rstrip": false,
128
+ "single_word": false
 
129
  },
130
+ {
131
  "content": "<extra_id_81>",
132
  "lstrip": true,
133
  "normalized": true,
134
  "rstrip": false,
135
+ "single_word": false
 
136
  },
137
+ {
138
  "content": "<extra_id_80>",
139
  "lstrip": true,
140
  "normalized": true,
141
  "rstrip": false,
142
+ "single_word": false
 
143
  },
144
+ {
145
  "content": "<extra_id_79>",
146
  "lstrip": true,
147
  "normalized": true,
148
  "rstrip": false,
149
+ "single_word": false
 
150
  },
151
+ {
152
  "content": "<extra_id_78>",
153
  "lstrip": true,
154
  "normalized": true,
155
  "rstrip": false,
156
+ "single_word": false
 
157
  },
158
+ {
159
  "content": "<extra_id_77>",
160
  "lstrip": true,
161
  "normalized": true,
162
  "rstrip": false,
163
+ "single_word": false
 
164
  },
165
+ {
166
  "content": "<extra_id_76>",
167
  "lstrip": true,
168
  "normalized": true,
169
  "rstrip": false,
170
+ "single_word": false
 
171
  },
172
+ {
173
  "content": "<extra_id_75>",
174
  "lstrip": true,
175
  "normalized": true,
176
  "rstrip": false,
177
+ "single_word": false
 
178
  },
179
+ {
180
  "content": "<extra_id_74>",
181
  "lstrip": true,
182
  "normalized": true,
183
  "rstrip": false,
184
+ "single_word": false
 
185
  },
186
+ {
187
  "content": "<extra_id_73>",
188
  "lstrip": true,
189
  "normalized": true,
190
  "rstrip": false,
191
+ "single_word": false
 
192
  },
193
+ {
194
  "content": "<extra_id_72>",
195
  "lstrip": true,
196
  "normalized": true,
197
  "rstrip": false,
198
+ "single_word": false
 
199
  },
200
+ {
201
  "content": "<extra_id_71>",
202
  "lstrip": true,
203
  "normalized": true,
204
  "rstrip": false,
205
+ "single_word": false
 
206
  },
207
+ {
208
  "content": "<extra_id_70>",
209
  "lstrip": true,
210
  "normalized": true,
211
  "rstrip": false,
212
+ "single_word": false
 
213
  },
214
+ {
215
  "content": "<extra_id_69>",
216
  "lstrip": true,
217
  "normalized": true,
218
  "rstrip": false,
219
+ "single_word": false
 
220
  },
221
+ {
222
  "content": "<extra_id_68>",
223
  "lstrip": true,
224
  "normalized": true,
225
  "rstrip": false,
226
+ "single_word": false
 
227
  },
228
+ {
229
  "content": "<extra_id_67>",
230
  "lstrip": true,
231
  "normalized": true,
232
  "rstrip": false,
233
+ "single_word": false
 
234
  },
235
+ {
236
  "content": "<extra_id_66>",
237
  "lstrip": true,
238
  "normalized": true,
239
  "rstrip": false,
240
+ "single_word": false
 
241
  },
242
+ {
243
  "content": "<extra_id_65>",
244
  "lstrip": true,
245
  "normalized": true,
246
  "rstrip": false,
247
+ "single_word": false
 
248
  },
249
+ {
250
  "content": "<extra_id_64>",
251
  "lstrip": true,
252
  "normalized": true,
253
  "rstrip": false,
254
+ "single_word": false
 
255
  },
256
+ {
257
  "content": "<extra_id_63>",
258
  "lstrip": true,
259
  "normalized": true,
260
  "rstrip": false,
261
+ "single_word": false
 
262
  },
263
+ {
264
  "content": "<extra_id_62>",
265
  "lstrip": true,
266
  "normalized": true,
267
  "rstrip": false,
268
+ "single_word": false
 
269
  },
270
+ {
271
  "content": "<extra_id_61>",
272
  "lstrip": true,
273
  "normalized": true,
274
  "rstrip": false,
275
+ "single_word": false
 
276
  },
277
+ {
278
  "content": "<extra_id_60>",
279
  "lstrip": true,
280
  "normalized": true,
281
  "rstrip": false,
282
+ "single_word": false
 
283
  },
284
+ {
285
  "content": "<extra_id_59>",
286
  "lstrip": true,
287
  "normalized": true,
288
  "rstrip": false,
289
+ "single_word": false
 
290
  },
291
+ {
292
  "content": "<extra_id_58>",
293
  "lstrip": true,
294
  "normalized": true,
295
  "rstrip": false,
296
+ "single_word": false
 
297
  },
298
+ {
299
  "content": "<extra_id_57>",
300
  "lstrip": true,
301
  "normalized": true,
302
  "rstrip": false,
303
+ "single_word": false
 
304
  },
305
+ {
306
  "content": "<extra_id_56>",
307
  "lstrip": true,
308
  "normalized": true,
309
  "rstrip": false,
310
+ "single_word": false
 
311
  },
312
+ {
313
  "content": "<extra_id_55>",
314
  "lstrip": true,
315
  "normalized": true,
316
  "rstrip": false,
317
+ "single_word": false
 
318
  },
319
+ {
320
  "content": "<extra_id_54>",
321
  "lstrip": true,
322
  "normalized": true,
323
  "rstrip": false,
324
+ "single_word": false
 
325
  },
326
+ {
327
  "content": "<extra_id_53>",
328
  "lstrip": true,
329
  "normalized": true,
330
  "rstrip": false,
331
+ "single_word": false
 
332
  },
333
+ {
334
  "content": "<extra_id_52>",
335
  "lstrip": true,
336
  "normalized": true,
337
  "rstrip": false,
338
+ "single_word": false
 
339
  },
340
+ {
341
  "content": "<extra_id_51>",
342
  "lstrip": true,
343
  "normalized": true,
344
  "rstrip": false,
345
+ "single_word": false
 
346
  },
347
+ {
348
  "content": "<extra_id_50>",
349
  "lstrip": true,
350
  "normalized": true,
351
  "rstrip": false,
352
+ "single_word": false
 
353
  },
354
+ {
355
  "content": "<extra_id_49>",
356
  "lstrip": true,
357
  "normalized": true,
358
  "rstrip": false,
359
+ "single_word": false
 
360
  },
361
+ {
362
  "content": "<extra_id_48>",
363
  "lstrip": true,
364
  "normalized": true,
365
  "rstrip": false,
366
+ "single_word": false
 
367
  },
368
+ {
369
  "content": "<extra_id_47>",
370
  "lstrip": true,
371
  "normalized": true,
372
  "rstrip": false,
373
+ "single_word": false
 
374
  },
375
+ {
376
  "content": "<extra_id_46>",
377
  "lstrip": true,
378
  "normalized": true,
379
  "rstrip": false,
380
+ "single_word": false
 
381
  },
382
+ {
383
  "content": "<extra_id_45>",
384
  "lstrip": true,
385
  "normalized": true,
386
  "rstrip": false,
387
+ "single_word": false
 
388
  },
389
+ {
390
  "content": "<extra_id_44>",
391
  "lstrip": true,
392
  "normalized": true,
393
  "rstrip": false,
394
+ "single_word": false
 
395
  },
396
+ {
397
  "content": "<extra_id_43>",
398
  "lstrip": true,
399
  "normalized": true,
400
  "rstrip": false,
401
+ "single_word": false
 
402
  },
403
+ {
404
  "content": "<extra_id_42>",
405
  "lstrip": true,
406
  "normalized": true,
407
  "rstrip": false,
408
+ "single_word": false
 
409
  },
410
+ {
411
  "content": "<extra_id_41>",
412
  "lstrip": true,
413
  "normalized": true,
414
  "rstrip": false,
415
+ "single_word": false
 
416
  },
417
+ {
418
  "content": "<extra_id_40>",
419
  "lstrip": true,
420
  "normalized": true,
421
  "rstrip": false,
422
+ "single_word": false
 
423
  },
424
+ {
425
  "content": "<extra_id_39>",
426
  "lstrip": true,
427
  "normalized": true,
428
  "rstrip": false,
429
+ "single_word": false
 
430
  },
431
+ {
432
  "content": "<extra_id_38>",
433
  "lstrip": true,
434
  "normalized": true,
435
  "rstrip": false,
436
+ "single_word": false
 
437
  },
438
+ {
439
  "content": "<extra_id_37>",
440
  "lstrip": true,
441
  "normalized": true,
442
  "rstrip": false,
443
+ "single_word": false
 
444
  },
445
+ {
446
  "content": "<extra_id_36>",
447
  "lstrip": true,
448
  "normalized": true,
449
  "rstrip": false,
450
+ "single_word": false
 
451
  },
452
+ {
453
  "content": "<extra_id_35>",
454
  "lstrip": true,
455
  "normalized": true,
456
  "rstrip": false,
457
+ "single_word": false
 
458
  },
459
+ {
460
  "content": "<extra_id_34>",
461
  "lstrip": true,
462
  "normalized": true,
463
  "rstrip": false,
464
+ "single_word": false
 
465
  },
466
+ {
467
  "content": "<extra_id_33>",
468
  "lstrip": true,
469
  "normalized": true,
470
  "rstrip": false,
471
+ "single_word": false
 
472
  },
473
+ {
474
  "content": "<extra_id_32>",
475
  "lstrip": true,
476
  "normalized": true,
477
  "rstrip": false,
478
+ "single_word": false
 
479
  },
480
+ {
481
  "content": "<extra_id_31>",
482
  "lstrip": true,
483
  "normalized": true,
484
  "rstrip": false,
485
+ "single_word": false
 
486
  },
487
+ {
488
  "content": "<extra_id_30>",
489
  "lstrip": true,
490
  "normalized": true,
491
  "rstrip": false,
492
+ "single_word": false
 
493
  },
494
+ {
495
  "content": "<extra_id_29>",
496
  "lstrip": true,
497
  "normalized": true,
498
  "rstrip": false,
499
+ "single_word": false
 
500
  },
501
+ {
502
  "content": "<extra_id_28>",
503
  "lstrip": true,
504
  "normalized": true,
505
  "rstrip": false,
506
+ "single_word": false
 
507
  },
508
+ {
509
  "content": "<extra_id_27>",
510
  "lstrip": true,
511
  "normalized": true,
512
  "rstrip": false,
513
+ "single_word": false
 
514
  },
515
+ {
516
  "content": "<extra_id_26>",
517
  "lstrip": true,
518
  "normalized": true,
519
  "rstrip": false,
520
+ "single_word": false
 
521
  },
522
+ {
523
  "content": "<extra_id_25>",
524
  "lstrip": true,
525
  "normalized": true,
526
  "rstrip": false,
527
+ "single_word": false
 
528
  },
529
+ {
530
  "content": "<extra_id_24>",
531
  "lstrip": true,
532
  "normalized": true,
533
  "rstrip": false,
534
+ "single_word": false
 
535
  },
536
+ {
537
  "content": "<extra_id_23>",
538
  "lstrip": true,
539
  "normalized": true,
540
  "rstrip": false,
541
+ "single_word": false
 
542
  },
543
+ {
544
  "content": "<extra_id_22>",
545
  "lstrip": true,
546
  "normalized": true,
547
  "rstrip": false,
548
+ "single_word": false
 
549
  },
550
+ {
551
  "content": "<extra_id_21>",
552
  "lstrip": true,
553
  "normalized": true,
554
  "rstrip": false,
555
+ "single_word": false
 
556
  },
557
+ {
558
  "content": "<extra_id_20>",
559
  "lstrip": true,
560
  "normalized": true,
561
  "rstrip": false,
562
+ "single_word": false
 
563
  },
564
+ {
565
  "content": "<extra_id_19>",
566
  "lstrip": true,
567
  "normalized": true,
568
  "rstrip": false,
569
+ "single_word": false
 
570
  },
571
+ {
572
  "content": "<extra_id_18>",
573
  "lstrip": true,
574
  "normalized": true,
575
  "rstrip": false,
576
+ "single_word": false
 
577
  },
578
+ {
579
  "content": "<extra_id_17>",
580
  "lstrip": true,
581
  "normalized": true,
582
  "rstrip": false,
583
+ "single_word": false
 
584
  },
585
+ {
586
  "content": "<extra_id_16>",
587
  "lstrip": true,
588
  "normalized": true,
589
  "rstrip": false,
590
+ "single_word": false
 
591
  },
592
+ {
593
  "content": "<extra_id_15>",
594
  "lstrip": true,
595
  "normalized": true,
596
  "rstrip": false,
597
+ "single_word": false
 
598
  },
599
+ {
600
  "content": "<extra_id_14>",
601
  "lstrip": true,
602
  "normalized": true,
603
  "rstrip": false,
604
+ "single_word": false
 
605
  },
606
+ {
607
  "content": "<extra_id_13>",
608
  "lstrip": true,
609
  "normalized": true,
610
  "rstrip": false,
611
+ "single_word": false
 
612
  },
613
+ {
614
  "content": "<extra_id_12>",
615
  "lstrip": true,
616
  "normalized": true,
617
  "rstrip": false,
618
+ "single_word": false
 
619
  },
620
+ {
621
  "content": "<extra_id_11>",
622
  "lstrip": true,
623
  "normalized": true,
624
  "rstrip": false,
625
+ "single_word": false
 
626
  },
627
+ {
628
  "content": "<extra_id_10>",
629
  "lstrip": true,
630
  "normalized": true,
631
  "rstrip": false,
632
+ "single_word": false
 
633
  },
634
+ {
635
  "content": "<extra_id_9>",
636
  "lstrip": true,
637
  "normalized": true,
638
  "rstrip": false,
639
+ "single_word": false
 
640
  },
641
+ {
642
  "content": "<extra_id_8>",
643
  "lstrip": true,
644
  "normalized": true,
645
  "rstrip": false,
646
+ "single_word": false
 
647
  },
648
+ {
649
  "content": "<extra_id_7>",
650
  "lstrip": true,
651
  "normalized": true,
652
  "rstrip": false,
653
+ "single_word": false
 
654
  },
655
+ {
656
  "content": "<extra_id_6>",
657
  "lstrip": true,
658
  "normalized": true,
659
  "rstrip": false,
660
+ "single_word": false
 
661
  },
662
+ {
663
  "content": "<extra_id_5>",
664
  "lstrip": true,
665
  "normalized": true,
666
  "rstrip": false,
667
+ "single_word": false
 
668
  },
669
+ {
670
  "content": "<extra_id_4>",
671
  "lstrip": true,
672
  "normalized": true,
673
  "rstrip": false,
674
+ "single_word": false
 
675
  },
676
+ {
677
  "content": "<extra_id_3>",
678
  "lstrip": true,
679
  "normalized": true,
680
  "rstrip": false,
681
+ "single_word": false
 
682
  },
683
+ {
684
  "content": "<extra_id_2>",
685
  "lstrip": true,
686
  "normalized": true,
687
  "rstrip": false,
688
+ "single_word": false
 
689
  },
690
+ {
691
  "content": "<extra_id_1>",
692
  "lstrip": true,
693
  "normalized": true,
694
  "rstrip": false,
695
+ "single_word": false
 
696
  },
697
+ {
698
  "content": "<extra_id_0>",
699
  "lstrip": true,
700
  "normalized": true,
701
  "rstrip": false,
702
+ "single_word": false
 
703
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
704
  ],
705
+ "backend": "tokenizers",
706
  "bos_token": "<s>",
 
707
  "cls_token": "<s>",
708
  "eos_token": "</s>",
709
  "errors": "replace",
710
+ "extra_special_tokens": [],
711
+ "is_local": false,
712
  "mask_token": "<mask>",
713
  "model_max_length": 512,
714
  "pad_token": "<pad>",