harish commited on
Commit
34fdec9
·
1 Parent(s): 2c61011

added model

Browse files
checkpoint-500/config.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "t5-base",
3
+ "architectures": [
4
+ "T5ForConditionalGeneration"
5
+ ],
6
+ "d_ff": 3072,
7
+ "d_kv": 64,
8
+ "d_model": 768,
9
+ "decoder_start_token_id": 0,
10
+ "dense_act_fn": "relu",
11
+ "dropout_rate": 0.1,
12
+ "eos_token_id": 1,
13
+ "feed_forward_proj": "relu",
14
+ "initializer_factor": 1.0,
15
+ "is_encoder_decoder": true,
16
+ "is_gated_act": false,
17
+ "layer_norm_epsilon": 1e-06,
18
+ "model_type": "t5",
19
+ "n_positions": 512,
20
+ "num_decoder_layers": 12,
21
+ "num_heads": 12,
22
+ "num_layers": 12,
23
+ "output_past": true,
24
+ "pad_token_id": 0,
25
+ "relative_attention_max_distance": 128,
26
+ "relative_attention_num_buckets": 32,
27
+ "task_specific_params": {
28
+ "summarization": {
29
+ "early_stopping": true,
30
+ "length_penalty": 2.0,
31
+ "max_length": 200,
32
+ "min_length": 30,
33
+ "no_repeat_ngram_size": 3,
34
+ "num_beams": 4,
35
+ "prefix": "summarize: "
36
+ },
37
+ "translation_en_to_de": {
38
+ "early_stopping": true,
39
+ "max_length": 300,
40
+ "num_beams": 4,
41
+ "prefix": "translate English to German: "
42
+ },
43
+ "translation_en_to_fr": {
44
+ "early_stopping": true,
45
+ "max_length": 300,
46
+ "num_beams": 4,
47
+ "prefix": "translate English to French: "
48
+ },
49
+ "translation_en_to_ro": {
50
+ "early_stopping": true,
51
+ "max_length": 300,
52
+ "num_beams": 4,
53
+ "prefix": "translate English to Romanian: "
54
+ }
55
+ },
56
+ "torch_dtype": "float32",
57
+ "transformers_version": "4.21.1",
58
+ "use_cache": true,
59
+ "vocab_size": 32128
60
+ }
checkpoint-500/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21ec6bb2cee16f38e6b71bd229f69991bbbf7e2a9bce8197a2d100acae96eacc
3
+ size 1783379133
checkpoint-500/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d22b6b35b95997fc1afdfeaf2e969f39d533b9b32d495314f1175fa2b0ca2a0c
3
+ size 891700799
checkpoint-500/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52a51a7ffa1c43d2e830f4e82d32a8b5f6583fdd62075dcd4b2da514e490fdf8
3
+ size 14503
checkpoint-500/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b33a6bb891189ab867f17fac974dbaad97ec1f3d6ca66dbc7c25be834f19cebf
3
+ size 623
checkpoint-500/special_tokens_map.json ADDED
@@ -0,0 +1,107 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<extra_id_0>",
4
+ "<extra_id_1>",
5
+ "<extra_id_2>",
6
+ "<extra_id_3>",
7
+ "<extra_id_4>",
8
+ "<extra_id_5>",
9
+ "<extra_id_6>",
10
+ "<extra_id_7>",
11
+ "<extra_id_8>",
12
+ "<extra_id_9>",
13
+ "<extra_id_10>",
14
+ "<extra_id_11>",
15
+ "<extra_id_12>",
16
+ "<extra_id_13>",
17
+ "<extra_id_14>",
18
+ "<extra_id_15>",
19
+ "<extra_id_16>",
20
+ "<extra_id_17>",
21
+ "<extra_id_18>",
22
+ "<extra_id_19>",
23
+ "<extra_id_20>",
24
+ "<extra_id_21>",
25
+ "<extra_id_22>",
26
+ "<extra_id_23>",
27
+ "<extra_id_24>",
28
+ "<extra_id_25>",
29
+ "<extra_id_26>",
30
+ "<extra_id_27>",
31
+ "<extra_id_28>",
32
+ "<extra_id_29>",
33
+ "<extra_id_30>",
34
+ "<extra_id_31>",
35
+ "<extra_id_32>",
36
+ "<extra_id_33>",
37
+ "<extra_id_34>",
38
+ "<extra_id_35>",
39
+ "<extra_id_36>",
40
+ "<extra_id_37>",
41
+ "<extra_id_38>",
42
+ "<extra_id_39>",
43
+ "<extra_id_40>",
44
+ "<extra_id_41>",
45
+ "<extra_id_42>",
46
+ "<extra_id_43>",
47
+ "<extra_id_44>",
48
+ "<extra_id_45>",
49
+ "<extra_id_46>",
50
+ "<extra_id_47>",
51
+ "<extra_id_48>",
52
+ "<extra_id_49>",
53
+ "<extra_id_50>",
54
+ "<extra_id_51>",
55
+ "<extra_id_52>",
56
+ "<extra_id_53>",
57
+ "<extra_id_54>",
58
+ "<extra_id_55>",
59
+ "<extra_id_56>",
60
+ "<extra_id_57>",
61
+ "<extra_id_58>",
62
+ "<extra_id_59>",
63
+ "<extra_id_60>",
64
+ "<extra_id_61>",
65
+ "<extra_id_62>",
66
+ "<extra_id_63>",
67
+ "<extra_id_64>",
68
+ "<extra_id_65>",
69
+ "<extra_id_66>",
70
+ "<extra_id_67>",
71
+ "<extra_id_68>",
72
+ "<extra_id_69>",
73
+ "<extra_id_70>",
74
+ "<extra_id_71>",
75
+ "<extra_id_72>",
76
+ "<extra_id_73>",
77
+ "<extra_id_74>",
78
+ "<extra_id_75>",
79
+ "<extra_id_76>",
80
+ "<extra_id_77>",
81
+ "<extra_id_78>",
82
+ "<extra_id_79>",
83
+ "<extra_id_80>",
84
+ "<extra_id_81>",
85
+ "<extra_id_82>",
86
+ "<extra_id_83>",
87
+ "<extra_id_84>",
88
+ "<extra_id_85>",
89
+ "<extra_id_86>",
90
+ "<extra_id_87>",
91
+ "<extra_id_88>",
92
+ "<extra_id_89>",
93
+ "<extra_id_90>",
94
+ "<extra_id_91>",
95
+ "<extra_id_92>",
96
+ "<extra_id_93>",
97
+ "<extra_id_94>",
98
+ "<extra_id_95>",
99
+ "<extra_id_96>",
100
+ "<extra_id_97>",
101
+ "<extra_id_98>",
102
+ "<extra_id_99>"
103
+ ],
104
+ "eos_token": "</s>",
105
+ "pad_token": "<pad>",
106
+ "unk_token": "<unk>"
107
+ }
checkpoint-500/spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d60acb128cf7b7f2536e8f38a5b18a05535c9e14c7a355904270e15b0945ea86
3
+ size 791656
checkpoint-500/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-500/tokenizer_config.json ADDED
@@ -0,0 +1,112 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<extra_id_0>",
4
+ "<extra_id_1>",
5
+ "<extra_id_2>",
6
+ "<extra_id_3>",
7
+ "<extra_id_4>",
8
+ "<extra_id_5>",
9
+ "<extra_id_6>",
10
+ "<extra_id_7>",
11
+ "<extra_id_8>",
12
+ "<extra_id_9>",
13
+ "<extra_id_10>",
14
+ "<extra_id_11>",
15
+ "<extra_id_12>",
16
+ "<extra_id_13>",
17
+ "<extra_id_14>",
18
+ "<extra_id_15>",
19
+ "<extra_id_16>",
20
+ "<extra_id_17>",
21
+ "<extra_id_18>",
22
+ "<extra_id_19>",
23
+ "<extra_id_20>",
24
+ "<extra_id_21>",
25
+ "<extra_id_22>",
26
+ "<extra_id_23>",
27
+ "<extra_id_24>",
28
+ "<extra_id_25>",
29
+ "<extra_id_26>",
30
+ "<extra_id_27>",
31
+ "<extra_id_28>",
32
+ "<extra_id_29>",
33
+ "<extra_id_30>",
34
+ "<extra_id_31>",
35
+ "<extra_id_32>",
36
+ "<extra_id_33>",
37
+ "<extra_id_34>",
38
+ "<extra_id_35>",
39
+ "<extra_id_36>",
40
+ "<extra_id_37>",
41
+ "<extra_id_38>",
42
+ "<extra_id_39>",
43
+ "<extra_id_40>",
44
+ "<extra_id_41>",
45
+ "<extra_id_42>",
46
+ "<extra_id_43>",
47
+ "<extra_id_44>",
48
+ "<extra_id_45>",
49
+ "<extra_id_46>",
50
+ "<extra_id_47>",
51
+ "<extra_id_48>",
52
+ "<extra_id_49>",
53
+ "<extra_id_50>",
54
+ "<extra_id_51>",
55
+ "<extra_id_52>",
56
+ "<extra_id_53>",
57
+ "<extra_id_54>",
58
+ "<extra_id_55>",
59
+ "<extra_id_56>",
60
+ "<extra_id_57>",
61
+ "<extra_id_58>",
62
+ "<extra_id_59>",
63
+ "<extra_id_60>",
64
+ "<extra_id_61>",
65
+ "<extra_id_62>",
66
+ "<extra_id_63>",
67
+ "<extra_id_64>",
68
+ "<extra_id_65>",
69
+ "<extra_id_66>",
70
+ "<extra_id_67>",
71
+ "<extra_id_68>",
72
+ "<extra_id_69>",
73
+ "<extra_id_70>",
74
+ "<extra_id_71>",
75
+ "<extra_id_72>",
76
+ "<extra_id_73>",
77
+ "<extra_id_74>",
78
+ "<extra_id_75>",
79
+ "<extra_id_76>",
80
+ "<extra_id_77>",
81
+ "<extra_id_78>",
82
+ "<extra_id_79>",
83
+ "<extra_id_80>",
84
+ "<extra_id_81>",
85
+ "<extra_id_82>",
86
+ "<extra_id_83>",
87
+ "<extra_id_84>",
88
+ "<extra_id_85>",
89
+ "<extra_id_86>",
90
+ "<extra_id_87>",
91
+ "<extra_id_88>",
92
+ "<extra_id_89>",
93
+ "<extra_id_90>",
94
+ "<extra_id_91>",
95
+ "<extra_id_92>",
96
+ "<extra_id_93>",
97
+ "<extra_id_94>",
98
+ "<extra_id_95>",
99
+ "<extra_id_96>",
100
+ "<extra_id_97>",
101
+ "<extra_id_98>",
102
+ "<extra_id_99>"
103
+ ],
104
+ "eos_token": "</s>",
105
+ "extra_ids": 100,
106
+ "model_max_length": 512,
107
+ "name_or_path": "t5-base",
108
+ "pad_token": "<pad>",
109
+ "special_tokens_map_file": null,
110
+ "tokenizer_class": "T5Tokenizer",
111
+ "unk_token": "<unk>"
112
+ }
checkpoint-500/trainer_state.json ADDED
@@ -0,0 +1,364 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 6.097560975609756,
5
+ "global_step": 500,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.12,
12
+ "learning_rate": 1e-05,
13
+ "loss": 0.4133,
14
+ "step": 10
15
+ },
16
+ {
17
+ "epoch": 0.24,
18
+ "learning_rate": 2e-05,
19
+ "loss": 0.2546,
20
+ "step": 20
21
+ },
22
+ {
23
+ "epoch": 0.37,
24
+ "learning_rate": 3e-05,
25
+ "loss": 0.1767,
26
+ "step": 30
27
+ },
28
+ {
29
+ "epoch": 0.49,
30
+ "learning_rate": 4e-05,
31
+ "loss": 0.1409,
32
+ "step": 40
33
+ },
34
+ {
35
+ "epoch": 0.61,
36
+ "learning_rate": 5e-05,
37
+ "loss": 0.1687,
38
+ "step": 50
39
+ },
40
+ {
41
+ "epoch": 0.73,
42
+ "learning_rate": 6e-05,
43
+ "loss": 0.1161,
44
+ "step": 60
45
+ },
46
+ {
47
+ "epoch": 0.85,
48
+ "learning_rate": 7e-05,
49
+ "loss": 0.1192,
50
+ "step": 70
51
+ },
52
+ {
53
+ "epoch": 0.98,
54
+ "learning_rate": 8e-05,
55
+ "loss": 0.1233,
56
+ "step": 80
57
+ },
58
+ {
59
+ "epoch": 1.0,
60
+ "eval_loss": 0.13027246296405792,
61
+ "eval_runtime": 3.8565,
62
+ "eval_samples_per_second": 37.599,
63
+ "eval_steps_per_second": 2.593,
64
+ "step": 82
65
+ },
66
+ {
67
+ "epoch": 1.1,
68
+ "learning_rate": 9e-05,
69
+ "loss": 0.1006,
70
+ "step": 90
71
+ },
72
+ {
73
+ "epoch": 1.22,
74
+ "learning_rate": 0.0001,
75
+ "loss": 0.0578,
76
+ "step": 100
77
+ },
78
+ {
79
+ "epoch": 1.34,
80
+ "learning_rate": 9.861111111111112e-05,
81
+ "loss": 0.0835,
82
+ "step": 110
83
+ },
84
+ {
85
+ "epoch": 1.46,
86
+ "learning_rate": 9.722222222222223e-05,
87
+ "loss": 0.0605,
88
+ "step": 120
89
+ },
90
+ {
91
+ "epoch": 1.59,
92
+ "learning_rate": 9.583333333333334e-05,
93
+ "loss": 0.0665,
94
+ "step": 130
95
+ },
96
+ {
97
+ "epoch": 1.71,
98
+ "learning_rate": 9.444444444444444e-05,
99
+ "loss": 0.0513,
100
+ "step": 140
101
+ },
102
+ {
103
+ "epoch": 1.83,
104
+ "learning_rate": 9.305555555555556e-05,
105
+ "loss": 0.0638,
106
+ "step": 150
107
+ },
108
+ {
109
+ "epoch": 1.95,
110
+ "learning_rate": 9.166666666666667e-05,
111
+ "loss": 0.0585,
112
+ "step": 160
113
+ },
114
+ {
115
+ "epoch": 2.0,
116
+ "eval_loss": 0.08042938262224197,
117
+ "eval_runtime": 3.8773,
118
+ "eval_samples_per_second": 37.397,
119
+ "eval_steps_per_second": 2.579,
120
+ "step": 164
121
+ },
122
+ {
123
+ "epoch": 2.07,
124
+ "learning_rate": 9.027777777777779e-05,
125
+ "loss": 0.022,
126
+ "step": 170
127
+ },
128
+ {
129
+ "epoch": 2.2,
130
+ "learning_rate": 8.888888888888889e-05,
131
+ "loss": 0.0175,
132
+ "step": 180
133
+ },
134
+ {
135
+ "epoch": 2.32,
136
+ "learning_rate": 8.75e-05,
137
+ "loss": 0.015,
138
+ "step": 190
139
+ },
140
+ {
141
+ "epoch": 2.44,
142
+ "learning_rate": 8.611111111111112e-05,
143
+ "loss": 0.0186,
144
+ "step": 200
145
+ },
146
+ {
147
+ "epoch": 2.56,
148
+ "learning_rate": 8.472222222222222e-05,
149
+ "loss": 0.025,
150
+ "step": 210
151
+ },
152
+ {
153
+ "epoch": 2.68,
154
+ "learning_rate": 8.333333333333334e-05,
155
+ "loss": 0.0237,
156
+ "step": 220
157
+ },
158
+ {
159
+ "epoch": 2.8,
160
+ "learning_rate": 8.194444444444445e-05,
161
+ "loss": 0.0199,
162
+ "step": 230
163
+ },
164
+ {
165
+ "epoch": 2.93,
166
+ "learning_rate": 8.055555555555556e-05,
167
+ "loss": 0.0305,
168
+ "step": 240
169
+ },
170
+ {
171
+ "epoch": 3.0,
172
+ "eval_loss": 0.11400174349546432,
173
+ "eval_runtime": 3.8699,
174
+ "eval_samples_per_second": 37.469,
175
+ "eval_steps_per_second": 2.584,
176
+ "step": 246
177
+ },
178
+ {
179
+ "epoch": 3.05,
180
+ "learning_rate": 7.916666666666666e-05,
181
+ "loss": 0.0067,
182
+ "step": 250
183
+ },
184
+ {
185
+ "epoch": 3.17,
186
+ "learning_rate": 7.777777777777778e-05,
187
+ "loss": 0.0084,
188
+ "step": 260
189
+ },
190
+ {
191
+ "epoch": 3.29,
192
+ "learning_rate": 7.638888888888889e-05,
193
+ "loss": 0.0078,
194
+ "step": 270
195
+ },
196
+ {
197
+ "epoch": 3.41,
198
+ "learning_rate": 7.500000000000001e-05,
199
+ "loss": 0.0036,
200
+ "step": 280
201
+ },
202
+ {
203
+ "epoch": 3.54,
204
+ "learning_rate": 7.361111111111111e-05,
205
+ "loss": 0.0075,
206
+ "step": 290
207
+ },
208
+ {
209
+ "epoch": 3.66,
210
+ "learning_rate": 7.222222222222222e-05,
211
+ "loss": 0.0051,
212
+ "step": 300
213
+ },
214
+ {
215
+ "epoch": 3.78,
216
+ "learning_rate": 7.083333333333334e-05,
217
+ "loss": 0.0067,
218
+ "step": 310
219
+ },
220
+ {
221
+ "epoch": 3.9,
222
+ "learning_rate": 6.944444444444444e-05,
223
+ "loss": 0.0147,
224
+ "step": 320
225
+ },
226
+ {
227
+ "epoch": 4.0,
228
+ "eval_loss": 0.17557735741138458,
229
+ "eval_runtime": 3.8616,
230
+ "eval_samples_per_second": 37.549,
231
+ "eval_steps_per_second": 2.59,
232
+ "step": 328
233
+ },
234
+ {
235
+ "epoch": 4.02,
236
+ "learning_rate": 6.805555555555556e-05,
237
+ "loss": 0.0212,
238
+ "step": 330
239
+ },
240
+ {
241
+ "epoch": 4.15,
242
+ "learning_rate": 6.666666666666667e-05,
243
+ "loss": 0.0073,
244
+ "step": 340
245
+ },
246
+ {
247
+ "epoch": 4.27,
248
+ "learning_rate": 6.527777777777778e-05,
249
+ "loss": 0.004,
250
+ "step": 350
251
+ },
252
+ {
253
+ "epoch": 4.39,
254
+ "learning_rate": 6.388888888888888e-05,
255
+ "loss": 0.0049,
256
+ "step": 360
257
+ },
258
+ {
259
+ "epoch": 4.51,
260
+ "learning_rate": 6.25e-05,
261
+ "loss": 0.0086,
262
+ "step": 370
263
+ },
264
+ {
265
+ "epoch": 4.63,
266
+ "learning_rate": 6.111111111111112e-05,
267
+ "loss": 0.0051,
268
+ "step": 380
269
+ },
270
+ {
271
+ "epoch": 4.76,
272
+ "learning_rate": 5.972222222222223e-05,
273
+ "loss": 0.0009,
274
+ "step": 390
275
+ },
276
+ {
277
+ "epoch": 4.88,
278
+ "learning_rate": 5.833333333333334e-05,
279
+ "loss": 0.005,
280
+ "step": 400
281
+ },
282
+ {
283
+ "epoch": 5.0,
284
+ "learning_rate": 5.6944444444444445e-05,
285
+ "loss": 0.0025,
286
+ "step": 410
287
+ },
288
+ {
289
+ "epoch": 5.0,
290
+ "eval_loss": 0.19509804248809814,
291
+ "eval_runtime": 3.8565,
292
+ "eval_samples_per_second": 37.599,
293
+ "eval_steps_per_second": 2.593,
294
+ "step": 410
295
+ },
296
+ {
297
+ "epoch": 5.12,
298
+ "learning_rate": 5.555555555555556e-05,
299
+ "loss": 0.0039,
300
+ "step": 420
301
+ },
302
+ {
303
+ "epoch": 5.24,
304
+ "learning_rate": 5.4166666666666664e-05,
305
+ "loss": 0.0037,
306
+ "step": 430
307
+ },
308
+ {
309
+ "epoch": 5.37,
310
+ "learning_rate": 5.2777777777777784e-05,
311
+ "loss": 0.0032,
312
+ "step": 440
313
+ },
314
+ {
315
+ "epoch": 5.49,
316
+ "learning_rate": 5.138888888888889e-05,
317
+ "loss": 0.0002,
318
+ "step": 450
319
+ },
320
+ {
321
+ "epoch": 5.61,
322
+ "learning_rate": 5e-05,
323
+ "loss": 0.006,
324
+ "step": 460
325
+ },
326
+ {
327
+ "epoch": 5.73,
328
+ "learning_rate": 4.8611111111111115e-05,
329
+ "loss": 0.0067,
330
+ "step": 470
331
+ },
332
+ {
333
+ "epoch": 5.85,
334
+ "learning_rate": 4.722222222222222e-05,
335
+ "loss": 0.0046,
336
+ "step": 480
337
+ },
338
+ {
339
+ "epoch": 5.98,
340
+ "learning_rate": 4.5833333333333334e-05,
341
+ "loss": 0.0009,
342
+ "step": 490
343
+ },
344
+ {
345
+ "epoch": 6.0,
346
+ "eval_loss": 0.21209779381752014,
347
+ "eval_runtime": 3.8607,
348
+ "eval_samples_per_second": 37.558,
349
+ "eval_steps_per_second": 2.59,
350
+ "step": 492
351
+ },
352
+ {
353
+ "epoch": 6.1,
354
+ "learning_rate": 4.4444444444444447e-05,
355
+ "loss": 0.0017,
356
+ "step": 500
357
+ }
358
+ ],
359
+ "max_steps": 820,
360
+ "num_train_epochs": 10,
361
+ "total_flos": 0.0,
362
+ "trial_name": null,
363
+ "trial_params": null
364
+ }
checkpoint-500/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:059a30c261f3bd54fbfe2362d7894c790b619685a34fdc10f23e0cddffd8fcd8
3
+ size 3567
checkpoint-750/config.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "t5-base",
3
+ "architectures": [
4
+ "T5ForConditionalGeneration"
5
+ ],
6
+ "d_ff": 3072,
7
+ "d_kv": 64,
8
+ "d_model": 768,
9
+ "decoder_start_token_id": 0,
10
+ "dense_act_fn": "relu",
11
+ "dropout_rate": 0.1,
12
+ "eos_token_id": 1,
13
+ "feed_forward_proj": "relu",
14
+ "initializer_factor": 1.0,
15
+ "is_encoder_decoder": true,
16
+ "is_gated_act": false,
17
+ "layer_norm_epsilon": 1e-06,
18
+ "model_type": "t5",
19
+ "n_positions": 512,
20
+ "num_decoder_layers": 12,
21
+ "num_heads": 12,
22
+ "num_layers": 12,
23
+ "output_past": true,
24
+ "pad_token_id": 0,
25
+ "relative_attention_max_distance": 128,
26
+ "relative_attention_num_buckets": 32,
27
+ "task_specific_params": {
28
+ "summarization": {
29
+ "early_stopping": true,
30
+ "length_penalty": 2.0,
31
+ "max_length": 200,
32
+ "min_length": 30,
33
+ "no_repeat_ngram_size": 3,
34
+ "num_beams": 4,
35
+ "prefix": "summarize: "
36
+ },
37
+ "translation_en_to_de": {
38
+ "early_stopping": true,
39
+ "max_length": 300,
40
+ "num_beams": 4,
41
+ "prefix": "translate English to German: "
42
+ },
43
+ "translation_en_to_fr": {
44
+ "early_stopping": true,
45
+ "max_length": 300,
46
+ "num_beams": 4,
47
+ "prefix": "translate English to French: "
48
+ },
49
+ "translation_en_to_ro": {
50
+ "early_stopping": true,
51
+ "max_length": 300,
52
+ "num_beams": 4,
53
+ "prefix": "translate English to Romanian: "
54
+ }
55
+ },
56
+ "torch_dtype": "float32",
57
+ "transformers_version": "4.21.1",
58
+ "use_cache": true,
59
+ "vocab_size": 32128
60
+ }
checkpoint-750/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b17b6cc752618c849c652ad06540b7e1bece7f0d1d1987c8871b06f588b407e
3
+ size 1783379133
checkpoint-750/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a280d42ed88b7ccd376dde2b2e2286b1b3bcd6713acebceba198942c27ebde8a
3
+ size 891700799
checkpoint-750/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9885b98c4ec2860b7f3ea8dae7a7ec0e71b3769e68ea2821165e5d2e5c4e057c
3
+ size 14503
checkpoint-750/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d57611f7ade3f6c0f631bd14c5185be0701a5d212d66b880906769dd1dde1e4d
3
+ size 623
checkpoint-750/special_tokens_map.json ADDED
@@ -0,0 +1,107 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<extra_id_0>",
4
+ "<extra_id_1>",
5
+ "<extra_id_2>",
6
+ "<extra_id_3>",
7
+ "<extra_id_4>",
8
+ "<extra_id_5>",
9
+ "<extra_id_6>",
10
+ "<extra_id_7>",
11
+ "<extra_id_8>",
12
+ "<extra_id_9>",
13
+ "<extra_id_10>",
14
+ "<extra_id_11>",
15
+ "<extra_id_12>",
16
+ "<extra_id_13>",
17
+ "<extra_id_14>",
18
+ "<extra_id_15>",
19
+ "<extra_id_16>",
20
+ "<extra_id_17>",
21
+ "<extra_id_18>",
22
+ "<extra_id_19>",
23
+ "<extra_id_20>",
24
+ "<extra_id_21>",
25
+ "<extra_id_22>",
26
+ "<extra_id_23>",
27
+ "<extra_id_24>",
28
+ "<extra_id_25>",
29
+ "<extra_id_26>",
30
+ "<extra_id_27>",
31
+ "<extra_id_28>",
32
+ "<extra_id_29>",
33
+ "<extra_id_30>",
34
+ "<extra_id_31>",
35
+ "<extra_id_32>",
36
+ "<extra_id_33>",
37
+ "<extra_id_34>",
38
+ "<extra_id_35>",
39
+ "<extra_id_36>",
40
+ "<extra_id_37>",
41
+ "<extra_id_38>",
42
+ "<extra_id_39>",
43
+ "<extra_id_40>",
44
+ "<extra_id_41>",
45
+ "<extra_id_42>",
46
+ "<extra_id_43>",
47
+ "<extra_id_44>",
48
+ "<extra_id_45>",
49
+ "<extra_id_46>",
50
+ "<extra_id_47>",
51
+ "<extra_id_48>",
52
+ "<extra_id_49>",
53
+ "<extra_id_50>",
54
+ "<extra_id_51>",
55
+ "<extra_id_52>",
56
+ "<extra_id_53>",
57
+ "<extra_id_54>",
58
+ "<extra_id_55>",
59
+ "<extra_id_56>",
60
+ "<extra_id_57>",
61
+ "<extra_id_58>",
62
+ "<extra_id_59>",
63
+ "<extra_id_60>",
64
+ "<extra_id_61>",
65
+ "<extra_id_62>",
66
+ "<extra_id_63>",
67
+ "<extra_id_64>",
68
+ "<extra_id_65>",
69
+ "<extra_id_66>",
70
+ "<extra_id_67>",
71
+ "<extra_id_68>",
72
+ "<extra_id_69>",
73
+ "<extra_id_70>",
74
+ "<extra_id_71>",
75
+ "<extra_id_72>",
76
+ "<extra_id_73>",
77
+ "<extra_id_74>",
78
+ "<extra_id_75>",
79
+ "<extra_id_76>",
80
+ "<extra_id_77>",
81
+ "<extra_id_78>",
82
+ "<extra_id_79>",
83
+ "<extra_id_80>",
84
+ "<extra_id_81>",
85
+ "<extra_id_82>",
86
+ "<extra_id_83>",
87
+ "<extra_id_84>",
88
+ "<extra_id_85>",
89
+ "<extra_id_86>",
90
+ "<extra_id_87>",
91
+ "<extra_id_88>",
92
+ "<extra_id_89>",
93
+ "<extra_id_90>",
94
+ "<extra_id_91>",
95
+ "<extra_id_92>",
96
+ "<extra_id_93>",
97
+ "<extra_id_94>",
98
+ "<extra_id_95>",
99
+ "<extra_id_96>",
100
+ "<extra_id_97>",
101
+ "<extra_id_98>",
102
+ "<extra_id_99>"
103
+ ],
104
+ "eos_token": "</s>",
105
+ "pad_token": "<pad>",
106
+ "unk_token": "<unk>"
107
+ }
checkpoint-750/spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d60acb128cf7b7f2536e8f38a5b18a05535c9e14c7a355904270e15b0945ea86
3
+ size 791656
checkpoint-750/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint-750/tokenizer_config.json ADDED
@@ -0,0 +1,112 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<extra_id_0>",
4
+ "<extra_id_1>",
5
+ "<extra_id_2>",
6
+ "<extra_id_3>",
7
+ "<extra_id_4>",
8
+ "<extra_id_5>",
9
+ "<extra_id_6>",
10
+ "<extra_id_7>",
11
+ "<extra_id_8>",
12
+ "<extra_id_9>",
13
+ "<extra_id_10>",
14
+ "<extra_id_11>",
15
+ "<extra_id_12>",
16
+ "<extra_id_13>",
17
+ "<extra_id_14>",
18
+ "<extra_id_15>",
19
+ "<extra_id_16>",
20
+ "<extra_id_17>",
21
+ "<extra_id_18>",
22
+ "<extra_id_19>",
23
+ "<extra_id_20>",
24
+ "<extra_id_21>",
25
+ "<extra_id_22>",
26
+ "<extra_id_23>",
27
+ "<extra_id_24>",
28
+ "<extra_id_25>",
29
+ "<extra_id_26>",
30
+ "<extra_id_27>",
31
+ "<extra_id_28>",
32
+ "<extra_id_29>",
33
+ "<extra_id_30>",
34
+ "<extra_id_31>",
35
+ "<extra_id_32>",
36
+ "<extra_id_33>",
37
+ "<extra_id_34>",
38
+ "<extra_id_35>",
39
+ "<extra_id_36>",
40
+ "<extra_id_37>",
41
+ "<extra_id_38>",
42
+ "<extra_id_39>",
43
+ "<extra_id_40>",
44
+ "<extra_id_41>",
45
+ "<extra_id_42>",
46
+ "<extra_id_43>",
47
+ "<extra_id_44>",
48
+ "<extra_id_45>",
49
+ "<extra_id_46>",
50
+ "<extra_id_47>",
51
+ "<extra_id_48>",
52
+ "<extra_id_49>",
53
+ "<extra_id_50>",
54
+ "<extra_id_51>",
55
+ "<extra_id_52>",
56
+ "<extra_id_53>",
57
+ "<extra_id_54>",
58
+ "<extra_id_55>",
59
+ "<extra_id_56>",
60
+ "<extra_id_57>",
61
+ "<extra_id_58>",
62
+ "<extra_id_59>",
63
+ "<extra_id_60>",
64
+ "<extra_id_61>",
65
+ "<extra_id_62>",
66
+ "<extra_id_63>",
67
+ "<extra_id_64>",
68
+ "<extra_id_65>",
69
+ "<extra_id_66>",
70
+ "<extra_id_67>",
71
+ "<extra_id_68>",
72
+ "<extra_id_69>",
73
+ "<extra_id_70>",
74
+ "<extra_id_71>",
75
+ "<extra_id_72>",
76
+ "<extra_id_73>",
77
+ "<extra_id_74>",
78
+ "<extra_id_75>",
79
+ "<extra_id_76>",
80
+ "<extra_id_77>",
81
+ "<extra_id_78>",
82
+ "<extra_id_79>",
83
+ "<extra_id_80>",
84
+ "<extra_id_81>",
85
+ "<extra_id_82>",
86
+ "<extra_id_83>",
87
+ "<extra_id_84>",
88
+ "<extra_id_85>",
89
+ "<extra_id_86>",
90
+ "<extra_id_87>",
91
+ "<extra_id_88>",
92
+ "<extra_id_89>",
93
+ "<extra_id_90>",
94
+ "<extra_id_91>",
95
+ "<extra_id_92>",
96
+ "<extra_id_93>",
97
+ "<extra_id_94>",
98
+ "<extra_id_95>",
99
+ "<extra_id_96>",
100
+ "<extra_id_97>",
101
+ "<extra_id_98>",
102
+ "<extra_id_99>"
103
+ ],
104
+ "eos_token": "</s>",
105
+ "extra_ids": 100,
106
+ "model_max_length": 512,
107
+ "name_or_path": "t5-base",
108
+ "pad_token": "<pad>",
109
+ "special_tokens_map_file": null,
110
+ "tokenizer_class": "T5Tokenizer",
111
+ "unk_token": "<unk>"
112
+ }
checkpoint-750/trainer_state.json ADDED
@@ -0,0 +1,538 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 9.146341463414634,
5
+ "global_step": 750,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.12,
12
+ "learning_rate": 1e-05,
13
+ "loss": 0.4133,
14
+ "step": 10
15
+ },
16
+ {
17
+ "epoch": 0.24,
18
+ "learning_rate": 2e-05,
19
+ "loss": 0.2546,
20
+ "step": 20
21
+ },
22
+ {
23
+ "epoch": 0.37,
24
+ "learning_rate": 3e-05,
25
+ "loss": 0.1767,
26
+ "step": 30
27
+ },
28
+ {
29
+ "epoch": 0.49,
30
+ "learning_rate": 4e-05,
31
+ "loss": 0.1409,
32
+ "step": 40
33
+ },
34
+ {
35
+ "epoch": 0.61,
36
+ "learning_rate": 5e-05,
37
+ "loss": 0.1687,
38
+ "step": 50
39
+ },
40
+ {
41
+ "epoch": 0.73,
42
+ "learning_rate": 6e-05,
43
+ "loss": 0.1161,
44
+ "step": 60
45
+ },
46
+ {
47
+ "epoch": 0.85,
48
+ "learning_rate": 7e-05,
49
+ "loss": 0.1192,
50
+ "step": 70
51
+ },
52
+ {
53
+ "epoch": 0.98,
54
+ "learning_rate": 8e-05,
55
+ "loss": 0.1233,
56
+ "step": 80
57
+ },
58
+ {
59
+ "epoch": 1.0,
60
+ "eval_loss": 0.13027246296405792,
61
+ "eval_runtime": 3.8565,
62
+ "eval_samples_per_second": 37.599,
63
+ "eval_steps_per_second": 2.593,
64
+ "step": 82
65
+ },
66
+ {
67
+ "epoch": 1.1,
68
+ "learning_rate": 9e-05,
69
+ "loss": 0.1006,
70
+ "step": 90
71
+ },
72
+ {
73
+ "epoch": 1.22,
74
+ "learning_rate": 0.0001,
75
+ "loss": 0.0578,
76
+ "step": 100
77
+ },
78
+ {
79
+ "epoch": 1.34,
80
+ "learning_rate": 9.861111111111112e-05,
81
+ "loss": 0.0835,
82
+ "step": 110
83
+ },
84
+ {
85
+ "epoch": 1.46,
86
+ "learning_rate": 9.722222222222223e-05,
87
+ "loss": 0.0605,
88
+ "step": 120
89
+ },
90
+ {
91
+ "epoch": 1.59,
92
+ "learning_rate": 9.583333333333334e-05,
93
+ "loss": 0.0665,
94
+ "step": 130
95
+ },
96
+ {
97
+ "epoch": 1.71,
98
+ "learning_rate": 9.444444444444444e-05,
99
+ "loss": 0.0513,
100
+ "step": 140
101
+ },
102
+ {
103
+ "epoch": 1.83,
104
+ "learning_rate": 9.305555555555556e-05,
105
+ "loss": 0.0638,
106
+ "step": 150
107
+ },
108
+ {
109
+ "epoch": 1.95,
110
+ "learning_rate": 9.166666666666667e-05,
111
+ "loss": 0.0585,
112
+ "step": 160
113
+ },
114
+ {
115
+ "epoch": 2.0,
116
+ "eval_loss": 0.08042938262224197,
117
+ "eval_runtime": 3.8773,
118
+ "eval_samples_per_second": 37.397,
119
+ "eval_steps_per_second": 2.579,
120
+ "step": 164
121
+ },
122
+ {
123
+ "epoch": 2.07,
124
+ "learning_rate": 9.027777777777779e-05,
125
+ "loss": 0.022,
126
+ "step": 170
127
+ },
128
+ {
129
+ "epoch": 2.2,
130
+ "learning_rate": 8.888888888888889e-05,
131
+ "loss": 0.0175,
132
+ "step": 180
133
+ },
134
+ {
135
+ "epoch": 2.32,
136
+ "learning_rate": 8.75e-05,
137
+ "loss": 0.015,
138
+ "step": 190
139
+ },
140
+ {
141
+ "epoch": 2.44,
142
+ "learning_rate": 8.611111111111112e-05,
143
+ "loss": 0.0186,
144
+ "step": 200
145
+ },
146
+ {
147
+ "epoch": 2.56,
148
+ "learning_rate": 8.472222222222222e-05,
149
+ "loss": 0.025,
150
+ "step": 210
151
+ },
152
+ {
153
+ "epoch": 2.68,
154
+ "learning_rate": 8.333333333333334e-05,
155
+ "loss": 0.0237,
156
+ "step": 220
157
+ },
158
+ {
159
+ "epoch": 2.8,
160
+ "learning_rate": 8.194444444444445e-05,
161
+ "loss": 0.0199,
162
+ "step": 230
163
+ },
164
+ {
165
+ "epoch": 2.93,
166
+ "learning_rate": 8.055555555555556e-05,
167
+ "loss": 0.0305,
168
+ "step": 240
169
+ },
170
+ {
171
+ "epoch": 3.0,
172
+ "eval_loss": 0.11400174349546432,
173
+ "eval_runtime": 3.8699,
174
+ "eval_samples_per_second": 37.469,
175
+ "eval_steps_per_second": 2.584,
176
+ "step": 246
177
+ },
178
+ {
179
+ "epoch": 3.05,
180
+ "learning_rate": 7.916666666666666e-05,
181
+ "loss": 0.0067,
182
+ "step": 250
183
+ },
184
+ {
185
+ "epoch": 3.17,
186
+ "learning_rate": 7.777777777777778e-05,
187
+ "loss": 0.0084,
188
+ "step": 260
189
+ },
190
+ {
191
+ "epoch": 3.29,
192
+ "learning_rate": 7.638888888888889e-05,
193
+ "loss": 0.0078,
194
+ "step": 270
195
+ },
196
+ {
197
+ "epoch": 3.41,
198
+ "learning_rate": 7.500000000000001e-05,
199
+ "loss": 0.0036,
200
+ "step": 280
201
+ },
202
+ {
203
+ "epoch": 3.54,
204
+ "learning_rate": 7.361111111111111e-05,
205
+ "loss": 0.0075,
206
+ "step": 290
207
+ },
208
+ {
209
+ "epoch": 3.66,
210
+ "learning_rate": 7.222222222222222e-05,
211
+ "loss": 0.0051,
212
+ "step": 300
213
+ },
214
+ {
215
+ "epoch": 3.78,
216
+ "learning_rate": 7.083333333333334e-05,
217
+ "loss": 0.0067,
218
+ "step": 310
219
+ },
220
+ {
221
+ "epoch": 3.9,
222
+ "learning_rate": 6.944444444444444e-05,
223
+ "loss": 0.0147,
224
+ "step": 320
225
+ },
226
+ {
227
+ "epoch": 4.0,
228
+ "eval_loss": 0.17557735741138458,
229
+ "eval_runtime": 3.8616,
230
+ "eval_samples_per_second": 37.549,
231
+ "eval_steps_per_second": 2.59,
232
+ "step": 328
233
+ },
234
+ {
235
+ "epoch": 4.02,
236
+ "learning_rate": 6.805555555555556e-05,
237
+ "loss": 0.0212,
238
+ "step": 330
239
+ },
240
+ {
241
+ "epoch": 4.15,
242
+ "learning_rate": 6.666666666666667e-05,
243
+ "loss": 0.0073,
244
+ "step": 340
245
+ },
246
+ {
247
+ "epoch": 4.27,
248
+ "learning_rate": 6.527777777777778e-05,
249
+ "loss": 0.004,
250
+ "step": 350
251
+ },
252
+ {
253
+ "epoch": 4.39,
254
+ "learning_rate": 6.388888888888888e-05,
255
+ "loss": 0.0049,
256
+ "step": 360
257
+ },
258
+ {
259
+ "epoch": 4.51,
260
+ "learning_rate": 6.25e-05,
261
+ "loss": 0.0086,
262
+ "step": 370
263
+ },
264
+ {
265
+ "epoch": 4.63,
266
+ "learning_rate": 6.111111111111112e-05,
267
+ "loss": 0.0051,
268
+ "step": 380
269
+ },
270
+ {
271
+ "epoch": 4.76,
272
+ "learning_rate": 5.972222222222223e-05,
273
+ "loss": 0.0009,
274
+ "step": 390
275
+ },
276
+ {
277
+ "epoch": 4.88,
278
+ "learning_rate": 5.833333333333334e-05,
279
+ "loss": 0.005,
280
+ "step": 400
281
+ },
282
+ {
283
+ "epoch": 5.0,
284
+ "learning_rate": 5.6944444444444445e-05,
285
+ "loss": 0.0025,
286
+ "step": 410
287
+ },
288
+ {
289
+ "epoch": 5.0,
290
+ "eval_loss": 0.19509804248809814,
291
+ "eval_runtime": 3.8565,
292
+ "eval_samples_per_second": 37.599,
293
+ "eval_steps_per_second": 2.593,
294
+ "step": 410
295
+ },
296
+ {
297
+ "epoch": 5.12,
298
+ "learning_rate": 5.555555555555556e-05,
299
+ "loss": 0.0039,
300
+ "step": 420
301
+ },
302
+ {
303
+ "epoch": 5.24,
304
+ "learning_rate": 5.4166666666666664e-05,
305
+ "loss": 0.0037,
306
+ "step": 430
307
+ },
308
+ {
309
+ "epoch": 5.37,
310
+ "learning_rate": 5.2777777777777784e-05,
311
+ "loss": 0.0032,
312
+ "step": 440
313
+ },
314
+ {
315
+ "epoch": 5.49,
316
+ "learning_rate": 5.138888888888889e-05,
317
+ "loss": 0.0002,
318
+ "step": 450
319
+ },
320
+ {
321
+ "epoch": 5.61,
322
+ "learning_rate": 5e-05,
323
+ "loss": 0.006,
324
+ "step": 460
325
+ },
326
+ {
327
+ "epoch": 5.73,
328
+ "learning_rate": 4.8611111111111115e-05,
329
+ "loss": 0.0067,
330
+ "step": 470
331
+ },
332
+ {
333
+ "epoch": 5.85,
334
+ "learning_rate": 4.722222222222222e-05,
335
+ "loss": 0.0046,
336
+ "step": 480
337
+ },
338
+ {
339
+ "epoch": 5.98,
340
+ "learning_rate": 4.5833333333333334e-05,
341
+ "loss": 0.0009,
342
+ "step": 490
343
+ },
344
+ {
345
+ "epoch": 6.0,
346
+ "eval_loss": 0.21209779381752014,
347
+ "eval_runtime": 3.8607,
348
+ "eval_samples_per_second": 37.558,
349
+ "eval_steps_per_second": 2.59,
350
+ "step": 492
351
+ },
352
+ {
353
+ "epoch": 6.1,
354
+ "learning_rate": 4.4444444444444447e-05,
355
+ "loss": 0.0017,
356
+ "step": 500
357
+ },
358
+ {
359
+ "epoch": 6.22,
360
+ "learning_rate": 4.305555555555556e-05,
361
+ "loss": 0.0069,
362
+ "step": 510
363
+ },
364
+ {
365
+ "epoch": 6.34,
366
+ "learning_rate": 4.166666666666667e-05,
367
+ "loss": 0.001,
368
+ "step": 520
369
+ },
370
+ {
371
+ "epoch": 6.46,
372
+ "learning_rate": 4.027777777777778e-05,
373
+ "loss": 0.0053,
374
+ "step": 530
375
+ },
376
+ {
377
+ "epoch": 6.59,
378
+ "learning_rate": 3.888888888888889e-05,
379
+ "loss": 0.0,
380
+ "step": 540
381
+ },
382
+ {
383
+ "epoch": 6.71,
384
+ "learning_rate": 3.7500000000000003e-05,
385
+ "loss": 0.0001,
386
+ "step": 550
387
+ },
388
+ {
389
+ "epoch": 6.83,
390
+ "learning_rate": 3.611111111111111e-05,
391
+ "loss": 0.0019,
392
+ "step": 560
393
+ },
394
+ {
395
+ "epoch": 6.95,
396
+ "learning_rate": 3.472222222222222e-05,
397
+ "loss": 0.0038,
398
+ "step": 570
399
+ },
400
+ {
401
+ "epoch": 7.0,
402
+ "eval_loss": 0.21831980347633362,
403
+ "eval_runtime": 3.8578,
404
+ "eval_samples_per_second": 37.586,
405
+ "eval_steps_per_second": 2.592,
406
+ "step": 574
407
+ },
408
+ {
409
+ "epoch": 7.07,
410
+ "learning_rate": 3.3333333333333335e-05,
411
+ "loss": 0.005,
412
+ "step": 580
413
+ },
414
+ {
415
+ "epoch": 7.2,
416
+ "learning_rate": 3.194444444444444e-05,
417
+ "loss": 0.0001,
418
+ "step": 590
419
+ },
420
+ {
421
+ "epoch": 7.32,
422
+ "learning_rate": 3.055555555555556e-05,
423
+ "loss": 0.0066,
424
+ "step": 600
425
+ },
426
+ {
427
+ "epoch": 7.44,
428
+ "learning_rate": 2.916666666666667e-05,
429
+ "loss": 0.0027,
430
+ "step": 610
431
+ },
432
+ {
433
+ "epoch": 7.56,
434
+ "learning_rate": 2.777777777777778e-05,
435
+ "loss": 0.0009,
436
+ "step": 620
437
+ },
438
+ {
439
+ "epoch": 7.68,
440
+ "learning_rate": 2.6388888888888892e-05,
441
+ "loss": 0.0016,
442
+ "step": 630
443
+ },
444
+ {
445
+ "epoch": 7.8,
446
+ "learning_rate": 2.5e-05,
447
+ "loss": 0.0055,
448
+ "step": 640
449
+ },
450
+ {
451
+ "epoch": 7.93,
452
+ "learning_rate": 2.361111111111111e-05,
453
+ "loss": 0.0016,
454
+ "step": 650
455
+ },
456
+ {
457
+ "epoch": 8.0,
458
+ "eval_loss": 0.2091258317232132,
459
+ "eval_runtime": 3.9519,
460
+ "eval_samples_per_second": 36.691,
461
+ "eval_steps_per_second": 2.53,
462
+ "step": 656
463
+ },
464
+ {
465
+ "epoch": 8.05,
466
+ "learning_rate": 2.2222222222222223e-05,
467
+ "loss": 0.0013,
468
+ "step": 660
469
+ },
470
+ {
471
+ "epoch": 8.17,
472
+ "learning_rate": 2.0833333333333336e-05,
473
+ "loss": 0.0023,
474
+ "step": 670
475
+ },
476
+ {
477
+ "epoch": 8.29,
478
+ "learning_rate": 1.9444444444444445e-05,
479
+ "loss": 0.0001,
480
+ "step": 680
481
+ },
482
+ {
483
+ "epoch": 8.41,
484
+ "learning_rate": 1.8055555555555555e-05,
485
+ "loss": 0.0038,
486
+ "step": 690
487
+ },
488
+ {
489
+ "epoch": 8.54,
490
+ "learning_rate": 1.6666666666666667e-05,
491
+ "loss": 0.0036,
492
+ "step": 700
493
+ },
494
+ {
495
+ "epoch": 8.66,
496
+ "learning_rate": 1.527777777777778e-05,
497
+ "loss": 0.0026,
498
+ "step": 710
499
+ },
500
+ {
501
+ "epoch": 8.78,
502
+ "learning_rate": 1.388888888888889e-05,
503
+ "loss": 0.0016,
504
+ "step": 720
505
+ },
506
+ {
507
+ "epoch": 8.9,
508
+ "learning_rate": 1.25e-05,
509
+ "loss": 0.0025,
510
+ "step": 730
511
+ },
512
+ {
513
+ "epoch": 9.0,
514
+ "eval_loss": 0.22118298709392548,
515
+ "eval_runtime": 3.8379,
516
+ "eval_samples_per_second": 37.781,
517
+ "eval_steps_per_second": 2.606,
518
+ "step": 738
519
+ },
520
+ {
521
+ "epoch": 9.02,
522
+ "learning_rate": 1.1111111111111112e-05,
523
+ "loss": 0.0,
524
+ "step": 740
525
+ },
526
+ {
527
+ "epoch": 9.15,
528
+ "learning_rate": 9.722222222222223e-06,
529
+ "loss": 0.0001,
530
+ "step": 750
531
+ }
532
+ ],
533
+ "max_steps": 820,
534
+ "num_train_epochs": 10,
535
+ "total_flos": 0.0,
536
+ "trial_name": null,
537
+ "trial_params": null
538
+ }
checkpoint-750/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:059a30c261f3bd54fbfe2362d7894c790b619685a34fdc10f23e0cddffd8fcd8
3
+ size 3567
config.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "t5-base",
3
+ "architectures": [
4
+ "T5ForConditionalGeneration"
5
+ ],
6
+ "d_ff": 3072,
7
+ "d_kv": 64,
8
+ "d_model": 768,
9
+ "decoder_start_token_id": 0,
10
+ "dense_act_fn": "relu",
11
+ "dropout_rate": 0.1,
12
+ "eos_token_id": 1,
13
+ "feed_forward_proj": "relu",
14
+ "initializer_factor": 1.0,
15
+ "is_encoder_decoder": true,
16
+ "is_gated_act": false,
17
+ "layer_norm_epsilon": 1e-06,
18
+ "model_type": "t5",
19
+ "n_positions": 512,
20
+ "num_decoder_layers": 12,
21
+ "num_heads": 12,
22
+ "num_layers": 12,
23
+ "output_past": true,
24
+ "pad_token_id": 0,
25
+ "relative_attention_max_distance": 128,
26
+ "relative_attention_num_buckets": 32,
27
+ "task_specific_params": {
28
+ "summarization": {
29
+ "early_stopping": true,
30
+ "length_penalty": 2.0,
31
+ "max_length": 200,
32
+ "min_length": 30,
33
+ "no_repeat_ngram_size": 3,
34
+ "num_beams": 4,
35
+ "prefix": "summarize: "
36
+ },
37
+ "translation_en_to_de": {
38
+ "early_stopping": true,
39
+ "max_length": 300,
40
+ "num_beams": 4,
41
+ "prefix": "translate English to German: "
42
+ },
43
+ "translation_en_to_fr": {
44
+ "early_stopping": true,
45
+ "max_length": 300,
46
+ "num_beams": 4,
47
+ "prefix": "translate English to French: "
48
+ },
49
+ "translation_en_to_ro": {
50
+ "early_stopping": true,
51
+ "max_length": 300,
52
+ "num_beams": 4,
53
+ "prefix": "translate English to Romanian: "
54
+ }
55
+ },
56
+ "torch_dtype": "float32",
57
+ "transformers_version": "4.21.1",
58
+ "use_cache": true,
59
+ "vocab_size": 32128
60
+ }
outputs.json ADDED
@@ -0,0 +1,1162 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "premise": "i cannot digest all this information",
4
+ "hypothesis": "i cannot understand all this information",
5
+ "label": "entailment",
6
+ "explanation": "",
7
+ "predicted_label": "entailment",
8
+ "model_explanation": ""
9
+ },
10
+ {
11
+ "premise": "the market is being clogged by these operations",
12
+ "hypothesis": "the drain is being clogged by these operations",
13
+ "label": "contradiction",
14
+ "explanation": "",
15
+ "predicted_label": "contradiction",
16
+ "model_explanation": ""
17
+ },
18
+ {
19
+ "premise": "the gun kicked back into my shoulder.",
20
+ "hypothesis": "the mule kicked back into my shoulder.",
21
+ "label": "contradiction",
22
+ "explanation": "",
23
+ "predicted_label": "contradiction",
24
+ "model_explanation": ""
25
+ },
26
+ {
27
+ "premise": "it dawned on him that she had betrayed him",
28
+ "hypothesis": "the sun dawned on him",
29
+ "label": "contradiction",
30
+ "explanation": "",
31
+ "predicted_label": "contradiction",
32
+ "model_explanation": ""
33
+ },
34
+ {
35
+ "premise": "They are enemies on the field -- and on draft day -- but many are friends who love to talk shop and, sometimes, even trade information. ",
36
+ "hypothesis": "There is also a lot of cross-pollination among the front offices and coaching staffs of the 32 NFL teams. They are enemies on the field -- and on draft day -- but many are friends who love to talk shit and, sometimes, even trade information.",
37
+ "label": "contradiction",
38
+ "explanation": "",
39
+ "predicted_label": "entailment",
40
+ "model_explanation": ""
41
+ },
42
+ {
43
+ "premise": "And the song this shape suggested",
44
+ "hypothesis": "And the song this shape reminded one of",
45
+ "label": "entailment",
46
+ "explanation": "",
47
+ "predicted_label": "entailment",
48
+ "model_explanation": ""
49
+ },
50
+ {
51
+ "premise": "We could still be looking for it when they blow us out of the water . \u2019",
52
+ "hypothesis": "We could still be looking for it when they surpassed us . \u2019",
53
+ "label": "entailment",
54
+ "explanation": "",
55
+ "predicted_label": "entailment",
56
+ "model_explanation": ""
57
+ },
58
+ {
59
+ "premise": "\u2018 To a certain extent you 'll have free rein,\u2019 he 'd told her over the telephone .",
60
+ "hypothesis": "\u2018 To a certain extent you 'll have unrestricted liberty of decision ,\u2019 he 'd told her over the telephone .",
61
+ "label": "entailment",
62
+ "explanation": "",
63
+ "predicted_label": "entailment",
64
+ "model_explanation": ""
65
+ },
66
+ {
67
+ "premise": "Swindon are on a roll at the moment and when things are going right , you ca n't go wrong .",
68
+ "hypothesis": "Swindon are having great success at the moment and when things are going right , you ca n't go wrong .",
69
+ "label": "entailment",
70
+ "explanation": "",
71
+ "predicted_label": "entailment",
72
+ "model_explanation": ""
73
+ },
74
+ {
75
+ "premise": "Covered all the earth with silence ,",
76
+ "hypothesis": "Made everything on the earth silent",
77
+ "label": "entailment",
78
+ "explanation": "",
79
+ "predicted_label": "entailment",
80
+ "model_explanation": ""
81
+ },
82
+ {
83
+ "premise": "While you 've been living it up in the lap of luxury \u2014\u2019",
84
+ "hypothesis": "While you 've been spending your time living in an enjoyable way in the lap of luxury \u2014\u2019",
85
+ "label": "entailment",
86
+ "explanation": "",
87
+ "predicted_label": "entailment",
88
+ "model_explanation": ""
89
+ },
90
+ {
91
+ "premise": "Marilyn Monroe in the 1953 film \u2018 How to Marry a Millionaire\u2019 is seen in her cabin on board the Queen Mary trying to come to terms with her Travellers Letter of Credit .",
92
+ "hypothesis": "Marilyn Monroe in the 1953 film \u2018 How to Marry a Millionaire\u2019 is seen in her cabin on board the Queen Mary trying to accept her Travellers Letter of Credit .",
93
+ "label": "entailment",
94
+ "explanation": "",
95
+ "predicted_label": "entailment",
96
+ "model_explanation": ""
97
+ },
98
+ {
99
+ "premise": "Fell the sunshine on his features ,",
100
+ "hypothesis": "Shone the sunshine on his features",
101
+ "label": "entailment",
102
+ "explanation": "",
103
+ "predicted_label": "entailment",
104
+ "model_explanation": ""
105
+ },
106
+ {
107
+ "premise": "the heavy rain guttered the soil.",
108
+ "hypothesis": "the heavy rain made channels in the soil.",
109
+ "label": "entailment",
110
+ "explanation": "",
111
+ "predicted_label": "entailment",
112
+ "model_explanation": ""
113
+ },
114
+ {
115
+ "premise": "Sister will put a pad over your eye for the time being ; I 'll telephone the hospital and we 'll arrange for someone to drive you over there .\u2019",
116
+ "hypothesis": "Sister will put a pad over your eye for now ; I 'll telephone the hospital and we 'll arrange for someone to drive you over there .\u2019",
117
+ "label": "entailment",
118
+ "explanation": "",
119
+ "predicted_label": "entailment",
120
+ "model_explanation": ""
121
+ },
122
+ {
123
+ "premise": "He followed suit , and , leaning back against the pillows , put a comforting arm around her .",
124
+ "hypothesis": "He conformed to another's actions , and , leaning back against the pillows , put a comforting arm around her .",
125
+ "label": "entailment",
126
+ "explanation": "",
127
+ "predicted_label": "entailment",
128
+ "model_explanation": ""
129
+ },
130
+ {
131
+ "premise": "they clawed their way to the top of the mountain.",
132
+ "hypothesis": "they climbed their way to the top of the mountain.",
133
+ "label": "entailment",
134
+ "explanation": "",
135
+ "predicted_label": "entailment",
136
+ "model_explanation": ""
137
+ },
138
+ {
139
+ "premise": "Where a brooklet led them onward ,",
140
+ "hypothesis": "Where a women led them onward ,",
141
+ "label": "contradiction",
142
+ "explanation": "",
143
+ "predicted_label": "contradiction",
144
+ "model_explanation": ""
145
+ },
146
+ {
147
+ "premise": "I 'll catch a cold .",
148
+ "hypothesis": "I 'll catch a ball.",
149
+ "label": "contradiction",
150
+ "explanation": "",
151
+ "predicted_label": "contradiction",
152
+ "model_explanation": ""
153
+ },
154
+ {
155
+ "premise": "De Quincey was more or less in hiding from Edinburgh people to whom he owed large sums of money , so Glasgow , a thriving and blackening metropolis of 365 , 000 souls , was the ideal place in which to eat your opium and keep your head down .",
156
+ "hypothesis": "De Quincey was more or less in hiding from Edinburgh people to whom he owed large sums of money , so Glasgow , a thriving and blackening metropolis of 365 , 000 souls , was the ideal place in which to eat your opium and keep your head .",
157
+ "label": "contradiction",
158
+ "explanation": "",
159
+ "predicted_label": "entailment",
160
+ "model_explanation": ""
161
+ },
162
+ {
163
+ "premise": "Immediately there was a loud laugh of relief from the guests , who at once took it that the child had come to terms with her charges ' ultimate fate .",
164
+ "hypothesis": "Immediately there was a loud laugh of relief from the guests , who at once took it that the child had come to accept her charges ' ultimate fate .",
165
+ "label": "entailment",
166
+ "explanation": "",
167
+ "predicted_label": "entailment",
168
+ "model_explanation": ""
169
+ },
170
+ {
171
+ "premise": "I know that 's not your fault , but all the same , God damn you , I ca n't help hating your guts\u2014!\u2019",
172
+ "hypothesis": "I know that 's not your fault , but all the same , God damn you , I ca n't help hating you so much \u2014!\u2019",
173
+ "label": "entailment",
174
+ "explanation": "",
175
+ "predicted_label": "entailment",
176
+ "model_explanation": ""
177
+ },
178
+ {
179
+ "premise": "Sadly with my church and Pat Roberson you do not have accountability and people are fearful to stand up to take action when your leader says or acts out of order.",
180
+ "hypothesis": "Sadly with my church and Pat Roberson you do not have accountability and people are fearful to stand up to take action when your leader says or acts inappropriately.",
181
+ "label": "entailment",
182
+ "explanation": "",
183
+ "predicted_label": "entailment",
184
+ "model_explanation": ""
185
+ },
186
+ {
187
+ "premise": "Why t why c why do they not communicate upwards and I think essentially people it in subordinate positions are about managing the impressions others have of them and tend to believe the notion , no matter how true it is , that er that organisations may have a shoot the messenger philosophy , yes ?",
188
+ "hypothesis": "Why t why c why do they not communicate upwards and I think essentially people it in subordinate positions are about managing the impressions others have of them and tend to believe the notion , no matter how true it is , that er that organisations may have a blaming the bad news bearer philosophy , yes ?",
189
+ "label": "entailment",
190
+ "explanation": "",
191
+ "predicted_label": "entailment",
192
+ "model_explanation": ""
193
+ },
194
+ {
195
+ "premise": "Saw his youth rise up before him",
196
+ "hypothesis": "Saw the sea rise up before him",
197
+ "label": "contradiction",
198
+ "explanation": "",
199
+ "predicted_label": "contradiction",
200
+ "model_explanation": ""
201
+ },
202
+ {
203
+ "premise": "The stains on the carpet have survived every name change .",
204
+ "hypothesis": "The stains on the carpet have outlasted every name change .",
205
+ "label": "entailment",
206
+ "explanation": "",
207
+ "predicted_label": "entailment",
208
+ "model_explanation": ""
209
+ },
210
+ {
211
+ "premise": "Once again , however , he discovered he had struck a chord with ordinary people , people who had felt they were unfit to pass judgement on modern buildings because they lacked the qualifications .",
212
+ "hypothesis": "Once again , however , he discovered he had struck ordinary people , people who had felt they were unfit to pass judgement on modern buildings because they lacked the qualifications .",
213
+ "label": "contradiction",
214
+ "explanation": "",
215
+ "predicted_label": "entailment",
216
+ "model_explanation": ""
217
+ },
218
+ {
219
+ "premise": "Using cash and bank accounts to collect and disburse contributions for welfare , was easier than collecting animals on the hoof , grains or sugar in sacks , and it was much easier to transfer the payments .",
220
+ "hypothesis": "Using cash and bank accounts to collect and disburse contributions for welfare , was easier than collecting animals not yet killed for eating , grains or sugar in sacks , and it was much easier to transfer the payments .",
221
+ "label": "entailment",
222
+ "explanation": "",
223
+ "predicted_label": "contradiction",
224
+ "model_explanation": ""
225
+ },
226
+ {
227
+ "premise": "her face glowed when she came out of the sauna",
228
+ "hypothesis": "her face became shining when she came out of the sauna",
229
+ "label": "entailment",
230
+ "explanation": "",
231
+ "predicted_label": "entailment",
232
+ "model_explanation": ""
233
+ },
234
+ {
235
+ "premise": "It was not as if what he saw fell short of his expectations .",
236
+ "hypothesis": "It was not as if what he saw did not meet his expectations .",
237
+ "label": "entailment",
238
+ "explanation": "",
239
+ "predicted_label": "entailment",
240
+ "model_explanation": ""
241
+ },
242
+ {
243
+ "premise": "the crowd flowed out of the stadium",
244
+ "hypothesis": "the water flowed out of the stadium",
245
+ "label": "contradiction",
246
+ "explanation": "",
247
+ "predicted_label": "contradiction",
248
+ "model_explanation": ""
249
+ },
250
+ {
251
+ "premise": "every star seemed to flare with new intensity.",
252
+ "hypothesis": "every star seemed to shine with new intensity",
253
+ "label": "entailment",
254
+ "explanation": "",
255
+ "predicted_label": "entailment",
256
+ "model_explanation": ""
257
+ },
258
+ {
259
+ "premise": "Monetarists also recognize that the demand for money can shift unpredictably in the short run with changing expectations of prices , interest rates and exchange rates .",
260
+ "hypothesis": "Monetarists also recognize that the demand for money can shift unpredictably in the near future with changing expectations of prices , interest rates and exchange rates .",
261
+ "label": "entailment",
262
+ "explanation": "",
263
+ "predicted_label": "entailment",
264
+ "model_explanation": ""
265
+ },
266
+ {
267
+ "premise": "McQueen was accompanied on location by Ali MacGraw , whom he had met on The Getaway , and whose presence he admitted saved him from going round the bend .",
268
+ "hypothesis": "McQueen was accompanied on location by Ali MacGraw , whom he had met on The Getaway , and whose presence he admitted saved him from going crazy .",
269
+ "label": "entailment",
270
+ "explanation": "",
271
+ "predicted_label": "entailment",
272
+ "model_explanation": ""
273
+ },
274
+ {
275
+ "premise": "It was as if he was proposing a bargain to God : I'll come to church , if You \u2018 ll turn a blind eye later .",
276
+ "hypothesis": "It was as if he was proposing a bargain to God : I'll come to church , if You \u2018 ll overlook later .",
277
+ "label": "entailment",
278
+ "explanation": "",
279
+ "predicted_label": "entailment",
280
+ "model_explanation": ""
281
+ },
282
+ {
283
+ "premise": "my son drifted around for years in california before going to law school",
284
+ "hypothesis": "my son drifted holes as an engineer for years in california before going to law school",
285
+ "label": "contradiction",
286
+ "explanation": "",
287
+ "predicted_label": "contradiction",
288
+ "model_explanation": ""
289
+ },
290
+ {
291
+ "premise": "she drowned her trouble in alcohol",
292
+ "hypothesis": "she drowned her baby in the tub",
293
+ "label": "contradiction",
294
+ "explanation": "",
295
+ "predicted_label": "contradiction",
296
+ "model_explanation": ""
297
+ },
298
+ {
299
+ "premise": "The results of allowing boroughs to withdraw would , to say the least , be chaotic .",
300
+ "hypothesis": "The results of allowing boroughs to withdraw would , at least , be chaotic .",
301
+ "label": "entailment",
302
+ "explanation": "",
303
+ "predicted_label": "entailment",
304
+ "model_explanation": ""
305
+ },
306
+ {
307
+ "premise": "Whichever camp you are in , the same celestial advice will apply \u2014 hit below the belt .",
308
+ "hypothesis": "Whichever camp you are in , the same celestial advice will apply \u2014 hit their belt .",
309
+ "label": "contradiction",
310
+ "explanation": "",
311
+ "predicted_label": "contradiction",
312
+ "model_explanation": ""
313
+ },
314
+ {
315
+ "premise": "they clawed their way to the top of the mountain.",
316
+ "hypothesis": "the cats clawed their way to the top of the curtain",
317
+ "label": "contradiction",
318
+ "explanation": "",
319
+ "predicted_label": "contradiction",
320
+ "model_explanation": ""
321
+ },
322
+ {
323
+ "premise": "he injected new life into the performance",
324
+ "hypothesis": "he injected new drugs into the performer's system",
325
+ "label": "contradiction",
326
+ "explanation": "",
327
+ "predicted_label": "contradiction",
328
+ "model_explanation": ""
329
+ },
330
+ {
331
+ "premise": "my personal feelings color my judgment in this case",
332
+ "hypothesis": "my personal feelings affect my judgment in this case",
333
+ "label": "entailment",
334
+ "explanation": "",
335
+ "predicted_label": "entailment",
336
+ "model_explanation": ""
337
+ },
338
+ {
339
+ "premise": "The project has run to schedule throughout and we have maintained volumes , thanks to the co - operation of everyone in the mill who have accepted enormous changes in working practices and got to grips with the new system quickly and competently \u2014 its ultimate success will be a tribute to them all .",
340
+ "hypothesis": "The project has run to schedule throughout and we have maintained volumes , thanks to the co - operation of everyone in the mill who have accepted enormous changes in working practices and begun to use the new system quickly and competently \u2014 its ultimate success will be a tribute to them all .",
341
+ "label": "entailment",
342
+ "explanation": "",
343
+ "predicted_label": "entailment",
344
+ "model_explanation": ""
345
+ },
346
+ {
347
+ "premise": "But their hopes took a dive in the 62nd minute when Polish striker Marcel Witeczek went on a run to score a superb individual goal .",
348
+ "hypothesis": "But their hopes fell suddenly in the 62nd minute when Polish striker Marcel Witeczek went on a run to score a superb individual goal .",
349
+ "label": "entailment",
350
+ "explanation": "",
351
+ "predicted_label": "entailment",
352
+ "model_explanation": ""
353
+ },
354
+ {
355
+ "premise": "Some of Mr Mellor 's favourite orchestras will probably be among companies handed over , albeit kicking and screaming .",
356
+ "hypothesis": "Some of Mr Mellor 's favourite orchestras will probably be among companies handed over , albeit reluctantly .",
357
+ "label": "entailment",
358
+ "explanation": "",
359
+ "predicted_label": "entailment",
360
+ "model_explanation": ""
361
+ },
362
+ {
363
+ "premise": "Till the darkness falls around us ,",
364
+ "hypothesis": "Till we fall in the darkness ,",
365
+ "label": "contradiction",
366
+ "explanation": "",
367
+ "predicted_label": "contradiction",
368
+ "model_explanation": ""
369
+ },
370
+ {
371
+ "premise": "Covered all the earth with silence ,",
372
+ "hypothesis": "Covered all the earth with cement",
373
+ "label": "contradiction",
374
+ "explanation": "",
375
+ "predicted_label": "contradiction",
376
+ "model_explanation": ""
377
+ },
378
+ {
379
+ "premise": "he heaped him with work",
380
+ "hypothesis": "he burdened him with work",
381
+ "label": "entailment",
382
+ "explanation": "",
383
+ "predicted_label": "entailment",
384
+ "model_explanation": ""
385
+ },
386
+ {
387
+ "premise": "The result of the debates of the early 1990s was a set of rough and ready rules on deficits and debt levels that was never taken quite seriously .",
388
+ "hypothesis": "The result of the debates of the early 1990s was a set of crude and effective rules on deficits and debt levels that was never taken quite seriously .",
389
+ "label": "entailment",
390
+ "explanation": "",
391
+ "predicted_label": "entailment",
392
+ "model_explanation": ""
393
+ },
394
+ {
395
+ "premise": "However , as has already been mentioned , Germany quickly broke ranks with the rest of the EC and the world over Croatia , which led , in the words of our Foreign Secretary , to\u2019 an acceptable compromise\u2019 .",
396
+ "hypothesis": "However , as has already been mentioned , Germany quickly broke laws with the rest of the EC and the world over Croatia , which led , in the words of our Foreign Secretary , to\u2019 an acceptable compromise\u2019 .",
397
+ "label": "contradiction",
398
+ "explanation": "",
399
+ "predicted_label": "contradiction",
400
+ "model_explanation": ""
401
+ },
402
+ {
403
+ "premise": "Between 1690 and 1713 the weakness of the Europeans in India , and the power of the Moghul emperors , had kept the peace .",
404
+ "hypothesis": "Between 1690 and 1713 the weakness of the Europeans in India , and the power of the Moghul emperors , had made sure that people refrain from conflict .",
405
+ "label": "entailment",
406
+ "explanation": "",
407
+ "predicted_label": "entailment",
408
+ "model_explanation": ""
409
+ },
410
+ {
411
+ "premise": "It was felt at the time that the upward movement was out of line with the underlying trend and the latest figures analysed by Reward suggest it has in fact been short - lived .",
412
+ "hypothesis": "It was felt at the time that the upward movement was inappropriate with the underlying trend and the latest figures analysed by Reward suggest it has in fact been short - lived .",
413
+ "label": "entailment",
414
+ "explanation": "",
415
+ "predicted_label": "entailment",
416
+ "model_explanation": ""
417
+ },
418
+ {
419
+ "premise": "That approach would seek to knock out a keystone of Civil Service tradition .",
420
+ "hypothesis": "That approach would seek to knock out the basis of Civil Service tradition .",
421
+ "label": "entailment",
422
+ "explanation": "",
423
+ "predicted_label": "contradiction",
424
+ "model_explanation": ""
425
+ },
426
+ {
427
+ "premise": "For me it is quite out of the question that the Maastricht treaties should be changed again in one way or another .",
428
+ "hypothesis": "For me it is impossible that the Maastricht treaties should be changed again in one way or another .",
429
+ "label": "entailment",
430
+ "explanation": "",
431
+ "predicted_label": "entailment",
432
+ "model_explanation": ""
433
+ },
434
+ {
435
+ "premise": "she was besieged by so many problems that she got discouraged",
436
+ "hypothesis": "she was besieged by so many soldiers that she gave up",
437
+ "label": "contradiction",
438
+ "explanation": "",
439
+ "predicted_label": "contradiction",
440
+ "model_explanation": ""
441
+ },
442
+ {
443
+ "premise": "During the 1950s , both railways hoped that major investment plans ( BTC 1955 ; RENFE 1950 ; 1957 m : ix ) would allow them to modernize , reduce costs and attract sufficient traffic to break even .",
444
+ "hypothesis": "During the 1950s , both railways hoped that major investment plans ( BTC 1955 ; RENFE 1950 ; 1957 m : ix ) would allow them to modernize , reduce costs and attract sufficient traffic to break records .",
445
+ "label": "contradiction",
446
+ "explanation": "",
447
+ "predicted_label": "contradiction",
448
+ "model_explanation": ""
449
+ },
450
+ {
451
+ "premise": "Instead of his usual behind the scenes stage management of pawns and other pieces , he was confronted by an array of unpredictable variables .",
452
+ "hypothesis": "Instead of his usual secret stage management of pawns and other pieces , he was confronted by an array of unpredictable variables .",
453
+ "label": "entailment",
454
+ "explanation": "",
455
+ "predicted_label": "entailment",
456
+ "model_explanation": ""
457
+ },
458
+ {
459
+ "premise": "With their fiery breath made answer :",
460
+ "hypothesis": "With their fiery breath gave an answer :",
461
+ "label": "entailment",
462
+ "explanation": "",
463
+ "predicted_label": "entailment",
464
+ "model_explanation": ""
465
+ },
466
+ {
467
+ "premise": "While they spake , the night departed :",
468
+ "hypothesis": "While they spake , the bird departed",
469
+ "label": "contradiction",
470
+ "explanation": "",
471
+ "predicted_label": "contradiction",
472
+ "model_explanation": ""
473
+ },
474
+ {
475
+ "premise": "Watson , who turned to crime after moving to London , slumped in the dock of Inner London Crown Court as Judge Brian Pryor handed out the sentence on Monday .",
476
+ "hypothesis": "Watson , who turned to crime after moving to London , slumped in the trial of Inner London Crown Court as Judge Brian Pryor handed out the sentence on Monday .",
477
+ "label": "entailment",
478
+ "explanation": "",
479
+ "predicted_label": "entailment",
480
+ "model_explanation": ""
481
+ },
482
+ {
483
+ "premise": "she aired her opinions on welfare",
484
+ "hypothesis": "she openly discussed her opinions on welfare",
485
+ "label": "entailment",
486
+ "explanation": "",
487
+ "predicted_label": "entailment",
488
+ "model_explanation": ""
489
+ },
490
+ {
491
+ "premise": "And made known unto the people",
492
+ "hypothesis": "And made corn for the people",
493
+ "label": "contradiction",
494
+ "explanation": "",
495
+ "predicted_label": "contradiction",
496
+ "model_explanation": ""
497
+ },
498
+ {
499
+ "premise": "Filled with joy was Mudjekeewis",
500
+ "hypothesis": "Experiencing great joy was Mudjekeewis",
501
+ "label": "entailment",
502
+ "explanation": "",
503
+ "predicted_label": "entailment",
504
+ "model_explanation": ""
505
+ },
506
+ {
507
+ "premise": "I 've got more straps and bloody cordless watches , everything , all over the place .",
508
+ "hypothesis": "I 've got more straps and bloody cordless watches , everything , everywhere .",
509
+ "label": "entailment",
510
+ "explanation": "",
511
+ "predicted_label": "entailment",
512
+ "model_explanation": ""
513
+ },
514
+ {
515
+ "premise": "However , the debate and the reception accorded to Mr Lawson 's speech was a striking demonstration of the Conservatives ' capacity to close ranks : proof , if proof were needed , of their party 's most formidable political resource .",
516
+ "hypothesis": "However , the debate and the reception accorded to Mr Lawson 's speech was a striking demonstration of the Conservatives ' capacity to work together : proof , if proof were needed , of their party 's most formidable political resource .",
517
+ "label": "entailment",
518
+ "explanation": "",
519
+ "predicted_label": "entailment",
520
+ "model_explanation": ""
521
+ },
522
+ {
523
+ "premise": "the rooms communicated",
524
+ "hypothesis": "the rooms were interconnected ",
525
+ "label": "entailment",
526
+ "explanation": "",
527
+ "predicted_label": "entailment",
528
+ "model_explanation": ""
529
+ },
530
+ {
531
+ "premise": "the new measures deflated the economy",
532
+ "hypothesis": "the new measures deflated the balloons",
533
+ "label": "contradiction",
534
+ "explanation": "",
535
+ "predicted_label": "contradiction",
536
+ "model_explanation": ""
537
+ },
538
+ {
539
+ "premise": "It was always likely that this would happen again this year , given that the Walker Cup team were making history whereas Faldo , for all his brilliance , was the second Briton and the fourth European in the Eighties to win at Augusta .",
540
+ "hypothesis": "It was always likely that this would happen again this year , given that the Walker Cup team were living in history whereas Faldo , for all his brilliance , was the second Briton and the fourth European in the Eighties to win at Augusta .",
541
+ "label": "contradiction",
542
+ "explanation": "",
543
+ "predicted_label": "entailment",
544
+ "model_explanation": ""
545
+ },
546
+ {
547
+ "premise": "If one decides to give away \u00a3 5 m to encourage the arts , I do not think that it is a very sensible way to give it to my noble friend Lord Archer , who is a very rich man already , and who gets \u00a3 6,000 a year out of the pockets of taxpayers who are very much poorer than he is . '",
548
+ "hypothesis": "If one decides to give away \u00a3 5 m to encourage the arts , I do not think that it is a very sensible way to give it to my noble friend Lord Archer , who is a very rich man already , and who gets \u00a3 6,000 a year from taxpayers who are very much poorer than he is . '",
549
+ "label": "entailment",
550
+ "explanation": "",
551
+ "predicted_label": "entailment",
552
+ "model_explanation": ""
553
+ },
554
+ {
555
+ "premise": "And his heart outran his footsteps ;",
556
+ "hypothesis": "And he outran his opponents ;",
557
+ "label": "contradiction",
558
+ "explanation": "",
559
+ "predicted_label": "contradiction",
560
+ "model_explanation": ""
561
+ },
562
+ {
563
+ "premise": "Benjamin went down on one knee , tugging at my sleeve for me to follow suit .",
564
+ "hypothesis": "Benjamin went down on one knee , tugging at my sleeve for me to conform to his actions .",
565
+ "label": "entailment",
566
+ "explanation": "",
567
+ "predicted_label": "entailment",
568
+ "model_explanation": ""
569
+ },
570
+ {
571
+ "premise": "At his touch he felt new courage",
572
+ "hypothesis": "At his touch he experienced new courage",
573
+ "label": "entailment",
574
+ "explanation": "",
575
+ "predicted_label": "entailment",
576
+ "model_explanation": ""
577
+ },
578
+ {
579
+ "premise": "\u2018 Of course he 's entitled to his opinion , but I do n't share it and it 's too premature to talk about anyone being certainties , or anyone being out of the running.\u2019",
580
+ "hypothesis": "\u2018 Of course he 's entitled to his opinion , but I do n't share it and it 's too premature to talk about anyone being certainties , or anyone running out.'",
581
+ "label": "contradiction",
582
+ "explanation": "",
583
+ "predicted_label": "contradiction",
584
+ "model_explanation": ""
585
+ },
586
+ {
587
+ "premise": "Some would have us believe that getting China and India on board will be easy .",
588
+ "hypothesis": "Some would have us believe that getting China and India boarded up will be easy .",
589
+ "label": "contradiction",
590
+ "explanation": "",
591
+ "predicted_label": "contradiction",
592
+ "model_explanation": ""
593
+ },
594
+ {
595
+ "premise": "Better to lose face and be open about not understanding the cryptic message , than to lose sleep at night over it .",
596
+ "hypothesis": "Better to lose money and be open about not understanding the cryptic message , than to lose sleep at night over it .",
597
+ "label": "contradiction",
598
+ "explanation": "",
599
+ "predicted_label": "contradiction",
600
+ "model_explanation": ""
601
+ },
602
+ {
603
+ "premise": "Belfast Telegraph Plan 82 could fit the bill because it covers 20 selections with a fine guarantee of at least seven 1 - 1 draws together if eight of your 20 selections end as 1 - 1 draws .",
604
+ "hypothesis": "Belfast Telegraph Plan 82 could be suitable because it covers 20 selections with a fine guarantee of at least seven 1 - 1 draws together if eight of your 20 selections end as 1 - 1 draws .",
605
+ "label": "entailment",
606
+ "explanation": "",
607
+ "predicted_label": "entailment",
608
+ "model_explanation": ""
609
+ },
610
+ {
611
+ "premise": "fill the child with pride",
612
+ "hypothesis": "make the child proud",
613
+ "label": "entailment",
614
+ "explanation": "",
615
+ "predicted_label": "entailment",
616
+ "model_explanation": ""
617
+ },
618
+ {
619
+ "premise": "\u2018 Westerns have a gladiatorial , timeless quality .",
620
+ "hypothesis": "Westerns have a violent-like-gladiator-combat , timeless quality .",
621
+ "label": "entailment",
622
+ "explanation": "",
623
+ "predicted_label": "entailment",
624
+ "model_explanation": ""
625
+ },
626
+ {
627
+ "premise": "I mean she 'll be out two days on the trot .",
628
+ "hypothesis": "I mean she 'll be out two days in a row .",
629
+ "label": "entailment",
630
+ "explanation": "",
631
+ "predicted_label": "entailment",
632
+ "model_explanation": ""
633
+ },
634
+ {
635
+ "premise": "In what she acknowledged was a difficult year for the Scottish party , Mrs McGuire admitted the party had yet to fully come to terms with the election defeat last April .",
636
+ "hypothesis": "In what she acknowledged was a difficult year for the Scottish party , Mrs McGuire admitted the party had yet to fully announce the terms of their election defeat last April .",
637
+ "label": "contradiction",
638
+ "explanation": "",
639
+ "predicted_label": "entailment",
640
+ "model_explanation": ""
641
+ },
642
+ {
643
+ "premise": "Why should you go clucking around them like a mother hen , just because they both hit the ceiling?\u2019",
644
+ "hypothesis": "Why should you go clucking around them like a mother hen , just because they both punched the ceiling?\u2019",
645
+ "label": "contradiction",
646
+ "explanation": "",
647
+ "predicted_label": "entailment",
648
+ "model_explanation": ""
649
+ },
650
+ {
651
+ "premise": "Fell the sunshine on his features ,",
652
+ "hypothesis": "Fell the moonlight on his features",
653
+ "label": "contradiction",
654
+ "explanation": "",
655
+ "predicted_label": "contradiction",
656
+ "model_explanation": ""
657
+ },
658
+ {
659
+ "premise": "The imagination trembles at some of these ideas \u2014 will a profession 's ruling body really come clean about its members ' income?\u2014 but no suggestion , on this subject , should be dismissed out of hand .",
660
+ "hypothesis": "The imagination trembles at some of these ideas \u2014 will a profession 's ruling body really be totally honest about its members ' income?\u2014 but no suggestion , on this subject , should be dismissed out of hand .",
661
+ "label": "entailment",
662
+ "explanation": "",
663
+ "predicted_label": "entailment",
664
+ "model_explanation": ""
665
+ },
666
+ {
667
+ "premise": "he heaped him with work",
668
+ "hypothesis": "he gave him a lot of work",
669
+ "label": "entailment",
670
+ "explanation": "",
671
+ "predicted_label": "entailment",
672
+ "model_explanation": ""
673
+ },
674
+ {
675
+ "premise": "Leonora doubted that biscuits were much of a cure for what ailed her , but she bit into one meekly , deciding that the best policy was to fall in with Penry Vaughan 's wishes whenever possible , to keep the peace .",
676
+ "hypothesis": "Leonora doubted that biscuits were much of a cure for what ailed her , but she bit into one meekly , deciding that the best policy was to fall in with Penry Vaughan 's wishes whenever possible , to prevent others from disturbing civil order .",
677
+ "label": "entailment",
678
+ "explanation": "",
679
+ "predicted_label": "entailment",
680
+ "model_explanation": ""
681
+ },
682
+ {
683
+ "premise": "He turned to stare at Tallis , who pulled a face .",
684
+ "hypothesis": "He turned to stare at Tallis , who expressed dislike .",
685
+ "label": "entailment",
686
+ "explanation": "",
687
+ "predicted_label": "entailment",
688
+ "model_explanation": ""
689
+ },
690
+ {
691
+ "premise": "As a housewife and knitting club member , she \u2018 took the plunge\u2019 and opened Woolwork nearly ten years ago and Meryl reckons the success of the shop is due to Lena 's attitude of giving the same smiling service whether the customer wants a cone of yarn or the latest machine .",
692
+ "hypothesis": "As a housewife and knitting club member , she bought a plunger and opened Woolwork nearly ten years ago and Meryl reckons the success of the shop is due to Lena 's attitude of giving the same smiling service whether the customer wants a cone of yarn or the latest machine .",
693
+ "label": "contradiction",
694
+ "explanation": "",
695
+ "predicted_label": "entailment",
696
+ "model_explanation": ""
697
+ },
698
+ {
699
+ "premise": "We rattled them from the first minute and did n't give them any breathing space .",
700
+ "hypothesis": "We worried them from the first minute and did n't give them any breathing space .",
701
+ "label": "entailment",
702
+ "explanation": "",
703
+ "predicted_label": "entailment",
704
+ "model_explanation": ""
705
+ },
706
+ {
707
+ "premise": "the father flicked him with his hand.",
708
+ "hypothesis": "the father flicked his hair with his hand.",
709
+ "label": "contradiction",
710
+ "explanation": "",
711
+ "predicted_label": "contradiction",
712
+ "model_explanation": ""
713
+ },
714
+ {
715
+ "premise": "the old cheese was crawling with maggots",
716
+ "hypothesis": "the old cheese was covered by maggots",
717
+ "label": "entailment",
718
+ "explanation": "",
719
+ "predicted_label": "entailment",
720
+ "model_explanation": ""
721
+ },
722
+ {
723
+ "premise": " I mean, we have to draw a line between just the abuse of free speech and hate in the raw .",
724
+ "hypothesis": "I mean, we have to draw a line between just the abuse of free speech and hate in its true state .",
725
+ "label": "entailment",
726
+ "explanation": "",
727
+ "predicted_label": "entailment",
728
+ "model_explanation": ""
729
+ },
730
+ {
731
+ "premise": "these rivers head from a mountain range in the himalayas",
732
+ "hypothesis": "these rivers come from a mountain range in the himalayas",
733
+ "label": "entailment",
734
+ "explanation": "",
735
+ "predicted_label": "entailment",
736
+ "model_explanation": ""
737
+ },
738
+ {
739
+ "premise": "Disputes about who 's going to stop drinking and drive home do n't help us go with the flow .",
740
+ "hypothesis": "Disputes about who 's going to stop drinking and drive home do n't help us continue drinking .",
741
+ "label": "contradiction",
742
+ "explanation": "",
743
+ "predicted_label": "contradiction",
744
+ "model_explanation": ""
745
+ },
746
+ {
747
+ "premise": "Once again , however , he discovered he had struck a chord with ordinary people , people who had felt they were unfit to pass judgement on modern buildings because they lacked the qualifications .",
748
+ "hypothesis": "Once again , however , he discovered he had stirred emotions of ordinary people , people who had felt they were unfit to pass judgement on modern buildings because they lacked the qualifications .",
749
+ "label": "entailment",
750
+ "explanation": "",
751
+ "predicted_label": "entailment",
752
+ "model_explanation": ""
753
+ },
754
+ {
755
+ "premise": "For they kept each other 's counsel ,",
756
+ "hypothesis": "For they listened to each other 's advice ,",
757
+ "label": "entailment",
758
+ "explanation": "",
759
+ "predicted_label": "entailment",
760
+ "model_explanation": ""
761
+ },
762
+ {
763
+ "premise": "It 's , it 's the same difference is n't it ?",
764
+ "hypothesis": "It 's , it 's essentially the same is n't it ?",
765
+ "label": "entailment",
766
+ "explanation": "",
767
+ "predicted_label": "entailment",
768
+ "model_explanation": ""
769
+ },
770
+ {
771
+ "premise": "All her insecurities surged painfully as , throwing caution to the winds , she confronted him furiously , demanding imperiously , \u2018 Why exactly have you brought me here , Rune ?",
772
+ "hypothesis": "All her insecurities surged painfully as , throwing her hat to the wind, she confronted him furiously , demanding imperiously , \u2018 Why exactly have you brought me here , Rune ?",
773
+ "label": "contradiction",
774
+ "explanation": "",
775
+ "predicted_label": "contradiction",
776
+ "model_explanation": ""
777
+ },
778
+ {
779
+ "premise": "JUNIOR and senior teams from Grangefield School , Stockton , have swept the board with their energy plans .",
780
+ "hypothesis": "JUNIOR and senior teams from Grangefield School , Stockton , have jumped on board with their energy plans .",
781
+ "label": "contradiction",
782
+ "explanation": "",
783
+ "predicted_label": "entailment",
784
+ "model_explanation": ""
785
+ },
786
+ {
787
+ "premise": "However , Richard Amos , the youth worker , continues to put considerable effort into the work of the youth club and would welcome with open arms any volunteers to join those already helping .",
788
+ "hypothesis": "However , Richard Amos , the youth worker , continues to put considerable effort into the work of the youth club and would welcome with great affection any volunteers to join those already helping .",
789
+ "label": "entailment",
790
+ "explanation": "",
791
+ "predicted_label": "entailment",
792
+ "model_explanation": ""
793
+ },
794
+ {
795
+ "premise": "it dawned on him that she had betrayed him",
796
+ "hypothesis": "it became apparent to him that she had betrayed him",
797
+ "label": "entailment",
798
+ "explanation": "",
799
+ "predicted_label": "entailment",
800
+ "model_explanation": ""
801
+ },
802
+ {
803
+ "premise": "\u2018 All day , on and off.\u2019",
804
+ "hypothesis": "\u2018 All day , intermittently.\u2019",
805
+ "label": "entailment",
806
+ "explanation": "",
807
+ "predicted_label": "entailment",
808
+ "model_explanation": ""
809
+ },
810
+ {
811
+ "premise": "prices climbed steeply",
812
+ "hypothesis": "prices went up steeply",
813
+ "label": "entailment",
814
+ "explanation": "",
815
+ "predicted_label": "entailment",
816
+ "model_explanation": ""
817
+ },
818
+ {
819
+ "premise": "she drowned her trouble in alcohol",
820
+ "hypothesis": "she got rid of her trouble with alcohol",
821
+ "label": "entailment",
822
+ "explanation": "",
823
+ "predicted_label": "entailment",
824
+ "model_explanation": ""
825
+ },
826
+ {
827
+ "premise": "The troubled conscience , the tortured mind , compelling one to come to terms with life , made one impatient of the mere accumulation of facts .",
828
+ "hypothesis": "The troubled conscience , the tortured mind , compelling one to come to accept life , made one impatient of the mere accumulation of facts .",
829
+ "label": "entailment",
830
+ "explanation": "",
831
+ "predicted_label": "entailment",
832
+ "model_explanation": ""
833
+ },
834
+ {
835
+ "premise": "i cannot digest all this information",
836
+ "hypothesis": "i cannot comprehend all this information",
837
+ "label": "entailment",
838
+ "explanation": "",
839
+ "predicted_label": "entailment",
840
+ "model_explanation": ""
841
+ },
842
+ {
843
+ "premise": "Fill the fiery brains of young men ?",
844
+ "hypothesis": "Occupy the fiery brains of young men ?",
845
+ "label": "entailment",
846
+ "explanation": "",
847
+ "predicted_label": "entailment",
848
+ "model_explanation": ""
849
+ },
850
+ {
851
+ "premise": "Kathleen flushed and was angry with herself for it and for allowing her sister to get the better of her again .",
852
+ "hypothesis": "Kathleen flushed and was angry with herself for it and for allowing her sister to be better than her again .",
853
+ "label": "contradiction",
854
+ "explanation": "",
855
+ "predicted_label": "entailment",
856
+ "model_explanation": ""
857
+ },
858
+ {
859
+ "premise": "the immigrants were quickly absorbed into society.",
860
+ "hypothesis": "the immigrants were quickly assimilated into society.",
861
+ "label": "entailment",
862
+ "explanation": "",
863
+ "predicted_label": "entailment",
864
+ "model_explanation": ""
865
+ },
866
+ {
867
+ "premise": "\u00a345,000 was the asking price and I was not surprised that the sale , so to speak , hung fire .",
868
+ "hypothesis": "\u00a345,000 was the asking price and I was not surprised that the sale , so to speak , was delayed .",
869
+ "label": "entailment",
870
+ "explanation": "",
871
+ "predicted_label": "entailment",
872
+ "model_explanation": ""
873
+ },
874
+ {
875
+ "premise": "harmonize one's goals with one's abilities",
876
+ "hypothesis": "make one's goals compatible with one's abilities",
877
+ "label": "entailment",
878
+ "explanation": "",
879
+ "predicted_label": "entailment",
880
+ "model_explanation": ""
881
+ },
882
+ {
883
+ "premise": "the government floated the ruble for a few months",
884
+ "hypothesis": "the government caused the ruble to fluctuate for a few months",
885
+ "label": "entailment",
886
+ "explanation": "",
887
+ "predicted_label": "entailment",
888
+ "model_explanation": ""
889
+ },
890
+ {
891
+ "premise": "And his wishes served to guide him ;",
892
+ "hypothesis": "And his waiters guided him ;",
893
+ "label": "contradiction",
894
+ "explanation": "",
895
+ "predicted_label": "contradiction",
896
+ "model_explanation": ""
897
+ },
898
+ {
899
+ "premise": "i cannot digest all this information",
900
+ "hypothesis": "i cannot digest all this food",
901
+ "label": "contradiction",
902
+ "explanation": "",
903
+ "predicted_label": "contradiction",
904
+ "model_explanation": ""
905
+ },
906
+ {
907
+ "premise": "London is like \u2018 iced water , it 's crystal clear and safe\u2019",
908
+ "hypothesis": "London is like \u2018 iced water , it 's completely transparent and safe\u2019",
909
+ "label": "entailment",
910
+ "explanation": "",
911
+ "predicted_label": "entailment",
912
+ "model_explanation": ""
913
+ },
914
+ {
915
+ "premise": "If such a proposal was adopted by the GMC Kay and his committee might find themselves in the dock .",
916
+ "hypothesis": "If such a proposal was adopted by the GMC Kay and his committee might find themselves under close scrutiny .",
917
+ "label": "entailment",
918
+ "explanation": "",
919
+ "predicted_label": "entailment",
920
+ "model_explanation": ""
921
+ },
922
+ {
923
+ "premise": "Would you accept as a Euro enthusiast , that the opinion poll published by the commission three weeks ago , showed that the Labour party in their tepid support for Maastricht , were wholly out of line with the average Labour voter and in fact it shows quite clearly the majority of people in Britain , not only were opposed to Maastricht , they were also opposed to the idea that the E C was a good idea at all .",
924
+ "hypothesis": "Would you accept as a Euro enthusiast , that the opinion poll published by the commission three weeks ago , showed that the Labour party in their tepid support for Maastricht , were wholly inappropriate with the average Labour voter and in fact it shows quite clearly the majority of people in Britain , not only were opposed to Maastricht , they were also opposed to the idea that the E C was a good idea at all .",
925
+ "label": "entailment",
926
+ "explanation": "",
927
+ "predicted_label": "entailment",
928
+ "model_explanation": ""
929
+ },
930
+ {
931
+ "premise": "And his wishes served to guide him ;",
932
+ "hypothesis": "And his wishes were useful for guiding him ;",
933
+ "label": "entailment",
934
+ "explanation": "",
935
+ "predicted_label": "entailment",
936
+ "model_explanation": ""
937
+ },
938
+ {
939
+ "premise": " I was on the rebound when I met Jack ",
940
+ "hypothesis": " I rebounded from the system when I met Jack ",
941
+ "label": "contradiction",
942
+ "explanation": "",
943
+ "predicted_label": "contradiction",
944
+ "model_explanation": ""
945
+ },
946
+ {
947
+ "premise": "Over her supine body Andrew and Horatia 's eyes met and she took the initiative , knowing she had to get the better of the marquis straight away .",
948
+ "hypothesis": "Over her supine body Andrew and Horatia 's eyes met and she took the initiative , knowing she had to secure an advantage over the marquis straight away .",
949
+ "label": "entailment",
950
+ "explanation": "",
951
+ "predicted_label": "entailment",
952
+ "model_explanation": ""
953
+ },
954
+ {
955
+ "premise": "They win their parents over with a rose-tinted vision of the world which is decidedly reassuring .",
956
+ "hypothesis": "They win their parents over with an optimistic vision of the world which is decidedly reassuring .",
957
+ "label": "entailment",
958
+ "explanation": "",
959
+ "predicted_label": "entailment",
960
+ "model_explanation": ""
961
+ },
962
+ {
963
+ "premise": "she drowned her trouble in alcohol",
964
+ "hypothesis": "she was drowned because of her trouble in alcohol",
965
+ "label": "contradiction",
966
+ "explanation": "",
967
+ "predicted_label": "contradiction",
968
+ "model_explanation": ""
969
+ },
970
+ {
971
+ "premise": "Last season 's Scottish National winner Captain Dibble staked his claim for another of jump racing 's most important handicaps when defeating Boraceva by one and half lengths in the Badger Beer Handicap Chase .",
972
+ "hypothesis": "Last season 's Scottish National winner Captain Dibble claimed his right for another of jump racing 's most important handicaps when defeating Boraceva by one and half lengths in the Badger Beer Handicap Chase .",
973
+ "label": "entailment",
974
+ "explanation": "",
975
+ "predicted_label": "entailment",
976
+ "model_explanation": ""
977
+ },
978
+ {
979
+ "premise": "That the time may pass more gayly ,",
980
+ "hypothesis": "That the time may advance more gayly ,",
981
+ "label": "entailment",
982
+ "explanation": "",
983
+ "predicted_label": "entailment",
984
+ "model_explanation": ""
985
+ },
986
+ {
987
+ "premise": "And they felt it rising , rising ,",
988
+ "hypothesis": "And they felt the carpet rising , rising",
989
+ "label": "contradiction",
990
+ "explanation": "",
991
+ "predicted_label": "contradiction",
992
+ "model_explanation": ""
993
+ },
994
+ {
995
+ "premise": "Then , out of the blue , a letter arrived in his cell .",
996
+ "hypothesis": "Then , abruptly , a letter arrived in his cell .",
997
+ "label": "entailment",
998
+ "explanation": "",
999
+ "predicted_label": "entailment",
1000
+ "model_explanation": ""
1001
+ },
1002
+ {
1003
+ "premise": "Sadly with my church and Pat Roberson you do not have accountability and people are fearful to stand up to take action when your leader says or acts out of order.",
1004
+ "hypothesis": "Sadly with my church and Pat Roberson you do not have accountability and people are fearful to stand up to take action when your leader says or acts orderly.",
1005
+ "label": "contradiction",
1006
+ "explanation": "",
1007
+ "predicted_label": "contradiction",
1008
+ "model_explanation": ""
1009
+ },
1010
+ {
1011
+ "premise": "Till the tree-tops shook with laughter ,",
1012
+ "hypothesis": "Till the tree-tops shook from the laughter of creatures on them",
1013
+ "label": "entailment",
1014
+ "explanation": "",
1015
+ "predicted_label": "contradiction",
1016
+ "model_explanation": ""
1017
+ },
1018
+ {
1019
+ "premise": "Parents have been selected to become erm , relatively insensitive to signs of distress in the offspring , because erm , as where they cry wolf all the time , and as a result , erm , parents do n't take crying as seriously in children as they do in adults .",
1020
+ "hypothesis": "Parents have been selected to become erm , relatively insensitive to signs of distress in the offspring , because erm , as where they cry about wolves all the time , and as a result , erm , parents do n't take crying as seriously in children as they do in adults .",
1021
+ "label": "contradiction",
1022
+ "explanation": "",
1023
+ "predicted_label": "contradiction",
1024
+ "model_explanation": ""
1025
+ },
1026
+ {
1027
+ "premise": "the government digested the entire law into a code",
1028
+ "hypothesis": "the government arranged the entire law into a code",
1029
+ "label": "entailment",
1030
+ "explanation": "",
1031
+ "predicted_label": "entailment",
1032
+ "model_explanation": ""
1033
+ },
1034
+ {
1035
+ "premise": "he 's been able to get round it really , it might well be above board , but the police have been looking into it",
1036
+ "hypothesis": "he 's been able to get round it really , it might well be above standards , but the police have been looking into it",
1037
+ "label": "contradiction",
1038
+ "explanation": "",
1039
+ "predicted_label": "entailment",
1040
+ "model_explanation": ""
1041
+ },
1042
+ {
1043
+ "premise": "The company highlights the fact that the Scale 3 systems use all three major mass - market off the shelf components \u2014 Sparc microprocessors , 3.5\u2019 disk drives and merchant memory chips .",
1044
+ "hypothesis": "The company highlights the fact that the Scale 3 systems use all three major mass - market shelved components \u2014 Sparc microprocessors , 3.5\u2019 disk drives and merchant memory chips .",
1045
+ "label": "contradiction",
1046
+ "explanation": "",
1047
+ "predicted_label": "entailment",
1048
+ "model_explanation": ""
1049
+ },
1050
+ {
1051
+ "premise": "After avoiding a swarm of awaiting reporters and photographers, former CIA director David Petraeus testified behind closed doors Friday that he believes the Sept. 11 attacks on a U.S. diplomatic outpost in Benghazi, Libya was an act of terrorism that did not arise out of a spontaneous demonstration, according to a lawmaker who heard the testimony.",
1052
+ "hypothesis": "After avoiding a swarm of awaiting reporters and photographers, former CIA director David Petraeus testified secretly Friday that he believes the Sept. 11 attacks on a U.S. diplomatic outpost in Benghazi, Libya was an act of terrorism that did not arise out of a spontaneous demonstration, according to a lawmaker who heard the testimony.",
1053
+ "label": "entailment",
1054
+ "explanation": "",
1055
+ "predicted_label": "entailment",
1056
+ "model_explanation": ""
1057
+ },
1058
+ {
1059
+ "premise": "The struggle to explore the inner space of their materials has driven sculptors to dig deep .",
1060
+ "hypothesis": "The struggle to explore the inner space of their materials has driven sculptors to make an effort with every resource .",
1061
+ "label": "entailment",
1062
+ "explanation": "",
1063
+ "predicted_label": "entailment",
1064
+ "model_explanation": ""
1065
+ },
1066
+ {
1067
+ "premise": "You could tell that she was looking forward to doing her number on the wart .",
1068
+ "hypothesis": "You could tell that she was looking forward to counting her number of warts .",
1069
+ "label": "contradiction",
1070
+ "explanation": "",
1071
+ "predicted_label": "contradiction",
1072
+ "model_explanation": ""
1073
+ },
1074
+ {
1075
+ "premise": "The appointment last week of company doctoring group Postern to work on an MTM recovery should help in buying time with the banks .",
1076
+ "hypothesis": "The appointment last week of company doctoring group Postern to work on an MTM recovery should help in delaying the banks .",
1077
+ "label": "entailment",
1078
+ "explanation": "",
1079
+ "predicted_label": "entailment",
1080
+ "model_explanation": ""
1081
+ },
1082
+ {
1083
+ "premise": "And Giggs is , of course , often out and about with pal Darren , the gaffer 's son",
1084
+ "hypothesis": "And Giggs is , of course , often engaging in normal activity with pal Darren , the gaffer 's son",
1085
+ "label": "entailment",
1086
+ "explanation": "",
1087
+ "predicted_label": "entailment",
1088
+ "model_explanation": ""
1089
+ },
1090
+ {
1091
+ "premise": "this story will grab you",
1092
+ "hypothesis": "this story will interest you",
1093
+ "label": "entailment",
1094
+ "explanation": "",
1095
+ "predicted_label": "entailment",
1096
+ "model_explanation": ""
1097
+ },
1098
+ {
1099
+ "premise": "our new synthetic fabric breathes and is perfect for summer wear",
1100
+ "hypothesis": "our new synthetic animal breathes and is perfect for a household pet",
1101
+ "label": "contradiction",
1102
+ "explanation": "",
1103
+ "predicted_label": "contradiction",
1104
+ "model_explanation": ""
1105
+ },
1106
+ {
1107
+ "premise": "So so there I will always remind you Peter says , I will always remind you of this things that if you buy up the time",
1108
+ "hypothesis": "So so there I will always remind you Peter says , I will always remind you of this things that if you delay it",
1109
+ "label": "entailment",
1110
+ "explanation": "",
1111
+ "predicted_label": "entailment",
1112
+ "model_explanation": ""
1113
+ },
1114
+ {
1115
+ "premise": "So take heart, friends, the next time your interaction with a liberal devolves into them accusing you of racism or stupidity, followed by a swift exit from the conversation. ",
1116
+ "hypothesis": "So take revenge, friends, the next time your interaction with a liberal devolves into them accusing you of racism or stupidity, followed by a swift exit from the conversation.",
1117
+ "label": "contradiction",
1118
+ "explanation": "",
1119
+ "predicted_label": "contradiction",
1120
+ "model_explanation": ""
1121
+ },
1122
+ {
1123
+ "premise": "The stains on the carpet have survived every name change .",
1124
+ "hypothesis": "The bugs on the carpet have survived every name change .",
1125
+ "label": "contradiction",
1126
+ "explanation": "",
1127
+ "predicted_label": "contradiction",
1128
+ "model_explanation": ""
1129
+ },
1130
+ {
1131
+ "premise": "my son drifted around for years in california before going to law school",
1132
+ "hypothesis": "my son drifted around the lakes in california for years before going to law school",
1133
+ "label": "contradiction",
1134
+ "explanation": "",
1135
+ "predicted_label": "contradiction",
1136
+ "model_explanation": ""
1137
+ },
1138
+ {
1139
+ "premise": "i was drowned in work",
1140
+ "hypothesis": "i almost drowned in the lake",
1141
+ "label": "contradiction",
1142
+ "explanation": "",
1143
+ "predicted_label": "contradiction",
1144
+ "model_explanation": ""
1145
+ },
1146
+ {
1147
+ "premise": "Came the Spring , and all the forest",
1148
+ "hypothesis": "Came the sheep , and all the forest",
1149
+ "label": "contradiction",
1150
+ "explanation": "",
1151
+ "predicted_label": "contradiction",
1152
+ "model_explanation": ""
1153
+ },
1154
+ {
1155
+ "premise": "Though his pace he checked and slackened",
1156
+ "hypothesis": "Though his pace he limited and slackened",
1157
+ "label": "entailment",
1158
+ "explanation": "",
1159
+ "predicted_label": "entailment",
1160
+ "model_explanation": ""
1161
+ }
1162
+ ]
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12c2edda9e1b88ffd5dc4c915d2a366db78b207dd43d68778be0f01c9c81be59
3
+ size 891700799
special_tokens_map.json ADDED
@@ -0,0 +1,107 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<extra_id_0>",
4
+ "<extra_id_1>",
5
+ "<extra_id_2>",
6
+ "<extra_id_3>",
7
+ "<extra_id_4>",
8
+ "<extra_id_5>",
9
+ "<extra_id_6>",
10
+ "<extra_id_7>",
11
+ "<extra_id_8>",
12
+ "<extra_id_9>",
13
+ "<extra_id_10>",
14
+ "<extra_id_11>",
15
+ "<extra_id_12>",
16
+ "<extra_id_13>",
17
+ "<extra_id_14>",
18
+ "<extra_id_15>",
19
+ "<extra_id_16>",
20
+ "<extra_id_17>",
21
+ "<extra_id_18>",
22
+ "<extra_id_19>",
23
+ "<extra_id_20>",
24
+ "<extra_id_21>",
25
+ "<extra_id_22>",
26
+ "<extra_id_23>",
27
+ "<extra_id_24>",
28
+ "<extra_id_25>",
29
+ "<extra_id_26>",
30
+ "<extra_id_27>",
31
+ "<extra_id_28>",
32
+ "<extra_id_29>",
33
+ "<extra_id_30>",
34
+ "<extra_id_31>",
35
+ "<extra_id_32>",
36
+ "<extra_id_33>",
37
+ "<extra_id_34>",
38
+ "<extra_id_35>",
39
+ "<extra_id_36>",
40
+ "<extra_id_37>",
41
+ "<extra_id_38>",
42
+ "<extra_id_39>",
43
+ "<extra_id_40>",
44
+ "<extra_id_41>",
45
+ "<extra_id_42>",
46
+ "<extra_id_43>",
47
+ "<extra_id_44>",
48
+ "<extra_id_45>",
49
+ "<extra_id_46>",
50
+ "<extra_id_47>",
51
+ "<extra_id_48>",
52
+ "<extra_id_49>",
53
+ "<extra_id_50>",
54
+ "<extra_id_51>",
55
+ "<extra_id_52>",
56
+ "<extra_id_53>",
57
+ "<extra_id_54>",
58
+ "<extra_id_55>",
59
+ "<extra_id_56>",
60
+ "<extra_id_57>",
61
+ "<extra_id_58>",
62
+ "<extra_id_59>",
63
+ "<extra_id_60>",
64
+ "<extra_id_61>",
65
+ "<extra_id_62>",
66
+ "<extra_id_63>",
67
+ "<extra_id_64>",
68
+ "<extra_id_65>",
69
+ "<extra_id_66>",
70
+ "<extra_id_67>",
71
+ "<extra_id_68>",
72
+ "<extra_id_69>",
73
+ "<extra_id_70>",
74
+ "<extra_id_71>",
75
+ "<extra_id_72>",
76
+ "<extra_id_73>",
77
+ "<extra_id_74>",
78
+ "<extra_id_75>",
79
+ "<extra_id_76>",
80
+ "<extra_id_77>",
81
+ "<extra_id_78>",
82
+ "<extra_id_79>",
83
+ "<extra_id_80>",
84
+ "<extra_id_81>",
85
+ "<extra_id_82>",
86
+ "<extra_id_83>",
87
+ "<extra_id_84>",
88
+ "<extra_id_85>",
89
+ "<extra_id_86>",
90
+ "<extra_id_87>",
91
+ "<extra_id_88>",
92
+ "<extra_id_89>",
93
+ "<extra_id_90>",
94
+ "<extra_id_91>",
95
+ "<extra_id_92>",
96
+ "<extra_id_93>",
97
+ "<extra_id_94>",
98
+ "<extra_id_95>",
99
+ "<extra_id_96>",
100
+ "<extra_id_97>",
101
+ "<extra_id_98>",
102
+ "<extra_id_99>"
103
+ ],
104
+ "eos_token": "</s>",
105
+ "pad_token": "<pad>",
106
+ "unk_token": "<unk>"
107
+ }
spiece.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d60acb128cf7b7f2536e8f38a5b18a05535c9e14c7a355904270e15b0945ea86
3
+ size 791656
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,112 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<extra_id_0>",
4
+ "<extra_id_1>",
5
+ "<extra_id_2>",
6
+ "<extra_id_3>",
7
+ "<extra_id_4>",
8
+ "<extra_id_5>",
9
+ "<extra_id_6>",
10
+ "<extra_id_7>",
11
+ "<extra_id_8>",
12
+ "<extra_id_9>",
13
+ "<extra_id_10>",
14
+ "<extra_id_11>",
15
+ "<extra_id_12>",
16
+ "<extra_id_13>",
17
+ "<extra_id_14>",
18
+ "<extra_id_15>",
19
+ "<extra_id_16>",
20
+ "<extra_id_17>",
21
+ "<extra_id_18>",
22
+ "<extra_id_19>",
23
+ "<extra_id_20>",
24
+ "<extra_id_21>",
25
+ "<extra_id_22>",
26
+ "<extra_id_23>",
27
+ "<extra_id_24>",
28
+ "<extra_id_25>",
29
+ "<extra_id_26>",
30
+ "<extra_id_27>",
31
+ "<extra_id_28>",
32
+ "<extra_id_29>",
33
+ "<extra_id_30>",
34
+ "<extra_id_31>",
35
+ "<extra_id_32>",
36
+ "<extra_id_33>",
37
+ "<extra_id_34>",
38
+ "<extra_id_35>",
39
+ "<extra_id_36>",
40
+ "<extra_id_37>",
41
+ "<extra_id_38>",
42
+ "<extra_id_39>",
43
+ "<extra_id_40>",
44
+ "<extra_id_41>",
45
+ "<extra_id_42>",
46
+ "<extra_id_43>",
47
+ "<extra_id_44>",
48
+ "<extra_id_45>",
49
+ "<extra_id_46>",
50
+ "<extra_id_47>",
51
+ "<extra_id_48>",
52
+ "<extra_id_49>",
53
+ "<extra_id_50>",
54
+ "<extra_id_51>",
55
+ "<extra_id_52>",
56
+ "<extra_id_53>",
57
+ "<extra_id_54>",
58
+ "<extra_id_55>",
59
+ "<extra_id_56>",
60
+ "<extra_id_57>",
61
+ "<extra_id_58>",
62
+ "<extra_id_59>",
63
+ "<extra_id_60>",
64
+ "<extra_id_61>",
65
+ "<extra_id_62>",
66
+ "<extra_id_63>",
67
+ "<extra_id_64>",
68
+ "<extra_id_65>",
69
+ "<extra_id_66>",
70
+ "<extra_id_67>",
71
+ "<extra_id_68>",
72
+ "<extra_id_69>",
73
+ "<extra_id_70>",
74
+ "<extra_id_71>",
75
+ "<extra_id_72>",
76
+ "<extra_id_73>",
77
+ "<extra_id_74>",
78
+ "<extra_id_75>",
79
+ "<extra_id_76>",
80
+ "<extra_id_77>",
81
+ "<extra_id_78>",
82
+ "<extra_id_79>",
83
+ "<extra_id_80>",
84
+ "<extra_id_81>",
85
+ "<extra_id_82>",
86
+ "<extra_id_83>",
87
+ "<extra_id_84>",
88
+ "<extra_id_85>",
89
+ "<extra_id_86>",
90
+ "<extra_id_87>",
91
+ "<extra_id_88>",
92
+ "<extra_id_89>",
93
+ "<extra_id_90>",
94
+ "<extra_id_91>",
95
+ "<extra_id_92>",
96
+ "<extra_id_93>",
97
+ "<extra_id_94>",
98
+ "<extra_id_95>",
99
+ "<extra_id_96>",
100
+ "<extra_id_97>",
101
+ "<extra_id_98>",
102
+ "<extra_id_99>"
103
+ ],
104
+ "eos_token": "</s>",
105
+ "extra_ids": 100,
106
+ "model_max_length": 512,
107
+ "name_or_path": "t5-base",
108
+ "pad_token": "<pad>",
109
+ "special_tokens_map_file": null,
110
+ "tokenizer_class": "T5Tokenizer",
111
+ "unk_token": "<unk>"
112
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:059a30c261f3bd54fbfe2362d7894c790b619685a34fdc10f23e0cddffd8fcd8
3
+ size 3567