ciebson commited on
Commit
8e027ea
·
verified ·
1 Parent(s): 9e9cff4

Training in progress, step 1000

Browse files
config.json CHANGED
@@ -78,7 +78,7 @@
78
  "typical_p": 1.0,
79
  "use_bfloat16": false,
80
  "use_cache": true,
81
- "vocab_size": 100
82
  },
83
  "decoder_start_token_id": 2,
84
  "encoder": {
@@ -157,7 +157,7 @@
157
  "typical_p": 1.0,
158
  "use_bfloat16": false,
159
  "use_cache": true,
160
- "vocab_size": 100
161
  },
162
  "eos_token_id": 0,
163
  "is_encoder_decoder": true,
 
78
  "typical_p": 1.0,
79
  "use_bfloat16": false,
80
  "use_cache": true,
81
+ "vocab_size": 107
82
  },
83
  "decoder_start_token_id": 2,
84
  "encoder": {
 
157
  "typical_p": 1.0,
158
  "use_bfloat16": false,
159
  "use_cache": true,
160
+ "vocab_size": 107
161
  },
162
  "eos_token_id": 0,
163
  "is_encoder_decoder": true,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b9f26789173ceaca3ccf6b1d58248b4890416476ef12e7057c07234a721ac85f
3
- size 31304048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7cee1f5677eceeba6fd6f9331d034970e487b01cfb41026cd3086dc58d9b5e9
3
+ size 31318412
runs/Mar04_14-22-27_d8c8da50ec4e/events.out.tfevents.1709562148.d8c8da50ec4e.409.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98a5c5bc7e2b0f4287502bd87bd3462e44a9f8daf3534ae8ce350858ac1c9a73
3
+ size 28107
runs/Mar04_14-24-04_d8c8da50ec4e/events.out.tfevents.1709562245.d8c8da50ec4e.409.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82e0284da9eb8273238fb07fde8b6ff33a22fe3eea5026ed0ca858a79b166258
3
+ size 10527
runs/Mar04_14-24-27_d8c8da50ec4e/events.out.tfevents.1709562267.d8c8da50ec4e.409.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73441e8c176e7fe631fcfb218b083cc9b0afcbfdc2deccbc291487a321952723
3
+ size 28108
runs/Mar04_14-25-36_d8c8da50ec4e/events.out.tfevents.1709562336.d8c8da50ec4e.409.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4093f20ec1a69fa4169c9107b47d3460ae31c7ec629b82bbb69e44e22e5e5902
3
+ size 47468
runs/Mar04_14-28-25_d8c8da50ec4e/events.out.tfevents.1709562506.d8c8da50ec4e.409.14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca7e7e75003992f4a43edb140cd2c5d8cdb87d3b00b7e740869ec1b299b4360e
3
+ size 42774
tokenizer.json CHANGED
@@ -113,174 +113,188 @@
113
  "8": 14,
114
  "9": 15,
115
  "=": 16,
116
- "14": 17,
117
- "12": 18,
118
- "15": 19,
119
- "17": 20,
120
- "16": 21,
121
- "19": 22,
122
- "11": 23,
123
- "10": 24,
124
- "13": 25,
125
- "18": 26,
126
- "20": 27,
127
- "21": 28,
128
- "98": 29,
129
- "22": 30,
130
- "23": 31,
131
- "99": 32,
132
- "97": 33,
133
- "96": 34,
134
- "24": 35,
135
- "95": 36,
136
- "93": 37,
137
- "94": 38,
138
- "25": 39,
139
- "26": 40,
140
- "92": 41,
141
- "28": 42,
142
- "27": 43,
143
- "90": 44,
144
- "30": 45,
145
- "29": 46,
146
- "91": 47,
147
- "89": 48,
148
- "88": 49,
149
- "31": 50,
150
- "87": 51,
151
- "33": 52,
152
- "32": 53,
153
- "86": 54,
154
- "85": 55,
155
- "35": 56,
156
- "34": 57,
157
- "84": 58,
158
- "83": 59,
159
- "36": 60,
160
- "37": 61,
161
- "82": 62,
162
- "38": 63,
163
- "81": 64,
164
- "80": 65,
165
- "41": 66,
166
- "40": 67,
167
- "39": 68,
168
- "79": 69,
169
- "77": 70,
170
- "42": 71,
171
  "78": 72,
172
- "75": 73,
173
- "43": 74,
174
- "76": 75,
175
- "44": 76,
176
- "74": 77,
177
- "72": 78,
178
- "47": 79,
179
- "73": 80,
180
- "46": 81,
181
- "45": 82,
182
- "49": 83,
183
- "70": 84,
184
- "71": 85,
185
- "48": 86,
186
- "69": 87,
187
- "68": 88,
188
- "50": 89,
189
- "51": 90,
190
- "52": 91,
191
- "53": 92,
192
- "54": 93,
193
- "67": 94,
194
- "66": 95,
195
- "55": 96,
196
- "64": 97,
197
- "65": 98,
198
- "63": 99
 
 
 
 
 
 
 
199
  },
200
  "merges": [
201
- "1 4",
202
- "1 2",
203
- "1 5",
204
- "1 7",
205
  "1 6",
206
- "1 9",
207
- "1 1",
208
- "1 0",
209
- "1 3",
210
- "1 8",
211
- "2 0",
212
- "2 1",
213
- "9 8",
214
- "2 2",
215
- "2 3",
216
- "9 9",
217
- "9 7",
218
- "9 6",
219
- "2 4",
220
- "9 5",
221
- "9 3",
222
- "9 4",
223
- "2 5",
224
- "2 6",
225
- "9 2",
226
  "2 8",
227
- "2 7",
228
- "9 0",
229
- "3 0",
230
- "2 9",
231
- "9 1",
232
- "8 9",
233
- "8 8",
234
  "3 1",
235
- "8 7",
236
- "3 3",
 
 
 
 
 
237
  "3 2",
238
- "8 6",
 
 
 
 
 
239
  "8 5",
240
- "3 5",
241
- "3 4",
242
- "8 4",
243
- "8 3",
 
 
 
 
244
  "3 6",
245
- "3 7",
246
- "8 2",
247
- "3 8",
248
  "8 1",
249
- "8 0",
 
 
 
 
 
 
 
 
250
  "4 1",
 
 
 
 
 
 
251
  "4 0",
252
- "3 9",
253
- "7 9",
254
- "7 7",
255
- "4 2",
256
  "7 8",
257
- "7 5",
 
258
  "4 3",
259
- "7 6",
260
- "4 4",
261
  "7 4",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
262
  "7 2",
263
- "4 7",
264
- "7 3",
265
- "4 6",
 
 
 
 
266
  "4 5",
267
- "4 9",
268
- "7 0",
269
- "7 1",
270
- "4 8",
271
  "6 9",
272
- "6 8",
273
- "5 0",
274
- "5 1",
275
- "5 2",
276
- "5 3",
277
- "5 4",
278
- "6 7",
279
- "6 6",
280
- "5 5",
281
- "6 4",
282
- "6 5",
283
- "6 3"
284
  ]
285
  }
286
  }
 
113
  "8": 14,
114
  "9": 15,
115
  "=": 16,
116
+ "51": 17,
117
+ "16": 18,
118
+ "35": 19,
119
+ "28": 20,
120
+ "25": 21,
121
+ "12": 22,
122
+ "58": 23,
123
+ "22": 24,
124
+ "14": 25,
125
+ "20": 26,
126
+ "86": 27,
127
+ "31": 28,
128
+ "57": 29,
129
+ "53": 30,
130
+ "60": 31,
131
+ "65": 32,
132
+ "54": 33,
133
+ "70": 34,
134
+ "62": 35,
135
+ "32": 36,
136
+ "76": 37,
137
+ "24": 38,
138
+ "18": 39,
139
+ "46": 40,
140
+ "87": 41,
141
+ "73": 42,
142
+ "85": 43,
143
+ "50": 44,
144
+ "23": 45,
145
+ "15": 46,
146
+ "94": 47,
147
+ "68": 48,
148
+ "61": 49,
149
+ "49": 50,
150
+ "92": 51,
151
+ "36": 52,
152
+ "44": 53,
153
+ "81": 54,
154
+ "37": 55,
155
+ "39": 56,
156
+ "47": 57,
157
+ "71": 58,
158
+ "59": 59,
159
+ "66": 60,
160
+ "93": 61,
161
+ "11": 62,
162
+ "13": 63,
163
+ "41": 64,
164
+ "99": 65,
165
+ "75": 66,
166
+ "83": 67,
167
+ "27": 68,
168
+ "52": 69,
169
+ "84": 70,
170
+ "40": 71,
171
  "78": 72,
172
+ "80": 73,
173
+ "10": 74,
174
+ "43": 75,
175
+ "95": 76,
176
+ "64": 77,
177
+ "74": 78,
178
+ "88": 79,
179
+ "21": 80,
180
+ "48": 81,
181
+ "55": 82,
182
+ "77": 83,
183
+ "89": 84,
184
+ "26": 85,
185
+ "42": 86,
186
+ "91": 87,
187
+ "79": 88,
188
+ "29": 89,
189
+ "19": 90,
190
+ "38": 91,
191
+ "67": 92,
192
+ "17": 93,
193
+ "30": 94,
194
+ "72": 95,
195
+ "96": 96,
196
+ "33": 97,
197
+ "97": 98,
198
+ "56": 99,
199
+ "82": 100,
200
+ "34": 101,
201
+ "63": 102,
202
+ "45": 103,
203
+ "69": 104,
204
+ "90": 105,
205
+ "98": 106
206
  },
207
  "merges": [
208
+ "5 1",
 
 
 
209
  "1 6",
210
+ "3 5",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
211
  "2 8",
212
+ "2 5",
213
+ "1 2",
214
+ "5 8",
215
+ "2 2",
216
+ "1 4",
217
+ "2 0",
218
+ "8 6",
219
  "3 1",
220
+ "5 7",
221
+ "5 3",
222
+ "6 0",
223
+ "6 5",
224
+ "5 4",
225
+ "7 0",
226
+ "6 2",
227
  "3 2",
228
+ "7 6",
229
+ "2 4",
230
+ "1 8",
231
+ "4 6",
232
+ "8 7",
233
+ "7 3",
234
  "8 5",
235
+ "5 0",
236
+ "2 3",
237
+ "1 5",
238
+ "9 4",
239
+ "6 8",
240
+ "6 1",
241
+ "4 9",
242
+ "9 2",
243
  "3 6",
244
+ "4 4",
 
 
245
  "8 1",
246
+ "3 7",
247
+ "3 9",
248
+ "4 7",
249
+ "7 1",
250
+ "5 9",
251
+ "6 6",
252
+ "9 3",
253
+ "1 1",
254
+ "1 3",
255
  "4 1",
256
+ "9 9",
257
+ "7 5",
258
+ "8 3",
259
+ "2 7",
260
+ "5 2",
261
+ "8 4",
262
  "4 0",
 
 
 
 
263
  "7 8",
264
+ "8 0",
265
+ "1 0",
266
  "4 3",
267
+ "9 5",
268
+ "6 4",
269
  "7 4",
270
+ "8 8",
271
+ "2 1",
272
+ "4 8",
273
+ "5 5",
274
+ "7 7",
275
+ "8 9",
276
+ "2 6",
277
+ "4 2",
278
+ "9 1",
279
+ "7 9",
280
+ "2 9",
281
+ "1 9",
282
+ "3 8",
283
+ "6 7",
284
+ "1 7",
285
+ "3 0",
286
  "7 2",
287
+ "9 6",
288
+ "3 3",
289
+ "9 7",
290
+ "5 6",
291
+ "8 2",
292
+ "3 4",
293
+ "6 3",
294
  "4 5",
 
 
 
 
295
  "6 9",
296
+ "9 0",
297
+ "9 8"
 
 
 
 
 
 
 
 
 
 
298
  ]
299
  }
300
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4791ceb8a8ace3a61b3381b0bdbcce405ba9afaa35906974a6b6830820af5acf
3
  size 5112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfd086a533a0d81d3b20fc7c5a598f39d1b5dee511e0b79e644f93e1d77b7cee
3
  size 5112