willtensora
commited on
Training in progress, step 4000, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/rng_state_4.pth +1 -1
- last-checkpoint/rng_state_5.pth +1 -1
- last-checkpoint/rng_state_6.pth +1 -1
- last-checkpoint/rng_state_7.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +26 -4
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 281587880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9286827e09996aa12033872735e0de092fd721c4fe1f91e63b8050c811435776
|
3 |
size 281587880
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 143366164
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:353f67a4c0bb212617e4e1eb2fea3e745777ba393205008d24b356bb498ecc67
|
3 |
size 143366164
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea009eea43ba9165a25447a2ebeb5b3ce293fc229f86ecc8e82133799a169966
|
3 |
size 15984
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6dfb77a49f10367faf585826f2baa575617770456a06df6deae0b699b8cbfe55
|
3 |
size 15984
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:556f588ce3e53b2cd23465a5fe33a0f16e45fcf93add9e1c51ddd54944327598
|
3 |
size 15984
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8445b826fcbaedb310f62e7bc99ed78babefe67e99b18bb93ecdf39f948cb8d3
|
3 |
size 15984
|
last-checkpoint/rng_state_4.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca8ec1dff7e8c1bbfb8a0a9f36b118f79da805799d7feb6fd3b3b5df69889adf
|
3 |
size 15984
|
last-checkpoint/rng_state_5.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:038432af1ae4b33111e160b3375c93d2ca42e7f72b9e44ece5c683ff70210b50
|
3 |
size 15984
|
last-checkpoint/rng_state_6.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d9b46724719c2f5295bd4180c934cad4763102ab04394464305bff7116c4581
|
3 |
size 15984
|
last-checkpoint/rng_state_7.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b97c73dff8b858f452882698214d6c496e79029e7e4e7768425eabf4cf62410b
|
3 |
size 15984
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94a718f147a195eb428ec1cc98c1dc66af23c9088cc3fbd17bc99e8886d33266
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
"eval_steps": 40,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -3593,6 +3593,28 @@
|
|
3593 |
"learning_rate": 1.2486132855826781e-08,
|
3594 |
"loss": 0.0,
|
3595 |
"step": 3980
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3596 |
}
|
3597 |
],
|
3598 |
"logging_steps": 10,
|
@@ -3607,12 +3629,12 @@
|
|
3607 |
"should_evaluate": false,
|
3608 |
"should_log": false,
|
3609 |
"should_save": true,
|
3610 |
-
"should_training_stop":
|
3611 |
},
|
3612 |
"attributes": {}
|
3613 |
}
|
3614 |
},
|
3615 |
-
"total_flos": 1.
|
3616 |
"train_batch_size": 1,
|
3617 |
"trial_name": null,
|
3618 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 100.0,
|
5 |
"eval_steps": 40,
|
6 |
+
"global_step": 4000,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
3593 |
"learning_rate": 1.2486132855826781e-08,
|
3594 |
"loss": 0.0,
|
3595 |
"step": 3980
|
3596 |
+
},
|
3597 |
+
{
|
3598 |
+
"epoch": 99.75,
|
3599 |
+
"grad_norm": 9.601525562175084e-06,
|
3600 |
+
"learning_rate": 3.121581935328077e-09,
|
3601 |
+
"loss": 0.0,
|
3602 |
+
"step": 3990
|
3603 |
+
},
|
3604 |
+
{
|
3605 |
+
"epoch": 100.0,
|
3606 |
+
"grad_norm": 2.9180186174926348e-05,
|
3607 |
+
"learning_rate": 0.0,
|
3608 |
+
"loss": 0.0,
|
3609 |
+
"step": 4000
|
3610 |
+
},
|
3611 |
+
{
|
3612 |
+
"epoch": 100.0,
|
3613 |
+
"eval_loss": 6.550197895194287e-07,
|
3614 |
+
"eval_runtime": 0.3302,
|
3615 |
+
"eval_samples_per_second": 109.012,
|
3616 |
+
"eval_steps_per_second": 15.141,
|
3617 |
+
"step": 4000
|
3618 |
}
|
3619 |
],
|
3620 |
"logging_steps": 10,
|
|
|
3629 |
"should_evaluate": false,
|
3630 |
"should_log": false,
|
3631 |
"should_save": true,
|
3632 |
+
"should_training_stop": true
|
3633 |
},
|
3634 |
"attributes": {}
|
3635 |
}
|
3636 |
},
|
3637 |
+
"total_flos": 1.684080299081728e+17,
|
3638 |
"train_batch_size": 1,
|
3639 |
"trial_name": null,
|
3640 |
"trial_params": null
|