Training in progress, step 1000, checkpoint
Browse files- last-checkpoint/adapter_model.bin +1 -1
- last-checkpoint/global_step1000/zero_pp_rank_0_mp_rank_00_model_states.pt +1 -1
- last-checkpoint/global_step1000/zero_pp_rank_0_mp_rank_00_optim_states.pt +1 -1
- last-checkpoint/global_step1000/zero_pp_rank_1_mp_rank_00_model_states.pt +1 -1
- last-checkpoint/global_step1000/zero_pp_rank_1_mp_rank_00_optim_states.pt +1 -1
- last-checkpoint/global_step1000/zero_pp_rank_2_mp_rank_00_model_states.pt +1 -1
- last-checkpoint/global_step1000/zero_pp_rank_2_mp_rank_00_optim_states.pt +1 -1
- last-checkpoint/global_step1000/zero_pp_rank_3_mp_rank_00_model_states.pt +1 -1
- last-checkpoint/global_step1000/zero_pp_rank_3_mp_rank_00_optim_states.pt +1 -1
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/trainer_state.json +7 -13
- last-checkpoint/training_args.bin +1 -1
last-checkpoint/adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2141578
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c64223b9e83dbe7f06b4c1de844227a7fcd2febfa65be961dbbcd89abb05f31
|
3 |
size 2141578
|
last-checkpoint/global_step1000/zero_pp_rank_0_mp_rank_00_model_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3369573916
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11440061d19e9b689490b5ff06d30a5122f73cff374fbea6a5ee2f8520ab1964
|
3 |
size 3369573916
|
last-checkpoint/global_step1000/zero_pp_rank_0_mp_rank_00_optim_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3149677
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d546fa0fe3d113ad206a2c086525dcacecb3533e20c0924482798280dbe55d5
|
3 |
size 3149677
|
last-checkpoint/global_step1000/zero_pp_rank_1_mp_rank_00_model_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3369573916
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:554f3da99c50c56d4f7880fc8f9758608a450153144eedb59c974e8e516f7ad4
|
3 |
size 3369573916
|
last-checkpoint/global_step1000/zero_pp_rank_1_mp_rank_00_optim_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3149677
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e790e2bf1acd32b0f95a5788a2c91206e415a05128054438b446fa961fec961d
|
3 |
size 3149677
|
last-checkpoint/global_step1000/zero_pp_rank_2_mp_rank_00_model_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3369573916
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f951d97c21f33bd47f64d86de8c76d040713afec628d5f2683b61060f934ff4c
|
3 |
size 3369573916
|
last-checkpoint/global_step1000/zero_pp_rank_2_mp_rank_00_optim_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3149677
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4850db2edb00b793213fffefa366620054d81977f1ff1780e4299ea470bf814
|
3 |
size 3149677
|
last-checkpoint/global_step1000/zero_pp_rank_3_mp_rank_00_model_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3369573916
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:034940c7e4526c1699089c785cd01421bdf5cf490b2f8c5920d6378fca4e3ed3
|
3 |
size 3369573916
|
last-checkpoint/global_step1000/zero_pp_rank_3_mp_rank_00_optim_states.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3149677
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70bdaec85d6cc09d7f2aee260d65fcae56231c2fddbb402df221b0f1dc79910a
|
3 |
size 3149677
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step1000
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8691df6f79e0b8b1eab2b8e5959f7d89b6550695ddcdaae4614805d51f39962a
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70cfb2c761a4a9b974e67a46881fd972571be73fe5353febf18edebeda2d1ab3
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed9e94b74c267e4ac6d4421c1598212ddae043208343290f7d0d6d3090de590a
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fa9db8e168da3307c95b5ad756cdc3091a44ff15b3ce1ad0eeb8a91bd5615c6
|
3 |
size 15024
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,31 +1,25 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 0.
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.39,
|
13 |
-
"learning_rate":
|
14 |
-
"loss": 0.
|
15 |
"step": 1000
|
16 |
-
},
|
17 |
-
{
|
18 |
-
"epoch": 0.78,
|
19 |
-
"learning_rate": 1e-05,
|
20 |
-
"loss": 0.3855,
|
21 |
-
"step": 2000
|
22 |
}
|
23 |
],
|
24 |
"logging_steps": 1000,
|
25 |
-
"max_steps":
|
26 |
-
"num_train_epochs":
|
27 |
"save_steps": 1000,
|
28 |
-
"total_flos":
|
29 |
"trial_name": null,
|
30 |
"trial_params": null
|
31 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 0.39093041438623927,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 1000,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.39,
|
13 |
+
"learning_rate": 0.0001,
|
14 |
+
"loss": 0.3412,
|
15 |
"step": 1000
|
|
|
|
|
|
|
|
|
|
|
|
|
16 |
}
|
17 |
],
|
18 |
"logging_steps": 1000,
|
19 |
+
"max_steps": 12790,
|
20 |
+
"num_train_epochs": 5,
|
21 |
"save_steps": 1000,
|
22 |
+
"total_flos": 13021766221824.0,
|
23 |
"trial_name": null,
|
24 |
"trial_params": null
|
25 |
}
|
last-checkpoint/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6840
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e88bb83dac898ccb88b94e8a2bbce48f354e3d93653571d7cd72c8fe00fe3205
|
3 |
size 6840
|