naman1011 commited on
Commit
3562956
·
1 Parent(s): fd0363a

Training in progress, step 2000, checkpoint

Browse files
last-checkpoint/adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1c64223b9e83dbe7f06b4c1de844227a7fcd2febfa65be961dbbcd89abb05f31
3
  size 2141578
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7328d3c4c1f327c39e82a120e4c4a584216b22fac4f3446fd72c1dcb57e70f32
3
  size 2141578
last-checkpoint/global_step2000/zero_pp_rank_0_mp_rank_00_model_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dca7f64207daeb0f5818f0bae3022ccea04994e358ed59c76880f398012ab283
3
  size 3369573916
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c631555bb216228fd776c70fdb0e256ee4e31d790108950abfa77b028c501d3
3
  size 3369573916
last-checkpoint/global_step2000/zero_pp_rank_0_mp_rank_00_optim_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18d8dab4b596aaf5c388a04e2c4b22c2af1c8aebf082ebb076b832fb651278a7
3
  size 3149677
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3080ba6a4f448c0f1f9e781443c976f2fd5a79ea723a6a49542f4c026632d021
3
  size 3149677
last-checkpoint/global_step2000/zero_pp_rank_1_mp_rank_00_model_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b65c99a66c8ddb1ca7d6a10f980fea331c2a73a4e3d712a15ae8456eebfad054
3
  size 3369573916
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be005c1c969525d4152a78bec86f4a9dbe8b58678eb89bb1bffa0b9953b40ba3
3
  size 3369573916
last-checkpoint/global_step2000/zero_pp_rank_1_mp_rank_00_optim_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:99251421a3d82f8aa04fef0bb5a40ac31b91fece6412bf5461459ab48af331fc
3
  size 3149677
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc4c18a4ef0f9857edeb68da455dc4e7080151c87a75e93f7b1ce4cbf4ab2461
3
  size 3149677
last-checkpoint/global_step2000/zero_pp_rank_2_mp_rank_00_model_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de61df69015d85a38c460f5ce2d7f89707b53547211524c02c95de843f22e77e
3
  size 3369573916
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7169575885257a5886f2a16d9e9ac0ec0650b4840c49e3cf46173bb490042a1f
3
  size 3369573916
last-checkpoint/global_step2000/zero_pp_rank_2_mp_rank_00_optim_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4434b3d3f4781df27851f5ae5b2156489413af687b69dd9661fc4ae0284d4911
3
  size 3149677
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a397d278e62116e1535866690747e07fcc337e68d0d6a1bc83659b5bce2d0fc8
3
  size 3149677
last-checkpoint/global_step2000/zero_pp_rank_3_mp_rank_00_model_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0bb2c03acff0c9f6df4bb65de65ca67958ea37048ae34027d11a6c2220006a1a
3
  size 3369573916
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93bf1650107328c65c26fa2f710cf3bf59bb92597b39fbc8120f97a1c8179044
3
  size 3369573916
last-checkpoint/global_step2000/zero_pp_rank_3_mp_rank_00_optim_states.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f3ef9cf375927ce659882b5180d7af88f640c6c51f492ce69b797e2c85889de
3
  size 3149677
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a216e45206c382e0569c4be9c261a3ff128aafd1935e65cab66c418f586fd578
3
  size 3149677
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step1000
 
1
+ global_step2000
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8691df6f79e0b8b1eab2b8e5959f7d89b6550695ddcdaae4614805d51f39962a
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50c45dee7a55d713aa15eaefbdbd4b45df9e67d02bb6ccefa86e1468c6ea416f
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70cfb2c761a4a9b974e67a46881fd972571be73fe5353febf18edebeda2d1ab3
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abb041f181920f1b36237d3ff78db879a26def694eccb0894945dbd4a97cc65a
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed9e94b74c267e4ac6d4421c1598212ddae043208343290f7d0d6d3090de590a
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3399d3d8d8d656a349c7e785e13454283813d091435a0af845c955519e7653c
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fa9db8e168da3307c95b5ad756cdc3091a44ff15b3ce1ad0eeb8a91bd5615c6
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1eea31e444764e3e1f1ec7465ddb8eefb5bbbefde013a11a62c8a1b296356b1
3
  size 15024
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.39093041438623927,
5
  "eval_steps": 500,
6
- "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -13,13 +13,19 @@
13
  "learning_rate": 0.0001,
14
  "loss": 0.3412,
15
  "step": 1000
 
 
 
 
 
 
16
  }
17
  ],
18
  "logging_steps": 1000,
19
  "max_steps": 12790,
20
  "num_train_epochs": 5,
21
  "save_steps": 1000,
22
- "total_flos": 13021766221824.0,
23
  "trial_name": null,
24
  "trial_params": null
25
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.7818608287724785,
5
  "eval_steps": 500,
6
+ "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
13
  "learning_rate": 0.0001,
14
  "loss": 0.3412,
15
  "step": 1000
16
+ },
17
+ {
18
+ "epoch": 0.78,
19
+ "learning_rate": 0.0001,
20
+ "loss": 0.1473,
21
+ "step": 2000
22
  }
23
  ],
24
  "logging_steps": 1000,
25
  "max_steps": 12790,
26
  "num_train_epochs": 5,
27
  "save_steps": 1000,
28
+ "total_flos": 26238293901312.0,
29
  "trial_name": null,
30
  "trial_params": null
31
  }