ihanif commited on
Commit
bc3f1c0
·
1 Parent(s): ed79ec3

End of training

Browse files
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 30.0,
3
- "eval_loss": 0.8710034489631653,
4
- "eval_runtime": 279.4192,
5
- "eval_samples_per_second": 1.832,
6
- "eval_steps_per_second": 0.057,
7
  "eval_wer": 60.05599273607748,
8
- "train_loss": 0.0,
9
- "train_runtime": 0.8373,
10
- "train_samples_per_second": 91726.968,
11
- "train_steps_per_second": 1433.234
12
  }
 
1
  {
2
+ "epoch": 33.33,
3
+ "eval_loss": 0.8714202046394348,
4
+ "eval_runtime": 282.6755,
5
+ "eval_samples_per_second": 1.811,
6
+ "eval_steps_per_second": 0.113,
7
  "eval_wer": 60.05599273607748,
8
+ "train_loss": 0.018539312619429368,
9
+ "train_runtime": 504.1118,
10
+ "train_samples_per_second": 165.043,
11
+ "train_steps_per_second": 2.579
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 30.0,
3
- "eval_loss": 0.8710034489631653,
4
- "eval_runtime": 279.4192,
5
- "eval_samples_per_second": 1.832,
6
- "eval_steps_per_second": 0.057,
7
  "eval_wer": 60.05599273607748
8
  }
 
1
  {
2
+ "epoch": 33.33,
3
+ "eval_loss": 0.8714202046394348,
4
+ "eval_runtime": 282.6755,
5
+ "eval_samples_per_second": 1.811,
6
+ "eval_steps_per_second": 0.113,
7
  "eval_wer": 60.05599273607748
8
  }
runs/Dec20_20-11-43_129-146-32-172/events.out.tfevents.1671567996.129-146-32-172.149339.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f35cb80a34e81a96e6ecea4220ba82e98f79d0b2759d0d7d032926a35627a522
3
+ size 358
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 30.0,
3
- "train_loss": 0.0,
4
- "train_runtime": 0.8373,
5
- "train_samples_per_second": 91726.968,
6
- "train_steps_per_second": 1433.234
7
  }
 
1
  {
2
+ "epoch": 33.33,
3
+ "train_loss": 0.018539312619429368,
4
+ "train_runtime": 504.1118,
5
+ "train_samples_per_second": 165.043,
6
+ "train_steps_per_second": 2.579
7
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.8710034489631653,
3
  "best_model_checkpoint": "./checkpoint-400",
4
- "epoch": 30.0,
5
- "global_step": 1200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -836,18 +836,87 @@
836
  "step": 1200
837
  },
838
  {
839
- "epoch": 30.0,
840
- "step": 1200,
841
- "total_flos": 4.8586623123456e+18,
842
- "train_loss": 0.0,
843
- "train_runtime": 0.8373,
844
- "train_samples_per_second": 91726.968,
845
- "train_steps_per_second": 1433.234
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
846
  }
847
  ],
848
- "max_steps": 1200,
849
- "num_train_epochs": 30,
850
- "total_flos": 4.8586623123456e+18,
851
  "trial_name": null,
852
  "trial_params": null
853
  }
 
1
  {
2
  "best_metric": 0.8710034489631653,
3
  "best_model_checkpoint": "./checkpoint-400",
4
+ "epoch": 33.32911392405063,
5
+ "global_step": 1300,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
836
  "step": 1200
837
  },
838
  {
839
+ "epoch": 31.03,
840
+ "learning_rate": 7.833333333333335e-07,
841
+ "loss": 0.2489,
842
+ "step": 1210
843
+ },
844
+ {
845
+ "epoch": 31.28,
846
+ "learning_rate": 7.000000000000001e-07,
847
+ "loss": 0.2397,
848
+ "step": 1220
849
+ },
850
+ {
851
+ "epoch": 31.53,
852
+ "learning_rate": 6.166666666666668e-07,
853
+ "loss": 0.2362,
854
+ "step": 1230
855
+ },
856
+ {
857
+ "epoch": 31.78,
858
+ "learning_rate": 5.333333333333335e-07,
859
+ "loss": 0.2419,
860
+ "step": 1240
861
+ },
862
+ {
863
+ "epoch": 32.05,
864
+ "learning_rate": 4.5000000000000003e-07,
865
+ "loss": 0.2533,
866
+ "step": 1250
867
+ },
868
+ {
869
+ "epoch": 32.3,
870
+ "learning_rate": 3.666666666666667e-07,
871
+ "loss": 0.2321,
872
+ "step": 1260
873
+ },
874
+ {
875
+ "epoch": 32.56,
876
+ "learning_rate": 2.8333333333333336e-07,
877
+ "loss": 0.232,
878
+ "step": 1270
879
+ },
880
+ {
881
+ "epoch": 32.81,
882
+ "learning_rate": 2.0000000000000002e-07,
883
+ "loss": 0.2421,
884
+ "step": 1280
885
+ },
886
+ {
887
+ "epoch": 33.08,
888
+ "learning_rate": 1.1666666666666668e-07,
889
+ "loss": 0.2457,
890
+ "step": 1290
891
+ },
892
+ {
893
+ "epoch": 33.33,
894
+ "learning_rate": 3.333333333333334e-08,
895
+ "loss": 0.2383,
896
+ "step": 1300
897
+ },
898
+ {
899
+ "epoch": 33.33,
900
+ "eval_loss": 0.9528815746307373,
901
+ "eval_runtime": 176.305,
902
+ "eval_samples_per_second": 2.904,
903
+ "eval_steps_per_second": 0.182,
904
+ "eval_wer": 59.07990314769975,
905
+ "step": 1300
906
+ },
907
+ {
908
+ "epoch": 33.33,
909
+ "step": 1300,
910
+ "total_flos": 5.27396086775808e+18,
911
+ "train_loss": 0.018539312619429368,
912
+ "train_runtime": 504.1118,
913
+ "train_samples_per_second": 165.043,
914
+ "train_steps_per_second": 2.579
915
  }
916
  ],
917
+ "max_steps": 1300,
918
+ "num_train_epochs": 34,
919
+ "total_flos": 5.27396086775808e+18,
920
  "trial_name": null,
921
  "trial_params": null
922
  }