jnmrr commited on
Commit
0e7ad46
·
verified ·
1 Parent(s): 66d10c1

End of training

Browse files
Files changed (3) hide show
  1. all_results.json +4 -4
  2. train_results.json +4 -4
  3. trainer_state.json +23 -23
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 0.9855072463768116,
3
  "total_flos": 1.686437022030889e+17,
4
- "train_loss": 1.1870845416012932,
5
- "train_runtime": 162.1308,
6
- "train_samples_per_second": 13.538,
7
- "train_steps_per_second": 0.105
8
  }
 
1
  {
2
  "epoch": 0.9855072463768116,
3
  "total_flos": 1.686437022030889e+17,
4
+ "train_loss": 1.5057464066673727,
5
+ "train_runtime": 321.636,
6
+ "train_samples_per_second": 6.824,
7
+ "train_steps_per_second": 0.053
8
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 0.9855072463768116,
3
  "total_flos": 1.686437022030889e+17,
4
- "train_loss": 1.1870845416012932,
5
- "train_runtime": 162.1308,
6
- "train_samples_per_second": 13.538,
7
- "train_steps_per_second": 0.105
8
  }
 
1
  {
2
  "epoch": 0.9855072463768116,
3
  "total_flos": 1.686437022030889e+17,
4
+ "train_loss": 1.5057464066673727,
5
+ "train_runtime": 321.636,
6
+ "train_samples_per_second": 6.824,
7
+ "train_steps_per_second": 0.053
8
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.3155737704918033,
3
  "best_model_checkpoint": "doc-img-classification/checkpoint-17",
4
  "epoch": 0.9855072463768116,
5
  "eval_steps": 500,
@@ -10,44 +10,44 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.057971014492753624,
13
- "grad_norm": 3.7626097202301025,
14
  "learning_rate": 0.0005,
15
- "loss": 1.1898,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.6956521739130435,
20
- "grad_norm": 2.0672760009765625,
21
  "learning_rate": 0.0003333333333333333,
22
- "loss": 1.2333,
23
  "step": 12
24
  },
25
  {
26
  "epoch": 0.9855072463768116,
27
- "eval_Macro F1": 0.2258236627984527,
28
- "eval_Macro Precision": 0.24799453831711893,
29
- "eval_Macro Recall": 0.3347186147186147,
30
- "eval_Micro F1": 0.3155737704918033,
31
- "eval_Micro Precision": 0.3155737704918033,
32
- "eval_Micro Recall": 0.3155737704918033,
33
- "eval_Weighted F1": 0.2118634338981494,
34
- "eval_Weighted Precision": 0.231138727304777,
35
- "eval_Weighted Recall": 0.3155737704918033,
36
- "eval_accuracy": 0.3155737704918033,
37
- "eval_loss": 1.099541425704956,
38
- "eval_runtime": 14.6506,
39
- "eval_samples_per_second": 16.655,
40
- "eval_steps_per_second": 0.546,
41
  "step": 17
42
  },
43
  {
44
  "epoch": 0.9855072463768116,
45
  "step": 17,
46
  "total_flos": 1.686437022030889e+17,
47
- "train_loss": 1.1870845416012932,
48
- "train_runtime": 162.1308,
49
- "train_samples_per_second": 13.538,
50
- "train_steps_per_second": 0.105
51
  }
52
  ],
53
  "logging_steps": 12,
 
1
  {
2
+ "best_metric": 0.3483606557377049,
3
  "best_model_checkpoint": "doc-img-classification/checkpoint-17",
4
  "epoch": 0.9855072463768116,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.057971014492753624,
13
+ "grad_norm": 7.618393898010254,
14
  "learning_rate": 0.0005,
15
+ "loss": 1.2624,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.6956521739130435,
20
+ "grad_norm": 7.588911056518555,
21
  "learning_rate": 0.0003333333333333333,
22
+ "loss": 1.7064,
23
  "step": 12
24
  },
25
  {
26
  "epoch": 0.9855072463768116,
27
+ "eval_Macro F1": 0.21733759318423854,
28
+ "eval_Macro Precision": 0.37635327635327637,
29
+ "eval_Macro Recall": 0.35452414439756214,
30
+ "eval_Micro F1": 0.3483606557377049,
31
+ "eval_Micro Precision": 0.3483606557377049,
32
+ "eval_Micro Recall": 0.3483606557377049,
33
+ "eval_Weighted F1": 0.21831561305190383,
34
+ "eval_Weighted Precision": 0.4016218299005184,
35
+ "eval_Weighted Recall": 0.3483606557377049,
36
+ "eval_accuracy": 0.3483606557377049,
37
+ "eval_loss": 1.0820339918136597,
38
+ "eval_runtime": 13.7157,
39
+ "eval_samples_per_second": 17.79,
40
+ "eval_steps_per_second": 0.583,
41
  "step": 17
42
  },
43
  {
44
  "epoch": 0.9855072463768116,
45
  "step": 17,
46
  "total_flos": 1.686437022030889e+17,
47
+ "train_loss": 1.5057464066673727,
48
+ "train_runtime": 321.636,
49
+ "train_samples_per_second": 6.824,
50
+ "train_steps_per_second": 0.053
51
  }
52
  ],
53
  "logging_steps": 12,