wgcv commited on
Commit
53d13b8
·
verified ·
1 Parent(s): c7beab0

Nuevo reto, nuevo tema en Platzi! 🤗

Browse files
README.md CHANGED
@@ -2,6 +2,7 @@
2
  license: apache-2.0
3
  base_model: distilroberta-base
4
  tags:
 
5
  - generated_from_trainer
6
  metrics:
7
  - accuracy
@@ -16,7 +17,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # platzi-distilroberta-base-mrpc-wgcv
18
 
19
- This model is a fine-tuned version of [distilroberta-base](https://huggingface.co/distilroberta-base) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
  - Loss: 0.4002
22
  - Accuracy: 0.8456
 
2
  license: apache-2.0
3
  base_model: distilroberta-base
4
  tags:
5
+ - text-classification
6
  - generated_from_trainer
7
  metrics:
8
  - accuracy
 
17
 
18
  # platzi-distilroberta-base-mrpc-wgcv
19
 
20
+ This model is a fine-tuned version of [distilroberta-base](https://huggingface.co/distilroberta-base) on the glue and the mrpc datasets.
21
  It achieves the following results on the evaluation set:
22
  - Loss: 0.4002
23
  - Accuracy: 0.8456
all_results.json CHANGED
@@ -1,8 +1,14 @@
1
  {
2
- "eval_accuracy": 0.3161764705882353,
3
- "eval_f1": 0.0,
4
- "eval_loss": 0.7639762163162231,
5
- "eval_runtime": 69.0364,
6
- "eval_samples_per_second": 5.91,
7
- "eval_steps_per_second": 0.377
 
 
 
 
 
 
8
  }
 
1
  {
2
+ "epoch": 3.0,
3
+ "eval_accuracy": 0.8455882352941176,
4
+ "eval_f1": 0.8835489833641405,
5
+ "eval_loss": 0.4001782238483429,
6
+ "eval_runtime": 83.5212,
7
+ "eval_samples_per_second": 4.885,
8
+ "eval_steps_per_second": 0.311,
9
+ "total_flos": 216973319786112.0,
10
+ "train_loss": 0.34854334955630095,
11
+ "train_runtime": 5190.8247,
12
+ "train_samples_per_second": 2.12,
13
+ "train_steps_per_second": 0.133
14
  }
eval_results.json CHANGED
@@ -1,8 +1,9 @@
1
  {
2
- "eval_accuracy": 0.3161764705882353,
3
- "eval_f1": 0.0,
4
- "eval_loss": 0.7639762163162231,
5
- "eval_runtime": 69.0364,
6
- "eval_samples_per_second": 5.91,
7
- "eval_steps_per_second": 0.377
 
8
  }
 
1
  {
2
+ "epoch": 3.0,
3
+ "eval_accuracy": 0.8455882352941176,
4
+ "eval_f1": 0.8835489833641405,
5
+ "eval_loss": 0.4001782238483429,
6
+ "eval_runtime": 83.5212,
7
+ "eval_samples_per_second": 4.885,
8
+ "eval_steps_per_second": 0.311
9
  }
runs/Jun23_22-38-15_c261aaf0d6a8/events.out.tfevents.1719187624.c261aaf0d6a8.177.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72a3216782c95b805b76506ed252749154943dfe21863255a553bd331ed1aaa9
3
+ size 457
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
- "total_flos": 251639417073456.0,
4
- "train_loss": 0.4489142757722701,
5
- "train_runtime": 3364.9714,
6
- "train_samples_per_second": 3.27,
7
- "train_steps_per_second": 0.026
8
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "total_flos": 216973319786112.0,
4
+ "train_loss": 0.34854334955630095,
5
+ "train_runtime": 5190.8247,
6
+ "train_samples_per_second": 2.12,
7
+ "train_steps_per_second": 0.133
8
  }
trainer_state.json CHANGED
@@ -1,25 +1,42 @@
1
  {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 87,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  {
12
  "epoch": 3.0,
13
- "step": 87,
14
- "total_flos": 251639417073456.0,
15
- "train_loss": 0.4489142757722701,
16
- "train_runtime": 3364.9714,
17
- "train_samples_per_second": 3.27,
18
- "train_steps_per_second": 0.026
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 87,
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 3,
25
  "save_steps": 500,
@@ -29,14 +46,14 @@
29
  "should_epoch_stop": false,
30
  "should_evaluate": false,
31
  "should_log": false,
32
- "should_save": false,
33
  "should_training_stop": false
34
  },
35
  "attributes": {}
36
  }
37
  },
38
- "total_flos": 251639417073456.0,
39
- "train_batch_size": 128,
40
  "trial_name": null,
41
  "trial_params": null
42
  }
 
1
  {
2
+ "best_metric": 0.4001782238483429,
3
+ "best_model_checkpoint": "./platzi-distilroberta-base-mrpc-glue-wgcv/checkpoint-500",
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
+ "global_step": 690,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
+ {
12
+ "epoch": 2.1739130434782608,
13
+ "grad_norm": 3.1889848709106445,
14
+ "learning_rate": 1.3768115942028985e-05,
15
+ "loss": 0.409,
16
+ "step": 500
17
+ },
18
+ {
19
+ "epoch": 2.1739130434782608,
20
+ "eval_accuracy": 0.8455882352941176,
21
+ "eval_f1": 0.8835489833641405,
22
+ "eval_loss": 0.4001782238483429,
23
+ "eval_runtime": 54.0627,
24
+ "eval_samples_per_second": 7.547,
25
+ "eval_steps_per_second": 0.481,
26
+ "step": 500
27
+ },
28
  {
29
  "epoch": 3.0,
30
+ "step": 690,
31
+ "total_flos": 216973319786112.0,
32
+ "train_loss": 0.34854334955630095,
33
+ "train_runtime": 5190.8247,
34
+ "train_samples_per_second": 2.12,
35
+ "train_steps_per_second": 0.133
36
  }
37
  ],
38
  "logging_steps": 500,
39
+ "max_steps": 690,
40
  "num_input_tokens_seen": 0,
41
  "num_train_epochs": 3,
42
  "save_steps": 500,
 
46
  "should_epoch_stop": false,
47
  "should_evaluate": false,
48
  "should_log": false,
49
+ "should_save": true,
50
  "should_training_stop": false
51
  },
52
  "attributes": {}
53
  }
54
  },
55
+ "total_flos": 216973319786112.0,
56
+ "train_batch_size": 16,
57
  "trial_name": null,
58
  "trial_params": null
59
  }