taufiqsyed commited on
Commit
3d74d8b
·
verified ·
1 Parent(s): d054974

End of training

Browse files
Files changed (5) hide show
  1. README.md +6 -1
  2. all_results.json +12 -12
  3. eval_results.json +6 -6
  4. train_results.json +7 -7
  5. trainer_state.json +14 -98
README.md CHANGED
@@ -3,6 +3,8 @@ library_name: peft
3
  license: cc-by-nc-4.0
4
  base_model: facebook/musicgen-small
5
  tags:
 
 
6
  - generated_from_trainer
7
  model-index:
8
  - name: salami_truncsplit_model_trial2
@@ -14,7 +16,10 @@ should probably proofread and complete it, then remove this comment. -->
14
 
15
  # salami_truncsplit_model_trial2
16
 
17
- This model is a fine-tuned version of [facebook/musicgen-small](https://huggingface.co/facebook/musicgen-small) on an unknown dataset.
 
 
 
18
 
19
  ## Model description
20
 
 
3
  license: cc-by-nc-4.0
4
  base_model: facebook/musicgen-small
5
  tags:
6
+ - text-to-audio
7
+ - taufiqsyed/salami_cleaned_sampled
8
  - generated_from_trainer
9
  model-index:
10
  - name: salami_truncsplit_model_trial2
 
16
 
17
  # salami_truncsplit_model_trial2
18
 
19
+ This model is a fine-tuned version of [facebook/musicgen-small](https://huggingface.co/facebook/musicgen-small) on the TAUFIQSYED/SALAMI_CLEANED_SAMPLED - DEFAULT dataset.
20
+ It achieves the following results on the evaluation set:
21
+ - Loss: 3.6772
22
+ - Clap: 0.2625
23
 
24
  ## Model description
25
 
all_results.json CHANGED
@@ -1,15 +1,15 @@
1
  {
2
- "epoch": 0.96,
3
- "eval_clap": 0.04283957555890083,
4
- "eval_loss": 5.623888969421387,
5
- "eval_runtime": 202.5479,
6
  "eval_samples": 32,
7
- "eval_samples_per_second": 0.158,
8
- "eval_steps_per_second": 0.158,
9
- "total_flos": 39958787199960.0,
10
- "train_loss": 7.737621545791626,
11
- "train_runtime": 78.8623,
12
- "train_samples": 200,
13
- "train_samples_per_second": 2.536,
14
- "train_steps_per_second": 0.152
15
  }
 
1
  {
2
+ "epoch": 0,
3
+ "eval_clap": 0.2624700963497162,
4
+ "eval_loss": 3.677215814590454,
5
+ "eval_runtime": 198.4313,
6
  "eval_samples": 32,
7
+ "eval_samples_per_second": 0.161,
8
+ "eval_steps_per_second": 0.161,
9
+ "total_flos": 0,
10
+ "train_loss": 0.0,
11
+ "train_runtime": 1.7065,
12
+ "train_samples": 10,
13
+ "train_samples_per_second": 0.0,
14
+ "train_steps_per_second": 0.0
15
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 0.96,
3
- "eval_clap": 0.04283957555890083,
4
- "eval_loss": 5.623888969421387,
5
- "eval_runtime": 202.5479,
6
  "eval_samples": 32,
7
- "eval_samples_per_second": 0.158,
8
- "eval_steps_per_second": 0.158
9
  }
 
1
  {
2
+ "epoch": 0,
3
+ "eval_clap": 0.2624700963497162,
4
+ "eval_loss": 3.677215814590454,
5
+ "eval_runtime": 198.4313,
6
  "eval_samples": 32,
7
+ "eval_samples_per_second": 0.161,
8
+ "eval_steps_per_second": 0.161
9
  }
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 0.96,
3
- "total_flos": 39958787199960.0,
4
- "train_loss": 7.737621545791626,
5
- "train_runtime": 78.8623,
6
- "train_samples": 200,
7
- "train_samples_per_second": 2.536,
8
- "train_steps_per_second": 0.152
9
  }
 
1
  {
2
+ "epoch": 0,
3
+ "total_flos": 0,
4
+ "train_loss": 0.0,
5
+ "train_runtime": 1.7065,
6
+ "train_samples": 10,
7
+ "train_samples_per_second": 0.0,
8
+ "train_steps_per_second": 0.0
9
  }
trainer_state.json CHANGED
@@ -1,111 +1,27 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.96,
5
  "eval_steps": 25,
6
- "global_step": 12,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.08,
13
- "grad_norm": 65.75566101074219,
14
- "learning_rate": 0.0002,
15
- "loss": 9.9453,
16
- "step": 1
17
- },
18
- {
19
- "epoch": 0.16,
20
- "grad_norm": 49.121734619140625,
21
- "learning_rate": 0.0002,
22
- "loss": 9.5694,
23
- "step": 2
24
- },
25
- {
26
- "epoch": 0.24,
27
- "grad_norm": 63.262027740478516,
28
- "learning_rate": 0.0002,
29
- "loss": 8.9499,
30
- "step": 3
31
- },
32
- {
33
- "epoch": 0.32,
34
- "grad_norm": 54.31144332885742,
35
- "learning_rate": 0.0002,
36
- "loss": 8.2463,
37
- "step": 4
38
- },
39
- {
40
- "epoch": 0.4,
41
- "grad_norm": 35.41240310668945,
42
- "learning_rate": 0.0002,
43
- "loss": 7.7117,
44
- "step": 5
45
- },
46
- {
47
- "epoch": 0.48,
48
- "grad_norm": 47.44524383544922,
49
- "learning_rate": 0.0002,
50
- "loss": 7.3188,
51
- "step": 6
52
- },
53
- {
54
- "epoch": 0.56,
55
- "grad_norm": 63.63182067871094,
56
- "learning_rate": 0.0002,
57
- "loss": 7.3082,
58
- "step": 7
59
- },
60
- {
61
- "epoch": 0.64,
62
- "grad_norm": 63.364933013916016,
63
- "learning_rate": 0.0002,
64
- "loss": 7.2847,
65
- "step": 8
66
- },
67
- {
68
- "epoch": 0.72,
69
- "grad_norm": 47.89399337768555,
70
- "learning_rate": 0.0002,
71
- "loss": 7.0953,
72
- "step": 9
73
- },
74
- {
75
- "epoch": 0.8,
76
- "grad_norm": 22.77845573425293,
77
- "learning_rate": 0.0002,
78
- "loss": 6.6363,
79
- "step": 10
80
- },
81
- {
82
- "epoch": 0.88,
83
- "grad_norm": 22.07503318786621,
84
- "learning_rate": 0.0002,
85
- "loss": 6.2242,
86
- "step": 11
87
- },
88
- {
89
- "epoch": 0.96,
90
- "grad_norm": 14.495305061340332,
91
- "learning_rate": 0.0002,
92
- "loss": 6.5613,
93
- "step": 12
94
- },
95
- {
96
- "epoch": 0.96,
97
- "step": 12,
98
- "total_flos": 39958787199960.0,
99
- "train_loss": 7.737621545791626,
100
- "train_runtime": 78.8623,
101
- "train_samples_per_second": 2.536,
102
- "train_steps_per_second": 0.152
103
  }
104
  ],
105
  "logging_steps": 1.0,
106
- "max_steps": 12,
107
  "num_input_tokens_seen": 0,
108
- "num_train_epochs": 1,
109
  "save_steps": 500,
110
  "stateful_callbacks": {
111
  "TrainerControl": {
@@ -113,13 +29,13 @@
113
  "should_epoch_stop": false,
114
  "should_evaluate": false,
115
  "should_log": false,
116
- "should_save": true,
117
- "should_training_stop": true
118
  },
119
  "attributes": {}
120
  }
121
  },
122
- "total_flos": 39958787199960.0,
123
  "train_batch_size": 1,
124
  "trial_name": null,
125
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0,
5
  "eval_steps": 25,
6
+ "global_step": 0,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0,
13
+ "step": 0,
14
+ "total_flos": 0,
15
+ "train_loss": 0.0,
16
+ "train_runtime": 1.7065,
17
+ "train_samples_per_second": 0.0,
18
+ "train_steps_per_second": 0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
19
  }
20
  ],
21
  "logging_steps": 1.0,
22
+ "max_steps": 0,
23
  "num_input_tokens_seen": 0,
24
+ "num_train_epochs": 0,
25
  "save_steps": 500,
26
  "stateful_callbacks": {
27
  "TrainerControl": {
 
29
  "should_epoch_stop": false,
30
  "should_evaluate": false,
31
  "should_log": false,
32
+ "should_save": false,
33
+ "should_training_stop": false
34
  },
35
  "attributes": {}
36
  }
37
  },
38
+ "total_flos": 0,
39
  "train_batch_size": 1,
40
  "trial_name": null,
41
  "trial_params": null