bhargob11 commited on
Commit
c258693
·
verified ·
1 Parent(s): c5e43b5

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -14,14 +14,14 @@
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
  "lora_alpha": 16,
17
- "lora_dropout": 0.1,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
  "modules_to_save": [
21
  "classifier"
22
  ],
23
  "peft_type": "LORA",
24
- "r": 16,
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
 
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
  "lora_alpha": 16,
17
+ "lora_dropout": 0.05,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
  "modules_to_save": [
21
  "classifier"
22
  ],
23
  "peft_type": "LORA",
24
+ "r": 32,
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:888b7a246087863947dece026546b16c5b9874999347eae36c3a549fefac1b99
3
- size 2372592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14ac509eaf5eacf8c37f09b45fb8556c83de0808c2fd9221ac37913a45e2ef87
3
+ size 4731912
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "total_flos": 3.405838778276659e+17,
4
+ "train_loss": 0.6811685698372977,
5
+ "train_runtime": 162.9509,
6
+ "train_samples_per_second": 26.787,
7
+ "train_steps_per_second": 0.215
8
+ }
runs/Aug15_13-57-16_c03d0dbfda2e/events.out.tfevents.1723730439.c03d0dbfda2e.1885.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e482f34e703102e60b97dbb9bb277609325bfe8c34633f35b8843dfbc51a766
3
+ size 405
runs/Aug15_14-03-02_c03d0dbfda2e/events.out.tfevents.1723730583.c03d0dbfda2e.1885.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:563b06d2895a4058a43bcaa21b13664e9aa225f6015de0687fc169a331d0e9a5
3
+ size 5879
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "total_flos": 3.405838778276659e+17,
4
+ "train_loss": 0.6811685698372977,
5
+ "train_runtime": 162.9509,
6
+ "train_samples_per_second": 26.787,
7
+ "train_steps_per_second": 0.215
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,108 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.5714285714285714,
3
+ "best_model_checkpoint": "vit-base-patch16-224-in21k-finetuned-qlora-houseplant/checkpoint-35",
4
+ "epoch": 5.0,
5
+ "eval_steps": 500,
6
+ "global_step": 35,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_accuracy": 0.5204081632653061,
14
+ "eval_loss": 0.6893933415412903,
15
+ "eval_runtime": 2.0373,
16
+ "eval_samples_per_second": 48.103,
17
+ "eval_steps_per_second": 1.963,
18
+ "step": 7
19
+ },
20
+ {
21
+ "epoch": 1.4285714285714286,
22
+ "grad_norm": 0.5420740246772766,
23
+ "learning_rate": 4.032258064516129e-05,
24
+ "loss": 0.6869,
25
+ "step": 10
26
+ },
27
+ {
28
+ "epoch": 2.0,
29
+ "eval_accuracy": 0.5306122448979592,
30
+ "eval_loss": 0.6856390237808228,
31
+ "eval_runtime": 2.0142,
32
+ "eval_samples_per_second": 48.654,
33
+ "eval_steps_per_second": 1.986,
34
+ "step": 14
35
+ },
36
+ {
37
+ "epoch": 2.857142857142857,
38
+ "grad_norm": 0.44206592440605164,
39
+ "learning_rate": 2.4193548387096777e-05,
40
+ "loss": 0.6797,
41
+ "step": 20
42
+ },
43
+ {
44
+ "epoch": 3.0,
45
+ "eval_accuracy": 0.5612244897959183,
46
+ "eval_loss": 0.6827691793441772,
47
+ "eval_runtime": 2.3921,
48
+ "eval_samples_per_second": 40.969,
49
+ "eval_steps_per_second": 1.672,
50
+ "step": 21
51
+ },
52
+ {
53
+ "epoch": 4.0,
54
+ "eval_accuracy": 0.5612244897959183,
55
+ "eval_loss": 0.6809878945350647,
56
+ "eval_runtime": 2.0128,
57
+ "eval_samples_per_second": 48.688,
58
+ "eval_steps_per_second": 1.987,
59
+ "step": 28
60
+ },
61
+ {
62
+ "epoch": 4.285714285714286,
63
+ "grad_norm": 0.47674253582954407,
64
+ "learning_rate": 8.064516129032258e-06,
65
+ "loss": 0.6808,
66
+ "step": 30
67
+ },
68
+ {
69
+ "epoch": 5.0,
70
+ "eval_accuracy": 0.5714285714285714,
71
+ "eval_loss": 0.6803476810455322,
72
+ "eval_runtime": 1.9919,
73
+ "eval_samples_per_second": 49.198,
74
+ "eval_steps_per_second": 2.008,
75
+ "step": 35
76
+ },
77
+ {
78
+ "epoch": 5.0,
79
+ "step": 35,
80
+ "total_flos": 3.405838778276659e+17,
81
+ "train_loss": 0.6811685698372977,
82
+ "train_runtime": 162.9509,
83
+ "train_samples_per_second": 26.787,
84
+ "train_steps_per_second": 0.215
85
+ }
86
+ ],
87
+ "logging_steps": 10,
88
+ "max_steps": 35,
89
+ "num_input_tokens_seen": 0,
90
+ "num_train_epochs": 5,
91
+ "save_steps": 500,
92
+ "stateful_callbacks": {
93
+ "TrainerControl": {
94
+ "args": {
95
+ "should_epoch_stop": false,
96
+ "should_evaluate": false,
97
+ "should_log": false,
98
+ "should_save": true,
99
+ "should_training_stop": true
100
+ },
101
+ "attributes": {}
102
+ }
103
+ },
104
+ "total_flos": 3.405838778276659e+17,
105
+ "train_batch_size": 32,
106
+ "trial_name": null,
107
+ "trial_params": null
108
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b7f8a025fdf080b905c81a3c18cb532bb04175d55bf1dfe38dd734373dcb71e
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a2816daebe68496c7c177291686be8bff9b425ea88a7c6c51e2422304bdb6f5
3
  size 5304