griffio commited on
Commit
38628db
·
verified ·
1 Parent(s): 15123ab

rotated_maps

Browse files
README.md ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: peft
3
+ license: apache-2.0
4
+ base_model: google/vit-large-patch16-224-in21k
5
+ tags:
6
+ - image-classification
7
+ - generated_from_trainer
8
+ datasets:
9
+ - imagefolder
10
+ metrics:
11
+ - accuracy
12
+ model-index:
13
+ - name: vit-large-patch16-224-in21k-testing-dungeons-lora-27Dec24-0001
14
+ results:
15
+ - task:
16
+ type: image-classification
17
+ name: Image Classification
18
+ dataset:
19
+ name: rotated_maps
20
+ type: imagefolder
21
+ config: default
22
+ split: validation
23
+ args: default
24
+ metrics:
25
+ - type: accuracy
26
+ value: 0.9607142857142857
27
+ name: Accuracy
28
+ ---
29
+
30
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
31
+ should probably proofread and complete it, then remove this comment. -->
32
+
33
+ # vit-large-patch16-224-in21k-testing-dungeons-lora-27Dec24-0001
34
+
35
+ This model is a fine-tuned version of [google/vit-large-patch16-224-in21k](https://huggingface.co/google/vit-large-patch16-224-in21k) on the rotated_maps dataset.
36
+ It achieves the following results on the evaluation set:
37
+ - Loss: 0.1076
38
+ - Accuracy: 0.9607
39
+
40
+ ## Model description
41
+
42
+ More information needed
43
+
44
+ ## Intended uses & limitations
45
+
46
+ More information needed
47
+
48
+ ## Training and evaluation data
49
+
50
+ More information needed
51
+
52
+ ## Training procedure
53
+
54
+ ### Training hyperparameters
55
+
56
+ The following hyperparameters were used during training:
57
+ - learning_rate: 0.005
58
+ - train_batch_size: 8
59
+ - eval_batch_size: 8
60
+ - seed: 42
61
+ - gradient_accumulation_steps: 4
62
+ - total_train_batch_size: 32
63
+ - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
64
+ - lr_scheduler_type: linear
65
+ - lr_scheduler_warmup_ratio: 0.1
66
+ - num_epochs: 12
67
+ - mixed_precision_training: Native AMP
68
+
69
+ ### Training results
70
+
71
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy |
72
+ |:-------------:|:-------:|:----:|:---------------:|:--------:|
73
+ | No log | 0.7273 | 2 | 1.5502 | 0.2946 |
74
+ | No log | 1.7273 | 4 | 1.1408 | 0.6696 |
75
+ | No log | 2.7273 | 6 | 1.0113 | 0.6036 |
76
+ | No log | 3.7273 | 8 | 0.6030 | 0.8411 |
77
+ | 5.1081 | 4.7273 | 10 | 0.4665 | 0.8625 |
78
+ | 5.1081 | 5.7273 | 12 | 0.4145 | 0.8643 |
79
+ | 5.1081 | 6.7273 | 14 | 0.2846 | 0.9107 |
80
+ | 5.1081 | 7.7273 | 16 | 0.2386 | 0.9125 |
81
+ | 5.1081 | 8.7273 | 18 | 0.1564 | 0.9554 |
82
+ | 0.7653 | 9.7273 | 20 | 0.1178 | 0.9679 |
83
+ | 0.7653 | 10.7273 | 22 | 0.1241 | 0.9536 |
84
+ | 0.7653 | 11.7273 | 24 | 0.1076 | 0.9607 |
85
+
86
+
87
+ ### Framework versions
88
+
89
+ - PEFT 0.14.0
90
+ - Transformers 4.47.1
91
+ - Pytorch 2.5.1+cu121
92
+ - Datasets 3.2.0
93
+ - Tokenizers 0.21.0
adapter_config.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "ViTForImageClassification",
5
+ "parent_library": "transformers.models.vit.modeling_vit"
6
+ },
7
+ "base_model_name_or_path": "google/vit-large-patch16-224-in21k",
8
+ "bias": "none",
9
+ "eva_config": null,
10
+ "exclude_modules": null,
11
+ "fan_in_fan_out": false,
12
+ "inference_mode": true,
13
+ "init_lora_weights": true,
14
+ "layer_replication": null,
15
+ "layers_pattern": null,
16
+ "layers_to_transform": null,
17
+ "loftq_config": {},
18
+ "lora_alpha": 16,
19
+ "lora_bias": false,
20
+ "lora_dropout": 0.1,
21
+ "megatron_config": null,
22
+ "megatron_core": "megatron.core",
23
+ "modules_to_save": [
24
+ "classifier"
25
+ ],
26
+ "peft_type": "LORA",
27
+ "r": 16,
28
+ "rank_pattern": {},
29
+ "revision": null,
30
+ "target_modules": [
31
+ "value",
32
+ "query"
33
+ ],
34
+ "task_type": null,
35
+ "use_dora": false,
36
+ "use_rslora": false
37
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:901edc81fd85a609484b8ddbe12ee75c4d9782adeaecba825dba77ae0b537d8d
3
+ size 6326220
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 11.727272727272727,
3
+ "eval_accuracy": 0.9607142857142857,
4
+ "eval_loss": 0.10761233419179916,
5
+ "eval_runtime": 8.7931,
6
+ "eval_samples_per_second": 63.686,
7
+ "eval_steps_per_second": 7.961
8
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 11.727272727272727,
3
+ "eval_accuracy": 0.9607142857142857,
4
+ "eval_loss": 0.10761233419179916,
5
+ "eval_runtime": 8.7931,
6
+ "eval_samples_per_second": 63.686,
7
+ "eval_steps_per_second": 7.961
8
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": null,
3
+ "do_normalize": true,
4
+ "do_rescale": false,
5
+ "do_resize": true,
6
+ "image_mean": [
7
+ 0.5,
8
+ 0.5,
9
+ 0.5
10
+ ],
11
+ "image_processor_type": "ViTImageProcessor",
12
+ "image_std": [
13
+ 0.5,
14
+ 0.5,
15
+ 0.5
16
+ ],
17
+ "resample": 2,
18
+ "rescale_factor": 0.00392156862745098,
19
+ "size": {
20
+ "height": 224,
21
+ "width": 224
22
+ }
23
+ }
runs/Dec27_18-35-49_021be320e763/events.out.tfevents.1735324617.021be320e763.1098.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa99ddc202b6d361b09fa3e9b921e5cb16c15e014f3581c93a7d6531375722ea
3
+ size 9859
runs/Dec27_18-35-49_021be320e763/events.out.tfevents.1735325083.021be320e763.1098.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbfe6771970bc15a9900be9112a68905354818f289b96cfcafa82c0b29f40da3
3
+ size 405
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9472f943b340e52190dd6cd91679b4ac57d120cfe37ceee6b662d4d2a78e10ef
3
+ size 5432