armanibadboy commited on
Commit
45a2f8a
·
verified ·
1 Parent(s): 25a89f5

armanibadboy/llama3.1-kazllm-8b-by-arman-ver3

Browse files
README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- base_model: unsloth/meta-llama-3.1-8b-instruct-bnb-4bit
3
  library_name: transformers
4
  model_name: outputs
5
  tags:
@@ -12,7 +12,7 @@ licence: license
12
 
13
  # Model Card for outputs
14
 
15
- This model is a fine-tuned version of [unsloth/meta-llama-3.1-8b-instruct-bnb-4bit](https://huggingface.co/unsloth/meta-llama-3.1-8b-instruct-bnb-4bit).
16
  It has been trained using [TRL](https://github.com/huggingface/trl).
17
 
18
  ## Quick start
 
1
  ---
2
+ base_model: unsloth/Meta-Llama-3.1-8B-Instruct
3
  library_name: transformers
4
  model_name: outputs
5
  tags:
 
12
 
13
  # Model Card for outputs
14
 
15
+ This model is a fine-tuned version of [unsloth/Meta-Llama-3.1-8B-Instruct](https://huggingface.co/unsloth/Meta-Llama-3.1-8B-Instruct).
16
  It has been trained using [TRL](https://github.com/huggingface/trl).
17
 
18
  ## Quick start
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "unsloth/meta-llama-3.1-8b-instruct-bnb-4bit",
5
  "bias": "none",
6
  "eva_config": null,
7
  "exclude_modules": null,
@@ -17,22 +17,19 @@
17
  "lora_dropout": 0,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
- "modules_to_save": [
21
- "embed_tokens",
22
- "lm_head"
23
- ],
24
  "peft_type": "LORA",
25
  "r": 32,
26
  "rank_pattern": {},
27
  "revision": null,
28
  "target_modules": [
29
- "gate_proj",
30
- "q_proj",
31
- "k_proj",
32
  "up_proj",
33
  "v_proj",
 
 
34
  "o_proj",
35
- "down_proj"
 
36
  ],
37
  "task_type": "CAUSAL_LM",
38
  "use_dora": false,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "unsloth/Meta-Llama-3.1-8B-Instruct",
5
  "bias": "none",
6
  "eva_config": null,
7
  "exclude_modules": null,
 
17
  "lora_dropout": 0,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
20
+ "modules_to_save": null,
 
 
 
21
  "peft_type": "LORA",
22
  "r": 32,
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
 
 
26
  "up_proj",
27
  "v_proj",
28
+ "q_proj",
29
+ "down_proj",
30
  "o_proj",
31
+ "k_proj",
32
+ "gate_proj"
33
  ],
34
  "task_type": "CAUSAL_LM",
35
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ab18236dd4b5c647caccf4ea8bc2ec9bc209111a2d736657c3655101ab4e278
3
- size 2436951232
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb5e7e7bc21a0f026bb256e385559ffb782183c7489f14d67d0fff098560a3df
3
+ size 335604696
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ff8c9eb231f7cc1f2d0cde7fb3e634ba8566ba1ea82c012025f11b3cbbea67d
3
  size 5560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:969b4e450867fd29aefe7cae901621bd298c839b278137531f31d92a91a19102
3
  size 5560