Ro-xe commited on
Commit
c17ec47
·
verified ·
1 Parent(s): b5ac1b2

Upload merged model: FMixIA-FrankenMerge-9.5B-PT-9

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. README.md +45 -0
  3. added_tokens.json +24 -0
  4. config.json +29 -0
  5. mergekit_config.yml +9 -0
  6. merges.txt +0 -0
  7. model-00001-of-00015.safetensors +3 -0
  8. model-00001-of-00030.safetensors +3 -0
  9. model-00002-of-00015.safetensors +3 -0
  10. model-00002-of-00030.safetensors +3 -0
  11. model-00003-of-00015.safetensors +3 -0
  12. model-00003-of-00030.safetensors +3 -0
  13. model-00004-of-00015.safetensors +3 -0
  14. model-00004-of-00030.safetensors +3 -0
  15. model-00005-of-00015.safetensors +3 -0
  16. model-00005-of-00030.safetensors +3 -0
  17. model-00006-of-00015.safetensors +3 -0
  18. model-00006-of-00030.safetensors +3 -0
  19. model-00007-of-00015.safetensors +3 -0
  20. model-00007-of-00030.safetensors +3 -0
  21. model-00008-of-00015.safetensors +3 -0
  22. model-00008-of-00030.safetensors +3 -0
  23. model-00009-of-00015.safetensors +3 -0
  24. model-00009-of-00030.safetensors +3 -0
  25. model-00010-of-00015.safetensors +3 -0
  26. model-00010-of-00030.safetensors +3 -0
  27. model-00011-of-00015.safetensors +3 -0
  28. model-00011-of-00030.safetensors +3 -0
  29. model-00012-of-00015.safetensors +3 -0
  30. model-00012-of-00030.safetensors +3 -0
  31. model-00013-of-00015.safetensors +3 -0
  32. model-00013-of-00030.safetensors +3 -0
  33. model-00014-of-00015.safetensors +3 -0
  34. model-00014-of-00030.safetensors +3 -0
  35. model-00015-of-00015.safetensors +3 -0
  36. model-00015-of-00030.safetensors +3 -0
  37. model-00016-of-00030.safetensors +3 -0
  38. model-00017-of-00030.safetensors +3 -0
  39. model-00018-of-00030.safetensors +3 -0
  40. model-00019-of-00030.safetensors +3 -0
  41. model-00020-of-00030.safetensors +3 -0
  42. model-00021-of-00030.safetensors +3 -0
  43. model-00022-of-00030.safetensors +3 -0
  44. model-00023-of-00030.safetensors +3 -0
  45. model-00024-of-00030.safetensors +3 -0
  46. model-00025-of-00030.safetensors +3 -0
  47. model-00026-of-00030.safetensors +3 -0
  48. model-00027-of-00030.safetensors +3 -0
  49. model-00028-of-00030.safetensors +3 -0
  50. model-00029-of-00030.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - merge
5
+ - mergekit
6
+ - passthrough
7
+ - "frankenmerge"
8
+ - "7B"
9
+ - "ZeroXClem/Qwen2.5-7B-HomerCreative-Mix"
10
+ - "ZeroXClem/Qwen2.5-7B-HomerAnvita-NerdMix"
11
+ ---
12
+
13
+ # FMixIA-FrankenMerge-9.5B-PT-9
14
+
15
+ A merged model using Passthrough layer concatenation, creating a frankenmerge model using [mergekit](https://github.com/cg123/mergekit).
16
+
17
+ ## Model Details
18
+ - **Base Models**:
19
+ * [ZeroXClem/Qwen2.5-7B-HomerCreative-Mix](https://huggingface.co/ZeroXClem/Qwen2.5-7B-HomerCreative-Mix)
20
+ * [ZeroXClem/Qwen2.5-7B-HomerAnvita-NerdMix](https://huggingface.co/ZeroXClem/Qwen2.5-7B-HomerAnvita-NerdMix)
21
+ - **Merge Method**: passthrough
22
+ - **Note**: This is a frankenmerge model with modified architecture
23
+
24
+ ## Configuration
25
+ ```yaml
26
+ slices:
27
+ - sources:
28
+ - model: ZeroXClem/Qwen2.5-7B-HomerCreative-Mix
29
+ layer_range: [0, 28]
30
+ - sources:
31
+ - model: ZeroXClem/Qwen2.5-7B-HomerAnvita-NerdMix
32
+ layer_range: [0, 28]
33
+ merge_method: passthrough
34
+ dtype: bfloat16
35
+ ```
36
+
37
+ ## Usage
38
+ This model can be used with the standard transformers library:
39
+
40
+ ```python
41
+ from transformers import AutoModelForCausalLM, AutoTokenizer
42
+
43
+ model = AutoModelForCausalLM.from_pretrained("Ro-xe/FMixIA-FrankenMerge-9.5B-PT-9")
44
+ tokenizer = AutoTokenizer.from_pretrained("Ro-xe/FMixIA-FrankenMerge-9.5B-PT-9")
45
+ ```
added_tokens.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "</tool_call>": 151658,
3
+ "<tool_call>": 151657,
4
+ "<|box_end|>": 151649,
5
+ "<|box_start|>": 151648,
6
+ "<|endoftext|>": 151643,
7
+ "<|file_sep|>": 151664,
8
+ "<|fim_middle|>": 151660,
9
+ "<|fim_pad|>": 151662,
10
+ "<|fim_prefix|>": 151659,
11
+ "<|fim_suffix|>": 151661,
12
+ "<|im_end|>": 151645,
13
+ "<|im_start|>": 151644,
14
+ "<|image_pad|>": 151655,
15
+ "<|object_ref_end|>": 151647,
16
+ "<|object_ref_start|>": 151646,
17
+ "<|quad_end|>": 151651,
18
+ "<|quad_start|>": 151650,
19
+ "<|repo_name|>": 151663,
20
+ "<|video_pad|>": 151656,
21
+ "<|vision_end|>": 151653,
22
+ "<|vision_pad|>": 151654,
23
+ "<|vision_start|>": 151652
24
+ }
config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "ZeroXClem/Qwen2.5-7B-HomerCreative-Mix",
3
+ "architectures": [
4
+ "Qwen2ForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 151643,
8
+ "eos_token_id": 151645,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 3584,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 18944,
13
+ "max_position_embeddings": 32768,
14
+ "max_window_layers": 28,
15
+ "model_type": "qwen2",
16
+ "num_attention_heads": 28,
17
+ "num_hidden_layers": 56,
18
+ "num_key_value_heads": 4,
19
+ "rms_norm_eps": 1e-06,
20
+ "rope_scaling": null,
21
+ "rope_theta": 1000000.0,
22
+ "sliding_window": null,
23
+ "tie_word_embeddings": false,
24
+ "torch_dtype": "bfloat16",
25
+ "transformers_version": "4.47.0",
26
+ "use_cache": true,
27
+ "use_sliding_window": false,
28
+ "vocab_size": 152064
29
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ slices:
2
+ - sources:
3
+ - model: ZeroXClem/Qwen2.5-7B-HomerCreative-Mix
4
+ layer_range: [0, 28]
5
+ - sources:
6
+ - model: ZeroXClem/Qwen2.5-7B-HomerAnvita-NerdMix
7
+ layer_range: [0, 28]
8
+ merge_method: passthrough
9
+ dtype: bfloat16
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e3179168d48da50b3aea6648f2ebaa5981948f898028d790e3a634cd0d258dc
3
+ size 960521544
model-00001-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e51fe7ca2ea39232b4bdc1831f088cf8772cbcfdfde1d74c43b918de24aa808
3
+ size 1089994880
model-00002-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:608bcaae953fe20abb77081886266d4853c3fff0615eab45ed8a0af5880b0429
3
+ size 989890704
model-00002-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27d2ab2a01a6c4bbd8d3130f4c7f272a3890efb33ef095804c391ccc676d6cbb
3
+ size 1089994896
model-00003-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e003c37da7e872c42d91b0cdb7b490b69445154c2785b846de38c353caedb32
3
+ size 989890712
model-00003-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67cd1803f5c0a5cac73236502b6b96ed87ca7b1be94ddeb06bf83516cd1262bd
3
+ size 932248448
model-00004-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d957312f3c875ee76a226bc9a5fd0ab301b27d32b1de9610fcb36d9c85b15f7
3
+ size 998287736
model-00004-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34a7f6a23104f1d3d6990d5e3723199a462075480f539e69aa2f2ad8bc3faba8
3
+ size 932233904
model-00005-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e82147b657c9015cd555d4f34efd5e566c177b7660f91bbda43913f8c373303
3
+ size 947956192
model-00005-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:312828ffdb5e483f0cb405b47373810faa3ea57c43f6cd4366d2226ede7ae82b
3
+ size 932233912
model-00006-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a2359c4374de0f3f0f474a2b8d294b4fa4ae82111fab896175bbdb05d485d2c
3
+ size 989890704
model-00006-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7d0886459e0ecf2993ee94a4b33b3a22e410eca4ba9e835d9bd97dab0ce2ff0
3
+ size 932233912
model-00007-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efc9f282eeb8741878481eba11cfd6916ce324b2651afc46ad6b7302f067f292
3
+ size 989890704
model-00007-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e12ff41eb53368f3d882dc3c305a33991f7d0627c4b0826046802329fcd98fa
3
+ size 932233912
model-00008-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:817e88d5b5c49421aa50006bfd8be023a5f6d4840a2d5d131dd36f1d5a68b1b4
3
+ size 998287736
model-00008-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da71aacd6c80e5c94b58420453b8b5f8b4cf1df48be5baf30642f31ae9a7e4ac
3
+ size 932233912
model-00009-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5c55d4836f65ec38599dcdab1c2b62d782214582132d7c47ad8ebd6af540e99
3
+ size 947956192
model-00009-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7efbc673f9a4f6f116e12b166d38c3a1ab925c84ea785db7d01c2e1278ade9a2
3
+ size 932233912
model-00010-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2fe506514a207cc33a2daaae0e7e451eaad1c518d72b97072fb2c8edce78a72
3
+ size 989890712
model-00010-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:793849c5236a3af8e7db8a31467da3238720a1b000985fb182499987c850bea5
3
+ size 932233912
model-00011-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:746e90454abf25b89de0a1630b6deb42de45eb6b740ef12210900d26cd587e1e
3
+ size 989890704
model-00011-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f517728dc5b6f711878010b22f1d386ae5b101acb8340dee53c5b7b81c7b2715
3
+ size 932233912
model-00012-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4c4425d84d5f7c1c9a59448ae4ac3f91cd964f0bab9beeaaedf8cea8eb66e87
3
+ size 998287736
model-00012-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9139b706a7e1c70197961a2fe667ee0a4ef65424bb21b270bad06b764650982
3
+ size 932233912
model-00013-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a275019bf5fb7cb519d439351bc21606b424735b92a9321127d912f7298e930
3
+ size 947956176
model-00013-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b2f0a2ac6f9b4f7311a23c19972936f3858d23a02257f3bf4b64f950b95e30d
3
+ size 932233912
model-00014-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57bec613dba0618d86c51df927ba5273a7ec48775ba396d78dfd404aa67467e9
3
+ size 989890688
model-00014-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f4f663183319d208b5bc681923cc225b12c029e833768809c703729ae82d0a3
3
+ size 932233912
model-00015-of-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88562da74888bcc892aa1d34579e5a4642ae41e42c1c03182e3151e9a839b1b0
3
+ size 755009424
model-00015-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d28f68b4bf99b4193a71aa9ee01a83b8b982fa541cc92a374ddcf4462d279fe
3
+ size 932233904
model-00016-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc08eba74e3e0c969a849a1f39d2172bf450e4317be70290a1c06b63256513bd
3
+ size 932233912
model-00017-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89ccc6e0131baaa2b58c9a73587ee0f386e5b91db029747e0036bcd1e67d0b73
3
+ size 932233912
model-00018-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab6cf7b53349e9f53433801ee078669011455c65e71efe6cc3737e94bd28943e
3
+ size 932233912
model-00019-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2586d358a0866ed7294b80bdef311c654f2881ec6c62f84dea120b55191f563f
3
+ size 932233912
model-00020-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00496af46a97cf7d6df56ef61f0732e9c84886def72754b7380fd370ab699fdf
3
+ size 932233912
model-00021-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb65590a5d7788924a9cd0cd293e11d86b5203da3deb0cfa59c689ea0a6dff8a
3
+ size 932233912
model-00022-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b31b26b2d02088fb8db55e78f1380b1a9e7c978a7508495126d3380536483638
3
+ size 932233912
model-00023-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0fa191172d0a04aa18d30787ed2701314f6cbb840a238ce2e9c965a02e7f85a
3
+ size 932233912
model-00024-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e5a49e71ef73248fc010722fad336d09cfd92abd7e0745f46c050fdf73eb5e9
3
+ size 932233904
model-00025-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0efe41650313b80e624c3c09af3773abebaa7be70ccd5d2c94e9333495b0a789
3
+ size 932233904
model-00026-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c1574b5a7ddbf748abf9e50d05058f89244c65144e9c16d53b27c1b9302e488
3
+ size 932233904
model-00027-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e157b8832b4aeaccf2e46e7b5f7d56af856bd28594610cafb9d68f8fed09856
3
+ size 932233904
model-00028-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4488cabc6fb74058bb835329b57799b0e6e0a54b24ff3fa6579b20b6159ef240
3
+ size 932233904
model-00029-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e7e980b6291f180db5c55687b30fd8fcc19387025df7a121b62800e68ec16af
3
+ size 932233904