dacorvo HF staff commited on
Commit
4ea2c74
·
verified ·
1 Parent(s): 1002f15

Synchronizing local compiler cache.

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +34 -0
  2. neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/gpt2/gpt2/a98695ecf15fb450e7fb.json +1 -0
  3. neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/granite/ibm-granite/granite-3.1-2b-instruct/1cb3e61df94568db875d.json +1 -0
  4. neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/granite/ibm-granite/granite-3.1-8b-instruct/a77e916953a3fe0abad7.json +1 -0
  5. neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/granite/ibm-granite/granite-3.1-8b-instruct/d2c65782eb016a7c7d3d.json +1 -0
  6. neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/granite/ibm-granite/granite-3.1-8b-instruct/d7f7ad625f88a41acce9.json +1 -0
  7. neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/llama/meta-llama/Llama-3.2-1B/a08b562da91aa93cecef.json +1 -0
  8. neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/qwen2/Qwen/Qwen2.5-0.5B/7f457366ad13eafe6b8a.json +1 -0
  9. neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/training/llama/michaelbenayoun/llama-2-tiny-4kv-heads-4layers-random/0eb20cc95fb402dd41b5.json +1 -0
  10. neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/training/llama/michaelbenayoun/llama-2-tiny-4kv-heads-4layers-random/64dfccc36a935e758422.json +1 -0
  11. neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev1/inference/llama/NousResearch/Hermes-2-Theta-Llama-3-8B/af163c75a04bbd5785ad.json +1 -0
  12. neuronxcc-2.15.143.0+e39249ad/MODULE_039209d63913e93c1e86+39f12043/compile_flags.json +1 -0
  13. neuronxcc-2.15.143.0+e39249ad/MODULE_039209d63913e93c1e86+39f12043/model.done +0 -0
  14. neuronxcc-2.15.143.0+e39249ad/MODULE_039209d63913e93c1e86+39f12043/model.hlo_module.pb +3 -0
  15. neuronxcc-2.15.143.0+e39249ad/MODULE_039209d63913e93c1e86+39f12043/model.neff +3 -0
  16. neuronxcc-2.15.143.0+e39249ad/MODULE_08bf44f19376de227f4a+39f12043/compile_flags.json +1 -0
  17. neuronxcc-2.15.143.0+e39249ad/MODULE_08bf44f19376de227f4a+39f12043/model.done +0 -0
  18. neuronxcc-2.15.143.0+e39249ad/MODULE_08bf44f19376de227f4a+39f12043/model.hlo_module.pb +3 -0
  19. neuronxcc-2.15.143.0+e39249ad/MODULE_08bf44f19376de227f4a+39f12043/model.neff +3 -0
  20. neuronxcc-2.15.143.0+e39249ad/MODULE_0c6016f7aa301b249715+39f12043/compile_flags.json +1 -0
  21. neuronxcc-2.15.143.0+e39249ad/MODULE_0c6016f7aa301b249715+39f12043/model.done +0 -0
  22. neuronxcc-2.15.143.0+e39249ad/MODULE_0c6016f7aa301b249715+39f12043/model.hlo_module.pb +3 -0
  23. neuronxcc-2.15.143.0+e39249ad/MODULE_0c6016f7aa301b249715+39f12043/model.neff +0 -0
  24. neuronxcc-2.15.143.0+e39249ad/MODULE_0fff2decd536cc6fae0b+39f12043/compile_flags.json +1 -0
  25. neuronxcc-2.15.143.0+e39249ad/MODULE_0fff2decd536cc6fae0b+39f12043/model.done +0 -0
  26. neuronxcc-2.15.143.0+e39249ad/MODULE_0fff2decd536cc6fae0b+39f12043/model.hlo_module.pb +3 -0
  27. neuronxcc-2.15.143.0+e39249ad/MODULE_0fff2decd536cc6fae0b+39f12043/model.neff +3 -0
  28. neuronxcc-2.15.143.0+e39249ad/MODULE_10699447453196921194+d7517139/compile_flags.json +1 -0
  29. neuronxcc-2.15.143.0+e39249ad/MODULE_10699447453196921194+d7517139/model.done +0 -0
  30. neuronxcc-2.15.143.0+e39249ad/MODULE_10699447453196921194+d7517139/model.hlo_module.pb +3 -0
  31. neuronxcc-2.15.143.0+e39249ad/MODULE_10699447453196921194+d7517139/model.neff +0 -0
  32. neuronxcc-2.15.143.0+e39249ad/MODULE_10855203598795096374+d7517139/compile_flags.json +1 -0
  33. neuronxcc-2.15.143.0+e39249ad/MODULE_10855203598795096374+d7517139/model.done +0 -0
  34. neuronxcc-2.15.143.0+e39249ad/MODULE_10855203598795096374+d7517139/model.hlo_module.pb +3 -0
  35. neuronxcc-2.15.143.0+e39249ad/MODULE_10855203598795096374+d7517139/model.neff +0 -0
  36. neuronxcc-2.15.143.0+e39249ad/MODULE_11438465433648369693+cc298dfa/compile_flags.json +1 -0
  37. neuronxcc-2.15.143.0+e39249ad/MODULE_11438465433648369693+cc298dfa/model.done +0 -0
  38. neuronxcc-2.15.143.0+e39249ad/MODULE_11438465433648369693+cc298dfa/model.hlo_module.pb +3 -0
  39. neuronxcc-2.15.143.0+e39249ad/MODULE_11438465433648369693+cc298dfa/model.neff +0 -0
  40. neuronxcc-2.15.143.0+e39249ad/MODULE_1146904795246293467+d7517139/compile_flags.json +1 -0
  41. neuronxcc-2.15.143.0+e39249ad/MODULE_1146904795246293467+d7517139/model.done +0 -0
  42. neuronxcc-2.15.143.0+e39249ad/MODULE_1146904795246293467+d7517139/model.hlo_module.pb +3 -0
  43. neuronxcc-2.15.143.0+e39249ad/MODULE_1146904795246293467+d7517139/model.neff +0 -0
  44. neuronxcc-2.15.143.0+e39249ad/MODULE_11866581511567855346+d7517139/compile_flags.json +1 -0
  45. neuronxcc-2.15.143.0+e39249ad/MODULE_11866581511567855346+d7517139/model.done +0 -0
  46. neuronxcc-2.15.143.0+e39249ad/MODULE_11866581511567855346+d7517139/model.hlo_module.pb +3 -0
  47. neuronxcc-2.15.143.0+e39249ad/MODULE_11866581511567855346+d7517139/model.neff +0 -0
  48. neuronxcc-2.15.143.0+e39249ad/MODULE_12007993937039433331+cc298dfa/compile_flags.json +1 -0
  49. neuronxcc-2.15.143.0+e39249ad/MODULE_12007993937039433331+cc298dfa/model.done +0 -0
  50. neuronxcc-2.15.143.0+e39249ad/MODULE_12007993937039433331+cc298dfa/model.hlo_module.pb +3 -0
.gitattributes CHANGED
@@ -1506,3 +1506,37 @@ neuronxcc-2.16.345.0+69131dd3/MODULE_58100a7445826a304805+613edded/model.neff fi
1506
  neuronxcc-2.16.345.0+69131dd3/MODULE_a4bb4e6e225de0782e33+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
1507
  neuronxcc-2.16.345.0+69131dd3/MODULE_45342279990edbf2b5cf+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
1508
  neuronxcc-2.16.345.0+69131dd3/MODULE_7a9ad5ca2b9a4c61ce61+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1506
  neuronxcc-2.16.345.0+69131dd3/MODULE_a4bb4e6e225de0782e33+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
1507
  neuronxcc-2.16.345.0+69131dd3/MODULE_45342279990edbf2b5cf+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
1508
  neuronxcc-2.16.345.0+69131dd3/MODULE_7a9ad5ca2b9a4c61ce61+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
1509
+ neuronxcc-2.15.143.0+e39249ad/MODULE_039209d63913e93c1e86+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1510
+ neuronxcc-2.15.143.0+e39249ad/MODULE_08bf44f19376de227f4a+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1511
+ neuronxcc-2.15.143.0+e39249ad/MODULE_0fff2decd536cc6fae0b+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1512
+ neuronxcc-2.15.143.0+e39249ad/MODULE_12a0552d04c7615b5f0d+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1513
+ neuronxcc-2.15.143.0+e39249ad/MODULE_20e558f7c64e10492a47+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1514
+ neuronxcc-2.15.143.0+e39249ad/MODULE_24fb07bef8bec6b8c55d+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1515
+ neuronxcc-2.15.143.0+e39249ad/MODULE_3107289755dc274c6618+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1516
+ neuronxcc-2.15.143.0+e39249ad/MODULE_45342279990edbf2b5cf+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1517
+ neuronxcc-2.15.143.0+e39249ad/MODULE_475f6a6337c3368d1634+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1518
+ neuronxcc-2.15.143.0+e39249ad/MODULE_5893dc47cb102343059e+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1519
+ neuronxcc-2.15.143.0+e39249ad/MODULE_5e114d6e37dbc83fd0d5+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1520
+ neuronxcc-2.15.143.0+e39249ad/MODULE_615e9729fc34f530d320+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1521
+ neuronxcc-2.15.143.0+e39249ad/MODULE_624bf4f0068a36d25cc2+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1522
+ neuronxcc-2.15.143.0+e39249ad/MODULE_6262eabbb464a129229d+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1523
+ neuronxcc-2.15.143.0+e39249ad/MODULE_6655ab3947956517350a+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1524
+ neuronxcc-2.15.143.0+e39249ad/MODULE_73bb972def7a8f46337f+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1525
+ neuronxcc-2.15.143.0+e39249ad/MODULE_7505bc281307b5e037a1+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1526
+ neuronxcc-2.15.143.0+e39249ad/MODULE_866f556d5bda514c53b5+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1527
+ neuronxcc-2.15.143.0+e39249ad/MODULE_95f0ce72279e469fa4dc+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1528
+ neuronxcc-2.15.143.0+e39249ad/MODULE_9b250895e3e1222009a6+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1529
+ neuronxcc-2.15.143.0+e39249ad/MODULE_9d845d35a80526bffb75+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1530
+ neuronxcc-2.15.143.0+e39249ad/MODULE_9e2cc8d23b5dc1d7bbcd+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1531
+ neuronxcc-2.15.143.0+e39249ad/MODULE_a42027513ff1c4e1a28b+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1532
+ neuronxcc-2.15.143.0+e39249ad/MODULE_ae142d763c7fe49cf917+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1533
+ neuronxcc-2.15.143.0+e39249ad/MODULE_b5542aa0c46559861e76+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1534
+ neuronxcc-2.15.143.0+e39249ad/MODULE_b60a34f4644d1f39a41c+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1535
+ neuronxcc-2.15.143.0+e39249ad/MODULE_ba3d6e3fd76f1db00baa+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1536
+ neuronxcc-2.15.143.0+e39249ad/MODULE_cab66edf22efc0df4bbc+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1537
+ neuronxcc-2.15.143.0+e39249ad/MODULE_d400c4285015b3e828bb+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1538
+ neuronxcc-2.15.143.0+e39249ad/MODULE_dfe7e6082eb121381a18+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1539
+ neuronxcc-2.15.143.0+e39249ad/MODULE_e4be9bcec68b9af4d7ce+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1540
+ neuronxcc-2.15.143.0+e39249ad/MODULE_eeea370b5fb22f353681+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1541
+ neuronxcc-2.15.143.0+e39249ad/MODULE_f37ba14e8cecd0289618+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
1542
+ neuronxcc-2.15.143.0+e39249ad/MODULE_f6695fce8439b8324614+39f12043/model.neff filter=lfs diff=lfs merge=lfs -text
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/gpt2/gpt2/a98695ecf15fb450e7fb.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"activation_function": "gelu_new", "architectures": ["GPT2LMHeadModel"], "attn_pdrop": 0.1, "bos_token_id": 50256, "embd_pdrop": 0.1, "eos_token_id": 50256, "initializer_range": 0.02, "layer_norm_epsilon": 1e-05, "model_type": "gpt2", "n_ctx": 1024, "n_embd": 768, "n_head": 12, "n_inner": null, "n_layer": 12, "n_positions": 1024, "neuron": {"auto_cast_type": "bf16", "batch_size": 1, "checkpoint_id": "gpt2", "checkpoint_revision": "607a30d783dfa663caf39e06633721c8d4cfcd7e", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 2, "sequence_length": 1024, "task": "text-generation"}, "reorder_and_upcast_attn": false, "resid_pdrop": 0.1, "scale_attn_by_inverse_layer_idx": false, "scale_attn_weights": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "summary_type": "cls_index", "summary_use_proj": true, "task_specific_params": {"text-generation": {"do_sample": true, "max_length": 50}}, "use_cache": true, "vocab_size": 50257}
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/granite/ibm-granite/granite-3.1-2b-instruct/1cb3e61df94568db875d.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["GraniteForCausalLM"], "attention_bias": false, "attention_dropout": 0.1, "attention_multiplier": 0.015625, "bos_token_id": 0, "embedding_multiplier": 12.0, "eos_token_id": 0, "hidden_act": "silu", "hidden_size": 2048, "initializer_range": 0.02, "intermediate_size": 8192, "logits_scaling": 8.0, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "granite", "neuron": {"auto_cast_type": "bf16", "batch_size": 8, "checkpoint_id": "ibm-granite/granite-3.1-2b-instruct", "checkpoint_revision": "a06c9a0fef05d8111ca1f77b60f477443c526043", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 40, "num_key_value_heads": 8, "pad_token_id": 0, "residual_multiplier": 0.22, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 5000000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 49155}
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/granite/ibm-granite/granite-3.1-8b-instruct/a77e916953a3fe0abad7.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["GraniteForCausalLM"], "attention_bias": false, "attention_dropout": 0.1, "attention_multiplier": 0.0078125, "bos_token_id": 0, "embedding_multiplier": 12.0, "eos_token_id": 0, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 12800, "logits_scaling": 16.0, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "granite", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "ibm-granite/granite-3.1-8b-instruct", "checkpoint_revision": "7f4bb8b56ad1c53b49b07a8f9f0ec43204e07ef2", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 40, "num_key_value_heads": 8, "pad_token_id": 0, "residual_multiplier": 0.22, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 49155}
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/granite/ibm-granite/granite-3.1-8b-instruct/d2c65782eb016a7c7d3d.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["GraniteForCausalLM"], "attention_bias": false, "attention_dropout": 0.1, "attention_multiplier": 0.0078125, "bos_token_id": 0, "embedding_multiplier": 12.0, "eos_token_id": 0, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 12800, "logits_scaling": 16.0, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "granite", "neuron": {"auto_cast_type": "bf16", "batch_size": 8, "checkpoint_id": "ibm-granite/granite-3.1-8b-instruct", "checkpoint_revision": "7f4bb8b56ad1c53b49b07a8f9f0ec43204e07ef2", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 40, "num_key_value_heads": 8, "pad_token_id": 0, "residual_multiplier": 0.22, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 49155}
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/granite/ibm-granite/granite-3.1-8b-instruct/d7f7ad625f88a41acce9.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["GraniteForCausalLM"], "attention_bias": false, "attention_dropout": 0.1, "attention_multiplier": 0.0078125, "bos_token_id": 0, "embedding_multiplier": 12.0, "eos_token_id": 0, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 12800, "logits_scaling": 16.0, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "granite", "neuron": {"auto_cast_type": "bf16", "batch_size": 1, "checkpoint_id": "ibm-granite/granite-3.1-8b-instruct", "checkpoint_revision": "7f4bb8b56ad1c53b49b07a8f9f0ec43204e07ef2", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 40, "num_key_value_heads": 8, "pad_token_id": 0, "residual_multiplier": 0.22, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 49155}
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/llama/meta-llama/Llama-3.2-1B/a08b562da91aa93cecef.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "head_dim": 64, "hidden_act": "silu", "hidden_size": 2048, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-3.2-1B", "checkpoint_revision": "4e20de362430cd3b72f300e6b0f18e50e7166e08", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 16, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 32.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/inference/qwen2/Qwen/Qwen2.5-0.5B/7f457366ad13eafe6b8a.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151643, "hidden_act": "silu", "hidden_size": 896, "initializer_range": 0.02, "intermediate_size": 4864, "max_position_embeddings": 32768, "max_window_layers": 24, "model_type": "qwen2", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "Qwen/Qwen2.5-0.5B", "checkpoint_revision": "060db6499f32faf8b98477b0a26969ef7d8b9987", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 14, "num_hidden_layers": 24, "num_key_value_heads": 2, "rms_norm_eps": 1e-06, "rope_scaling": null, "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "use_mrope": false, "use_sliding_window": false, "vocab_size": 151936}
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/training/llama/michaelbenayoun/llama-2-tiny-4kv-heads-4layers-random/0eb20cc95fb402dd41b5.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"_attn_implementation_autoset": true, "architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "head_dim": 4, "hidden_act": "silu", "hidden_size": 128, "initializer_range": 0.02, "intermediate_size": 128, "is_decoder": true, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"compiler_version": "2.15.143.0+e39249ad", "input_specs": {"attention_mask": [1, 32], "input_ids": [1, 32], "labels": [1, 32]}, "model_class": "LlamaForCausalLM", "num_neuron_cores_per_node": 2, "pipeline_parallel_size": 1, "precision": "bfloat16", "tensor_parallel_size": 1, "training": true}, "num_attention_heads": 32, "num_hidden_layers": 4, "num_key_value_heads": 4, "pad_token_id": 0, "pretraining_tp": 1, "rms_norm_eps": 1e-06, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float32", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev0/training/llama/michaelbenayoun/llama-2-tiny-4kv-heads-4layers-random/64dfccc36a935e758422.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"_attn_implementation_autoset": true, "architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "head_dim": 4, "hidden_act": "silu", "hidden_size": 128, "initializer_range": 0.02, "intermediate_size": 128, "is_decoder": true, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"compiler_version": "2.15.143.0+e39249ad", "input_specs": {"attention_mask": [1, 32], "input_ids": [1, 32], "labels": [1, 32]}, "model_class": "LlamaForCausalLM", "num_neuron_cores_per_node": 2, "pipeline_parallel_size": 1, "precision": "bfloat16", "tensor_parallel_size": 2, "training": true}, "num_attention_heads": 32, "num_hidden_layers": 4, "num_key_value_heads": 4, "pad_token_id": 0, "pretraining_tp": 1, "rms_norm_eps": 1e-06, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float32", "use_cache": true, "vocab_size": 32000}
neuronxcc-2.15.143.0+e39249ad/0_REGISTRY/0.0.28.dev1/inference/llama/NousResearch/Hermes-2-Theta-Llama-3-8B/af163c75a04bbd5785ad.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128003, "head_dim": 128, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "NousResearch/Hermes-2-Theta-Llama-3-8B", "checkpoint_revision": "57a73110702e7b05ba3f39fef36297454c680725", "compiler_type": "neuronx-cc", "compiler_version": "2.15.143.0+e39249ad", "num_cores": 2, "sequence_length": 2048, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
neuronxcc-2.15.143.0+e39249ad/MODULE_039209d63913e93c1e86+39f12043/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.15.143.0+e39249ad/MODULE_039209d63913e93c1e86+39f12043/model.done ADDED
File without changes
neuronxcc-2.15.143.0+e39249ad/MODULE_039209d63913e93c1e86+39f12043/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68a305d1cdc88fb60e2b1c43eeb7d78761a992531f9666c5b68db23dd8d9357e
3
+ size 427956
neuronxcc-2.15.143.0+e39249ad/MODULE_039209d63913e93c1e86+39f12043/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2be217728c00a4fb50ff097f342d339e14d71f045d6f9ac74e440f8cf4204f47
3
+ size 9135104
neuronxcc-2.15.143.0+e39249ad/MODULE_08bf44f19376de227f4a+39f12043/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.15.143.0+e39249ad/MODULE_08bf44f19376de227f4a+39f12043/model.done ADDED
File without changes
neuronxcc-2.15.143.0+e39249ad/MODULE_08bf44f19376de227f4a+39f12043/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c11c4ecd0fa5f202e5783b39e3c8649491963a0e723f35c288af8a2a8551f649
3
+ size 184812
neuronxcc-2.15.143.0+e39249ad/MODULE_08bf44f19376de227f4a+39f12043/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:933b76fcd0afddcf53b8207545f60e017e3a1e484165f845a0cf640ec5fdbc89
3
+ size 2827264
neuronxcc-2.15.143.0+e39249ad/MODULE_0c6016f7aa301b249715+39f12043/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.15.143.0+e39249ad/MODULE_0c6016f7aa301b249715+39f12043/model.done ADDED
File without changes
neuronxcc-2.15.143.0+e39249ad/MODULE_0c6016f7aa301b249715+39f12043/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5282bdef8463b48977137e5a0b003bf5832f81f44bede7463ede348fd3fc2251
3
+ size 130638
neuronxcc-2.15.143.0+e39249ad/MODULE_0c6016f7aa301b249715+39f12043/model.neff ADDED
Binary file (441 kB). View file
 
neuronxcc-2.15.143.0+e39249ad/MODULE_0fff2decd536cc6fae0b+39f12043/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.15.143.0+e39249ad/MODULE_0fff2decd536cc6fae0b+39f12043/model.done ADDED
File without changes
neuronxcc-2.15.143.0+e39249ad/MODULE_0fff2decd536cc6fae0b+39f12043/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd1fd11eaf38deb423ff4f463a72f2f089e65252945fc35562df4d1f9982f2fc
3
+ size 569348
neuronxcc-2.15.143.0+e39249ad/MODULE_0fff2decd536cc6fae0b+39f12043/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29bf7c1dee57b0c2b7c30b4c8936d048f65a3e06be296f69fb6c448d028d9241
3
+ size 5991424
neuronxcc-2.15.143.0+e39249ad/MODULE_10699447453196921194+d7517139/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ []
neuronxcc-2.15.143.0+e39249ad/MODULE_10699447453196921194+d7517139/model.done ADDED
File without changes
neuronxcc-2.15.143.0+e39249ad/MODULE_10699447453196921194+d7517139/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51e439d7b74d6aeb3ea348698f65c5223071806940b62b7848048b08a329f41a
3
+ size 25736
neuronxcc-2.15.143.0+e39249ad/MODULE_10699447453196921194+d7517139/model.neff ADDED
Binary file (52.2 kB). View file
 
neuronxcc-2.15.143.0+e39249ad/MODULE_10855203598795096374+d7517139/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ []
neuronxcc-2.15.143.0+e39249ad/MODULE_10855203598795096374+d7517139/model.done ADDED
File without changes
neuronxcc-2.15.143.0+e39249ad/MODULE_10855203598795096374+d7517139/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f4dab6ac5f7e557f5d88e6d3db95a54dc976d6787a3e8fdb79bf05a40e7d232
3
+ size 1219
neuronxcc-2.15.143.0+e39249ad/MODULE_10855203598795096374+d7517139/model.neff ADDED
Binary file (62.5 kB). View file
 
neuronxcc-2.15.143.0+e39249ad/MODULE_11438465433648369693+cc298dfa/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--model-type=transformer"]
neuronxcc-2.15.143.0+e39249ad/MODULE_11438465433648369693+cc298dfa/model.done ADDED
File without changes
neuronxcc-2.15.143.0+e39249ad/MODULE_11438465433648369693+cc298dfa/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f362864d6d5d0fd4a64e43ec04a659bc37751439c207a8359197cdf754c608ee
3
+ size 140419
neuronxcc-2.15.143.0+e39249ad/MODULE_11438465433648369693+cc298dfa/model.neff ADDED
Binary file (308 kB). View file
 
neuronxcc-2.15.143.0+e39249ad/MODULE_1146904795246293467+d7517139/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ []
neuronxcc-2.15.143.0+e39249ad/MODULE_1146904795246293467+d7517139/model.done ADDED
File without changes
neuronxcc-2.15.143.0+e39249ad/MODULE_1146904795246293467+d7517139/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96bc04422b953bd9a292496414ae9471dd67d193cbd28bcd070015a987a20081
3
+ size 112950
neuronxcc-2.15.143.0+e39249ad/MODULE_1146904795246293467+d7517139/model.neff ADDED
Binary file (493 kB). View file
 
neuronxcc-2.15.143.0+e39249ad/MODULE_11866581511567855346+d7517139/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ []
neuronxcc-2.15.143.0+e39249ad/MODULE_11866581511567855346+d7517139/model.done ADDED
File without changes
neuronxcc-2.15.143.0+e39249ad/MODULE_11866581511567855346+d7517139/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdd59a43db7bdc9c5ce76b1ee8d8b2d73a0337944747ea8124c233a27f7d4c5a
3
+ size 126962
neuronxcc-2.15.143.0+e39249ad/MODULE_11866581511567855346+d7517139/model.neff ADDED
Binary file (359 kB). View file
 
neuronxcc-2.15.143.0+e39249ad/MODULE_12007993937039433331+cc298dfa/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--model-type=transformer"]
neuronxcc-2.15.143.0+e39249ad/MODULE_12007993937039433331+cc298dfa/model.done ADDED
File without changes
neuronxcc-2.15.143.0+e39249ad/MODULE_12007993937039433331+cc298dfa/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae0d4e1acedfa2f030981df45cf6e2b626601d9719594bae5628edef4d44b148
3
+ size 125892