dacorvo HF staff commited on
Commit
7c452af
·
verified ·
1 Parent(s): 83c8e95

Synchronizing local compiler cache.

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +24 -0
  2. neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/granite/ibm-granite/granite-3.1-2b-instruct/0211503669c9e68fbbde.json +1 -0
  3. neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.1-8B-Instruct/25395edbfe4cb40ed4e9.json +1 -0
  4. neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/7a87208395f3db5ba7be.json +1 -0
  5. neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/8cd73c74d69aa6440798.json +1 -0
  6. neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/ebbf84c3779811da8d2c.json +1 -0
  7. neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/13bb5f11971eace7eeed.json +1 -0
  8. neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/29904a0c0edb4679ee76.json +1 -0
  9. neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/d7892042a1da5eaa0020.json +1 -0
  10. neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/phi-4/6faff6d0347b9b3197ed.json +1 -0
  11. neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/phi-4/f6232f240b5b98678a51.json +1 -0
  12. neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/qwen2/Qwen/Qwen2.5-Math-1.5B/a5b11f2dd182bd813171.json +1 -0
  13. neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/compile_flags.json +1 -0
  14. neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.done +0 -0
  15. neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.hlo_module.pb +3 -0
  16. neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.neff +3 -0
  17. neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/compile_flags.json +1 -0
  18. neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.done +0 -0
  19. neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.hlo_module.pb +3 -0
  20. neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.neff +3 -0
  21. neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/compile_flags.json +1 -0
  22. neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.done +0 -0
  23. neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.hlo_module.pb +3 -0
  24. neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.neff +3 -0
  25. neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/compile_flags.json +1 -0
  26. neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.done +0 -0
  27. neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.hlo_module.pb +3 -0
  28. neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.neff +3 -0
  29. neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/compile_flags.json +1 -0
  30. neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.done +0 -0
  31. neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.hlo_module.pb +3 -0
  32. neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.neff +3 -0
  33. neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/compile_flags.json +1 -0
  34. neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.done +0 -0
  35. neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.hlo_module.pb +3 -0
  36. neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.neff +3 -0
  37. neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/compile_flags.json +1 -0
  38. neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.done +0 -0
  39. neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.hlo_module.pb +3 -0
  40. neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.neff +3 -0
  41. neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/compile_flags.json +1 -0
  42. neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.done +0 -0
  43. neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.hlo_module.pb +3 -0
  44. neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.neff +3 -0
  45. neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/compile_flags.json +1 -0
  46. neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.done +0 -0
  47. neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.hlo_module.pb +3 -0
  48. neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.neff +3 -0
  49. neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/compile_flags.json +1 -0
  50. neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/model.done +0 -0
.gitattributes CHANGED
@@ -7472,3 +7472,27 @@ neuronxcc-2.16.372.0+4a9b2326/MODULE_9e3cdf817e494ba86fd4+613edded/model.neff fi
7472
  neuronxcc-2.16.372.0+4a9b2326/MODULE_b2aaa317ae645625c9d1+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7473
  neuronxcc-2.16.372.0+4a9b2326/MODULE_d07d2aeb772cbb9c0ccd+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7474
  neuronxcc-2.16.372.0+4a9b2326/MODULE_ef26a928b1a6003d9b67+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7472
  neuronxcc-2.16.372.0+4a9b2326/MODULE_b2aaa317ae645625c9d1+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7473
  neuronxcc-2.16.372.0+4a9b2326/MODULE_d07d2aeb772cbb9c0ccd+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7474
  neuronxcc-2.16.372.0+4a9b2326/MODULE_ef26a928b1a6003d9b67+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7475
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7476
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7477
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7478
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7479
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7480
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7481
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7482
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7483
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7484
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7485
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7486
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7487
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7488
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7489
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7490
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7491
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7492
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7493
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7494
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7495
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7496
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7497
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
7498
+ neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/model.neff filter=lfs diff=lfs merge=lfs -text
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/granite/ibm-granite/granite-3.1-2b-instruct/0211503669c9e68fbbde.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["GraniteForCausalLM"], "attention_bias": false, "attention_dropout": 0.1, "attention_multiplier": 0.015625, "bos_token_id": 0, "embedding_multiplier": 12.0, "eos_token_id": 0, "hidden_act": "silu", "hidden_size": 2048, "initializer_range": 0.02, "intermediate_size": 8192, "logits_scaling": 8.0, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "granite", "neuron": {"auto_cast_type": "bf16", "batch_size": 2, "checkpoint_id": "ibm-granite/granite-3.1-2b-instruct", "checkpoint_revision": "374ef54e020a3ce208c65e96d6213922a87d8952", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 40, "num_key_value_heads": 8, "pad_token_id": 0, "residual_multiplier": 0.22, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 5000000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 49155}
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.1-8B-Instruct/25395edbfe4cb40ed4e9.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": [128001, 128008, 128009], "head_dim": 128, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-3.1-8B-Instruct", "checkpoint_revision": "0e9e39f249a16976918f6564b8830bc894c89659", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 8.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/7a87208395f3db5ba7be.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": [128001, 128008, 128009], "head_dim": 64, "hidden_act": "silu", "hidden_size": 2048, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-3.2-1B-Instruct", "checkpoint_revision": "9213176726f574b556790deb65791e0c5aa438b6", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 16, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 32.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/8cd73c74d69aa6440798.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": [128001, 128008, 128009], "head_dim": 64, "hidden_act": "silu", "hidden_size": 2048, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "bf16", "batch_size": 2, "checkpoint_id": "meta-llama/Llama-3.2-1B-Instruct", "checkpoint_revision": "9213176726f574b556790deb65791e0c5aa438b6", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 16, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 32.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/ebbf84c3779811da8d2c.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": [128001, 128008, 128009], "head_dim": 64, "hidden_act": "silu", "hidden_size": 2048, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "bf16", "batch_size": 1, "checkpoint_id": "meta-llama/Llama-3.2-1B-Instruct", "checkpoint_revision": "9213176726f574b556790deb65791e0c5aa438b6", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 16, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 32.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/13bb5f11971eace7eeed.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["Phi3ForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "auto_map": {"AutoConfig": "microsoft/Phi-3-mini-4k-instruct--configuration_phi3.Phi3Config", "AutoModelForCausalLM": "microsoft/Phi-3-mini-4k-instruct--modeling_phi3.Phi3ForCausalLM"}, "bos_token_id": 1, "embd_pdrop": 0.0, "eos_token_id": 32000, "hidden_act": "silu", "hidden_size": 3072, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 4096, "model_type": "phi3", "neuron": {"auto_cast_type": "bf16", "batch_size": 1, "checkpoint_id": "microsoft/Phi-3-mini-4k-instruct", "checkpoint_revision": "0a67737cc96d2554230f90338b163bc6380a2a85", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "original_max_position_embeddings": 4096, "pad_token_id": 32000, "resid_pdrop": 0.0, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "sliding_window": 2047, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32064}
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/29904a0c0edb4679ee76.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["Phi3ForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "auto_map": {"AutoConfig": "microsoft/Phi-3-mini-4k-instruct--configuration_phi3.Phi3Config", "AutoModelForCausalLM": "microsoft/Phi-3-mini-4k-instruct--modeling_phi3.Phi3ForCausalLM"}, "bos_token_id": 1, "embd_pdrop": 0.0, "eos_token_id": 32000, "hidden_act": "silu", "hidden_size": 3072, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 4096, "model_type": "phi3", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "microsoft/Phi-3-mini-4k-instruct", "checkpoint_revision": "0a67737cc96d2554230f90338b163bc6380a2a85", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "original_max_position_embeddings": 4096, "pad_token_id": 32000, "resid_pdrop": 0.0, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "sliding_window": 2047, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32064}
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/d7892042a1da5eaa0020.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["Phi3ForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "auto_map": {"AutoConfig": "microsoft/Phi-3-mini-4k-instruct--configuration_phi3.Phi3Config", "AutoModelForCausalLM": "microsoft/Phi-3-mini-4k-instruct--modeling_phi3.Phi3ForCausalLM"}, "bos_token_id": 1, "embd_pdrop": 0.0, "eos_token_id": 32000, "hidden_act": "silu", "hidden_size": 3072, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 4096, "model_type": "phi3", "neuron": {"auto_cast_type": "bf16", "batch_size": 2, "checkpoint_id": "microsoft/Phi-3-mini-4k-instruct", "checkpoint_revision": "0a67737cc96d2554230f90338b163bc6380a2a85", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "original_max_position_embeddings": 4096, "pad_token_id": 32000, "resid_pdrop": 0.0, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "sliding_window": 2047, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32064}
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/phi-4/6faff6d0347b9b3197ed.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["Phi3ForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 100257, "embd_pdrop": 0.0, "eos_token_id": 100265, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 17920, "max_position_embeddings": 16384, "model_type": "phi3", "neuron": {"auto_cast_type": "bf16", "batch_size": 2, "checkpoint_id": "microsoft/phi-4", "checkpoint_revision": "187ef0342fff0eb3333be9f00389385e95ef0b61", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 10, "original_max_position_embeddings": 16384, "pad_token_id": 100349, "resid_pdrop": 0.0, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 250000, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 100352}
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/phi-4/f6232f240b5b98678a51.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["Phi3ForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 100257, "embd_pdrop": 0.0, "eos_token_id": 100265, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 17920, "max_position_embeddings": 16384, "model_type": "phi3", "neuron": {"auto_cast_type": "bf16", "batch_size": 16, "checkpoint_id": "microsoft/phi-4", "checkpoint_revision": "187ef0342fff0eb3333be9f00389385e95ef0b61", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 12, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 10, "original_max_position_embeddings": 16384, "pad_token_id": 100349, "resid_pdrop": 0.0, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 250000, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 100352}
neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/qwen2/Qwen/Qwen2.5-Math-1.5B/a5b11f2dd182bd813171.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151643, "hidden_act": "silu", "hidden_size": 1536, "initializer_range": 0.02, "intermediate_size": 8960, "max_position_embeddings": 4096, "max_window_layers": 21, "model_type": "qwen2", "neuron": {"auto_cast_type": "bf16", "batch_size": 2, "checkpoint_id": "Qwen/Qwen2.5-Math-1.5B", "checkpoint_revision": "4a83ca6e4526a4f2da3aa259ec36c259f66b2ab2", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 12, "num_hidden_layers": 28, "num_key_value_heads": 2, "rms_norm_eps": 1e-06, "rope_scaling": null, "rope_theta": 10000, "sliding_window": null, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "use_mrope": false, "use_sliding_window": false, "vocab_size": 151936}
neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.done ADDED
File without changes
neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fa5f11d38562c29cf3284eb3b302c805c799403b793fc04dc4cd5411962cbea
3
+ size 165513
neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b46d912ec0d4ba1d798fb6055147df25a672f32b123053f9dfa75b9ba558f92
3
+ size 666624
neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.done ADDED
File without changes
neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6a07f919670b2e693ad48e3c320a28ab9048ef4d0ca58a28ec377ad4a17c52c
3
+ size 465434
neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e49330035c9c64c1d19cc95d2fde40f92ee1eccb88a2ba3d4ae2be507351a31e
3
+ size 1639424
neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.done ADDED
File without changes
neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c508e43fb5e2ecfebc578758edfa421749e4baa67035764d681752f9251d95b
3
+ size 338318
neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:249191058af787e1bc95fabd033f90c2fe0c586d4130665f6d73b7e4d9b31af0
3
+ size 2243584
neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.done ADDED
File without changes
neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7f758ff7ee4c3ca022b464b5ccb1b254357fe32e46425ffc1dc1e81b623f1ce
3
+ size 222468
neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fad6ca719717cf1591912264f0ba20fa7336ba8742fb5ad4d25f98d08d9824e8
3
+ size 8469504
neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.done ADDED
File without changes
neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48eae4af3605d17c8ede02c8932731e95d4e4fa629d24801fb1b6c8f6d2a1c0e
3
+ size 542299
neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8940acbcd0d34461745450fc622691f42f3bbfa99a7405ba245023026199138
3
+ size 3277824
neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.done ADDED
File without changes
neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:721efa4c0b96b61064f4ecf696b870970145eb8590122ee91a93f24609ec5e0a
3
+ size 355108
neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cf8f95dba796216068bbae29591b027b94a339edac7fcb9f83631802725188e
3
+ size 1199104
neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.done ADDED
File without changes
neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a8bfe85bf00a03e2819464a9320113afac5c60446bdf86b79028c88b23f1e86
3
+ size 424072
neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f962552dc243f7443af34e7b00b330ff0d7f4d4b37a4d12e64c1a9f7c96f74b
3
+ size 6124544
neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.done ADDED
File without changes
neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3b59758c297b87ef1706a98e7a672d3006e3d759f23b31b9309e697255b1755
3
+ size 557579
neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95d11208068d0dd63b7222bd523154de777acb813fcea09322cc5a217d9e70af
3
+ size 2274304
neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.done ADDED
File without changes
neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.hlo_module.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93e021f4b02d076e52df35b402056e3245f1cced1f42e6c1de9ee66d692be20d
3
+ size 454232
neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.neff ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d0794ec2f0110042fe145132157d3a3a3a96765db7ada9d5298d82b9cb1de56
3
+ size 4977664
neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/compile_flags.json ADDED
@@ -0,0 +1 @@
 
 
1
+ ["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/model.done ADDED
File without changes