diff --git a/.gitattributes b/.gitattributes index 598b1317346f81863cf40df5f9b512f9dc093cae..fa03224798457808e7bd29d94bb85579b2dd154a 100644 --- a/.gitattributes +++ b/.gitattributes @@ -7472,3 +7472,27 @@ neuronxcc-2.16.372.0+4a9b2326/MODULE_9e3cdf817e494ba86fd4+613edded/model.neff fi neuronxcc-2.16.372.0+4a9b2326/MODULE_b2aaa317ae645625c9d1+613edded/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.16.372.0+4a9b2326/MODULE_d07d2aeb772cbb9c0ccd+613edded/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.16.372.0+4a9b2326/MODULE_ef26a928b1a6003d9b67+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/model.neff filter=lfs diff=lfs merge=lfs -text diff --git a/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/granite/ibm-granite/granite-3.1-2b-instruct/0211503669c9e68fbbde.json b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/granite/ibm-granite/granite-3.1-2b-instruct/0211503669c9e68fbbde.json new file mode 100644 index 0000000000000000000000000000000000000000..4ec509eab38c87a4045e4249d4a32240ef5de55f --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/granite/ibm-granite/granite-3.1-2b-instruct/0211503669c9e68fbbde.json @@ -0,0 +1 @@ +{"architectures": ["GraniteForCausalLM"], "attention_bias": false, "attention_dropout": 0.1, "attention_multiplier": 0.015625, "bos_token_id": 0, "embedding_multiplier": 12.0, "eos_token_id": 0, "hidden_act": "silu", "hidden_size": 2048, "initializer_range": 0.02, "intermediate_size": 8192, "logits_scaling": 8.0, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "granite", "neuron": {"auto_cast_type": "bf16", "batch_size": 2, "checkpoint_id": "ibm-granite/granite-3.1-2b-instruct", "checkpoint_revision": "374ef54e020a3ce208c65e96d6213922a87d8952", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 40, "num_key_value_heads": 8, "pad_token_id": 0, "residual_multiplier": 0.22, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 5000000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 49155} \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.1-8B-Instruct/25395edbfe4cb40ed4e9.json b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.1-8B-Instruct/25395edbfe4cb40ed4e9.json new file mode 100644 index 0000000000000000000000000000000000000000..550183760a923165933d18b6132f7fc6d13ea9c7 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.1-8B-Instruct/25395edbfe4cb40ed4e9.json @@ -0,0 +1 @@ +{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": [128001, 128008, 128009], "head_dim": 128, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-3.1-8B-Instruct", "checkpoint_revision": "0e9e39f249a16976918f6564b8830bc894c89659", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 8.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256} \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/7a87208395f3db5ba7be.json b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/7a87208395f3db5ba7be.json new file mode 100644 index 0000000000000000000000000000000000000000..19df718351af31bfbf600d879a8b5a25a99ad3f7 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/7a87208395f3db5ba7be.json @@ -0,0 +1 @@ +{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": [128001, 128008, 128009], "head_dim": 64, "hidden_act": "silu", "hidden_size": 2048, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-3.2-1B-Instruct", "checkpoint_revision": "9213176726f574b556790deb65791e0c5aa438b6", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 16, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 32.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256} \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/8cd73c74d69aa6440798.json b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/8cd73c74d69aa6440798.json new file mode 100644 index 0000000000000000000000000000000000000000..a1ccee35001f1a90ce1b88f3fc8b4ccff3be3089 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/8cd73c74d69aa6440798.json @@ -0,0 +1 @@ +{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": [128001, 128008, 128009], "head_dim": 64, "hidden_act": "silu", "hidden_size": 2048, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "bf16", "batch_size": 2, "checkpoint_id": "meta-llama/Llama-3.2-1B-Instruct", "checkpoint_revision": "9213176726f574b556790deb65791e0c5aa438b6", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 16, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 32.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256} \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/ebbf84c3779811da8d2c.json b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/ebbf84c3779811da8d2c.json new file mode 100644 index 0000000000000000000000000000000000000000..c26250e08bff574b67cac4514f77395cfb690750 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/llama/meta-llama/Llama-3.2-1B-Instruct/ebbf84c3779811da8d2c.json @@ -0,0 +1 @@ +{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": [128001, 128008, 128009], "head_dim": 64, "hidden_act": "silu", "hidden_size": 2048, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "bf16", "batch_size": 1, "checkpoint_id": "meta-llama/Llama-3.2-1B-Instruct", "checkpoint_revision": "9213176726f574b556790deb65791e0c5aa438b6", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 16, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 32.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256} \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/13bb5f11971eace7eeed.json b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/13bb5f11971eace7eeed.json new file mode 100644 index 0000000000000000000000000000000000000000..4add0d642146f68385e7da81908aeb98b0015453 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/13bb5f11971eace7eeed.json @@ -0,0 +1 @@ +{"architectures": ["Phi3ForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "auto_map": {"AutoConfig": "microsoft/Phi-3-mini-4k-instruct--configuration_phi3.Phi3Config", "AutoModelForCausalLM": "microsoft/Phi-3-mini-4k-instruct--modeling_phi3.Phi3ForCausalLM"}, "bos_token_id": 1, "embd_pdrop": 0.0, "eos_token_id": 32000, "hidden_act": "silu", "hidden_size": 3072, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 4096, "model_type": "phi3", "neuron": {"auto_cast_type": "bf16", "batch_size": 1, "checkpoint_id": "microsoft/Phi-3-mini-4k-instruct", "checkpoint_revision": "0a67737cc96d2554230f90338b163bc6380a2a85", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "original_max_position_embeddings": 4096, "pad_token_id": 32000, "resid_pdrop": 0.0, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "sliding_window": 2047, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32064} \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/29904a0c0edb4679ee76.json b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/29904a0c0edb4679ee76.json new file mode 100644 index 0000000000000000000000000000000000000000..281368651ca66c4bfc1f82ceb6b3d5284f42acbe --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/29904a0c0edb4679ee76.json @@ -0,0 +1 @@ +{"architectures": ["Phi3ForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "auto_map": {"AutoConfig": "microsoft/Phi-3-mini-4k-instruct--configuration_phi3.Phi3Config", "AutoModelForCausalLM": "microsoft/Phi-3-mini-4k-instruct--modeling_phi3.Phi3ForCausalLM"}, "bos_token_id": 1, "embd_pdrop": 0.0, "eos_token_id": 32000, "hidden_act": "silu", "hidden_size": 3072, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 4096, "model_type": "phi3", "neuron": {"auto_cast_type": "bf16", "batch_size": 4, "checkpoint_id": "microsoft/Phi-3-mini-4k-instruct", "checkpoint_revision": "0a67737cc96d2554230f90338b163bc6380a2a85", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "original_max_position_embeddings": 4096, "pad_token_id": 32000, "resid_pdrop": 0.0, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "sliding_window": 2047, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32064} \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/d7892042a1da5eaa0020.json b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/d7892042a1da5eaa0020.json new file mode 100644 index 0000000000000000000000000000000000000000..35c74246d86f3cb3e8c81a9edcbbae4d98fed852 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/Phi-3-mini-4k-instruct/d7892042a1da5eaa0020.json @@ -0,0 +1 @@ +{"architectures": ["Phi3ForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "auto_map": {"AutoConfig": "microsoft/Phi-3-mini-4k-instruct--configuration_phi3.Phi3Config", "AutoModelForCausalLM": "microsoft/Phi-3-mini-4k-instruct--modeling_phi3.Phi3ForCausalLM"}, "bos_token_id": 1, "embd_pdrop": 0.0, "eos_token_id": 32000, "hidden_act": "silu", "hidden_size": 3072, "initializer_range": 0.02, "intermediate_size": 8192, "max_position_embeddings": 4096, "model_type": "phi3", "neuron": {"auto_cast_type": "bf16", "batch_size": 2, "checkpoint_id": "microsoft/Phi-3-mini-4k-instruct", "checkpoint_revision": "0a67737cc96d2554230f90338b163bc6380a2a85", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "original_max_position_embeddings": 4096, "pad_token_id": 32000, "resid_pdrop": 0.0, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "sliding_window": 2047, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 32064} \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/phi-4/6faff6d0347b9b3197ed.json b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/phi-4/6faff6d0347b9b3197ed.json new file mode 100644 index 0000000000000000000000000000000000000000..f34aca95159e6a7c5eeb44d14e3d972dfa1b523e --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/phi-4/6faff6d0347b9b3197ed.json @@ -0,0 +1 @@ +{"architectures": ["Phi3ForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 100257, "embd_pdrop": 0.0, "eos_token_id": 100265, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 17920, "max_position_embeddings": 16384, "model_type": "phi3", "neuron": {"auto_cast_type": "bf16", "batch_size": 2, "checkpoint_id": "microsoft/phi-4", "checkpoint_revision": "187ef0342fff0eb3333be9f00389385e95ef0b61", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 10, "original_max_position_embeddings": 16384, "pad_token_id": 100349, "resid_pdrop": 0.0, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 250000, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 100352} \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/phi-4/f6232f240b5b98678a51.json b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/phi-4/f6232f240b5b98678a51.json new file mode 100644 index 0000000000000000000000000000000000000000..debe9ae3c303469b2337e1bdea1a4977846fda18 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/phi3/microsoft/phi-4/f6232f240b5b98678a51.json @@ -0,0 +1 @@ +{"architectures": ["Phi3ForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 100257, "embd_pdrop": 0.0, "eos_token_id": 100265, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 17920, "max_position_embeddings": 16384, "model_type": "phi3", "neuron": {"auto_cast_type": "bf16", "batch_size": 16, "checkpoint_id": "microsoft/phi-4", "checkpoint_revision": "187ef0342fff0eb3333be9f00389385e95ef0b61", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 12, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 10, "original_max_position_embeddings": 16384, "pad_token_id": 100349, "resid_pdrop": 0.0, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 250000, "sliding_window": null, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 100352} \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/qwen2/Qwen/Qwen2.5-Math-1.5B/a5b11f2dd182bd813171.json b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/qwen2/Qwen/Qwen2.5-Math-1.5B/a5b11f2dd182bd813171.json new file mode 100644 index 0000000000000000000000000000000000000000..70ca2eb16e0ca9e712202c581b2364ae9117a76a --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/0_REGISTRY/0.1.0.dev1/inference/qwen2/Qwen/Qwen2.5-Math-1.5B/a5b11f2dd182bd813171.json @@ -0,0 +1 @@ +{"architectures": ["Qwen2ForCausalLM"], "attention_dropout": 0.0, "bos_token_id": 151643, "eos_token_id": 151643, "hidden_act": "silu", "hidden_size": 1536, "initializer_range": 0.02, "intermediate_size": 8960, "max_position_embeddings": 4096, "max_window_layers": 21, "model_type": "qwen2", "neuron": {"auto_cast_type": "bf16", "batch_size": 2, "checkpoint_id": "Qwen/Qwen2.5-Math-1.5B", "checkpoint_revision": "4a83ca6e4526a4f2da3aa259ec36c259f66b2ab2", "compiler_type": "neuronx-cc", "compiler_version": "2.16.372.0+4a9b2326", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 12, "num_hidden_layers": 28, "num_key_value_heads": 2, "rms_norm_eps": 1e-06, "rope_scaling": null, "rope_theta": 10000, "sliding_window": null, "tie_word_embeddings": true, "torch_dtype": "bfloat16", "use_cache": true, "use_mrope": false, "use_sliding_window": false, "vocab_size": 151936} \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a89add9669f37110f009e96a6237333c808af3af --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa5f11d38562c29cf3284eb3b302c805c799403b793fc04dc4cd5411962cbea +size 165513 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..361c7cf4b7def437c1e25634e041104a6ea4a14b --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_008512cdad534106824b+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b46d912ec0d4ba1d798fb6055147df25a672f32b123053f9dfa75b9ba558f92 +size 666624 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b1a573d94957230a189d5b47f81e83dc6a59d2e9 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a07f919670b2e693ad48e3c320a28ab9048ef4d0ca58a28ec377ad4a17c52c +size 465434 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..e81f0c6e8d4a8b44156c487626a9003cff465b59 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_10bd954bb3f712b9cf93+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e49330035c9c64c1d19cc95d2fde40f92ee1eccb88a2ba3d4ae2be507351a31e +size 1639424 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c5b72165075b83a176b05cdd075845c94531b4cf --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c508e43fb5e2ecfebc578758edfa421749e4baa67035764d681752f9251d95b +size 338318 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0932bd22aaa20ebf7d17bc05f9ce06107e4861b4 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_17de9f35d8b452d30d64+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:249191058af787e1bc95fabd033f90c2fe0c586d4130665f6d73b7e4d9b31af0 +size 2243584 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..9be0e6b21181ac9f610969b30959003912935cb0 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7f758ff7ee4c3ca022b464b5ccb1b254357fe32e46425ffc1dc1e81b623f1ce +size 222468 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..bec2eabcff25a0141f72cbbdb6fdd88507f15729 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_215d5f9f03ff7f796870+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad6ca719717cf1591912264f0ba20fa7336ba8742fb5ad4d25f98d08d9824e8 +size 8469504 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..737b32a10859e7c07357be9a5794f744b9d1daa8 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48eae4af3605d17c8ede02c8932731e95d4e4fa629d24801fb1b6c8f6d2a1c0e +size 542299 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ae62289aff7f02005b466ea59fbc4ac2c27632b4 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_2e2fefac0330c92cf935+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8940acbcd0d34461745450fc622691f42f3bbfa99a7405ba245023026199138 +size 3277824 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..eca42e4cdd2de949d6bfd6f286f90abb487aa1b4 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:721efa4c0b96b61064f4ecf696b870970145eb8590122ee91a93f24609ec5e0a +size 355108 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..08427ce26c4e2b6e079d7bda74b3d5962a9e6d95 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_399d134629eb34a00d43+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cf8f95dba796216068bbae29591b027b94a339edac7fcb9f83631802725188e +size 1199104 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..09a16a77aea6f4d73a899e0d40a2f5618b052c46 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a8bfe85bf00a03e2819464a9320113afac5c60446bdf86b79028c88b23f1e86 +size 424072 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ec4214c07f281174ed1316838b9b18aab29a7b3f --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_40c932379328aee8b619+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f962552dc243f7443af34e7b00b330ff0d7f4d4b37a4d12e64c1a9f7c96f74b +size 6124544 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1b49f87f29495a49fdc21838c01402fee9e68c43 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3b59758c297b87ef1706a98e7a672d3006e3d759f23b31b9309e697255b1755 +size 557579 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d2713a3d398fb533c317d6f5c96ed2757bbf30ee --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_41bd479e657e66f398e1+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95d11208068d0dd63b7222bd523154de777acb813fcea09322cc5a217d9e70af +size 2274304 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1708cfdc068a3d3de2ee81e73d3908749d1ad110 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93e021f4b02d076e52df35b402056e3245f1cced1f42e6c1de9ee66d692be20d +size 454232 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d57c4999f08f6e2ad9c748c42bdc3a41d63d6b46 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4723142e6e2041791232+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d0794ec2f0110042fe145132157d3a3a3a96765db7ada9d5298d82b9cb1de56 +size 4977664 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7f1942d89d2fca6890546720dfe2ad2747fdd508 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00d9a3a248a49de28028535a049b7ccb89f33662e60859a3118084ba500eb361 +size 307963 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..67ff262a125916b82ca2a0225fc0e8fb9c5c4068 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_4ed4eafdd8b57b2a58ba+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed14fd191433ab42d1c2fa28a5f95e9bea6f5058c4b436bb281b849d800e8c5e +size 2274304 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..533cc83d0d64dc26cd1be46a978848c10468c630 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:762b97c9c6924c976cd169cceaa529fe92156e9c78b973ee8a17402f125953b7 +size 442251 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f30ee7fe6378be416f443597ed3e15c92c7c0fc7 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_626306e0d30994029849+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fd99521a70ea27e19c2e4eb4dbc77fda2b308d4276ce747d2c4a21b4242a181 +size 22662144 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8816c620db08cb9133c301bfa32b54646a39b72b --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d0c314b49c161be98a3bfc5f10f6f14b781e07f6e9da8cdb01bedf7322401b4 +size 427661 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..eb0587864c94c27d47b175bf8610553bc9bf82fc --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_66e776ad8f8401a7fa1f+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30d86fd8db6f8084fdedf5395b7e5d4db15d2b7c9c9b214e64ea4e40d59b141c +size 9729024 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7bf8cbf156df1ef38452543ea62083a727851484 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee18731f09bac36cbad24bcae52a8dab998fd1a6d56c812d4edc6ecf505770b6 +size 181102 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..67d44c7940a2ae96cc981755927e0683f8378f60 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7323a70130bb87727b84+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aad0bb5c2148ff008ed74b31ebfd98febe3f79ad762e9b66ee971555cc30bcfd +size 881664 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..956dd29c5f069f181097cc7b76ad635acdfdfd2b --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a538f89d259b2080257109ed42f1c162f52a0103c6f52c922235713ecc62b59 +size 243895 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..762dfea66250aab0c2ecd050dcfc053daae8722c --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_7f54d4d3885e2a479ab4+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f31c274b9a21adc9c2ae9bc68b74f963296a314ba94c8a056b11e4e2dae351e3 +size 3267584 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5d14a73dca67541eb559421a8d232c7ba9261924 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d45302a9ecd81e541c5c931cbbfeeb86d2300db835958a2807d62a51d1fb9f2 +size 181166 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4ed9a0ec14e2e360eb4cd556f27a79afe5ec4926 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_827f458fd58fe6442166+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09d08ff08b2f619f9ab32cccd8dbd8901b490e84a0df8bc96c6cef3213e78b13 +size 943104 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..72b0b816e36e9e0dba7e050c752d556e8480d90d --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7653bf5cb766a55c4466f9f4dbbee7b92bbb8995469c0682d77f2fa06d62cf8 +size 568423 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9bcd011976499f0a5687a8e89242dd315f09ccd4 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_8d1befe3d92435e31fdf+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:737d6c87a3b801a881c6e22411587c16a5c38fdf177dfbb48b4e845396af6b92 +size 20788224 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c6833df84554faa49238785c612546a71e217bf1 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f2b4303852062995e9c60172cc6e87715bb7ba138e991b25133d27354ba6ccc +size 432583 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8bf35de2061427042184a4795b1e455569f4c85b --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_949152ff315aeb616749+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef9d4c17d4a0282d20f7f933e3f53dab5e438d6f8ffdb59cabc1056ea4823006 +size 22447104 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..38d7bdaac3006f863c0cdb56e22240aa5dd4175e --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b61216a00d4d80f539ba155714bb7cd8c3bca57a5fade7a7d77968b45352f0e9 +size 199884 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..fb13ed464a4b6f20f3995a5738889d104b436fa4 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_94932be571ca32c0d6c9+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7130267cdace7d0f4312a631e0c907beb085cc8d580f65a745516c9cff620ef +size 8715264 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f31de6c7bd5b8c9d7322dd28c6d89deae422b3e2 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0311b2f6cf93568da65687c069ef1710020cae34665db6ec948f0d47e11ad58c +size 307067 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..29a18d14fc37f3706bdaadd744946badcd5ff316 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_95f239593a81a9baed26+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68b18f2b91d87b7c8f9dfa26279cbf0eecdb252322ad212719eb39b0406d56d4 +size 1895424 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0f4b0701008b9221166f0f68be952a43e8d9bc05 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97f80afb79a1851a44429f3639acd8520c7c35a5a199b42e02495528dcdc6c8e +size 348304 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..e4150d54b5bf083c12843dd097a4d2b1912a960f --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_a307a86e0d389d7d8d9e+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2186d47af994a48be3d9c6c97e9372c044516963ced97f626e8aab1a7420e11b +size 2202624 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f727de232d93821e58a77f8604ee6abfa95e8653 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff88e53093945e4e85d285bbf1e141c6d99c7ee50d883af6367afa3506a21235 +size 222404 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..292c1a283ce65c4c2233136df2c697ce5d68ed9a --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b3ac85ee34a5d9e564ba+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9172abb725e4bf4252b11a326e33a8c9b220247a59ba23eff4281cc0d375c87 +size 8469504 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..948be61bb91c5fb521f9dd11115e33f25b7508e6 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f84243ebd4bd860e5f1448f0515a979f65a2f03fb0780d9efedf588e1cbe799 +size 432393 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..33e92947a3c9d6ecd2d48472d3b4df24ca2c9889 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_b4a7a4856dcbd900d6ed+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76667c15f54eef78c5a17ed09bccfb6f53ef15658154a02fc06e1d9f122b16c9 +size 21914624 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..03f3c72504fa83c96a330d365582a9072c4a9fff --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:706bbf477c2dcf229273f55bd2898f39c210713cec07c6cf5624e61247a17ce5 +size 386860 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..227687971f9bea075232fd472bc03e4dfe11817d --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_c0740fe961da69526f92+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:860caa8537813d427e365c845d0872d1f03d9d4046acf51db0a4f095e5ffb739 +size 22897664 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/compile_flags.json b/neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0c655e4bcad17c00d4d9ec479b31fc9e637d4287 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"] \ No newline at end of file diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/model.done b/neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/model.hlo_module.pb b/neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b9527492e192f48a06d66b6e24496a56711bfd0b --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:955d81ae424ffcb7ddb2401bd64744474b062da05b27f1a470f696ea47ebd08e +size 338639 diff --git a/neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/model.neff b/neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0b02661d733cdf34f49c6082b46de30d3c668a63 --- /dev/null +++ b/neuronxcc-2.16.372.0+4a9b2326/MODULE_f914d922823d8ceace3c+613edded/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:899f3a92aa103caf6aa05c2479ce5f8170d60455ff5ce3566d0c31b8b2fc0c72 +size 2366464