diff --git a/.gitattributes b/.gitattributes index 377a954544d49f374f0107b87ead5ee429ff6634..86cc25f0027bd26e2296c39ba1f5f658d55b4567 100644 --- a/.gitattributes +++ b/.gitattributes @@ -3361,3 +3361,68 @@ neuronxcc-2.19.8089.0+8ab9f450/MODULE_23d27f640534fb2c4304+5be477de/model.neff f neuronxcc-2.19.8089.0+8ab9f450/MODULE_23d27f640534fb2c4304+5be477de/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text neuronxcc-2.19.8089.0+8ab9f450/MODULE_38ed63d19a6b0761a692+84f3e719/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.19.8089.0+8ab9f450/MODULE_9bce7228204bd2d4577b+431f5505/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_025b98fcff252cba485d+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_097b7e476646dbe13102+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f259e869c3d6531c373+c2cadba6/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_0faba5d4e9a33c984547+84f3e719/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_1845adad88a4d5ae3381+84f3e719/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d4ed11977011ce5e7+431f5505/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea6ee6758cc98aa0e89+84f3e719/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_2716a18eea591aaf4f20+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_2e79c5faf457fd022d25+84f3e719/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_3fcde42e05c364259ae4+84f3e719/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_4cc296fe1b7abcee7c5b+8afcc287/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fefca4728e29af5f535+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_67660d190a903f2f351f+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_796c64ab3e80099de463+84f3e719/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba292be7e7e441b703f+84f3e719/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_a3410e1989f6ba8dd0bb+431f5505/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_abffbaee6c01c4e3d2c4+431f5505/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3922fb6a70df3e2474d+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3972df3e33231af7683+84f3e719/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf2b84c02a9cc5486e3e+84f3e719/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_db708956da7a3174471d+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4125c11885b90ff94c9+431f5505/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_e48df5a1ca8b2b49e13f+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_ec3616cec65f8deb284b+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8cade1575b9d31c15da+ad9e832d/model.neff filter=lfs diff=lfs merge=lfs -text diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/deepseek-ai/DeepSeek-R1-Distill-Llama-70B/38357c754f2cbd1d382e.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/deepseek-ai/DeepSeek-R1-Distill-Llama-70B/38357c754f2cbd1d382e.json new file mode 100644 index 0000000000000000000000000000000000000000..58da43d30f7e4c8421019dee35b1198e377eced2 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/deepseek-ai/DeepSeek-R1-Distill-Llama-70B/38357c754f2cbd1d382e.json @@ -0,0 +1,77 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 8192, + "initializer_range": 0.02, + "intermediate_size": 28672, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 8, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "checkpoint_revision": "b1c0b44b4369b597ad119a196caf79a9c40e141e", + "continuous_batching": true, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": true, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 24, + "logical_nc_config": 1, + "max_batch_size": 8, + "max_context_length": 4096, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0.dev2", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 24, + "vocab_parallel": false + }, + "num_attention_heads": 64, + "num_hidden_layers": 80, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/deepseek-ai/DeepSeek-R1-Distill-Llama-70B/89acac1543511de63934.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/deepseek-ai/DeepSeek-R1-Distill-Llama-70B/89acac1543511de63934.json new file mode 100644 index 0000000000000000000000000000000000000000..68ea8ffd46933ef1094de106382722c06e902017 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/deepseek-ai/DeepSeek-R1-Distill-Llama-70B/89acac1543511de63934.json @@ -0,0 +1,77 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 8192, + "initializer_range": 0.02, + "intermediate_size": 28672, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 4, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "checkpoint_revision": "b1c0b44b4369b597ad119a196caf79a9c40e141e", + "continuous_batching": true, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": true, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 24, + "logical_nc_config": 1, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0.dev2", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 24, + "vocab_parallel": false + }, + "num_attention_heads": 64, + "num_hidden_layers": 80, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/deepseek-ai/DeepSeek-R1-Distill-Llama-70B/a91139c3aee28b0f6c94.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/deepseek-ai/DeepSeek-R1-Distill-Llama-70B/a91139c3aee28b0f6c94.json new file mode 100644 index 0000000000000000000000000000000000000000..c3c030ce11fe934a47ac9b35e592c13020f8cb04 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/deepseek-ai/DeepSeek-R1-Distill-Llama-70B/a91139c3aee28b0f6c94.json @@ -0,0 +1,77 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 8192, + "initializer_range": 0.02, + "intermediate_size": 28672, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 1, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "checkpoint_revision": "b1c0b44b4369b597ad119a196caf79a9c40e141e", + "continuous_batching": false, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": true, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 24, + "logical_nc_config": 1, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0.dev2", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 24, + "vocab_parallel": false + }, + "num_attention_heads": 64, + "num_hidden_layers": 80, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/29f3c7ef0e6a87f35788.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/29f3c7ef0e6a87f35788.json new file mode 100644 index 0000000000000000000000000000000000000000..f906b4847deeaa55f332d7cc289ff425109a9e0a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/29f3c7ef0e6a87f35788.json @@ -0,0 +1,78 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.1-8B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 48, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "unsloth/Llama-3.1-8B-Instruct", + "checkpoint_revision": "4699cc75b550f9c6f3173fb80f4703b62d946aa5", + "continuous_batching": true, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": true, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 8, + "logical_nc_config": 1, + "max_batch_size": 48, + "max_context_length": 4096, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0.dev2", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 8, + "vocab_parallel": false + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/6d3aa041c08b8396ee41.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/6d3aa041c08b8396ee41.json new file mode 100644 index 0000000000000000000000000000000000000000..3320bb51b7633791b098728cde07ea6abfe899e8 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/6d3aa041c08b8396ee41.json @@ -0,0 +1,78 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.1-8B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 16, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "unsloth/Llama-3.1-8B-Instruct", + "checkpoint_revision": "4699cc75b550f9c6f3173fb80f4703b62d946aa5", + "continuous_batching": true, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": true, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 8, + "logical_nc_config": 1, + "max_batch_size": 16, + "max_context_length": 4096, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0.dev2", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 8, + "vocab_parallel": false + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/7523661354aea5f66d6c.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/7523661354aea5f66d6c.json new file mode 100644 index 0000000000000000000000000000000000000000..0690b8f1d1626134a6c57eb6f5f37ccb7620d0b3 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/7523661354aea5f66d6c.json @@ -0,0 +1,78 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.1-8B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 4, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "unsloth/Llama-3.1-8B-Instruct", + "checkpoint_revision": "4699cc75b550f9c6f3173fb80f4703b62d946aa5", + "continuous_batching": true, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": true, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 8, + "logical_nc_config": 1, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0.dev2", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 8, + "vocab_parallel": false + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/7c2b4b0f296eeda524b6.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/7c2b4b0f296eeda524b6.json new file mode 100644 index 0000000000000000000000000000000000000000..86ca282d2159a873b578dbcbb1b6fd419f5e2b4b --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/7c2b4b0f296eeda524b6.json @@ -0,0 +1,78 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.1-8B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 1, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "unsloth/Llama-3.1-8B-Instruct", + "checkpoint_revision": "4699cc75b550f9c6f3173fb80f4703b62d946aa5", + "continuous_batching": false, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": true, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 8, + "logical_nc_config": 1, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0.dev2", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 8, + "vocab_parallel": false + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/9932c1d05bd91a781c3a.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/9932c1d05bd91a781c3a.json new file mode 100644 index 0000000000000000000000000000000000000000..38e15bc6511de9330dbe671939236a99927cd1d2 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/9932c1d05bd91a781c3a.json @@ -0,0 +1,78 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.1-8B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 8, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "unsloth/Llama-3.1-8B-Instruct", + "checkpoint_revision": "4699cc75b550f9c6f3173fb80f4703b62d946aa5", + "continuous_batching": true, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": true, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 8, + "logical_nc_config": 1, + "max_batch_size": 8, + "max_context_length": 4096, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0.dev2", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 8, + "vocab_parallel": false + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/ad521b5b119cf355612b.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/ad521b5b119cf355612b.json new file mode 100644 index 0000000000000000000000000000000000000000..bb118701c6ce26fdb8f2ee3223c204ebabba33c7 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.0.dev2/llama/unsloth/Llama-3.1-8B-Instruct/ad521b5b119cf355612b.json @@ -0,0 +1,78 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.1-8B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 32, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "unsloth/Llama-3.1-8B-Instruct", + "checkpoint_revision": "4699cc75b550f9c6f3173fb80f4703b62d946aa5", + "continuous_batching": true, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": true, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 8, + "logical_nc_config": 1, + "max_batch_size": 32, + "max_context_length": 4096, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0.dev2", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 4096, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 8, + "vocab_parallel": false + }, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_00333196986acf2eb79a+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_00333196986acf2eb79a+431f5505/model.neff index 7ac01afffd3a1e31b35326141be0159314a39a66..a978b7c3d2899a1190213986ede5056215566c22 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_00333196986acf2eb79a+431f5505/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_00333196986acf2eb79a+431f5505/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_025b98fcff252cba485d+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_025b98fcff252cba485d+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_025b98fcff252cba485d+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_025b98fcff252cba485d+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_025b98fcff252cba485d+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_025b98fcff252cba485d+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_025b98fcff252cba485d+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..cbff3da1a4453ede6bb6031b73f54e913150e13a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_025b98fcff252cba485d+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b52c0497bb2f9417b413e7407edf5d7eaa44ba4fd866fea870205954a6bf774d +size 944123 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_025b98fcff252cba485d+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_025b98fcff252cba485d+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..245ffce78607a2669e6c2cf8b4fdb5d9c85e3a57 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_025b98fcff252cba485d+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65982d84aa20c84c91ec97004a8f2b70161dc19442039b7d3b45b734229b981f +size 31140864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_061f22ddc7af0a5d29f9+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_061f22ddc7af0a5d29f9+84f3e719/model.hlo_module.pb index b50cb77334cc1da0125a0e0a9ac31a79029899e9..cd7cab5e446deeea38d51590e68181a708706cca 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_061f22ddc7af0a5d29f9+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_061f22ddc7af0a5d29f9+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bb13bd85a99f6c51fdfe0a6b857954378132608531c1b9d446ab1844ce1663b3 +oid sha256:0677a23025fbd7931d9195daf02d5312e2da1158a7927ddd283ee33bec101024 size 858046 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_061f22ddc7af0a5d29f9+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_061f22ddc7af0a5d29f9+84f3e719/model.neff index 8a6316ce7d41f2162c6bbbd58ae8edf66f22a1a7..6824c454ec2d20f885be236afcf1a454a05320ca 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_061f22ddc7af0a5d29f9+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_061f22ddc7af0a5d29f9+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:283b815f75d0bf82f38196943cd73a0a564b23e0dc4232018ff3998c97a9bb7c +oid sha256:e22c01e02854f21979862b09571130be0a7968089cd9166a4240ddcb7d25e926 size 5786624 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0661e1d8741e9ead0d5c+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0661e1d8741e9ead0d5c+431f5505/model.neff index 6486c44fe0e20d402a0266aca705dcd1426f02b2..839a53667f3f4f343ea297c1cbe012c4264c7452 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0661e1d8741e9ead0d5c+431f5505/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0661e1d8741e9ead0d5c+431f5505/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_097b7e476646dbe13102+ad9e832d/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_097b7e476646dbe13102+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_097b7e476646dbe13102+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_097b7e476646dbe13102+ad9e832d/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_097b7e476646dbe13102+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_097b7e476646dbe13102+ad9e832d/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_097b7e476646dbe13102+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1769023600649219383891c1cf3b3c5eb2086dbe --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_097b7e476646dbe13102+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21e28eceb37cad9ca93db5b7d4d33ac2b18bc4a10b72fa6f41354d73a93b5595 +size 1661172 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_097b7e476646dbe13102+ad9e832d/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_097b7e476646dbe13102+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d816afa2abd2658172be706dd3e8f82fdd35111d --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_097b7e476646dbe13102+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf47c986e05a6b4ded732905e78b6b71cfd0a4c0ca2d802a0cb3922ac35f78d +size 3881984 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..40eff9e5e06de68280863f354dc58b1f474ebd91 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..48c060bfc566a2808b5ac053f2c6154a586b957f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce55f9f3b779172d357a166157f85e849aef70cc86fc56962d5dd729022e4b4 +size 773433 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..62d24c7aa08c4b60a05048a9020aace3028272f0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49f0e297edf120891e834496626c5249d3a4c8b3d00fdb313de6e8c25f5f3422 +size 6237184 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..88c0f9d3936722ee015901655cd1eefffc11dcf0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0aacfff4eaf4af570582+97bb129f/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f130cf2e0d4e49d2a5fd646193917cb290dedd28df33ebc0e15f76afa7ed7a93 +size 6375001 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0b8b4fa5620a4855f332+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0b8b4fa5620a4855f332+5be477de/model.neff index 0c52d88bca62f0471680b6ea35f28060f0fb71d9..e6e4d2c7b03e73224b0bc3065fe7a6e07e22bbc6 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0b8b4fa5620a4855f332+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0b8b4fa5620a4855f332+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a9904275e47a301a74852348f3d191d476260c0b5a579e942b475fd35d6ff849 +oid sha256:e3c3bbd7fc867b9903f6cb1bb028ef67eaea33732fc7afde7b4124bb04d5a50d size 1434624 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0b8b4fa5620a4855f332+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0b8b4fa5620a4855f332+5be477de/wrapped_neff.hlo index df9162eaee431fefca3ae2cce0445a8f1ed9da18..7b1e746af6e6e55067773af976dec10b2a05acd4 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0b8b4fa5620a4855f332+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0b8b4fa5620a4855f332+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:598bf6c94994c9a09461e25689b995599f60fc7d7bca903cd5ebf32bce07f30e +oid sha256:5062513634c02e3976177b97dbfe83030caca965f6d94efff0074585baa8c022 size 1521594 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0bbe60dde8eaacbc8218+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0bbe60dde8eaacbc8218+5be477de/model.neff index 242c96bcb2f4d88f08229248d6789749cee1cac6..052a5fe066dbc0db1c032f62caa0c132e6d71ad7 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0bbe60dde8eaacbc8218+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0bbe60dde8eaacbc8218+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:804ad495b5912a48b919944f97fa6d3ce25d83e98a1587d964e2742b4f814924 +oid sha256:1ab9e2f02fa29415c2a584da7d3a0dd489fa46185414b6a6ceda1ff02a0b7e42 size 154624 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0bbe60dde8eaacbc8218+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0bbe60dde8eaacbc8218+5be477de/wrapped_neff.hlo index 9495291a429dc206137b0254d8d5425d6314cc22..20944d74b5cd685ec7b965885660f201eb827749 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0bbe60dde8eaacbc8218+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0bbe60dde8eaacbc8218+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cd2d02036e8ca0155df726e5a3621617b893f38bf98f7747d64ed53a1bb5db18 +oid sha256:12294311aab65c8b1e1b69aefdf4cc623e27bd53029218381ec6a4cf66f7584c size 162285 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f259e869c3d6531c373+c2cadba6/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f259e869c3d6531c373+c2cadba6/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..3b2493c1b26278a4a34ae718e13972384636c4bd --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f259e869c3d6531c373+c2cadba6/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f259e869c3d6531c373+c2cadba6/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f259e869c3d6531c373+c2cadba6/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f259e869c3d6531c373+c2cadba6/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f259e869c3d6531c373+c2cadba6/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..44df9812265ba3722fbd610f911fe0228e6ca70e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f259e869c3d6531c373+c2cadba6/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b93fe1412edfe43e4d0b824ef6cc3a483f918e718f8a2140d7e8627e0d8e510 +size 944123 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f259e869c3d6531c373+c2cadba6/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f259e869c3d6531c373+c2cadba6/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ed7d11536c193364516bf27a4f5de2053c5df5d5 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f259e869c3d6531c373+c2cadba6/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae0036534d76e1308381c4a5a3a6429b663681816fd0898c056db27711fa981 +size 31171584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f82fe03a3af29dff8f6+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f82fe03a3af29dff8f6+5be477de/model.neff index 7d42aa8914fd151fb77ae74d9de965e67fd49289..3d82017293d30b3ab28643e0391cf340c913f781 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f82fe03a3af29dff8f6+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f82fe03a3af29dff8f6+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:01872c9e47bfe8cd1de7112bbd8cc81654293fa719da9e5241fde748aaa594f2 +oid sha256:a89157420d03816ac2f9222a89bce907177f1a5ca48f1137c20a533f8fdfb10a size 236544 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f82fe03a3af29dff8f6+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f82fe03a3af29dff8f6+5be477de/wrapped_neff.hlo index a0cf3289c89faa1c816e01b320583963288177b0..66e566163971ea284cc8f027409911616b1e7982 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f82fe03a3af29dff8f6+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f82fe03a3af29dff8f6+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d38053203fb2172fc6fe741d07a9c0155ebc44c2c2b39e08ab0ac71d98670ff8 +oid sha256:f02bf62809adc55ce64637129b796e84a3032d0036f542bf94e0f21ec5512b0e size 244319 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0faba5d4e9a33c984547+84f3e719/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0faba5d4e9a33c984547+84f3e719/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..60ddcc80e16080ded570954fe3fc17240221f2ab --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0faba5d4e9a33c984547+84f3e719/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0faba5d4e9a33c984547+84f3e719/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0faba5d4e9a33c984547+84f3e719/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0faba5d4e9a33c984547+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0faba5d4e9a33c984547+84f3e719/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f1dcc172b637a7842a3085071ec1f5c0ede2b2fd --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0faba5d4e9a33c984547+84f3e719/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2e6fecd547e8919f61a673b54a175c4eee9fa33b8a93f82e2a7bc3ca585e952 +size 874711 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0faba5d4e9a33c984547+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0faba5d4e9a33c984547+84f3e719/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..330d44757f10b4167a12f9077c8dd4a1aa0d3fb3 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_0faba5d4e9a33c984547+84f3e719/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea9c0d90c5c4235c7dc27de50def577fd4fe7b292669b6019f8d21e54f20cd64 +size 31028224 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1845adad88a4d5ae3381+84f3e719/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1845adad88a4d5ae3381+84f3e719/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..60ddcc80e16080ded570954fe3fc17240221f2ab --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1845adad88a4d5ae3381+84f3e719/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1845adad88a4d5ae3381+84f3e719/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1845adad88a4d5ae3381+84f3e719/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1845adad88a4d5ae3381+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1845adad88a4d5ae3381+84f3e719/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..9fe9205b7b08a6659c20a690e737079ec28924c4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1845adad88a4d5ae3381+84f3e719/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3644d3a934ba05c8e98acdb2da8a63f46c70f18baa46f9904fc3b29a58ef16ce +size 944123 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1845adad88a4d5ae3381+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1845adad88a4d5ae3381+84f3e719/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..659ca112adf9de579aee583fa64e042cd6ca3726 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1845adad88a4d5ae3381+84f3e719/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbd13ab3d6e75b38f4b6611de0bf03e1e699ab03019b554122deab152bc17a6f +size 31140864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d4ed11977011ce5e7+431f5505/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d4ed11977011ce5e7+431f5505/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..9932c70d27d759d781be88485b74b17b49b4c04f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d4ed11977011ce5e7+431f5505/compile_flags.json @@ -0,0 +1 @@ +"--model-type=transformer -O1 --lnc=1 --internal-hlo2tensorizer-options=--experimental-unsafe-fp8e4m3fn-as-fp8e4m3 --logfile=/tmp/nxd_model/layout_opt/log-neuron-cc.txt" \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d4ed11977011ce5e7+431f5505/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d4ed11977011ce5e7+431f5505/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d4ed11977011ce5e7+431f5505/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d4ed11977011ce5e7+431f5505/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c4dccbe1d2bb154396c4f2e11e90a4ef6f5623b3 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d4ed11977011ce5e7+431f5505/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5928e1e3d71165915a25d2d9778aedfc58cd57ef9ba8621279558be58e16fb7 +size 136713 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d4ed11977011ce5e7+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d4ed11977011ce5e7+431f5505/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f5ae81f4dd5ca9ae184522d91afbef8d505bcc2f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d4ed11977011ce5e7+431f5505/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8049cc5f3ba1f19852a0d85515d2cf31cd6b4ec3c6781035d679f01bc934104 +size 2315264 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1bce819dd943e86ebacb+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1bce819dd943e86ebacb+431f5505/model.neff index 936f1b935b5c3abd921c13c1f1c00b0f83e33619..5468bf0b8ad489d1215ef2ecc721636ed168cd8d 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1bce819dd943e86ebacb+431f5505/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1bce819dd943e86ebacb+431f5505/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9203cab8e6d7541d1148063a1b41e11e4b29248e4ebb6de7c273d6fce9386218 +oid sha256:b5877e7d3d6af1d8f7e8e8c85f364b45abe57bc0cd8764fef18529242aceea36 size 1281024 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..e24f877fd3bd437b366557076d7c7d635759a2ca --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f8a9f009f623782ff35dabeeaab840ffa02e24fc --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:332a9f5be929101fd9b4daf5e31dbfbe4f953698ae1a2f981a832e76a33b9622 +size 772484 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..eb9a222efe49b406b91c024bf76bbd727892c8ca --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1631d9704457551bb3ff42e765aa7514fad478f7eadaa1971aa7b94b7533dbc1 +size 2018304 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..d567f803aff29f344308794c27aa9f697032b75c --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1cb238717180fb6073dd+5be477de/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71535347737ed3efae9ba23f072f45490b5353400eb86ce76280ce32f5b92bfa +size 2156630 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1d687728a717f87883ca+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1d687728a717f87883ca+431f5505/model.neff index 764fd6ac326128b4f7ea5aea5380d301d52904d5..011b0d7fda00e58143e76644f75ef7ee615644b2 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1d687728a717f87883ca+431f5505/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1d687728a717f87883ca+431f5505/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ed7989cbbbbeb3fa4ac55c13af2258e03687224ee83ce593ea62cd98508bc48d +oid sha256:7620edb3b2c01abe336f904cd409b85732204a2bfa44a10ccba787a4a0b474e7 size 103424 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea6ee6758cc98aa0e89+84f3e719/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea6ee6758cc98aa0e89+84f3e719/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..60ddcc80e16080ded570954fe3fc17240221f2ab --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea6ee6758cc98aa0e89+84f3e719/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea6ee6758cc98aa0e89+84f3e719/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea6ee6758cc98aa0e89+84f3e719/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea6ee6758cc98aa0e89+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea6ee6758cc98aa0e89+84f3e719/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..9e22c8cdad672f2b554b19790a5f92c560ddabc6 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea6ee6758cc98aa0e89+84f3e719/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6da43545b6d9856455e6319c643a83d46001a0545d18e21faf9fb8834c1ae0c +size 944123 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea6ee6758cc98aa0e89+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea6ee6758cc98aa0e89+84f3e719/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c5cbffd36f8a51ba4555e6619d221f4e85c8fd21 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea6ee6758cc98aa0e89+84f3e719/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13fc0a07b3ff0f4bf204a5618cd739509cf5a5faebc9f737ab8f3a8f3ede44aa +size 31140864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea7c53c16e767166083+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea7c53c16e767166083+84f3e719/model.hlo_module.pb index d67af13a5efaa11a5ceac69ac7b0b50af8159476..07ea5de8d4ec025011e713c79a814335038dc333 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea7c53c16e767166083+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea7c53c16e767166083+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:be30440dcb0ade880599dfcb928ec84de7225b98ec2da5c608bd894ff8be8526 +oid sha256:bb3f3c80a1f760b0f801aa56dd94adcd18f8703faf4fbe1cf4629086b0f3ced2 size 87785 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea7c53c16e767166083+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea7c53c16e767166083+84f3e719/model.neff index 165ca7d4e3a3aa9d4a97b92ab9b90504ffbc4ca9..742722e53f4fd051a3749048f32e1f71c0a5aafd 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea7c53c16e767166083+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ea7c53c16e767166083+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:958720d92df0c3aff14bfa33e9c2145416bb60052fb1938d522f70486cc76d49 +oid sha256:7bcc37564d8330894550bcd1c560c819f27452fc9a2dccfc5012d25347f52f7d size 246784 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..e24f877fd3bd437b366557076d7c7d635759a2ca --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..48c060bfc566a2808b5ac053f2c6154a586b957f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce55f9f3b779172d357a166157f85e849aef70cc86fc56962d5dd729022e4b4 +size 773433 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7e25ff158905791cbdb93cf6224daf81fd439e86 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f94cffdbfea4fc0336ff9ccaf90dc03a7bfd77d3a71be20313da0dc71ef9497 +size 6237184 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..38d09ae4d4dad4c7a3ffca6637aca99a7057fb57 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_225aa072d587f98b83e9+5be477de/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20bbbea7128e540afbbea21b386c191de188036d19746af61dc98d04747f462c +size 6375001 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2371c90829406a620831+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2371c90829406a620831+5be477de/model.neff index 69839474a29040c92a41c69b7a1add0dd27e4610..46bf13757be27f687533bbe52663054aa1449305 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2371c90829406a620831+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2371c90829406a620831+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:df4eb1e63cd1ffbf4ab279d7e12dd2e33b64282a5c61cd137c3b3a415fc8c22f +oid sha256:8c09b60673a5f6626e5e43ee91b19cdf385f2dc3113114ba3212f31b086f1fc7 size 216064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2371c90829406a620831+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2371c90829406a620831+5be477de/wrapped_neff.hlo index 8b003de1fd4936ec5846cc6af6c12301a4481ad5..aa33d546563690ed627a67157abce1c79029e277 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2371c90829406a620831+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2371c90829406a620831+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3fde0865fb4c144e713bc17c222aa569a5526c4314f2932f74e8ab8da6f592cc +oid sha256:6979a724da90b05c60b1f6049e232b513dd03d8d1a531e9c0704643c8ca737ab size 223770 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..e24f877fd3bd437b366557076d7c7d635759a2ca --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..cc99646ebd68dd496f026d8f1acd22e08ad628b2 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1b48e07355c617bc22621ee00de7b4f93dff6de0c903824675c3140857a0793 +size 773033 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..3929331e9e493189742684d53a1cc6ad9c0106e0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c7d6a586432b3fff46f9f556c01d44ec0a178ee9fe3076053e86a789f50c31 +size 3113984 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..75902d715e1aeb5b40e85f68ca153a14861c63ad --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_25b514ebfb24f7862617+5be477de/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a66f4d15672a836e4c406438cdb87324bdeab2162f9222a2a67ddcc31b470522 +size 3251801 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_266c5c386fd48dd67015+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_266c5c386fd48dd67015+431f5505/model.neff index 61042b7da6c0e8b7f8e44a85675c3ba0066fbc42..05d17b15f3dde62ddbeb6352d704c4fa97d8d9f4 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_266c5c386fd48dd67015+431f5505/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_266c5c386fd48dd67015+431f5505/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2716a18eea591aaf4f20+ad9e832d/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2716a18eea591aaf4f20+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2716a18eea591aaf4f20+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2716a18eea591aaf4f20+ad9e832d/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2716a18eea591aaf4f20+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2716a18eea591aaf4f20+ad9e832d/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2716a18eea591aaf4f20+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..aaa604e938fd44a4b5268ce4abce8f799574ce04 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2716a18eea591aaf4f20+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4293200d1f2ad90a66c02cc4879fee2b3bfde501b7151fb610370054aa2c3da1 +size 1789812 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2716a18eea591aaf4f20+ad9e832d/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2716a18eea591aaf4f20+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..47c53bba9cbbf4c6148338cda2393f7637c835c4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2716a18eea591aaf4f20+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8d4c62cc926302eba61b35b1e5cb663382805dcbd2e250be83d3c6a825f05b7 +size 2520064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2af3b88e8bfa7573c510+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2af3b88e8bfa7573c510+84f3e719/model.hlo_module.pb index 14ee441a033ddfd1efc8fd33c43927334b4ef363..74f4328c100742b54a0da08568c623fdb58bf8d8 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2af3b88e8bfa7573c510+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2af3b88e8bfa7573c510+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:edef0cb1face52bb242d9a790c72d9759b587093514b2c8ce8008dbe00073dd7 +oid sha256:291711a5dd69387c68f5d90c715f4279533a4c872e22ca0cf368e4e452231d49 size 81323 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2af3b88e8bfa7573c510+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2af3b88e8bfa7573c510+84f3e719/model.neff index cecbba8fcc7aef777908ee336af310694e1b0d46..a0f98f0612db6bf34905e5bd353636651630cea8 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2af3b88e8bfa7573c510+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2af3b88e8bfa7573c510+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9a821a9c6a2e0b3a220c3199148c0356162db26c15687b2a2a52f0cfea43e84a +oid sha256:21068e94ed15da4166d08503c40bbfa65fb0b048bb3ee873fde12b233f4ae681 size 236544 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2e79c5faf457fd022d25+84f3e719/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2e79c5faf457fd022d25+84f3e719/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..60ddcc80e16080ded570954fe3fc17240221f2ab --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2e79c5faf457fd022d25+84f3e719/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2e79c5faf457fd022d25+84f3e719/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2e79c5faf457fd022d25+84f3e719/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2e79c5faf457fd022d25+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2e79c5faf457fd022d25+84f3e719/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3d632eeb2d0079a9127c7bb3bcfe943348eb646e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2e79c5faf457fd022d25+84f3e719/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d93d20fa61a0b1774c81751ae669689205e1ce1d74e195214aa95ae5623ce6c +size 2143984 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2e79c5faf457fd022d25+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2e79c5faf457fd022d25+84f3e719/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..87d025ac7ca3f12c0eaf76b716e1fdcb7f709988 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2e79c5faf457fd022d25+84f3e719/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cb94912614a59b8bf4dae70448481973fe25894e3b3ea66d75e8caa7366f9d0 +size 3482624 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_30c8e5dffb371f5a2fc0+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_30c8e5dffb371f5a2fc0+5be477de/model.neff index 6fd6b838fce471ed900ffd3cac697b95d6904f4c..02623580a92f2986a82d058e771cb3d0a5146d8d 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_30c8e5dffb371f5a2fc0+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_30c8e5dffb371f5a2fc0+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d40d0f953b8e8f1f8da278f4840189454eeeeacd84a81ffe76ced44ee38a383e +oid sha256:f01ec781276063d1550d6620dffe2d414e727480955959ac21331622c17ccf53 size 164864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_30c8e5dffb371f5a2fc0+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_30c8e5dffb371f5a2fc0+5be477de/wrapped_neff.hlo index 1f69fd409122f53302a446c123f554de4410ee09..c405456691ce1123c5dd9b686c63ac696cd4efbc 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_30c8e5dffb371f5a2fc0+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_30c8e5dffb371f5a2fc0+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3b3ddbeea4fe6cce73c76a648a2ff3fbc2f5e478fa82a21b74481c444ed044a7 +oid sha256:bf1d4d6bdee08e32a94cb51eb0d019d7f562f7dc69546a7cba310828a021e389 size 172461 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_32b878f811b89114a743+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_32b878f811b89114a743+431f5505/model.neff index 0ea80b705f42e6eab78f8230ce416b6bb8d0b0b1..1454977989c2fa71c93b44467908fbb896400e21 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_32b878f811b89114a743+431f5505/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_32b878f811b89114a743+431f5505/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3596a0566dd0e4bfadf9+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3596a0566dd0e4bfadf9+5be477de/model.neff index 737867f4ee9f025a78b6e0b039a50635064baa71..73639e4d4c899bc446f9c311deedb8d76b90879c 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3596a0566dd0e4bfadf9+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3596a0566dd0e4bfadf9+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:245e36d2cddc4bc9c22b69541385aa3e931374a536043a381fec31e4ccbc1519 +oid sha256:2db38c3dbacf8dffddd1a131f519bdc432f2789f24be07d612ec84ba1ad86e7e size 3533824 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3596a0566dd0e4bfadf9+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3596a0566dd0e4bfadf9+5be477de/wrapped_neff.hlo index ead0b92f12ec05f3c11fc30c6a542e4e511f2110..0bcc69c52ea9550a11cdbf8de1b63f6d741470cb 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3596a0566dd0e4bfadf9+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3596a0566dd0e4bfadf9+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5310fbbafd14f9cbc517e97502f85865cae586e232929b62f1caf36f39a73bf8 +oid sha256:203853af4a81bc46f26c852058a69008bf1d1640987f5c88a0b498e3a13ac7b6 size 3663806 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3829e8e6510db07ee7eb+c2248236/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3829e8e6510db07ee7eb+c2248236/model.hlo_module.pb index 2b2fd0b66e3352c17e64c82b94cfb9afde0123a0..357a09cc68ca787b762d016946e1b412289ddb34 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3829e8e6510db07ee7eb+c2248236/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3829e8e6510db07ee7eb+c2248236/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2df4e5b5cfe0c06198f58152217a38cf59b80fef21e3d0b9045459d9a86d80e9 +oid sha256:785ffb37d0114be58bbff93596d1905917de36982edf639ad3f6b98cd5e43415 size 82573 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3829e8e6510db07ee7eb+c2248236/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3829e8e6510db07ee7eb+c2248236/model.neff index 9689c2e5ddebc0c78f506a5d9e63cbc3464dedb2..36c8e8e483c611c945a8f4104c982de48893bf5a 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3829e8e6510db07ee7eb+c2248236/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3829e8e6510db07ee7eb+c2248236/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:420532af544c0d6e179ce7f817ec1dd845218ebec9d57a9e92bc858aa0c6be63 +oid sha256:f2aafae91ecad0ad9b888bcb669b64acb2929ce33065e9452bddf2d2d8ee4a14 size 359424 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_39930d0c2120289c9c3e+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_39930d0c2120289c9c3e+431f5505/model.neff index 1e4da87676368be198737969517768a68fdf16fb..168e202205361dde465a8b78023a14daa268811b 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_39930d0c2120289c9c3e+431f5505/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_39930d0c2120289c9c3e+431f5505/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3fcde42e05c364259ae4+84f3e719/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3fcde42e05c364259ae4+84f3e719/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..60ddcc80e16080ded570954fe3fc17240221f2ab --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3fcde42e05c364259ae4+84f3e719/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3fcde42e05c364259ae4+84f3e719/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3fcde42e05c364259ae4+84f3e719/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3fcde42e05c364259ae4+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3fcde42e05c364259ae4+84f3e719/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8dd4666666bb38ca96f9f028a3d44dfd55b6ef7e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3fcde42e05c364259ae4+84f3e719/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6467c23f65b4e1cf85e7d8d42844debee91b8214cf4662ed17d093581c5cc12 +size 944123 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3fcde42e05c364259ae4+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3fcde42e05c364259ae4+84f3e719/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b58bc15d39dd97d877eaff16dad024c563a71805 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3fcde42e05c364259ae4+84f3e719/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c564da4ed513820fea7e8a765005c4a821894e8798cbce881638c90592aeb3 +size 31140864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_40b0c067485074fdf48a+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_40b0c067485074fdf48a+431f5505/model.neff index 5bce122b9e62156a4a01e31200964db7dcbaede9..2ffad384663ce2da0b032949452d86872fafabd3 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_40b0c067485074fdf48a+431f5505/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_40b0c067485074fdf48a+431f5505/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_46b9d2bfbdf1b2752484+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_46b9d2bfbdf1b2752484+431f5505/model.neff index 159edba0ffe591e88b02ddac8a1d6b871ba1e258..692bc10dec58b206ccaa112ae651dcbb650b3cd6 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_46b9d2bfbdf1b2752484+431f5505/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_46b9d2bfbdf1b2752484+431f5505/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c726262234763accdabd975e27c9948bbbf4cf1b2c2918b9fca65f338ed6f73 +oid sha256:82b6371144cf9c14b0241c348d02996e5997df9694353a59d7657009aa4a0626 size 1168384 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4c948ba1d275cea9b124+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4c948ba1d275cea9b124+431f5505/model.neff index fab3264107bdc6d1074ea95c75cfd58030a7baab..95dc9d108b7a7133bb92bd1cdbbd17fb92ff31db 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4c948ba1d275cea9b124+431f5505/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4c948ba1d275cea9b124+431f5505/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4cc296fe1b7abcee7c5b+8afcc287/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4cc296fe1b7abcee7c5b+8afcc287/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..d0de290d4994cbbffbdb4df818224f3488d981f5 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4cc296fe1b7abcee7c5b+8afcc287/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4cc296fe1b7abcee7c5b+8afcc287/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4cc296fe1b7abcee7c5b+8afcc287/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4cc296fe1b7abcee7c5b+8afcc287/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4cc296fe1b7abcee7c5b+8afcc287/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ee5302006f5261c8a5364810b502e977177edc46 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4cc296fe1b7abcee7c5b+8afcc287/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7e09d3057909f88c501b6ace030dc0d43bc4438e83932d587b19098ea653e9d +size 944123 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4cc296fe1b7abcee7c5b+8afcc287/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4cc296fe1b7abcee7c5b+8afcc287/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..07b0b9bba7b31b6503b216a4ccedcda45b3875ce --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4cc296fe1b7abcee7c5b+8afcc287/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d53f1696e8ef5162c366e0fcfbbaf608ae7bed8dfff739649d482fea118be1c +size 31140864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..e24f877fd3bd437b366557076d7c7d635759a2ca --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a9edf7c07eee7492f09299b1504b8a8e8057215c --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9892ab17c6774324486a078fb89da8c211495929fd88b6c08aac476252ec7aca +size 773033 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..baa5bb8cffb53b11be20a272c0305f515431c3fa --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2205e1fb7956b6c78549ca304ab2e432a4223d7cdf4ef3445b579f18991224ed +size 2499584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..d2217f7a418fdcba02761194443c865ade8282c5 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5011cce3a1b686f14b46+5be477de/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d748e5bab7eb9bbfc7970c4d11ee7b29d507fdba2f7593cb5e6169ef10c4f1d2 +size 2637401 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_51d7ba87477561ddf31e+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_51d7ba87477561ddf31e+84f3e719/model.hlo_module.pb index b86e1122e462e3af04a6690772b2052f77b4e0e8..2125dd117f8003a3eb43d47d4ebaf3b89e2a2059 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_51d7ba87477561ddf31e+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_51d7ba87477561ddf31e+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:203bf226d003dfe6501f325e9c71e2969bc4353247115a6f22000287a427b0a2 +oid sha256:e8dc89c6b2f228783a4b7a847c419d01d23623bb1c36c7346580d9b8f877269f size 456914 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_51d7ba87477561ddf31e+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_51d7ba87477561ddf31e+84f3e719/model.neff index 0f86aa640d3cc2f00da3f818b789ca1b3a6cf256..fd3f30a45f7c18cf8857511196d8e984c32d92c4 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_51d7ba87477561ddf31e+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_51d7ba87477561ddf31e+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b6cfc1ef16a092af729d7198d8c9f7fc4ca7dc4c26485cea0ae06c3cca2ca0bc +oid sha256:8e6440704e13e17efd6a9115b3ee8306b3906f06fc8106d08f762dedfc26408e size 31376384 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_57e3cfa23bd65e42d62f+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_57e3cfa23bd65e42d62f+84f3e719/model.hlo_module.pb index e1349ca59f40e551ef72414ef1c32524a43711bc..25bf0ffdc848f50be1bd167e231c8b4a4cba283d 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_57e3cfa23bd65e42d62f+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_57e3cfa23bd65e42d62f+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9b703bac247d3385d23982597cfd18d0a2c6be31f48417b503967416a76488f9 +oid sha256:9ba61c6d291ec0b9899feaaf7fd7f0af72ca6ad6e816b7bcde96849f93307a29 size 843436 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_57e3cfa23bd65e42d62f+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_57e3cfa23bd65e42d62f+84f3e719/model.neff index 8127823671c575b5e4d3ab5f5682caf5694bb79c..bfb3ed8cd577524763afc274665ccd228539c9fb 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_57e3cfa23bd65e42d62f+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_57e3cfa23bd65e42d62f+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:efda9e5d532093900037dbf17bb0104b642ecd584fc05b0bf415a5d09daafc79 +oid sha256:fba7378f7fee82244d0057a8d4f97c6bb2f886fafd3fa380709a9c9dd8587016 size 35533824 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5a10198534c5f2725fd7+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5a10198534c5f2725fd7+5be477de/model.neff index 61d6e1dba10430541093fc57fe2f8cf9065c9282..bd52c653d8f5762e01ade9ed2f069497869146b8 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5a10198534c5f2725fd7+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5a10198534c5f2725fd7+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f79efa214162d017c10988ea700a1d92682a164594b65debb46aad1dadc2e8b5 +oid sha256:39311f8dea15b407c7820c48887e5274479782b917cc9281bbd0f759f206ba83 size 185344 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5a10198534c5f2725fd7+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5a10198534c5f2725fd7+5be477de/wrapped_neff.hlo index 52ddf69610a94556508a2b3967ac77aa2c11f9e9..d6a9f07914f6426dd66dd4a1b5c8d4772d0bb0d4 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5a10198534c5f2725fd7+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5a10198534c5f2725fd7+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3aa3b1e98368fe8ce7bd6bd640fc378543434f18c2c1df3c23b2f0a4d728f759 +oid sha256:dd188af2314d5a7eff13ea15abc949171cd513fc3e3d699549f36bf39dd1fa32 size 195507 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fefca4728e29af5f535+ad9e832d/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fefca4728e29af5f535+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fefca4728e29af5f535+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fefca4728e29af5f535+ad9e832d/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fefca4728e29af5f535+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fefca4728e29af5f535+ad9e832d/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fefca4728e29af5f535+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..351cd71e8997957e0ede64a72807c5fa845feed8 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fefca4728e29af5f535+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2711d1a721a01baf204ea9e97eb708195a15f240d8bd65b796009607fe80f099 +size 1565304 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fefca4728e29af5f535+ad9e832d/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fefca4728e29af5f535+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..65012ac67c2e57d90c3d7a44676e69763f87b9a1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fefca4728e29af5f535+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1b627b538c817e80aaddca5082477ebe73c18498b028bd8aaa50f9acb99785b +size 2591744 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67377aec01dd303d63ef+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67377aec01dd303d63ef+5be477de/model.neff index 7bb7878e0ba4146d27a50a36e200a0800e523b41..0fe22e64e38d1b291a4c4719e59494e661f54328 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67377aec01dd303d63ef+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67377aec01dd303d63ef+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a4faa2b4c682ddb3d71a021c1e8a1fcbc810c24e0e06b449e0941ba7e48dce8f +oid sha256:4bc6d1bcffc98a707063849584bd777524ab16d99a9b36f43a0c97a8b85341cb size 236544 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67377aec01dd303d63ef+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67377aec01dd303d63ef+5be477de/wrapped_neff.hlo index 47f99e02c5ead76e5942c3fc31a65c99040f91c2..91def0f685533e6ba7591af6311eedf398f790eb 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67377aec01dd303d63ef+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67377aec01dd303d63ef+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4873c291e5cb4f8469b3b41b65165dc55aef5ccfcd217d64b4ccb2abd6f8599d +oid sha256:4dee33a8f0104c3005b67b596d1d3ef787e7cd23850f1ffac3bde7c6b31e3c85 size 244319 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67660d190a903f2f351f+ad9e832d/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67660d190a903f2f351f+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67660d190a903f2f351f+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67660d190a903f2f351f+ad9e832d/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67660d190a903f2f351f+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67660d190a903f2f351f+ad9e832d/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67660d190a903f2f351f+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e04c4d1590cbab0f681e2026f4f0d82cef535697 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67660d190a903f2f351f+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:334ed4956be2b358f129ee3db200a4bf138f5001f29d06574c83c07ca8aed4f9 +size 1789812 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67660d190a903f2f351f+ad9e832d/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67660d190a903f2f351f+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1468c55d94b245d3df14a6a2b9744696b6af1e24 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_67660d190a903f2f351f+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b0c0f835a9225f92e6adff858bdde2e2dc5ec4b4775b9ddb26c9949c7ce61b1 +size 2520064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_679852c8ccd2cff92dd1+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_679852c8ccd2cff92dd1+84f3e719/model.hlo_module.pb index 596f025205726b8fafe50ab8d26d62459dd1b4f1..6018009af437dee58def76e11803ee14b43862eb 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_679852c8ccd2cff92dd1+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_679852c8ccd2cff92dd1+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:21a3f8e14c1aa8040ceca813acc17e532d6fc18e01594457ccae96067e2dc429 +oid sha256:8595de39b60526028c04b4c6d00125d4521ba64bce786cf02368b76977ffdad0 size 50076 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_679852c8ccd2cff92dd1+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_679852c8ccd2cff92dd1+84f3e719/model.neff index 127381ac01a184953d866956a3f2acbccdf4a230..a989d8e45cdf8d4232e0c3fd3460bf86d69be29a 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_679852c8ccd2cff92dd1+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_679852c8ccd2cff92dd1+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fa74edf92d2bf09eab45b626bfedaa14a2cb593c0372ac5bf4bbbeca3043419a +oid sha256:69ff807748f08a32821febafa966cdfe8ba5def5c664d1c6d02826fd2ee94358 size 236544 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..c3996d6ba369f652f0f05d1f183ca3c9e9f32acf --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..48c060bfc566a2808b5ac053f2c6154a586b957f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce55f9f3b779172d357a166157f85e849aef70cc86fc56962d5dd729022e4b4 +size 773433 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..caab05a40844a1c2036faa8d3a2775abf3f25152 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327275d915349b86fa5f5466da49d9bb1753645c98344b17f688cef2a78df53b +size 6237184 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..48e6c1378f6f3d730c02115fecb60ec36f0c54ce --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e4efecaeb594ce776fc+651dae50/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:053b08cf17a262168a05ea5c80012a256d92d76bcc7f95fb55ba7bcd3b248f6b +size 6375001 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ec54d1cb60ff01fc2a1+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ec54d1cb60ff01fc2a1+5be477de/model.neff index b15273e4aa3d956522fadd4bf2e9fead71ea2669..7a146599bba83a46134c7b71185ca33d6d65f95b 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ec54d1cb60ff01fc2a1+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ec54d1cb60ff01fc2a1+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:555984b14655f0861a0339c74f5710d1f798c50924c82e902ef0b828fc4b161d +oid sha256:8fc0b3513bc9d5aac316a65397b2ca7cf9324435e864fc965bd48d5b8659044f size 8725504 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ec54d1cb60ff01fc2a1+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ec54d1cb60ff01fc2a1+5be477de/wrapped_neff.hlo index 5f833f94ac27bd3815e24da36e04c2ff0617115e..3ef8df0021469c03c13a0cb7c87b682e2e8cb368 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ec54d1cb60ff01fc2a1+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ec54d1cb60ff01fc2a1+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:67ad730cce63a62597856d55747fb4851ed4c2752d0480964116efc51a8ec7dd +oid sha256:97b0bb5c0170043e3f760308c54d4c96cff4c66b0fdc52d19d064e8bbd6ba438 size 8862755 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6eee1d2655983d3e332f+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6eee1d2655983d3e332f+84f3e719/model.hlo_module.pb index adb4fcb03b178b88e5c191ac4b567909b59fb5c8..72151e6c720e2b3e99604524a20905c9a077fdde 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6eee1d2655983d3e332f+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6eee1d2655983d3e332f+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8623fec92564afd3eb9768c1d5533b631a2419b8ab622ddca1f2c83620dcf8c3 +oid sha256:b7dce04cf5169e7d7109611eebcc65efdf248fcbd2877b68f27e8f5211549484 size 1072456 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6eee1d2655983d3e332f+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6eee1d2655983d3e332f+84f3e719/model.neff index a90bda1ac218564baa696563b5b6dc120ab8cb1c..8f86a635d0094443c0dc6c42dc1f92fa063dbde0 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6eee1d2655983d3e332f+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6eee1d2655983d3e332f+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0d017a1e367859eb5e59126b30a53d4c2233ff8abbb5edd4a43cd95f53af8391 +oid sha256:ab674f3130a691cd1e9ac273cc21f5c8cdeed34d59d5ca471aad26ace63bbc32 size 6605824 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2b9f372659ef1a96c4404f7e7e73242988f391b0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf2a710f566a2d1f59f90dba87a5350c8ee8e8d21aba309ce32afcf049aa0eb5 +size 745782 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..2f29f69c7ae427c2ea4d6de6486d97bdb2f7f806 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfefac025bf42101ca37f7d1740c85a4e7654c060aa481339a530960b7e96fac +size 4998144 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..ad0aa028c21e09c7baee63eebcc55fc6bdcb1a1f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_73ec31085ec199e0bf87+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4c85276620308cf543f4c870d3661766b5b6b4fdd85dc8c562a0500034f9b1b +size 5169870 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_761b3c734083fe56af68+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_761b3c734083fe56af68+84f3e719/model.hlo_module.pb index 9b12403ebcb229ec08ef28102b4060b3a9a8cc43..f6f45609d733e98fa628e247cbf4f4c64040b3ec 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_761b3c734083fe56af68+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_761b3c734083fe56af68+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:34d4e10bc888050ec26d9c3e3aff814775107d3b688ba44c41c34c4a61b6d37e +oid sha256:3911b9e19624e2d62f7d180667f966981db8d75fba37e5f97e83efb5bfe119da size 87785 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_761b3c734083fe56af68+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_761b3c734083fe56af68+84f3e719/model.neff index fd76e7f02f2922bfcd9f01269bf29b5aadb2eb8e..55268d0057a121cd68028b5e0ae16ca474cd9c64 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_761b3c734083fe56af68+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_761b3c734083fe56af68+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4a84945df255da71d092b420e2646cf92a7f33ec10f41dd16b79373641d3d2ea +oid sha256:3a1d3978e4569f994a020271ae0831bc5643a917923e45b4c3348aed583775f4 size 246784 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7850f8c16172e0c763cf+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7850f8c16172e0c763cf+84f3e719/model.hlo_module.pb index c68e5b1ac18247e502a07da37dd9bc8bdd990d41..1627088221d0fa812c4a968a72bc1273c515f7fb 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7850f8c16172e0c763cf+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7850f8c16172e0c763cf+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b56b00da30a983c25b7e4e0142e6e79082a607608bdceebe17aaa8a061a9516d +oid sha256:65b142d87d876dee57b5b66d54c21bf5a9bc73b3d63a32d4ffd01c46fe2c82e2 size 80469 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7850f8c16172e0c763cf+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7850f8c16172e0c763cf+84f3e719/model.neff index 482fecd9eda6a4eecfdd38f0e3c4c063857e900a..721c228ab64a1572b175cb9581b751dad03b08f3 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7850f8c16172e0c763cf+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7850f8c16172e0c763cf+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:26e6633856f2b6f2f508f3a55080c9e319118be18dd49f9a82973ba6988171d0 +oid sha256:fc5cb8e6b7db67bf40c1e0170697533b941b247d1324c5fc287abf11640081c4 size 205824 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_791f80da2052a6cfa05d+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_791f80da2052a6cfa05d+5be477de/model.neff index c9d9ea1bf392ea3a67c45ac3c1f8a0adffe2db22..72ee4ab9b23d858eacb53ec76014f8351f2bb05b 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_791f80da2052a6cfa05d+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_791f80da2052a6cfa05d+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:083a85082fcd636e5983308405202e4f0c67da1f77b075861736362fadfb806b +oid sha256:d0224d883f8020fbb8be6d472705c13d81bf4f3f1a27ad3bda24aa3146372572 size 185344 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_791f80da2052a6cfa05d+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_791f80da2052a6cfa05d+5be477de/wrapped_neff.hlo index 724d734316b5352ed3d15e3ab5015fdb81218da4..ab3fffdfed99a4ac8d5d16069e703fa9e8f45088 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_791f80da2052a6cfa05d+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_791f80da2052a6cfa05d+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ea66972c5360b773fcf1fb6b81bad2ede8c4d596df08ee43e37ccee8bc597104 +oid sha256:eaf33660ad2b95a5db5021c668111bd025d45020cf0a23ccf8fc049154b661ea size 193114 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_796c64ab3e80099de463+84f3e719/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_796c64ab3e80099de463+84f3e719/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..60ddcc80e16080ded570954fe3fc17240221f2ab --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_796c64ab3e80099de463+84f3e719/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_796c64ab3e80099de463+84f3e719/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_796c64ab3e80099de463+84f3e719/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_796c64ab3e80099de463+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_796c64ab3e80099de463+84f3e719/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..9d315b00a2533426122184731c16d10c7c3aae75 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_796c64ab3e80099de463+84f3e719/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd447798999fbb97fff82cb7a5bd0cc8bf0dc8040472a26ff75021bea7ece392 +size 944123 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_796c64ab3e80099de463+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_796c64ab3e80099de463+84f3e719/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..90d99f6315288179985fc3530042d3f4e443476f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_796c64ab3e80099de463+84f3e719/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:defd23921a1ed328d7549614718da2702e6d68886399d0f6baa4569889c336fa +size 31140864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c7c536a078a2c0f91a7+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c7c536a078a2c0f91a7+431f5505/model.neff index 356343012c68907bdbf9c209143ef9279bde82a2..1610224b254f298cf5f0e598b58480b909b2701e 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c7c536a078a2c0f91a7+431f5505/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c7c536a078a2c0f91a7+431f5505/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..6d65eaf41e0d913ac1ed0ab5b10ef1ebf2c03c39 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72ad0025306f4a788a5544f116be695c8058e05259f57ae3fbfbc8978955ace9 +size 1888271 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d7d2683361698b14926ea4082ddf87ac99612485 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9122130ad37e5e9b751c6d09dc45e7d9cf9e45740c95fcadf87448b2756ecf4 +size 6534144 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..769fe00d2884897c18d5d54e758b2b8481ed2702 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c80fa99c1314097c5ca+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74623aee5b9cbb27a4b291bdc59320b756618e07f60dcb01433400d1985acf8f +size 6965264 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7d84a4cdb76e9616c2a7+c2248236/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7d84a4cdb76e9616c2a7+c2248236/model.hlo_module.pb index 4602d1f55c0efe5a8b8a381113c0e2d54e715592..2d16df4d61f7ec5889998b2629acc4d936367f1e 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7d84a4cdb76e9616c2a7+c2248236/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7d84a4cdb76e9616c2a7+c2248236/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3d4db8c0c8c7732595c80eb133486be2017caffae8cb7d5f0f89628c1f218f1a +oid sha256:f61eab86b4c8d3ff91c00c1739d222c4ed2b688e4625c4bd8cda0e80dd81d38b size 83368 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7d84a4cdb76e9616c2a7+c2248236/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7d84a4cdb76e9616c2a7+c2248236/model.neff index b2f974d792727afd4811311367f0183fc2a73901..f84dbe31ca5f0e7ee9964afc1d5c138ed65435d0 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7d84a4cdb76e9616c2a7+c2248236/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7d84a4cdb76e9616c2a7+c2248236/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6cbe5f9b4439f98065f40d0fdcd9cbaa50b902c0221d1b3171a99b67b85b4f04 +oid sha256:a833e92f3439f4b0359cb62519c02c51dda934079f1cf31e8ec2b8fb2f091c51 size 420864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_81e0fb8dfd58e42d4ea8+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_81e0fb8dfd58e42d4ea8+84f3e719/model.hlo_module.pb index 261fd2b1900b5c7f65a085fe6fb226600609d19a..b3e09794147aa46cb3586f8df0df755a69e7d0b8 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_81e0fb8dfd58e42d4ea8+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_81e0fb8dfd58e42d4ea8+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9168e842c91c40ca70b37cfedb1caa5f11783d458ce905b3e1b5a54ff52a34ab +oid sha256:b8c3291c3028b7cc44e790e359a20c4a356dc8317135a8920091635dc195987e size 53803 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_81e0fb8dfd58e42d4ea8+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_81e0fb8dfd58e42d4ea8+84f3e719/model.neff index b091d90b20997c78ff0244445dddfc1b7f83bce1..c9f55811dc28e3c37363b9de0fa5c277e5e69327 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_81e0fb8dfd58e42d4ea8+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_81e0fb8dfd58e42d4ea8+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ee2ec50d9b46eb7d0289314a5b6d41bf772b0b83fe8feac3ae2816007fb972c9 +oid sha256:f04718f2195a2c1b43c763d1c97db3bdca3078632c6d0f8a05ee89c442b6f708 size 164864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8bbedb082fb6a65e221e+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8bbedb082fb6a65e221e+5be477de/model.neff index 0f36b2fbc61e4e566d10ba2652913f8ccbc7570b..dc0ab807fa4ed801936b627edbda12c79d239e49 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8bbedb082fb6a65e221e+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8bbedb082fb6a65e221e+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b846ed30973986650b0098ede9be709e3c0b79f1efc72cd94d13c864998b4064 +oid sha256:4041dffc23fbfabef08cc959c1cd21aed5b8ad5b9ac0dad1a8a4cb6faba17fe9 size 185344 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8bbedb082fb6a65e221e+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8bbedb082fb6a65e221e+5be477de/wrapped_neff.hlo index f3837b7e96558df5344393353198cea97f66c3ab..8a814d634dfa89551774d83bcfc3c116ebeb0a85 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8bbedb082fb6a65e221e+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8bbedb082fb6a65e221e+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ce47d4b752466288d1630fc4dbc9bc577e997116e9dee7ac3af5e135e32e5a8c +oid sha256:e7962dec34318c62eafebbb03c003a1515a174f5348826c9b222ff2d8e3947dc size 193114 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8f8f2bb409247485b54f+408096d6/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8f8f2bb409247485b54f+408096d6/model.neff index 0d796feeb7a0c9ba71c54d66823b988468fa117d..44930b780879e9685f9edbc28768de7dddecf942 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8f8f2bb409247485b54f+408096d6/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8f8f2bb409247485b54f+408096d6/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b33f95fb786aa7f06d31f3c6af955c18c15ccd3b5316d905e00eef71750bc1fa +oid sha256:e63314ff7255f981bbd68fc19cedbbbd15afdc387680049b8d97f3c03edd4bcd size 2683904 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4e40528b2c1be3a27a14449d0ba0f52562443620 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41c0c1dc5cb13b2021125ba93d8b556d84bf6c87a60e4f795c4291c81fe88f5a +size 745398 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7cdf73e4e939615292b01e39d20b03603aeb1221 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97c5c1d5d0b195b6bfd1cc96f77e336a7dc7c21e2eed0fde6e08f1c9c05b55d1 +size 3820544 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..ce003f78a177a5e3c03edd5002221145adafab6a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_92cdc4fd3b2c266a1f01+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb18671f4a5a4444ad1077fe5df0c4c2780f1297bc01724d237ea14749be0a5 +size 3992270 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..31998095ef5da96d478d824cc63f0f03d7474ac1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:287ddb67e3d9191bf1a53454e958ae2301a287dc4b2b02047b1637341772e767 +size 745782 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8b68c1cee78c5a5bc41b7d59ef606a43199cde35 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b27c9c07e348b863966047feef36dd6726f08397a79367c8ebdca107df5342c +size 6339584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..0f4e2bcac16e9491fd498d8cb0ef92235d758f43 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9461a71f0b134dc8d40a+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:251cde90cc98ce530bbacfac62e4d22c0447107450128460a03fbb5aed1eef70 +size 6511310 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..e24f877fd3bd437b366557076d7c7d635759a2ca --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..21ec3dd36acf696ce490381ddbf4b3bc612add5c --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55ff68867c5bbfe5baeb0ae1da8e8c750ebf33f6b0a7eeb15b3e321e3341c207 +size 1910639 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8a0365632e966c04402e874fd4dfd92ad1d63c39 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34d28013bd783aed785e0a65415bd3e6a302b9e71e725e981673f9578b547c82 +size 6738944 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..db90daaef2c33ea0f56fada7c120ea9eca0eea7d --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_94e031bc9e9d532910fa+5be477de/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93e701f41a85478a6bf91c13c18d8210ef864faf4379a5d45f67b84374f68df9 +size 7082519 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8bffe6187691159db2605f30cafdcfcdcf53a100 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fc07323d8dbde3248d4aadf4a9df1d0970b39abe7d1123e0ffebab560f9c193 +size 643836 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..19f14bc663f04a5f5af353b7304062f3fd97fe79 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0608993395a01bc5bad1706fc6360f1eec0a791b250e6c6aa9d5bad4dfca8a01 +size 8725504 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..799db8bc3031b12473dc63aff2f544b108c38b1e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_951c8a5cf15504464697+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:997a46f7771c6ebbb8c2e04128eccb78adc3b01a8b9fbe7ec1621604a482a110 +size 8862755 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9a042dec7c8f1bb9bb73+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9a042dec7c8f1bb9bb73+431f5505/model.neff index 775809132a87e1e0c838438c4ac2cbd7b6545bc9..bf4c14732768a50c46be5b0cf9124efe046b04e1 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9a042dec7c8f1bb9bb73+431f5505/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9a042dec7c8f1bb9bb73+431f5505/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba292be7e7e441b703f+84f3e719/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba292be7e7e441b703f+84f3e719/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..60ddcc80e16080ded570954fe3fc17240221f2ab --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba292be7e7e441b703f+84f3e719/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba292be7e7e441b703f+84f3e719/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba292be7e7e441b703f+84f3e719/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba292be7e7e441b703f+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba292be7e7e441b703f+84f3e719/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..465a5c9f13c760886fc4a7728a5aaf3b20d23801 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba292be7e7e441b703f+84f3e719/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb1d004a3cc933a8e48554473fa7c83168bdcfe66f5286ebeea67f8db25e30ae +size 2327880 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba292be7e7e441b703f+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba292be7e7e441b703f+84f3e719/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..92ba90fa6fd2f4d64c5d8e90323a292c82657e65 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba292be7e7e441b703f+84f3e719/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af0e2b1e464816f528cd197528a0c07a22ab283512fd6ed5f87b99c561f8073c +size 3390464 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9bef1303fb9e21c6cb66+c2248236/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9bef1303fb9e21c6cb66+c2248236/model.hlo_module.pb index 3b402c4112e8b7d56c5a616fd8f54abb4cb144af..ac1c1cbdeb45a22e8c938abfda2a718eb2f8ca82 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9bef1303fb9e21c6cb66+c2248236/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9bef1303fb9e21c6cb66+c2248236/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b6908d54bca8a211d0dffa4cf560854b7a4be047dd1bcafa722b6042b61dfce9 +oid sha256:9ba6755f76044cc182adbd3f58b2f88e3647ebe64d521e294bee38f33cd7d099 size 82571 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9bef1303fb9e21c6cb66+c2248236/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9bef1303fb9e21c6cb66+c2248236/model.neff index af8d777e0669adc47cd71e77afa3b93f2894211f..7a7036c035482c95fe179591398f40ab70c3844a 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9bef1303fb9e21c6cb66+c2248236/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9bef1303fb9e21c6cb66+c2248236/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8f6644c9cb41ad344495d66338defb8e23dade921574e01b2a8754de58a22ac6 +oid sha256:67ed7c62c7882a05f20a82c1070ccebd3b96ebccab601e9985d0d9d470ae03a2 size 359424 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9d325789026e6ce273ae+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9d325789026e6ce273ae+84f3e719/model.hlo_module.pb index 787dec80dfee21fc28b4e3f2033cc880123ecc79..1654cfc00a632ac0cb2fcf75f4d89dd2d5d75c8a 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9d325789026e6ce273ae+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9d325789026e6ce273ae+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f1708664f78e976e8175f18544260a1c733680a8d6e7c311029aa765eed8d8ba +oid sha256:15a1f8e05a86a5c8f515e1c034a06442d19fdc3f1674c0fbf0e3499011b528c3 size 83920 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9d325789026e6ce273ae+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9d325789026e6ce273ae+84f3e719/model.neff index 066ccc7123a88fc1e38a4dc4b5bb3443e414de73..21da0c1439b8cfc9b6a7039588fbd4d8c7a400b9 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9d325789026e6ce273ae+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9d325789026e6ce273ae+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:22447903b596e506900050be53f7d84f0f7f89280f3b27c43ee2f29244455765 +oid sha256:7d25a3804d66b7ff656ecf5199d0baded3622f17e660ef4f4736e8734c1b0938 size 185344 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9e2025b598171192a3d4+ca355898/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9e2025b598171192a3d4+ca355898/model.neff index 3ee85c05842e13e541b72d3064822b9a92daba0f..fa00256331c0cabf14d56a463c8d19d3b5f962d5 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9e2025b598171192a3d4+ca355898/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9e2025b598171192a3d4+ca355898/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e1e12ec9c623c659ed43c52a9114f67490fdbcc082437851105518bf1623b20d +oid sha256:dbf462cdeb496241af30d672b2e4f91b7541fd490d67691bee195c614e1fcf79 size 308224 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9e2025b598171192a3d4+ca355898/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9e2025b598171192a3d4+ca355898/wrapped_neff.hlo index b09c7ca21e06fc59827b7ecec66858cdad7b5db5..f767a06770c98dc1cce417af3b62edc988cb0a19 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9e2025b598171192a3d4+ca355898/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9e2025b598171192a3d4+ca355898/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bccdb46848f74e34f44d7f485f601a466cd58dce8fcf657c58697c0c52ec3744 +oid sha256:7f4b338c58fc56e5397fbe8016b2b3780f5a925cafeeb733a1e0554aae0c5e48 size 319522 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1746e7481045e1ccc37+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1746e7481045e1ccc37+84f3e719/model.hlo_module.pb index c8860a02643a0001de941a19eca194bbd6207194..bae7532e62f87dd96aeaa2c2011979cf73338534 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1746e7481045e1ccc37+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1746e7481045e1ccc37+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dee883d59326309a6a50fd855082eed95da01f743fcf5dfb4da4bcc046074869 +oid sha256:44b160039d090f8d029b08fb98b9ef3a9477eb4389b4b08b4410dd67a09e9af6 size 80469 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1746e7481045e1ccc37+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1746e7481045e1ccc37+84f3e719/model.neff index 372306fbe5b8aae0ff985d52505134946c61a572..a1a861c4ace0aafa314e00c9e59e651a373e19b5 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1746e7481045e1ccc37+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1746e7481045e1ccc37+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3f7a43c440b008cba04126a1cffb18954ad029882e4533f562f2d6d10f756c83 +oid sha256:4972af6f4c52b9f9229ad3866e5d54a272391a1839aafc8054159655bcad7619 size 205824 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a20343aa93b3e4cbf95f+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a20343aa93b3e4cbf95f+5be477de/model.neff index 9e00a7374e9f673b890606afc5a94a3a87deb5fb..c15965095c8cba5111015087b355d4641c3a756c 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a20343aa93b3e4cbf95f+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a20343aa93b3e4cbf95f+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eaa215446b250eebb0719b48f07d83dcfc26aa97ecaa8bd347ad1b87cb5ca63f +oid sha256:ac1f5e0c4b538ef4d33b7c9c03dd4d8c636770d739a6395af324e36dc2a9fedb size 236544 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a20343aa93b3e4cbf95f+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a20343aa93b3e4cbf95f+5be477de/wrapped_neff.hlo index 85e4f5d945d4f50944e4df31c56bc5c24b57f34c..99896f8625b657e4bed8991e55de90449186f481 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a20343aa93b3e4cbf95f+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a20343aa93b3e4cbf95f+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:444ac0bdb8e8a884cca9119742efdcf34bcc46232786a13def6ff0fb569b19f6 +oid sha256:c7e47c8d6011c2921e8cb2c32b61ce263b5c06e42a22d81ade3f0e63d0c49776 size 247153 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a3410e1989f6ba8dd0bb+431f5505/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a3410e1989f6ba8dd0bb+431f5505/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..9932c70d27d759d781be88485b74b17b49b4c04f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a3410e1989f6ba8dd0bb+431f5505/compile_flags.json @@ -0,0 +1 @@ +"--model-type=transformer -O1 --lnc=1 --internal-hlo2tensorizer-options=--experimental-unsafe-fp8e4m3fn-as-fp8e4m3 --logfile=/tmp/nxd_model/layout_opt/log-neuron-cc.txt" \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a3410e1989f6ba8dd0bb+431f5505/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a3410e1989f6ba8dd0bb+431f5505/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a3410e1989f6ba8dd0bb+431f5505/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a3410e1989f6ba8dd0bb+431f5505/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1f84c3b89b02315c1d279608f358dda5906af751 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a3410e1989f6ba8dd0bb+431f5505/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef71906b1d021844eea2415d9928668b43bf018232964fd9029a064bb9b0ccd7 +size 136009 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a3410e1989f6ba8dd0bb+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a3410e1989f6ba8dd0bb+431f5505/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7892eb8da2a6155eb3dda6acc33924c84dc59f36 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a3410e1989f6ba8dd0bb+431f5505/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9175f5fa3964832e96703af015bdef337ac74d03a8d50b3fa6f9850f4b6f8c5 +size 2192384 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4b7d22d92e285308be8c114ffa5887bf3be0bf4c --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b59cf7db0eead3c13e358c6914e26d5128c90c98f9c72406f37ad1b0832396c3 +size 744990 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..effcb2464953e72ab1cf8351b611b26969badb59 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4f75ccbe5415a3bf4126696c9a686960eef46f097aba02031461711ae474fbc +size 1997824 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..a66a23f5f8ef2aa3912d178dfedf2035ff37c0e1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a49b12b082ce2bdd4394+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ccc971d29fb445fb7a519fdbef9850ec9cfbacaa6c2b3bce66863da44c68c2 +size 2169547 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a963e9aa5a33fdf44b01+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a963e9aa5a33fdf44b01+431f5505/model.neff index f59c36b23501b034b04a981da079fd7ff23320fd..089d2fe0f250f49558924ccb8fdf25d122a634bd 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a963e9aa5a33fdf44b01+431f5505/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a963e9aa5a33fdf44b01+431f5505/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a5e76972a894223f1a3dc025a3f2535d6befa859aa54d854153fd8ec1f91a0fd +oid sha256:01b6e95760b38f249119c0916517c0021346d8c7908b5566fffa0ccb5067cd11 size 103424 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_abffbaee6c01c4e3d2c4+431f5505/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_abffbaee6c01c4e3d2c4+431f5505/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..9932c70d27d759d781be88485b74b17b49b4c04f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_abffbaee6c01c4e3d2c4+431f5505/compile_flags.json @@ -0,0 +1 @@ +"--model-type=transformer -O1 --lnc=1 --internal-hlo2tensorizer-options=--experimental-unsafe-fp8e4m3fn-as-fp8e4m3 --logfile=/tmp/nxd_model/layout_opt/log-neuron-cc.txt" \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_abffbaee6c01c4e3d2c4+431f5505/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_abffbaee6c01c4e3d2c4+431f5505/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_abffbaee6c01c4e3d2c4+431f5505/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_abffbaee6c01c4e3d2c4+431f5505/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..76102661e28b8fa2b7042c6b4336c1d62fbd85b4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_abffbaee6c01c4e3d2c4+431f5505/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cd97a5178f1294bcc60c1a3a853d5892aa2f834138a2cb73035a98c01302618 +size 339944 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_abffbaee6c01c4e3d2c4+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_abffbaee6c01c4e3d2c4+431f5505/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c02649911b7bb1a002faad4da699504a3b8c8dba --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_abffbaee6c01c4e3d2c4+431f5505/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:922850e7a45fe1ebd7ba3df3ecd0e7f8febf582c9c538e7e78cf7afe20a4f645 +size 7711744 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d7470aed79d91cfa86f4f98fcaed3980077956fc --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a21988309ab35c792ff07095595756d5704884e71a5b0cdc3b7f38f42939190d +size 745398 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..2d502fcdb8c182c0cc9bcb18644c70a8397a544c --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:735b085988e657797e4baa665bb99948a76f80f479c231e06baa536dca53f266 +size 3083264 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..5d5a53f2adf2b11983697cff479d2db12f14c91e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b19bd1cae910012a5fa6+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:247da6fe93a0c8e1d0d534ef5141d56dc23cde617f9b4231c3fdea1f67e523a4 +size 3254990 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b254587b1ec9eec17e0e+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b254587b1ec9eec17e0e+5be477de/model.neff index ee8ed64d46a7c0816ddd41009e3a387f050b205d..ffd9432ccb8b448b3edc8fae5fffd501c107267e 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b254587b1ec9eec17e0e+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b254587b1ec9eec17e0e+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:042b1d0a13e7ce4add4997eb51c95ff916f9d5a1a4e9ad372f61ddab5c909dae +oid sha256:e99b5e875fc8436e3e28b9aa4eab699c40bfe177c512cf00b8642f94c9cf0995 size 1455104 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b254587b1ec9eec17e0e+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b254587b1ec9eec17e0e+5be477de/wrapped_neff.hlo index da92b4d323b4f54de8c45e26fcd94d9839b72b7a..27daa0ea1aa2faa26612044f80f53b7ba883f5e9 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b254587b1ec9eec17e0e+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b254587b1ec9eec17e0e+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0abd160f3e9d722e3de25250bcf7c8b5f106fb35dd64ff3e6af665f95324f3d5 +oid sha256:a8a24fdc65289021b8b6e1a20c0e107d16bd3cecc62faded4b1a06ddc1235f51 size 1600015 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3922fb6a70df3e2474d+ad9e832d/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3922fb6a70df3e2474d+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3922fb6a70df3e2474d+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3922fb6a70df3e2474d+ad9e832d/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3922fb6a70df3e2474d+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3922fb6a70df3e2474d+ad9e832d/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3922fb6a70df3e2474d+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5c198c977e9ea4944d4dbb3d89a549ea06998dcf --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3922fb6a70df3e2474d+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20cc6faf99551296c87aed865cf33e7b5d9d680545b16bdc0af35824a6cbc7ed +size 1789812 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3922fb6a70df3e2474d+ad9e832d/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3922fb6a70df3e2474d+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d46517079276a4dab359811006e2ef767e591b47 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3922fb6a70df3e2474d+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97c93da2b0f65324f182111345b86306629d670847120811323a5e36111f4b7a +size 2520064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3972df3e33231af7683+84f3e719/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3972df3e33231af7683+84f3e719/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..60ddcc80e16080ded570954fe3fc17240221f2ab --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3972df3e33231af7683+84f3e719/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3972df3e33231af7683+84f3e719/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3972df3e33231af7683+84f3e719/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3972df3e33231af7683+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3972df3e33231af7683+84f3e719/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..910fd42341c7a91026feff8e73bcb6563572229f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3972df3e33231af7683+84f3e719/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cec344eaf4f9b146d749fadc8eb5f88bfbf8405f8e64c52e2610b0c71e684c97 +size 2327880 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3972df3e33231af7683+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3972df3e33231af7683+84f3e719/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f20a2894c779d49ad3d7f2a604faf7996c184d43 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b3972df3e33231af7683+84f3e719/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9f15eceed7c2c2faead9e79476187e1a2bf97e85c98989781e687d6217daaa9 +size 3390464 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b77e0e7f43a3603bfe9b+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b77e0e7f43a3603bfe9b+84f3e719/model.hlo_module.pb index 26ca69a8732b0147c2737a5979901724ad2e0819..b4e6c16f42b5841a3b416a34149ff1004ecb23d9 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b77e0e7f43a3603bfe9b+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b77e0e7f43a3603bfe9b+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:891688b9e7c4937c0bd5b89684410d71676642526c924b6d34f1f79a63450b14 +oid sha256:78e4287bfc92bf850eea4d10461af2352f2edc23a29ebe6782591e1b850f075f size 83920 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b77e0e7f43a3603bfe9b+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b77e0e7f43a3603bfe9b+84f3e719/model.neff index 3cf9cfbcc859d5236e0e88aceea5af4881c32442..5c576b737d9ff722a68ce0d0067e30e98e735637 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b77e0e7f43a3603bfe9b+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b77e0e7f43a3603bfe9b+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1a7cfe17a5b512aa64841fede6451fbdfab672809be3a4232b95fb763f29e99f +oid sha256:284a5071c265c48612d234ce96a5c2855f346de8b297018766db228865277ee9 size 185344 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b8997c221d74ec4a7842+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b8997c221d74ec4a7842+84f3e719/model.hlo_module.pb index 935c2936544ee810a2462f0c043e43b4295ae508..a05db28aa1daa64e1e6adf1788a0b8c7cdbbe8bf 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b8997c221d74ec4a7842+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b8997c221d74ec4a7842+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0e94e5e24d1f1d44c1195aa6c0bc815443caccb88c58683ac324eff51805978c +oid sha256:700fdb2999174103945b216119818f393e43318102778ceea42408cea535ef67 size 81323 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b8997c221d74ec4a7842+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b8997c221d74ec4a7842+84f3e719/model.neff index d71329bdac1688ebc0f8b021ba397075134944e2..5bd62aa52442ddca10951bfc79c87e8e11226db7 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b8997c221d74ec4a7842+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b8997c221d74ec4a7842+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5d5b4953b7516509a2c02818a2480e4dae09aa7607074d07b4191acd30a1a83a +oid sha256:57afc6cfa83683d461e4e7a29bf91aa41b051b845bab370323414a6a7ec44a6d size 236544 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc0dc6318052d18d4f59+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc0dc6318052d18d4f59+5be477de/model.neff index bacbd1355710553f0e49da0f13ea69c378462d8d..f0ad67ca06668adfbd0292f90c3ee8f2b47f9816 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc0dc6318052d18d4f59+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc0dc6318052d18d4f59+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:db627f364f1509a3d35851947572abcb533b5792049a30253d8912b97ea10bf6 +oid sha256:42979cd0ec9a5f3294698a306d1083ffe6c98f8a98fe89bc2760dfab9097396c size 185344 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc0dc6318052d18d4f59+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc0dc6318052d18d4f59+5be477de/wrapped_neff.hlo index 005615e38294c271ac4486bbe957bc674352bec3..b248385fe494ffc7cad59a16508e903029cff1d6 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc0dc6318052d18d4f59+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc0dc6318052d18d4f59+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2b713e884452e0dd669bde4ede5d8b18f59d3f4ba99485d593af4bdbd9cfad7f +oid sha256:b5ee20aa4f1f1686fd0bf72fcbb970e56e5afd7f78ff60bcfed24affa4a8fb80 size 193010 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..e24f877fd3bd437b366557076d7c7d635759a2ca --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e5429c3c1bfea143c0553c0c5b99573952190748 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38fd4d07237114f1e5b7b152b9ecc9e7faed11bd73abc539f18a609261d2fcc2 +size 1911064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8b4f28026983fd4fe77b23cefbc7cd306f7fe8f1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd9b5e25d91bca9370d52607a23e2e1e2888ddf185e2809c4d075ebc16a6724 +size 9944064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..b33048b2c0e28fc431a271dcdb143f56c1adc1c9 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bcadb50ab85e2fba8d71+5be477de/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99de851664d7db2ffcf1ddd5a51897a67461dca7912bed4cb5becfd72f45f322 +size 10287639 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf2b84c02a9cc5486e3e+84f3e719/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf2b84c02a9cc5486e3e+84f3e719/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..60ddcc80e16080ded570954fe3fc17240221f2ab --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf2b84c02a9cc5486e3e+84f3e719/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf2b84c02a9cc5486e3e+84f3e719/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf2b84c02a9cc5486e3e+84f3e719/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf2b84c02a9cc5486e3e+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf2b84c02a9cc5486e3e+84f3e719/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..39174d7dd5530fffae9e3cf826973d855720c57f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf2b84c02a9cc5486e3e+84f3e719/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e9f7682a68adc61d2363757bcf548c22a5f8b5a3bbe768fda1e8b80b7ca34d8 +size 944123 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf2b84c02a9cc5486e3e+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf2b84c02a9cc5486e3e+84f3e719/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..fdbe243a82f26ebd87a6bda311deabf7164cc2d1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf2b84c02a9cc5486e3e+84f3e719/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:212eecc57bff1679126e3bf0b125d0dbfa9f17ef653f818ced0553e11cbdf586 +size 31140864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c2d3f01e87cac25e1312+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c2d3f01e87cac25e1312+5be477de/model.neff index 0fad72d05a723b55c15bb12ba79172041afd40a6..804e207e2418e3f4545d81d6c5531911c6bcbabe 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c2d3f01e87cac25e1312+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c2d3f01e87cac25e1312+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8429cecb2b4044158b1e7ed02765927d5d8a30edb021eb4c20bbb25374179c82 +oid sha256:a8b633e19f1762738f127621ff50d126405e0aea355b8abadbba521b3a4adcf4 size 236544 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c2d3f01e87cac25e1312+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c2d3f01e87cac25e1312+5be477de/wrapped_neff.hlo index d89d9573700e4c451fdce28c9a323a2facc843a1..be98b35c896f791f6941cda19904560394773a3d 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c2d3f01e87cac25e1312+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c2d3f01e87cac25e1312+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b13184a09bd49144b6e04beaee93a50cc036b78b3d0f9811ad5c4f1de2a5f4bf +oid sha256:44e64ac581f0a7cf925adea4b412b0e40d764dcb011500119d451cd986f5d4eb size 247153 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c58c3b1c9745cdc8b7c7+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c58c3b1c9745cdc8b7c7+5be477de/model.neff index 6ec9c76e3050ae8d5c8d658f6c57a14f502dac52..254b4d5758463f859280b44471b17b0c07d895c3 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c58c3b1c9745cdc8b7c7+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c58c3b1c9745cdc8b7c7+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6f26982e448868bb745d66f5dc9c4eac5495e2c1b45644dddaea3329dc6e4039 +oid sha256:1503c163901140c3c6cff34a88574d3b16f0cfcf93e5776aa6138f4c5d31702b size 4885504 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c58c3b1c9745cdc8b7c7+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c58c3b1c9745cdc8b7c7+5be477de/wrapped_neff.hlo index 3b488cd73b88c7ebde6130d8e199b6ad3a3c0908..53e1d10bcf467986e7fc1de78f4ff805d2856a38 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c58c3b1c9745cdc8b7c7+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c58c3b1c9745cdc8b7c7+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a4feb23c1fbd958fb7a2e6ee6f804d4f0d0d97a54b068d936ac5458e06332439 +oid sha256:c5267323fe94c9128dfe2dd422429248faff4e302101e83bb92f78c0cf7fd74c size 5058549 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c7b1afc8cbed0b2dbf01+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c7b1afc8cbed0b2dbf01+431f5505/model.neff index bcaf3fb9e78fb2372af8278e3d2023bc3fb6da56..f6c9c6a98043d9e583d7703d88c6b5e9129fc399 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c7b1afc8cbed0b2dbf01+431f5505/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_c7b1afc8cbed0b2dbf01+431f5505/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_cbd29f12a931a6034fdc+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_cbd29f12a931a6034fdc+431f5505/model.neff index a12afd4db0c9a0280158065dbf44e711dc7757b6..96d2fd66b7b404052a3f52202f94fe5485d46ebc 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_cbd29f12a931a6034fdc+431f5505/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_cbd29f12a931a6034fdc+431f5505/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_cdb1257943a078485626+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_cdb1257943a078485626+84f3e719/model.neff index b8adef5794916f499b0c16c0d3e45d3020642aaa..f873d0e19407cca45f6b19c609f413dd39372b57 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_cdb1257943a078485626+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_cdb1257943a078485626+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f49a570369624a9ecc8b9e186c88cc2aa8dd6821c27ef20822e2145aae9172ae +oid sha256:2c81b3204ab5b0f437eb9ffb073d99229c72ec5f7e4185a891bfdc8e767b285c size 31867904 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..e24f877fd3bd437b366557076d7c7d635759a2ca --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2c5fcdff9fbfa35b7d64f748cbb7207bbcbe6ffa --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0cd76ace5e6f1a3df1193b16ac13dc0b6c893919326dadab8f4c9c2e702b50c +size 1911064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7c12909a82ab224ab2b0684417b140d2dc940084 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b907ab33b50f4f3d212d6499b5144bb73a30d3c6c4888505dfd28886c0677952 +size 8233984 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..fe1a536c8a9e846245b917f73b52f4dd1df0187c --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d265ad478c2b4276dbcc+5be477de/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e34beea364bce7e13b6ec51555ce7b79cd692014e00032cc5100e4ff1c63332 +size 8577559 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d43edcfa396bb5f7fa37+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d43edcfa396bb5f7fa37+5be477de/model.neff index 12313fe2bca2004e356160ca4098ebb31108ef7d..2d43f71f7fbeffaa6ff9deaf124ee62df29ba049 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d43edcfa396bb5f7fa37+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d43edcfa396bb5f7fa37+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7f1b7f0169d2b9e38e0505e94aba7f5c35c3bf77540664e8434f50c97d74bc03 +oid sha256:5b1ebf710d7cc5b0de84ef8e7920dcd8eb62252bec30e4f2e0da985dd31de9c7 size 216064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d43edcfa396bb5f7fa37+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d43edcfa396bb5f7fa37+5be477de/wrapped_neff.hlo index 303855757e0025fc151776513b7d355def6fc468..7c4d2866082836642c5ba9e5cfcfe24ebb8cf7d6 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d43edcfa396bb5f7fa37+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d43edcfa396bb5f7fa37+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:33d30c98bd7251f4cc223426d859552a205bb86a56ab8b541df5b93dc3f77e57 +oid sha256:d42680fa0b68c035ecba291608b9ee78d9dce3a1d8932fe01a4eae9bf2d77e4f size 223770 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..e24f877fd3bd437b366557076d7c7d635759a2ca --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..12c9d702c96d2d3d5d79fcd0da25323e8071ccff --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8c4bfb4a3a80783b2a17c61e627c81e514f5fd14b92ec0d4f5e601794825129 +size 773049 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..71b0d375a8ec791470e24c48ed1280a02929c2f4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a07eee4f4ad79222aac0a031687e6f074f85e939e3c6a0a73a761f23dfb7509 +size 3841024 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..f53210580e7ca168dfcd6194ab25754d3eaff686 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d51b8cc19b9784687709+5be477de/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca6fc751ec3a222237c1b39a9c068244dfb1b597cd10c9f00f0a2a61d8f841fb +size 3978841 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d6c19a447da67dfa686e+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d6c19a447da67dfa686e+431f5505/model.neff index 64f0b7078c724e74d8c7e18420cfc96cb67cbf2a..d67d9acd6b2a6fbe231449b40669f6c331329d37 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d6c19a447da67dfa686e+431f5505/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d6c19a447da67dfa686e+431f5505/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8ec04796190477a39934d9f899e8602197a22cbc9e101dc0248dea5582b4469b +oid sha256:12baa0e6a5c8ae2d90ebf56eaa45a53f8085068dc450b5613927eafcad8e1350 size 103424 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d7e2548756fae2419754+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d7e2548756fae2419754+5be477de/model.neff index 764f9cdbba76e3c31f8cca151ee2227f2a00a16d..039a66e561ea3ef85fc422e11159c84552cbd1ef 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d7e2548756fae2419754+5be477de/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d7e2548756fae2419754+5be477de/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:68adc92264f879a6a3c2ed4866a1def6023f6041cbece802067a56430225f206 +oid sha256:90011a7b74cd8cedd21beab5f0105b67a975dcd1c99a509a7b76832aa6c4c8ae size 2151424 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d7e2548756fae2419754+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d7e2548756fae2419754+5be477de/wrapped_neff.hlo index fe8a4b41e3d414e237f7623bc2954f7c9cd95ec9..110a46367a74635e4f2ec80e2b4eb234e05c4d8a 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d7e2548756fae2419754+5be477de/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d7e2548756fae2419754+5be477de/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2380ec34e81a57b7dcd09d2cef310b4ae7c27dbcfd4432dc05771b536dcadaf8 +oid sha256:930529517954a020d452a7d3cb9ec3fc249379cf44b05340e8a7e2993dad6a19 size 2221053 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d84f59502564753faaf1+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d84f59502564753faaf1+431f5505/model.neff index 8fb2d0c5b526ec051bc2302330d63ff608034012..6de944c18cafd39bdba5e04d8a922a82412fed84 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d84f59502564753faaf1+431f5505/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d84f59502564753faaf1+431f5505/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:57148812c2312dd95b5ddf1007ffd0f756fdc5881c70266129af49acfdd184fc +oid sha256:6879d6759e2fd04da1faf21f3b48689a6aff0a67926deed21a47bdada119584e size 2274304 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_da644c4824015946da20+ca355898/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_da644c4824015946da20+ca355898/model.neff index 2da852a38c74e4dbf48c0c6e77c6849e4b0743c2..63d3a49485f4766ae4f97ac71cffee3dc827081c 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_da644c4824015946da20+ca355898/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_da644c4824015946da20+ca355898/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a9d85adba2658d4625af536d31072f39991b231227cfb17c745adc0911889f64 +oid sha256:7614258fc592bd21a671fc29fd833fdf6321eab9923b28bdaa281a03ea028aa0 size 246784 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_da644c4824015946da20+ca355898/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_da644c4824015946da20+ca355898/wrapped_neff.hlo index 844816dcdc5b6390f835b7e75a060e090f6312fc..b72fd7079202294281d082b853096297c8c1f04f 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_da644c4824015946da20+ca355898/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_da644c4824015946da20+ca355898/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:626da706ce9b8c4d7c551d6a4bf4b2b0ec5f085a91d62cc5692c8469f2e6fef0 +oid sha256:0652c2837255ddb07aee5fdffebf5b8ae68da37845f1e83aabe3f152b2b40db6 size 258114 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db708956da7a3174471d+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db708956da7a3174471d+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db708956da7a3174471d+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db708956da7a3174471d+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db708956da7a3174471d+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db708956da7a3174471d+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db708956da7a3174471d+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e493d501dab7626cee2a41ac607c678ad06bdb44 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db708956da7a3174471d+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07320203e12321430e926d11e45f841c5dada2dcdc4b9494ef6ce64d5ae37a6c +size 858046 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db708956da7a3174471d+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db708956da7a3174471d+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..bb35d5f9d0236fba65cfbcaa32dbd3b2ab97c1c1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db708956da7a3174471d+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:070af26c182dbd87738d25306473305a2e2e20171fdf6d04bcbfc2fdab5ffa43 +size 5786624 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_de463290b0cc81f3e50a+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_de463290b0cc81f3e50a+431f5505/model.neff index 41653fa7ea418eb718f73a4b8d4c1070a9a16242..d7ad88fc9e26890d00987e59616603c6d6a0420f 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_de463290b0cc81f3e50a+431f5505/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_de463290b0cc81f3e50a+431f5505/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ab5bcbb77f5aa563aea48d1f0d2c61bff08cdb8376e6a773d4e522532cf0f6d0 +oid sha256:3848fcec9b32af2021ea06f33bd5924122b55f43a41b7fe1e76d97d0215fa4c8 size 594944 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..107cebd2dc9223d7d557c2256bdd494131263beb --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=1 --vectorize-strided-dma ", "--lnc=1", "-O2", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b25ba34ceb75e44194415a1b72bd90707c39db39 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19f599ce69d962eb886127c2db10ab5c5dacd77051234269877f5c8ad84f473e +size 745398 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..248fcf23f3275f35cd1731ca59683a829e917d0d --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7305d37ac4aede1368287e2e62ba519682ba1e3cf145273ff960470a8b342aab +size 2468864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..05a9eee8435fd128edab04f75392b92d11bb6f07 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e09b62be1d6d8ad18632+617f6939/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a74d67e1562716284c3832f66d415f62749f6b3c57322035535309f16d579e4c +size 2640590 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4125c11885b90ff94c9+431f5505/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4125c11885b90ff94c9+431f5505/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..9932c70d27d759d781be88485b74b17b49b4c04f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4125c11885b90ff94c9+431f5505/compile_flags.json @@ -0,0 +1 @@ +"--model-type=transformer -O1 --lnc=1 --internal-hlo2tensorizer-options=--experimental-unsafe-fp8e4m3fn-as-fp8e4m3 --logfile=/tmp/nxd_model/layout_opt/log-neuron-cc.txt" \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4125c11885b90ff94c9+431f5505/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4125c11885b90ff94c9+431f5505/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4125c11885b90ff94c9+431f5505/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4125c11885b90ff94c9+431f5505/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8a554e1b77b9a7df908fa74bdc87045aa82e3fae --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4125c11885b90ff94c9+431f5505/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aff9d6f42eae55702201bb0e47eb34ec59feb160a18d9cd679c5a34266c5256d +size 339944 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4125c11885b90ff94c9+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4125c11885b90ff94c9+431f5505/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..26053178883b79c7517ec4744b80fee78620c017 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4125c11885b90ff94c9+431f5505/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c1b555dfee8836335340f096cf1e165c95afdcf6b22edca04d598dfa2053988 +size 8182784 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e48df5a1ca8b2b49e13f+ad9e832d/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e48df5a1ca8b2b49e13f+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e48df5a1ca8b2b49e13f+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e48df5a1ca8b2b49e13f+ad9e832d/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e48df5a1ca8b2b49e13f+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e48df5a1ca8b2b49e13f+ad9e832d/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e48df5a1ca8b2b49e13f+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3bfe984fcdc978e129c8ea5b82b56a969aa19f82 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e48df5a1ca8b2b49e13f+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90219bf03934f40c0c8753f2e706536d262abb06db039f0e806a238e39b6a3d3 +size 1789812 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e48df5a1ca8b2b49e13f+ad9e832d/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e48df5a1ca8b2b49e13f+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..2c0bd2f7e7c2545669b56b69754c921dad93cff3 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e48df5a1ca8b2b49e13f+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b909a79a3a657d1ff90463f00c789bc37a5f0f958d50f7128eae8ea05697051 +size 2520064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4ae034a0e6bde8dd152+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4ae034a0e6bde8dd152+84f3e719/model.hlo_module.pb index faf2d305a3e0018c7110ca30f5864323a5d5eb35..b45c639e4a7e818e4d96f69f71149d19b10389fb 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4ae034a0e6bde8dd152+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4ae034a0e6bde8dd152+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4c0ae40a2d1e2306a933fdea473d674b57854e26c6608172c516da401a559618 +oid sha256:4eb25c443d6cf2fe2e2ab55b05029569a1aa3e75608c0634a8650533b06c46b4 size 46622 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4ae034a0e6bde8dd152+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4ae034a0e6bde8dd152+84f3e719/model.neff index 51f8c849ac38a168298d1c58dae3a62033408963..9e203f494f922b8f4690c863f764105ccdf6534f 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4ae034a0e6bde8dd152+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4ae034a0e6bde8dd152+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3b578b3c5b81bbbf8b7a20009bf45e82a4fca470e81c11a6da9240fa40cc4033 +oid sha256:23194ec69f19c8f3023e75314b47e31e462b52c4e3ad5482c7c5871a4fce399b size 144384 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e6cf0fcd9a16a4306e4c+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e6cf0fcd9a16a4306e4c+84f3e719/model.hlo_module.pb index 4a436b9c2f836dffec88e39c4528b404471aabc6..9cbbc4c635ad7641dfda536147ede80bccdcfb89 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e6cf0fcd9a16a4306e4c+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e6cf0fcd9a16a4306e4c+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:afbe904f71746cb80e822a0d50f8263f88b82cd9e0cd1759620046bbb628b58e +oid sha256:7c1606fd12d57efa1a8823b5f6cebc151cbe7fabf201a575f62206bebe1d973e size 715372 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e6cf0fcd9a16a4306e4c+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e6cf0fcd9a16a4306e4c+84f3e719/model.neff index d0a2dcd40c0c85b85ecf9e16d6356d7bea211904..dd6e80c40c08f1909407b70c00598082e7476ad9 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e6cf0fcd9a16a4306e4c+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e6cf0fcd9a16a4306e4c+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:796c26acf7cb1d1320884e10cf9f764ecfbb6cfe557d24348151b3cb7a85175c +oid sha256:4f8875e6a1fdad78dafd4d4808f2ef48525c34c0f1b30f6af4cb1743c8d30e82 size 19835904 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e9c7a317b8ff33889716+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e9c7a317b8ff33889716+84f3e719/model.hlo_module.pb index fff590726b32f7b074886a9a2639593c34aaae71..14baac76b252c4f5619625e0bb51aa8bcef52a52 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e9c7a317b8ff33889716+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e9c7a317b8ff33889716+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3b75d37483883ea40ffa8ca5df68499478139b9b0c5b415240667ec36afe54a8 +oid sha256:d4135cdf3a474d12793ab55474180091c957ef032abef7de650b0a277cb2048f size 47478 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e9c7a317b8ff33889716+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e9c7a317b8ff33889716+84f3e719/model.neff index 8a6a56e0b6373b6f8f38aa0c195ed9747990e5fd..83b0124ec96368bc29408c631698f5485dd1a727 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e9c7a317b8ff33889716+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e9c7a317b8ff33889716+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a0db86f94352a9b9001fde493191928bb68d81b78cce34a7c40b8b2306f8dd6f +oid sha256:1b6c609b2232870f2babcf7c062f4312c306563a2d58f3f7cc7589af54486206 size 246784 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..48c060bfc566a2808b5ac053f2c6154a586b957f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce55f9f3b779172d357a166157f85e849aef70cc86fc56962d5dd729022e4b4 +size 773433 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f3e3f12d2391de22aadf092dfaaa037fc832ff68 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6969e3652e9d4c9605bb9b538e7467a7e51bd5ceba9981fb92784f0e28f225b +size 6237184 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..cfd28983eb686b722181e3b5f0d7587f7d0c4e91 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_eb35938cbfc781930141+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05205d1e0412418e6181ac619583bccd7ee5278736b7c9e959c32a236245b46f +size 6375001 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ec3616cec65f8deb284b+ad9e832d/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ec3616cec65f8deb284b+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ec3616cec65f8deb284b+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ec3616cec65f8deb284b+ad9e832d/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ec3616cec65f8deb284b+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ec3616cec65f8deb284b+ad9e832d/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ec3616cec65f8deb284b+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..91776ef5712b5571d1de1baff244a9c499834010 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ec3616cec65f8deb284b+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ffccba216823c3cebff446b9b6a9b9faa3fc2e76552e65e0df5499d0a03a273 +size 1789812 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ec3616cec65f8deb284b+ad9e832d/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ec3616cec65f8deb284b+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d90108d89e43372f408f85c098fa8a88e6c1a0de --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ec3616cec65f8deb284b+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:636bcd5261129fea69900483b03b798ec23da6207d24586bab57257550121d11 +size 2520064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ed6180267143dfea9183+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ed6180267143dfea9183+431f5505/model.neff index a79586b2377752509482627cf5fbdb97e8f51036..3811d7917b56c964461723a18a924339eb13ffa9 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ed6180267143dfea9183+431f5505/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ed6180267143dfea9183+431f5505/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ef8771b8447d48519ae4+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ef8771b8447d48519ae4+431f5505/model.neff index 09a769b90b84cb98c7e5be1c1dc4c82e94ff4299..08da78d525f1f719d5f8bfcec45e8a2d8257b4f0 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ef8771b8447d48519ae4+431f5505/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ef8771b8447d48519ae4+431f5505/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d3f111aa060cdc7f6c5648eda137df09491ae67418906aae99d80996bbf627fc +oid sha256:2897ded479757c09958822fc780197d52175739e8c36edd6403aa2df5bf5a1e2 size 3974144 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f101d5f6b79e47ea24cd+431f5505/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f101d5f6b79e47ea24cd+431f5505/model.neff index c855e14e68af9f24a97ec092cb220491f50720ae..7aa3afbfb6d25f3e5bcb147742b0ed5b1c211f52 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f101d5f6b79e47ea24cd+431f5505/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f101d5f6b79e47ea24cd+431f5505/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:afba2a97ccce705a91b19a8cd604a872fd0a2d9002e3b4f36ee1f4beb347f98b +oid sha256:ed3ab87f52d67ddded78138be2135b0830286157aabc64d3453ea73f7e2be11d size 1178624 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f407a744f5f40980a494+84f3e719/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f407a744f5f40980a494+84f3e719/model.hlo_module.pb index 839081bc58795f75b84338359e184c9d07d2c811..58f4cb07f3acaee9b9ff560d4a8dd98c7c66196f 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f407a744f5f40980a494+84f3e719/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f407a744f5f40980a494+84f3e719/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0ab306ca3554c7c2a6e317ad92aaa6fb0edec08e7300665f2f603656289cabb6 +oid sha256:b086f89fdd83c753893ea4f9e290ae3ae7da3856dff528cc953936b24c590426 size 427940 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f407a744f5f40980a494+84f3e719/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f407a744f5f40980a494+84f3e719/model.neff index abf832d13640a625dcdd701b9637cfcd017caba5..155ba5d163d42cc1e434103225ff618d1b6bffbe 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f407a744f5f40980a494+84f3e719/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f407a744f5f40980a494+84f3e719/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2136c4058f81b4b50d81d437353cdbbf362989256e37362d38d0cca62735c7a5 +oid sha256:d75b500fc075523597f5bfd193d2c9e702baf6f46d03ce9798321e780b0cb123 size 31120384 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..e24f877fd3bd437b366557076d7c7d635759a2ca --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-dge-dma --vectorize-strided-dma ", "-O2", "--internal-num-neuroncores-per-sengine=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..132bc422001def92d60719e338da0d0394dd4954 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d1360974675cafa0d38921f0013c9df0c9639537b0d0076974f045646fa23e3 +size 773433 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..139ab3407aba884e4ca62946fa17a53e272a3469 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:302a92c6f3fe621df127d000505e65a36912809c3216fadc23836a0cae7266e6 +size 4926464 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..19f565814dccb9b7cb99db680878ae0e37dd9d74 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f559b4b89708afc7e809+5be477de/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:236f5b7aba42341d1994d355b4f5bdeb2a0c816c819758d2b6e070f2ffffec6a +size 5064281 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8cade1575b9d31c15da+ad9e832d/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8cade1575b9d31c15da+ad9e832d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2078b3647f01aa3165babe7ccfb751b4575e61 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8cade1575b9d31c15da+ad9e832d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "--lnc=1", "-O1", "--internal-hlo2tensorizer-options= --modular-flow-mac-threshold=10 --verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8cade1575b9d31c15da+ad9e832d/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8cade1575b9d31c15da+ad9e832d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8cade1575b9d31c15da+ad9e832d/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8cade1575b9d31c15da+ad9e832d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4c7a25ec423eb9ecf78aaa32e5870966efd9e309 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8cade1575b9d31c15da+ad9e832d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f904043d81d836bd0374acd05de056e257e0d854b36af66b646aa6bcef23ff9 +size 1789812 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8cade1575b9d31c15da+ad9e832d/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8cade1575b9d31c15da+ad9e832d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b65d1a7555d57fbb856abc6b859499a7c9d52f05 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8cade1575b9d31c15da+ad9e832d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b58e5f3568be6c98ea11334ac31a3b989f6ca4cb96275027ffc845199b1a1ab +size 2520064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f95e3cf0271f5c661734+ca355898/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f95e3cf0271f5c661734+ca355898/model.neff index 5a0cc4be521d2f28fc7632fcfe89761c56e8c219..4237d3675e8adc880406ba92a59b454ebffd67c7 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f95e3cf0271f5c661734+ca355898/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f95e3cf0271f5c661734+ca355898/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d949554b84305800c99daa634390481e9a90870b437d5a62f955b44e5a83fffa +oid sha256:b0257059d9e332b0a165601211a0f5a11c8471c1f55ea42fdf23e2fae04d278d size 246784 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f95e3cf0271f5c661734+ca355898/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f95e3cf0271f5c661734+ca355898/wrapped_neff.hlo index 323ed18658d61f30248d6811fe80ad85bba87f86..c74a39bc36ecc53c7de6692932a6e7762b124356 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f95e3cf0271f5c661734+ca355898/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f95e3cf0271f5c661734+ca355898/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b73125970ef192ad54cd2e87acba14b1a56c7d8febb88c8ee7ee54f8fa4087bc +oid sha256:5d618b554d92f95543e636879190f32bf698d8094c33e0a648cdff00e7a4e58b size 258114