diff --git a/.gitattributes b/.gitattributes index 0989f66791939045c68ec822f2b4189585a32498..93b1dce0d720b67e9d9af5e184a08d7f8a740211 100644 --- a/.gitattributes +++ b/.gitattributes @@ -4777,3 +4777,60 @@ neuronxcc-2.20.9961.0+0acef03a/MODULE_f68e835b3390768bbcce+5aef0af0/model.neff f neuronxcc-2.20.9961.0+0acef03a/MODULE_f68e835b3390768bbcce+5aef0af0/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text neuronxcc-2.20.9961.0+0acef03a/MODULE_fdb7516de508e42d4f39+97633c67/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.20.9961.0+0acef03a/MODULE_fdb7516de508e42d4f39+97633c67/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_02da278f167522769f43+253d6470/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_4ab214a26135c9602b57+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_63cd0b95d5730c3ea2ff+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_7492a59ff398cdd8c726+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c3334ebde4334499745+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_826fd2949b06a672b9bc+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_88c363db429237aad147+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_96aa20706930df3658e1+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_978910d0b56af3a47501+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_a8844fe97439b2667680+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_ae0fabd3d0b75f0150a0+253d6470/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_bbb0c02d6e06f337e549+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_db25850f47f3c97209ab+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_dd67c7d76a4a3b7bc5ff+253d6470/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5e262df0f4573dfd367+253d6470/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/meta-llama/Llama-4-Scout-17B-16E-Instruct/53100a81701818c9be88.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/meta-llama/Llama-4-Scout-17B-16E-Instruct/53100a81701818c9be88.json new file mode 100644 index 0000000000000000000000000000000000000000..1f04ded78d7c6424dcd43f445726fb47da0302b7 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/meta-llama/Llama-4-Scout-17B-16E-Instruct/53100a81701818c9be88.json @@ -0,0 +1,221 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "_task": "text-generation", + "attention_bias": false, + "attention_chunk_size": 8192, + "attention_dropout": 0.0, + "attn_scale": 0.1, + "attn_temperature_tuning": true, + "floor_scale": 8192, + "for_llm_compressor": false, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 5120, + "initializer_range": 0.02, + "interleave_moe_layer_step": 1, + "intermediate_size": 8192, + "intermediate_size_mlp": 16384, + "layer_types": [ + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention" + ], + "max_position_embeddings": 10485760, + "model_type": "llama4_text", + "moe_layers": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 10, + 11, + 12, + 13, + 14, + 15, + 16, + 17, + 18, + 19, + 20, + 21, + 22, + 23, + 24, + 25, + 26, + 27, + 28, + 29, + 30, + 31, + 32, + 33, + 34, + 35, + 36, + 37, + 38, + 39, + 40, + 41, + 42, + 43, + 44, + 45, + 46, + 47 + ], + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "checkpoint_revision": "92f3b1597a195b523d8d9e5700e57e4fbb8f20d3", + "continuous_batching": false, + "enable_bucketing": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 16, + "logical_nc_config": 1, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "on_device_sampling": false, + "optimum_neuron_version": "0.3.1.dev6", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 16 + }, + "no_rope_layers": [ + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0 + ], + "num_attention_heads": 40, + "num_experts_per_tok": 1, + "num_hidden_layers": 48, + "num_key_value_heads": 8, + "num_local_experts": 16, + "output_router_logits": false, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 16.0, + "high_freq_factor": 1.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "router_aux_loss_coef": 0.001, + "router_jitter_noise": 0.0, + "tie_word_embeddings": false, + "use_cache": true, + "use_qk_norm": true, + "vocab_size": 202048 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/meta-llama/Llama-4-Scout-17B-16E-Instruct/5c9a7ddb696911cf7f93.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/meta-llama/Llama-4-Scout-17B-16E-Instruct/5c9a7ddb696911cf7f93.json new file mode 100644 index 0000000000000000000000000000000000000000..d92689a963c368816e69a96cac020e3e773c33a9 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/meta-llama/Llama-4-Scout-17B-16E-Instruct/5c9a7ddb696911cf7f93.json @@ -0,0 +1,221 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "_task": "text-generation", + "attention_bias": false, + "attention_chunk_size": 8192, + "attention_dropout": 0.0, + "attn_scale": 0.1, + "attn_temperature_tuning": true, + "floor_scale": 8192, + "for_llm_compressor": false, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 5120, + "initializer_range": 0.02, + "interleave_moe_layer_step": 1, + "intermediate_size": 8192, + "intermediate_size_mlp": 16384, + "layer_types": [ + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention" + ], + "max_position_embeddings": 10485760, + "model_type": "llama4_text", + "moe_layers": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 10, + 11, + 12, + 13, + 14, + 15, + 16, + 17, + 18, + 19, + 20, + 21, + 22, + 23, + 24, + 25, + 26, + 27, + 28, + 29, + 30, + 31, + 32, + 33, + 34, + 35, + 36, + 37, + 38, + 39, + 40, + 41, + 42, + 43, + 44, + 45, + 46, + 47 + ], + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "checkpoint_revision": "92f3b1597a195b523d8d9e5700e57e4fbb8f20d3", + "continuous_batching": true, + "enable_bucketing": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 16, + "logical_nc_config": 1, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "on_device_sampling": false, + "optimum_neuron_version": "0.3.1.dev6", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 16 + }, + "no_rope_layers": [ + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0 + ], + "num_attention_heads": 40, + "num_experts_per_tok": 1, + "num_hidden_layers": 48, + "num_key_value_heads": 8, + "num_local_experts": 16, + "output_router_logits": false, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 16.0, + "high_freq_factor": 1.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "router_aux_loss_coef": 0.001, + "router_jitter_noise": 0.0, + "tie_word_embeddings": false, + "use_cache": true, + "use_qk_norm": true, + "vocab_size": 202048 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/meta-llama/Llama-4-Scout-17B-16E-Instruct/c958eda2360716f886e4.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/meta-llama/Llama-4-Scout-17B-16E-Instruct/c958eda2360716f886e4.json new file mode 100644 index 0000000000000000000000000000000000000000..0136042f9dd3484ebd68c867f612c44cd726b085 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/meta-llama/Llama-4-Scout-17B-16E-Instruct/c958eda2360716f886e4.json @@ -0,0 +1,221 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "_task": "text-generation", + "attention_bias": false, + "attention_chunk_size": 8192, + "attention_dropout": 0.0, + "attn_scale": 0.1, + "attn_temperature_tuning": true, + "floor_scale": 8192, + "for_llm_compressor": false, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 5120, + "initializer_range": 0.02, + "interleave_moe_layer_step": 1, + "intermediate_size": 8192, + "intermediate_size_mlp": 16384, + "layer_types": [ + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention" + ], + "max_position_embeddings": 10485760, + "model_type": "llama4_text", + "moe_layers": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 10, + 11, + 12, + 13, + 14, + 15, + 16, + 17, + 18, + 19, + 20, + 21, + 22, + 23, + 24, + 25, + 26, + 27, + 28, + 29, + 30, + 31, + 32, + 33, + 34, + 35, + 36, + 37, + 38, + 39, + 40, + 41, + 42, + 43, + 44, + 45, + 46, + 47 + ], + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "checkpoint_revision": "92f3b1597a195b523d8d9e5700e57e4fbb8f20d3", + "continuous_batching": false, + "enable_bucketing": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 16, + "logical_nc_config": 1, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "on_device_sampling": false, + "optimum_neuron_version": "0.3.1.dev6", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 16 + }, + "no_rope_layers": [ + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0 + ], + "num_attention_heads": 40, + "num_experts_per_tok": 1, + "num_hidden_layers": 48, + "num_key_value_heads": 8, + "num_local_experts": 16, + "output_router_logits": false, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 16.0, + "high_freq_factor": 1.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "router_aux_loss_coef": 0.001, + "router_jitter_noise": 0.0, + "tie_word_embeddings": false, + "use_cache": true, + "use_qk_norm": true, + "vocab_size": 202048 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/meta-llama/Llama-4-Scout-17B-16E-Instruct/f9d1010b22a4e5da4bd5.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/meta-llama/Llama-4-Scout-17B-16E-Instruct/f9d1010b22a4e5da4bd5.json new file mode 100644 index 0000000000000000000000000000000000000000..be707ea121d78147cb14288b8132cec52e5635d0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/meta-llama/Llama-4-Scout-17B-16E-Instruct/f9d1010b22a4e5da4bd5.json @@ -0,0 +1,221 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "_task": "text-generation", + "attention_bias": false, + "attention_chunk_size": 8192, + "attention_dropout": 0.0, + "attn_scale": 0.1, + "attn_temperature_tuning": true, + "floor_scale": 8192, + "for_llm_compressor": false, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 5120, + "initializer_range": 0.02, + "interleave_moe_layer_step": 1, + "intermediate_size": 8192, + "intermediate_size_mlp": 16384, + "layer_types": [ + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention", + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention" + ], + "max_position_embeddings": 10485760, + "model_type": "llama4_text", + "moe_layers": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 10, + 11, + 12, + 13, + 14, + 15, + 16, + 17, + 18, + 19, + 20, + 21, + 22, + 23, + 24, + 25, + 26, + 27, + 28, + 29, + 30, + 31, + 32, + 33, + 34, + 35, + 36, + 37, + 38, + 39, + 40, + 41, + 42, + 43, + 44, + 45, + 46, + 47 + ], + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "checkpoint_revision": "92f3b1597a195b523d8d9e5700e57e4fbb8f20d3", + "continuous_batching": true, + "enable_bucketing": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 16, + "logical_nc_config": 1, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "on_device_sampling": true, + "optimum_neuron_version": "0.3.1.dev6", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 16 + }, + "no_rope_layers": [ + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0, + 1, + 1, + 1, + 0 + ], + "num_attention_heads": 40, + "num_experts_per_tok": 1, + "num_hidden_layers": 48, + "num_key_value_heads": 8, + "num_local_experts": 16, + "output_router_logits": false, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 16.0, + "high_freq_factor": 1.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "router_aux_loss_coef": 0.001, + "router_jitter_noise": 0.0, + "tie_word_embeddings": false, + "use_cache": true, + "use_qk_norm": true, + "vocab_size": 202048 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/tiny-random/llama-4/585b1c34b9a47c8c0a73.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/tiny-random/llama-4/585b1c34b9a47c8c0a73.json new file mode 100644 index 0000000000000000000000000000000000000000..40a2fcb344d9c4c7ec8da973f3b6df1f2f903285 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/llama4_text/tiny-random/llama-4/585b1c34b9a47c8c0a73.json @@ -0,0 +1,82 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "tiny-random/llama-4", + "_task": "text-generation", + "attention_bias": false, + "attention_chunk_size": 128, + "attention_dropout": 0.0, + "attn_scale": 0.1, + "attn_temperature_tuning": 4, + "cache_implementation": "hybrid", + "floor_scale": 8192, + "for_llm_compressor": false, + "head_dim": 32, + "hidden_act": "silu", + "hidden_size": 32, + "initializer_range": 0.02, + "interleave_moe_layer_step": 2, + "intermediate_size": 64, + "intermediate_size_mlp": 128, + "layer_types": [ + "chunked_attention", + "chunked_attention", + "chunked_attention", + "full_attention" + ], + "max_position_embeddings": 1048576, + "model_type": "llama4_text", + "moe_layers": [ + 1, + 3 + ], + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "tiny-random/llama-4", + "checkpoint_revision": "9e716f5d4d1ffe0a44a15f46f4a12b840439aba4", + "continuous_batching": false, + "enable_bucketing": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 2, + "logical_nc_config": 1, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "on_device_sampling": false, + "optimum_neuron_version": "0.3.1.dev6", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "no_rope_layers": [ + 1, + 1, + 1, + 0 + ], + "num_attention_heads": 1, + "num_experts_per_tok": 1, + "num_hidden_layers": 4, + "num_key_value_heads": 1, + "num_local_experts": 8, + "output_router_logits": false, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 500000.0, + "router_aux_loss_coef": 0.001, + "router_jitter_noise": 0.0, + "tie_word_embeddings": true, + "use_cache": true, + "use_qk_norm": true, + "vocab_size": 202048 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/qwen3_moe/Qwen/Qwen3-30B-A3B-Instruct-2507/0dd3b941d43fb01b72a8.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/qwen3_moe/Qwen/Qwen3-30B-A3B-Instruct-2507/0dd3b941d43fb01b72a8.json new file mode 100644 index 0000000000000000000000000000000000000000..496555dc7246d4c4673d5bab6d17605121cee633 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/qwen3_moe/Qwen/Qwen3-30B-A3B-Instruct-2507/0dd3b941d43fb01b72a8.json @@ -0,0 +1,66 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "_task": "text-generation", + "architectures": [ + "Qwen3MoeForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "decoder_sparse_step": 1, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 6144, + "max_position_embeddings": 262144, + "max_window_layers": 48, + "mlp_only_layers": [], + "model_type": "qwen3_moe", + "moe_intermediate_size": 768, + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "checkpoint_revision": "61082d4deaa4785f64943b443cbc2b5de7524fad", + "continuous_batching": true, + "enable_bucketing": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 16, + "logical_nc_config": 1, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "on_device_sampling": false, + "optimum_neuron_version": "0.3.1.dev6", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 16 + }, + "norm_topk_prob": true, + "num_attention_heads": 32, + "num_experts": 128, + "num_experts_per_tok": 8, + "num_hidden_layers": 48, + "num_key_value_heads": 4, + "output_router_logits": false, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 10000000, + "router_aux_loss_coef": 0.001, + "sliding_window": null, + "tie_word_embeddings": false, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/qwen3_moe/Qwen/Qwen3-30B-A3B-Instruct-2507/5c776e5f1eb55e76831a.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/qwen3_moe/Qwen/Qwen3-30B-A3B-Instruct-2507/5c776e5f1eb55e76831a.json new file mode 100644 index 0000000000000000000000000000000000000000..21d1d145bcefa5eb378d526e82d61d4b07b37d04 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/qwen3_moe/Qwen/Qwen3-30B-A3B-Instruct-2507/5c776e5f1eb55e76831a.json @@ -0,0 +1,66 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "_task": "text-generation", + "architectures": [ + "Qwen3MoeForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "decoder_sparse_step": 1, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 6144, + "max_position_embeddings": 262144, + "max_window_layers": 48, + "mlp_only_layers": [], + "model_type": "qwen3_moe", + "moe_intermediate_size": 768, + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "checkpoint_revision": "61082d4deaa4785f64943b443cbc2b5de7524fad", + "continuous_batching": true, + "enable_bucketing": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 16, + "logical_nc_config": 1, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "on_device_sampling": true, + "optimum_neuron_version": "0.3.1.dev6", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 16 + }, + "norm_topk_prob": true, + "num_attention_heads": 32, + "num_experts": 128, + "num_experts_per_tok": 8, + "num_hidden_layers": 48, + "num_key_value_heads": 4, + "output_router_logits": false, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 10000000, + "router_aux_loss_coef": 0.001, + "sliding_window": null, + "tie_word_embeddings": false, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/qwen3_moe/Qwen/Qwen3-30B-A3B-Instruct-2507/99615150643a9e903722.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/qwen3_moe/Qwen/Qwen3-30B-A3B-Instruct-2507/99615150643a9e903722.json new file mode 100644 index 0000000000000000000000000000000000000000..4e98ec6cb927ef1b6d95fa16388d53cbaebd8243 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/qwen3_moe/Qwen/Qwen3-30B-A3B-Instruct-2507/99615150643a9e903722.json @@ -0,0 +1,66 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "_task": "text-generation", + "architectures": [ + "Qwen3MoeForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "decoder_sparse_step": 1, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 6144, + "max_position_embeddings": 262144, + "max_window_layers": 48, + "mlp_only_layers": [], + "model_type": "qwen3_moe", + "moe_intermediate_size": 768, + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 8, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "checkpoint_revision": "61082d4deaa4785f64943b443cbc2b5de7524fad", + "continuous_batching": true, + "enable_bucketing": false, + "ep_degree": 1, + "fused_qkv": false, + "glu_mlp": true, + "local_ranks_size": 16, + "logical_nc_config": 1, + "max_batch_size": 8, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.19.8089.0+8ab9f450", + "on_device_sampling": true, + "optimum_neuron_version": "0.3.1.dev6", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 16 + }, + "norm_topk_prob": true, + "num_attention_heads": 32, + "num_experts": 128, + "num_experts_per_tok": 8, + "num_hidden_layers": 48, + "num_key_value_heads": 4, + "output_router_logits": false, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 10000000, + "router_aux_loss_coef": 0.001, + "sliding_window": null, + "tie_word_embeddings": false, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/t5/hf-internal-testing/tiny-random-t5/15f7e443873c3474a6aa.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/t5/hf-internal-testing/tiny-random-t5/15f7e443873c3474a6aa.json new file mode 100644 index 0000000000000000000000000000000000000000..196770eca4fe7ca59d8e3cdb1e5011aaebc20f75 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/t5/hf-internal-testing/tiny-random-t5/15f7e443873c3474a6aa.json @@ -0,0 +1,91 @@ +{ + "_entry_class": "MultiModelCacheEntry", + "_model_id": "hf-internal-testing/tiny-random-t5", + "_task": null, + "decoder": { + "classifier_dropout": 0.0, + "d_ff": 37, + "d_kv": 8, + "d_model": 32, + "decoder_start_token_id": 0, + "dense_act_fn": "relu", + "dropout_rate": 0.1, + "feed_forward_proj": "relu", + "gradient_checkpointing": false, + "initializer_factor": 0.002, + "is_encoder_decoder": true, + "is_gated_act": false, + "layer_norm_epsilon": 1e-06, + "model_type": "t5", + "neuron": { + "auto_cast": "matmul", + "auto_cast_type": "bf16", + "compiler_type": "neuronx-cc", + "compiler_version": "2.19.8089.0+8ab9f450", + "disable_fallback": false, + "disable_fast_relayout": false, + "dynamic_batch_size": false, + "float_dtype": "fp32", + "inline_weights_to_neff": true, + "int_dtype": "int64", + "optlevel": "2", + "output_attentions": false, + "output_hidden_states": false, + "static_batch_size": 1, + "static_num_beams": 4, + "static_sequence_length": 64, + "task": "text2text-generation", + "tensor_parallel_size": 1 + }, + "num_decoder_layers": 5, + "num_heads": 4, + "num_layers": 5, + "relative_attention_max_distance": 128, + "relative_attention_num_buckets": 8, + "use_cache": true, + "vocab_size": 1103 + }, + "encoder": { + "classifier_dropout": 0.0, + "d_ff": 37, + "d_kv": 8, + "d_model": 32, + "decoder_start_token_id": 0, + "dense_act_fn": "relu", + "dropout_rate": 0.1, + "feed_forward_proj": "relu", + "gradient_checkpointing": false, + "initializer_factor": 0.002, + "is_encoder_decoder": true, + "is_gated_act": false, + "layer_norm_epsilon": 1e-06, + "model_type": "t5", + "neuron": { + "auto_cast": "matmul", + "auto_cast_type": "bf16", + "compiler_type": "neuronx-cc", + "compiler_version": "2.19.8089.0+8ab9f450", + "disable_fallback": false, + "disable_fast_relayout": false, + "dynamic_batch_size": false, + "float_dtype": "fp32", + "inline_weights_to_neff": true, + "int_dtype": "int64", + "optlevel": "2", + "output_attentions": false, + "output_hidden_states": false, + "static_batch_size": 1, + "static_num_beams": 4, + "static_sequence_length": 64, + "task": "text2text-generation", + "tensor_parallel_size": 1 + }, + "num_decoder_layers": 5, + "num_heads": 4, + "num_layers": 5, + "relative_attention_max_distance": 128, + "relative_attention_num_buckets": 8, + "use_cache": true, + "vocab_size": 1103 + } +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/t5/hf-internal-testing/tiny-random-t5/5d5dadc2c2138bf8ab44.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/t5/hf-internal-testing/tiny-random-t5/5d5dadc2c2138bf8ab44.json new file mode 100644 index 0000000000000000000000000000000000000000..ad340944f5e935a03d11fbb70d890f003f6b9d7c --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/t5/hf-internal-testing/tiny-random-t5/5d5dadc2c2138bf8ab44.json @@ -0,0 +1,91 @@ +{ + "_entry_class": "MultiModelCacheEntry", + "_model_id": "hf-internal-testing/tiny-random-t5", + "_task": null, + "decoder": { + "classifier_dropout": 0.0, + "d_ff": 37, + "d_kv": 8, + "d_model": 32, + "decoder_start_token_id": 0, + "dense_act_fn": "relu", + "dropout_rate": 0.1, + "feed_forward_proj": "relu", + "gradient_checkpointing": false, + "initializer_factor": 0.002, + "is_encoder_decoder": true, + "is_gated_act": false, + "layer_norm_epsilon": 1e-06, + "model_type": "t5", + "neuron": { + "auto_cast": "matmul", + "auto_cast_type": "bf16", + "compiler_type": "neuronx-cc", + "compiler_version": "2.19.8089.0+8ab9f450", + "disable_fallback": false, + "disable_fast_relayout": false, + "dynamic_batch_size": false, + "float_dtype": "fp32", + "inline_weights_to_neff": true, + "int_dtype": "int64", + "optlevel": "2", + "output_attentions": true, + "output_hidden_states": true, + "static_batch_size": 1, + "static_num_beams": 1, + "static_sequence_length": 64, + "task": "text2text-generation", + "tensor_parallel_size": 1 + }, + "num_decoder_layers": 5, + "num_heads": 4, + "num_layers": 5, + "relative_attention_max_distance": 128, + "relative_attention_num_buckets": 8, + "use_cache": true, + "vocab_size": 1103 + }, + "encoder": { + "classifier_dropout": 0.0, + "d_ff": 37, + "d_kv": 8, + "d_model": 32, + "decoder_start_token_id": 0, + "dense_act_fn": "relu", + "dropout_rate": 0.1, + "feed_forward_proj": "relu", + "gradient_checkpointing": false, + "initializer_factor": 0.002, + "is_encoder_decoder": true, + "is_gated_act": false, + "layer_norm_epsilon": 1e-06, + "model_type": "t5", + "neuron": { + "auto_cast": "matmul", + "auto_cast_type": "bf16", + "compiler_type": "neuronx-cc", + "compiler_version": "2.19.8089.0+8ab9f450", + "disable_fallback": false, + "disable_fast_relayout": false, + "dynamic_batch_size": false, + "float_dtype": "fp32", + "inline_weights_to_neff": true, + "int_dtype": "int64", + "optlevel": "2", + "output_attentions": true, + "output_hidden_states": true, + "static_batch_size": 1, + "static_num_beams": 1, + "static_sequence_length": 64, + "task": "text2text-generation", + "tensor_parallel_size": 1 + }, + "num_decoder_layers": 5, + "num_heads": 4, + "num_layers": 5, + "relative_attention_max_distance": 128, + "relative_attention_num_buckets": 8, + "use_cache": true, + "vocab_size": 1103 + } +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/t5/hf-internal-testing/tiny-random-t5/d83e395611ddc3a29d9f.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/t5/hf-internal-testing/tiny-random-t5/d83e395611ddc3a29d9f.json new file mode 100644 index 0000000000000000000000000000000000000000..1981fa74bf11c72a546e1c357d3afa293a9d5485 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/t5/hf-internal-testing/tiny-random-t5/d83e395611ddc3a29d9f.json @@ -0,0 +1,91 @@ +{ + "_entry_class": "MultiModelCacheEntry", + "_model_id": "hf-internal-testing/tiny-random-t5", + "_task": null, + "decoder": { + "classifier_dropout": 0.0, + "d_ff": 37, + "d_kv": 8, + "d_model": 32, + "decoder_start_token_id": 0, + "dense_act_fn": "relu", + "dropout_rate": 0.1, + "feed_forward_proj": "relu", + "gradient_checkpointing": false, + "initializer_factor": 0.002, + "is_encoder_decoder": true, + "is_gated_act": false, + "layer_norm_epsilon": 1e-06, + "model_type": "t5", + "neuron": { + "auto_cast": "matmul", + "auto_cast_type": "bf16", + "compiler_type": "neuronx-cc", + "compiler_version": "2.19.8089.0+8ab9f450", + "disable_fallback": false, + "disable_fast_relayout": false, + "dynamic_batch_size": false, + "float_dtype": "fp32", + "inline_weights_to_neff": true, + "int_dtype": "int64", + "optlevel": "2", + "output_attentions": false, + "output_hidden_states": false, + "static_batch_size": 1, + "static_num_beams": 1, + "static_sequence_length": 64, + "task": "text2text-generation", + "tensor_parallel_size": 1 + }, + "num_decoder_layers": 5, + "num_heads": 4, + "num_layers": 5, + "relative_attention_max_distance": 128, + "relative_attention_num_buckets": 8, + "use_cache": true, + "vocab_size": 1103 + }, + "encoder": { + "classifier_dropout": 0.0, + "d_ff": 37, + "d_kv": 8, + "d_model": 32, + "decoder_start_token_id": 0, + "dense_act_fn": "relu", + "dropout_rate": 0.1, + "feed_forward_proj": "relu", + "gradient_checkpointing": false, + "initializer_factor": 0.002, + "is_encoder_decoder": true, + "is_gated_act": false, + "layer_norm_epsilon": 1e-06, + "model_type": "t5", + "neuron": { + "auto_cast": "matmul", + "auto_cast_type": "bf16", + "compiler_type": "neuronx-cc", + "compiler_version": "2.19.8089.0+8ab9f450", + "disable_fallback": false, + "disable_fast_relayout": false, + "dynamic_batch_size": false, + "float_dtype": "fp32", + "inline_weights_to_neff": true, + "int_dtype": "int64", + "optlevel": "2", + "output_attentions": false, + "output_hidden_states": false, + "static_batch_size": 1, + "static_num_beams": 1, + "static_sequence_length": 64, + "task": "text2text-generation", + "tensor_parallel_size": 1 + }, + "num_decoder_layers": 5, + "num_heads": 4, + "num_layers": 5, + "relative_attention_max_distance": 128, + "relative_attention_num_buckets": 8, + "use_cache": true, + "vocab_size": 1103 + } +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/t5/hf-internal-testing/tiny-random-t5/e57cbde649dde732937d.json b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/t5/hf-internal-testing/tiny-random-t5/e57cbde649dde732937d.json new file mode 100644 index 0000000000000000000000000000000000000000..b550d3bc9697ef54eef3eae64365e7808b7dc281 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev6/t5/hf-internal-testing/tiny-random-t5/e57cbde649dde732937d.json @@ -0,0 +1,91 @@ +{ + "_entry_class": "MultiModelCacheEntry", + "_model_id": "hf-internal-testing/tiny-random-t5", + "_task": null, + "decoder": { + "classifier_dropout": 0.0, + "d_ff": 37, + "d_kv": 8, + "d_model": 32, + "decoder_start_token_id": 0, + "dense_act_fn": "relu", + "dropout_rate": 0.1, + "feed_forward_proj": "relu", + "gradient_checkpointing": false, + "initializer_factor": 0.002, + "is_encoder_decoder": true, + "is_gated_act": false, + "layer_norm_epsilon": 1e-06, + "model_type": "t5", + "neuron": { + "auto_cast": "matmul", + "auto_cast_type": "bf16", + "compiler_type": "neuronx-cc", + "compiler_version": "2.19.8089.0+8ab9f450", + "disable_fallback": false, + "disable_fast_relayout": false, + "dynamic_batch_size": false, + "float_dtype": "fp32", + "inline_weights_to_neff": true, + "int_dtype": "int64", + "optlevel": "2", + "output_attentions": true, + "output_hidden_states": true, + "static_batch_size": 1, + "static_num_beams": 4, + "static_sequence_length": 64, + "task": "text2text-generation", + "tensor_parallel_size": 1 + }, + "num_decoder_layers": 5, + "num_heads": 4, + "num_layers": 5, + "relative_attention_max_distance": 128, + "relative_attention_num_buckets": 8, + "use_cache": true, + "vocab_size": 1103 + }, + "encoder": { + "classifier_dropout": 0.0, + "d_ff": 37, + "d_kv": 8, + "d_model": 32, + "decoder_start_token_id": 0, + "dense_act_fn": "relu", + "dropout_rate": 0.1, + "feed_forward_proj": "relu", + "gradient_checkpointing": false, + "initializer_factor": 0.002, + "is_encoder_decoder": true, + "is_gated_act": false, + "layer_norm_epsilon": 1e-06, + "model_type": "t5", + "neuron": { + "auto_cast": "matmul", + "auto_cast_type": "bf16", + "compiler_type": "neuronx-cc", + "compiler_version": "2.19.8089.0+8ab9f450", + "disable_fallback": false, + "disable_fast_relayout": false, + "dynamic_batch_size": false, + "float_dtype": "fp32", + "inline_weights_to_neff": true, + "int_dtype": "int64", + "optlevel": "2", + "output_attentions": true, + "output_hidden_states": true, + "static_batch_size": 1, + "static_num_beams": 4, + "static_sequence_length": 64, + "task": "text2text-generation", + "tensor_parallel_size": 1 + }, + "num_decoder_layers": 5, + "num_heads": 4, + "num_layers": 5, + "relative_attention_max_distance": 128, + "relative_attention_num_buckets": 8, + "use_cache": true, + "vocab_size": 1103 + } +} \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_00a086963636c3805778+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_00a086963636c3805778+ed72d204/model.hlo_module.pb index ff2add9228e02876f3420c76e3459481645507f4..782b82bf9a4a4ebf93378bc32956f4660440a70a 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_00a086963636c3805778+ed72d204/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_00a086963636c3805778+ed72d204/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c4b6d089df781e3ab0dfe911812cbb200f2dc1d358cc2d49abd01f7222601b25 +oid sha256:52e2ac447c53f64b1d6c2ffa89ba1c66587cb89fa087c23a7f9e266d3953fca4 size 497603 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_00a086963636c3805778+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_00a086963636c3805778+ed72d204/model.neff index af08051da20c68315921439b2e9724d9fbe8630e..fd9e391547b485b90e4741b8eb08a9113ef01a14 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_00a086963636c3805778+ed72d204/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_00a086963636c3805778+ed72d204/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a9cdaa16cfce3a4b868994f3a379ad2cc60becae6b12accc37ba0c6e7b5b89ad +oid sha256:7d38dfb588e27e16a260ab31ca8eff6551c9655002dbe77ebf52baf8f9396af8 size 31345664 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_02da278f167522769f43+253d6470/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_02da278f167522769f43+253d6470/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..cb53ce53583cfe21339b4bed39f5fa1a679cddd1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_02da278f167522769f43+253d6470/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_02da278f167522769f43+253d6470/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_02da278f167522769f43+253d6470/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_02da278f167522769f43+253d6470/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_02da278f167522769f43+253d6470/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..853451f0393707d9e09b5c04d0791e824f2d931a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_02da278f167522769f43+253d6470/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67438285964b08bb19d5cc976e3c54297f08d1b0df76c2f3fe542e1624483de2 +size 9670898 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_02da278f167522769f43+253d6470/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_02da278f167522769f43+253d6470/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..040c3bacc222cd32680954d4f4827f9bd485edda --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_02da278f167522769f43+253d6470/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:851ad19d69a28aebcb76eeb4e4529f9d13bd810ffc4849ea085036f1af5e2beb +size 17439744 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10118825694329555156+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10118825694329555156+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10118825694329555156+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10118825694329555156+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10118825694329555156+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10118825694329555156+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10118825694329555156+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..39c2c734c0c9a1cf027e392c557504b6f5a34ff2 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10118825694329555156+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a42e5d8e63342a8132a9098c06cceb024a7467006f87a370d54b32c22639217 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10118825694329555156+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10118825694329555156+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f89153b1953a4299dfe4f0ec2ce50fb52e5fab05 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10118825694329555156+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10149811978412508127+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10149811978412508127+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10149811978412508127+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10149811978412508127+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10149811978412508127+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10149811978412508127+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10149811978412508127+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e50431e6e3ec3e6317acc7e994afa9cf40ee1210 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10149811978412508127+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86311f9f0a00aedc439bf6b1a7e72130115305331deaa6d802b2852f929f1b25 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10149811978412508127+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10149811978412508127+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..19703429879a7f3bc5d59e7b5079982adb34d518 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10149811978412508127+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10449065838075029877+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10449065838075029877+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10449065838075029877+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10449065838075029877+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10449065838075029877+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10449065838075029877+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10449065838075029877+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7fcef3c41c0d6edeb3832dd09ad315e34d1c3b05 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10449065838075029877+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3772c9b53cf2c833d0d1c07c90e6b645617324394ad76cd3936137a547c93adf +size 1144 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10449065838075029877+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10449065838075029877+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6ec3109636bd5d62ae10022a8f5031cda60cfbf0 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10449065838075029877+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1054760819228113117+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1054760819228113117+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1054760819228113117+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1054760819228113117+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1054760819228113117+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1054760819228113117+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1054760819228113117+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..bc7dba47c95bebece02d0288cd8935858c400394 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1054760819228113117+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae138f6fc3e7b0cb4fdf2453c4cd8579723d427253d4f54a890b46ff7e1df6a +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1054760819228113117+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1054760819228113117+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..e2d87dbe4210d24e144091592315aa159015a48c Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1054760819228113117+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10665707039599941067+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10665707039599941067+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10665707039599941067+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10665707039599941067+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10665707039599941067+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10665707039599941067+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10665707039599941067+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..262465c49748bb91f8bc2cacb35de9ccb0cce94c --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10665707039599941067+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48cdf21fbdf4fdcb05b1a22e95aee811e40354d8145c54198b487140629ca097 +size 1585 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10665707039599941067+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10665707039599941067+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d28fe3a295751f72cdec335e8a2040ecc21a2f35 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10665707039599941067+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10855235522929658999+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10855235522929658999+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10855235522929658999+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10855235522929658999+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10855235522929658999+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10855235522929658999+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10855235522929658999+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3bbccb1c0369f1c21fb06543a454b91e3c62a475 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10855235522929658999+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eac431d89ac5d753c6c7948e2d74f830fde1dab9bf7d7cc89d1878ad7a29689a +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10855235522929658999+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10855235522929658999+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..cd31b5d2291ed05782d345c505f4be131938aeea Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_10855235522929658999+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1090664928465068038+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1090664928465068038+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1090664928465068038+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1090664928465068038+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1090664928465068038+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1090664928465068038+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1090664928465068038+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ccd2f94f5984921811e989fbb95e83d9518803ce --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1090664928465068038+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e3e5d8a329342c24bbba2d50035e229e31a2376adb622342e9d86956cd7408a +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1090664928465068038+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1090664928465068038+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..e7a66ae2692072c7206a3a84b8050a92ca6be1be Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1090664928465068038+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11202137614579807680+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11202137614579807680+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11202137614579807680+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11202137614579807680+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11202137614579807680+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11202137614579807680+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11202137614579807680+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4ddaad102731278721b6f783da50c45d424260f1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11202137614579807680+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a896dad3fa2c0fa6a2db99ab90c4b5edba1ae9ccb09ee00f41e99c511b14541 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11202137614579807680+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11202137614579807680+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..da7c433129dedcbc0a0c53169537632b5e9d0c4e Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11202137614579807680+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11277182249750227945+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11277182249750227945+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11277182249750227945+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11277182249750227945+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11277182249750227945+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11277182249750227945+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11277182249750227945+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2cf74a4202b1ae1308ad55ccd45438c72e8c1749 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11277182249750227945+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:092b80157d518351dfb8d5dd0c0b1dde38d23e902bee644d29f7666f5d3f4892 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11277182249750227945+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11277182249750227945+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1fc47775867e1ec9a550692914354285691c624f Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11277182249750227945+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11434367459596307593+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11434367459596307593+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11434367459596307593+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11434367459596307593+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11434367459596307593+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11434367459596307593+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11434367459596307593+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4edd5d9a069278486ab901ecd35a433607127fe1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11434367459596307593+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80b2fbc4b8ef776e0b5bc8f2a97a91e3775a1451e3b54eec5a1bcb8b37460595 +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11434367459596307593+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11434367459596307593+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..25bd96ef0478d5500baf6d1a039c638093bb681a Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11434367459596307593+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11620898142083431840+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11620898142083431840+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11620898142083431840+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11620898142083431840+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11620898142083431840+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11620898142083431840+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11620898142083431840+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b102a1d0de592826766b33432a3aa79162be57f1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11620898142083431840+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3428f502a287da892ae564e12a0364d236abb2b133c6a7d79b419f19582c424 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11620898142083431840+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11620898142083431840+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..27e2704fef8d14dd88b7a4326e6cf9a713b1948c Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11620898142083431840+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11819691844502964612+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11819691844502964612+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11819691844502964612+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11819691844502964612+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11819691844502964612+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11819691844502964612+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11819691844502964612+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..78b7516c43435cb9705f91c72e2d3fcb300b3da8 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11819691844502964612+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35e7bb1a2ae698c9cb728cbc2763b153dd03fa2b5747fbfb418d4989c502a885 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11819691844502964612+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11819691844502964612+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4ee52cb351bf48393554fffb5e143662e5add8ed Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11819691844502964612+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11949607074455821922+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11949607074455821922+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11949607074455821922+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11949607074455821922+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11949607074455821922+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11949607074455821922+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11949607074455821922+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7bba865dbec7e95ea91468c2d5a97c49df528617 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11949607074455821922+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50844827e4f02bbc6f1a8f5cced9c8cb36e9855929bdc3fd3d5d5b1491ff2fee +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11949607074455821922+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11949607074455821922+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0df361c37c9d06191ca712fd756bc16a90ac3e27 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_11949607074455821922+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12291785342055497735+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12291785342055497735+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12291785342055497735+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12291785342055497735+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12291785342055497735+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12291785342055497735+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12291785342055497735+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8e512d9b350f71d61580af9624c8e618457f80f6 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12291785342055497735+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dac28e3f7ebe7579d25eedc525ab122ad6859dcd448c798929190baa40b7b67 +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12291785342055497735+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12291785342055497735+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b7cb0d7bb4fa52abf86ba0d64e3198d02cef0df4 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12291785342055497735+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12858209690589865209+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12858209690589865209+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12858209690589865209+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12858209690589865209+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12858209690589865209+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12858209690589865209+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12858209690589865209+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..86186414e79e4a5c24b2629e86e20de265e29b46 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12858209690589865209+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a3873aec9c3d0922d30abefbf62110abe7dc6b32896dbcd91c23420428ece2 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12858209690589865209+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12858209690589865209+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..76ab8878677379e8a1ec80e65f3563c7acc09a2c Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_12858209690589865209+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13298849504190979618+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13298849504190979618+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13298849504190979618+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13298849504190979618+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13298849504190979618+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13298849504190979618+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13298849504190979618+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..906bc6541e7964254a83672ac6149f3c99f7e406 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13298849504190979618+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ab3f9c95ee2facf77840c5a7d904d47fa5a46a3357a9d58ac551123c76dcd8f +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13298849504190979618+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13298849504190979618+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c34c852675a9a8faf47c344c2361e882bb3fe2e2 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13298849504190979618+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13708481322180332252+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13708481322180332252+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13708481322180332252+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13708481322180332252+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13708481322180332252+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13708481322180332252+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13708481322180332252+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f283430fe535f609f836db5e2010a8f5441f690b --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13708481322180332252+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afc8ff919893cccee58620b063b799fbf3548c59f0c1d6840e4e1391d9c31a5e +size 2861 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13708481322180332252+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13708481322180332252+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7cff05637a8bf7e97027d0ec918592ef01bd11a6 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13708481322180332252+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13837596457087810475+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13837596457087810475+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13837596457087810475+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13837596457087810475+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13837596457087810475+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13837596457087810475+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13837596457087810475+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5b665fd26512856f41d9ff5f4c28cdc774168db2 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13837596457087810475+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ead735220105699b2334a57958d25734e9bd86cb5ba67dad31e66e9c3ab5d204 +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13837596457087810475+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13837596457087810475+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..124407dbd7717c8483a52240ee469262f15ed4ba Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13837596457087810475+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13856630914759037234+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13856630914759037234+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13856630914759037234+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13856630914759037234+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13856630914759037234+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13856630914759037234+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13856630914759037234+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..62e96717329b0f35eba8936a3baf1c3da9e38f0e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13856630914759037234+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21f6ad81d3bb99d5b3f0fde132e512790135e2299ae8666dd544405693fd15df +size 1585 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13856630914759037234+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13856630914759037234+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..71e44888e6a1f6c7c6caefacd65ac4a30a37e8d5 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_13856630914759037234+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15261586862706909689+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15261586862706909689+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15261586862706909689+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15261586862706909689+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15261586862706909689+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15261586862706909689+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15261586862706909689+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..dcb949f8c35940d8f604c37d029a7419395cb738 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15261586862706909689+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:719f8aa3529c519d75245493496aa89e47dc178486a6333dd3d93a573d444f9d +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15261586862706909689+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15261586862706909689+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4854186dd84ba90e3bad6922f35c0d6ecd3cb072 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15261586862706909689+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15294796227089169965+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15294796227089169965+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15294796227089169965+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15294796227089169965+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15294796227089169965+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15294796227089169965+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15294796227089169965+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a1fb038ac2a04f0a549497dca45b236bf444fb28 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15294796227089169965+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc7b797e842693cce6c65cbe434bd9d3e09bf967a3623fff8b14ba5a1bfb0590 +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15294796227089169965+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15294796227089169965+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4558c5215051e79dc812d7ff44b036622655d2fc Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15294796227089169965+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15383404534416318704+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15383404534416318704+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15383404534416318704+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15383404534416318704+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15383404534416318704+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15383404534416318704+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15383404534416318704+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..14aa67860cc05058197eb0d397a115fb67ef92b6 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15383404534416318704+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8910c0e31207508f5190f2b1bada1d933456fe8cba5adae89ee1c0f6fb8ab34 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15383404534416318704+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15383404534416318704+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ac153364ade2c08a03377bbb97c0dd230d974890 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15383404534416318704+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15704081915593163079+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15704081915593163079+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15704081915593163079+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15704081915593163079+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15704081915593163079+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15704081915593163079+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15704081915593163079+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1f615ae21bde0e83462d58e60e93cc7036fa4311 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15704081915593163079+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b453d9412b470017be7adc71575130eacf5a7c8277a6b4424e0751ceecaf33df +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15704081915593163079+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15704081915593163079+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9946abee35ad2701c02c5ae84ce0958dd7798ecc Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15704081915593163079+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1587399457649203969+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1587399457649203969+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1587399457649203969+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1587399457649203969+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1587399457649203969+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1587399457649203969+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1587399457649203969+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..509e50c2b377d4012d29dc2dcbcc87f7a2562cd9 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1587399457649203969+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6011200a05558b8d896f11050898479276a557413676de70326fa9810afbacd4 +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1587399457649203969+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1587399457649203969+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f2e858e6059eb6212f6cb9b24d7756d6abfdaa9b Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1587399457649203969+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15f7e443873c3474a6aa/decoder/model.neuron b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15f7e443873c3474a6aa/decoder/model.neuron index 90dec5f3231ef0fff4ffd800319701569415afa9..fbf87f430a4bc62c87cd8328f3f66961f1d40684 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15f7e443873c3474a6aa/decoder/model.neuron +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15f7e443873c3474a6aa/decoder/model.neuron @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b788d306aa621145bd4c1b566e270308aa9d03f560b54a659020c5087dc28413 -size 1190094 +oid sha256:c062fb6a1f3d277faac7225d1bec3b60dff7c9c7f780cc21ef74a345ad1e0409 +size 1189966 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15f7e443873c3474a6aa/encoder/model.neuron b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15f7e443873c3474a6aa/encoder/model.neuron index f48894ddd94baff7166ff9c85ca13d95057e5c6b..4ca805b61a2ba13ba5cce95ec5703450a11d5f3d 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15f7e443873c3474a6aa/encoder/model.neuron +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_15f7e443873c3474a6aa/encoder/model.neuron @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fd726585ac540b16f29cf45b77f7fa0beb2fa5363f3d09a5a0c25c4007501304 -size 349882 +oid sha256:7c3b2291d6e1e91d862de919369aef0c73f10af7f0d3d06bdac64df2f247ceb8 +size 349818 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16364384937141820797+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16364384937141820797+e30acd3a/model.neff index cc3145ec179a1d9ecbf09975819dff6290577cb2..e883da46ae19f3706a5c19f9feecb8c67415cf4b 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16364384937141820797+e30acd3a/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16364384937141820797+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16774151007614265487+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16774151007614265487+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16774151007614265487+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16774151007614265487+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16774151007614265487+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16774151007614265487+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16774151007614265487+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f9287944d40128c1ec671204681b511e75f25b60 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16774151007614265487+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3e0bc5a3c7d16f319499949a174246d04450f8cc2080d819fa3aa4bceecd678 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16774151007614265487+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16774151007614265487+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..35284706e21dbfe2cd9996cf69edd1085a914182 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16774151007614265487+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16963083935060167100+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16963083935060167100+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16963083935060167100+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16963083935060167100+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16963083935060167100+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16963083935060167100+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16963083935060167100+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d7f57ca2ba84f1cb98fa7fa791dc6ac57e243838 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16963083935060167100+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cfc19f1b309d6a8d5805d5f4d2996e55655c88bed387674b3a369598c40518c +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16963083935060167100+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16963083935060167100+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..3c6d10388cd293fcdb7a28d6f0203b0f30699e6c Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_16963083935060167100+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17127091050305702058+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17127091050305702058+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17127091050305702058+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17127091050305702058+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17127091050305702058+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17127091050305702058+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17127091050305702058+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..6f597d61e71506d05a43bbc7f786e50e1f8b90e3 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17127091050305702058+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8a1066be3228bbe47e1228ad7b3defbc6877df254c70d9c3772ed60075b1a15 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17127091050305702058+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17127091050305702058+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f84af9cd830acb23b46d165c8edd23fde1e412b1 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17127091050305702058+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1729176184418632850+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1729176184418632850+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1729176184418632850+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1729176184418632850+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1729176184418632850+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1729176184418632850+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1729176184418632850+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..77d5f743792bb4c45c37d075ca8d2819322eba9f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1729176184418632850+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe848e2380679bb760f4392c5e43fc5915960275d98ec31e95b0d48cf433369 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1729176184418632850+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1729176184418632850+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..93f81fb08d08b3ea9c47cbc6316bb477cb54bf90 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_1729176184418632850+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17313106528817084385+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17313106528817084385+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17313106528817084385+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17313106528817084385+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17313106528817084385+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17313106528817084385+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17313106528817084385+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7d1c4f6767a01ae80f4d152cc28352723ca9dfb8 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17313106528817084385+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7752379c4a6681e6d736b9466fc50ed1167744b11c729dc3ad44fdee1021a38 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17313106528817084385+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17313106528817084385+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4c433638ec9803cd6d76284d78bb934668e185b9 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17313106528817084385+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17369777196536189124+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17369777196536189124+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17369777196536189124+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17369777196536189124+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17369777196536189124+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17369777196536189124+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17369777196536189124+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..cedcae31cd2e003e183f6c87d0d439039ef8b01e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17369777196536189124+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8d761528ce6886a8b55d0c5ea938e8bedc2b6e7a1632afaae7f26549f37e571 +size 1369 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17369777196536189124+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17369777196536189124+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ef08330fb1f7895036af3f36fc914f96e447ac87 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17369777196536189124+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17428083197400802541+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17428083197400802541+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17428083197400802541+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17428083197400802541+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17428083197400802541+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17428083197400802541+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17428083197400802541+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d1a6a25662366245e230217e58aec1ec02b33934 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17428083197400802541+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:928fcca6423e3e233e6fec41fe75a3628dbeba9b4abc2fef942b0976f42880d7 +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17428083197400802541+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17428083197400802541+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..236572121e67db8368bb787f2c4dba95d8d8a1fc Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17428083197400802541+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17557006053795692186+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17557006053795692186+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17557006053795692186+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17557006053795692186+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17557006053795692186+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17557006053795692186+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17557006053795692186+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..9c4111cbd1e8e50de49dda93d637f2c5f0b943eb --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17557006053795692186+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c211fc5277964b7bbc67d57ccdf857ac3e17cb508c34045db4b2935ed8aabaf +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17557006053795692186+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17557006053795692186+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8f8ae5147fa9d8cf7b30f6b3103c3a04c622d2a0 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17557006053795692186+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17563204255823942492+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17563204255823942492+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17563204255823942492+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17563204255823942492+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17563204255823942492+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17563204255823942492+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17563204255823942492+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7dd9349c009c754bd318a617a382b45a148a8fbf --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17563204255823942492+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6c172e3fd432c1b7bbc9a605173a704ae4851f588357c1ac13919d74cfbfb7c +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17563204255823942492+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17563204255823942492+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..de6431698b400435af16ff0d69168be10f003454 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17563204255823942492+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17663242194127898969+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17663242194127898969+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17663242194127898969+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17663242194127898969+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17663242194127898969+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17663242194127898969+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17663242194127898969+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..71eace50b412cccce65fe73ba7507243777c5a1e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17663242194127898969+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d265c14a4e669b74aaa8e5d9578247f2de04d1d5210e6a981c95368c8c87a026 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17663242194127898969+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17663242194127898969+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a799099075a086d4cb10b1af0bb95d65f7a3fa2e Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17663242194127898969+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17820036763001301806+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17820036763001301806+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17820036763001301806+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17820036763001301806+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17820036763001301806+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17820036763001301806+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17820036763001301806+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d560aa7836266076df3bf4ce364a30646e0838a3 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17820036763001301806+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4243920bcc2c2a24a52dfa8987ab9473deb4d78a4670a61445d473982e64db7b +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17820036763001301806+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17820036763001301806+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4d7357512ccf5dd500a4626d09f4e2e27bbdb570 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_17820036763001301806+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18065335321178308811+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18065335321178308811+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18065335321178308811+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18065335321178308811+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18065335321178308811+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18065335321178308811+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18065335321178308811+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5cbe3dba6566c3bebbbee6980d17a189ee78ab42 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18065335321178308811+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6bcafe3bd7cb039293067c828a6cf4bdf13c979e1a00b27bea63fed4f037178 +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18065335321178308811+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18065335321178308811+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6b6d1123082c030f0e2cd70ddef09fde015aea58 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18065335321178308811+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18132732170084255670+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18132732170084255670+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18132732170084255670+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18132732170084255670+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18132732170084255670+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18132732170084255670+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18132732170084255670+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ab5ff6e160a511c3acbe0fe420597dee642311e1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18132732170084255670+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:293d0ac96beb67db77da03ff32a557fca6828445dcca222378824d2306810592 +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18132732170084255670+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18132732170084255670+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c7f3765ae5c5ab9ca205c91ed9b41946c56041c5 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_18132732170084255670+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2019660303511744503+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2019660303511744503+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2019660303511744503+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2019660303511744503+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2019660303511744503+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2019660303511744503+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2019660303511744503+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3168ffbdbf1762cd60c4ce40e547f04290f350f5 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2019660303511744503+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab014cbfaedd6071dcaa1fca0d83ce2f63df59982e5dfabe27f4e74caadd4179 +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2019660303511744503+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2019660303511744503+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ed1b22e505daee2fe09fbb4721a2d061ab347e15 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2019660303511744503+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_212973925893596393+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_212973925893596393+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_212973925893596393+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_212973925893596393+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_212973925893596393+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_212973925893596393+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_212973925893596393+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7696047ef5a6a0a1fcdc117db4fe2ca5fcbab181 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_212973925893596393+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f545ae7d060322f5989444c0528b27ec2689a53b32d9d11cd53376fa63d3a8e1 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_212973925893596393+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_212973925893596393+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..53494d0e64df4873f756fe655ab06328996ecf86 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_212973925893596393+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_219872634856243073+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_219872634856243073+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_219872634856243073+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_219872634856243073+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_219872634856243073+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_219872634856243073+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_219872634856243073+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..631c21bd4f2b45ad54395106e6d57bb16abec40b --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_219872634856243073+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c72e93d823b706748e43edc828dece2fb7b6a98a58e5bbfff127ff47325c1884 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_219872634856243073+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_219872634856243073+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..74a019caea04b4042e61ca278a808edb49558ce9 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_219872634856243073+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2213217598519524012+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2213217598519524012+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2213217598519524012+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2213217598519524012+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2213217598519524012+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2213217598519524012+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2213217598519524012+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d357aff629b30b4aa881a7a0cb6691b3d9b46f14 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2213217598519524012+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40e65fb7f1a7ade84bee7263415a7c03f3ea40431bd2e36430b339a378445c4d +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2213217598519524012+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2213217598519524012+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9323b34ac91dcbd57fea02913c4c4a0864422405 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2213217598519524012+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_22971814024490892+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_22971814024490892+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_22971814024490892+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_22971814024490892+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_22971814024490892+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_22971814024490892+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_22971814024490892+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7b2c7302cf528c77276ef717f2e1674456569c85 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_22971814024490892+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6f66cf7db42deebdd2e40a2d8ffe21cb944546844f0da4d13c53d3cc1b9a5d9 +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_22971814024490892+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_22971814024490892+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9e9c1846b3eef86959da95c349278d28653186e3 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_22971814024490892+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2312007082139657764+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2312007082139657764+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2312007082139657764+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2312007082139657764+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2312007082139657764+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2312007082139657764+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2312007082139657764+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a297a9b52f229a9d9ced2a6a4f747d96301ab5dd --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2312007082139657764+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfc4ab0cc5bb46d9eae97062bb084835dd03a2cc877999bbadd1a338e38874e2 +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2312007082139657764+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2312007082139657764+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5d10d381d0ef1ad8b021a54e1b1a9e9dd0dce3fd Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2312007082139657764+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_234b5c34641e778cc5d2+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_234b5c34641e778cc5d2+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_234b5c34641e778cc5d2+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_234b5c34641e778cc5d2+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_234b5c34641e778cc5d2+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..bffdd3ff42ffb62a3193a19e15071208accc14a9 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_234b5c34641e778cc5d2+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddfdd3b97bc014c3753edd934bfc9558878a8ef0a424799cec49b546e76cb5c8 +size 110959906 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_234b5c34641e778cc5d2+ed72d204/model.log b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_234b5c34641e778cc5d2+ed72d204/model.log new file mode 100644 index 0000000000000000000000000000000000000000..0c20de5c3f2f5f49c47bb991ef422999f81d8411 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_234b5c34641e778cc5d2+ed72d204/model.log @@ -0,0 +1,3 @@ +Failed compilation with ['neuronx-cc', 'compile', '--framework=XLA', '/tmp/nxd_model/context_encoding_model/_tp0_bk0/model.MODULE_234b5c34641e778cc5d2+ed72d204.hlo_module.pb', '--output', '/tmp/nxd_model/context_encoding_model/_tp0_bk0/model.MODULE_234b5c34641e778cc5d2+ed72d204.neff', '--target=trn1', '--auto-cast=none', '--model-type=transformer', '--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ', '-O2', '--lnc=1', '--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt', '--verbose=35']: [XCG815] Estimated peak HBM usage (18.327946) exceeds 16GB. Neff won't be able to load on chip - Please open a support ticket at https://github.com/aws-neuron/aws-neuron-sdk/issues/new. You may also be able to obtain more information using the 'XLA_IR_DEBUG' and 'XLA_HLO_DEBUG' environment variables. +2025-09-10T13:49:56Z Non-signal exit. Backend exited with code 1 and stderr: [XCG815] Estimated peak HBM usage (18.327946) exceeds 16GB. Neff won't be able to load on chip - Please open a support ticket at https://github.com/aws-neuron/aws-neuron-sdk/issues/new. You may also be able to obtain more information using the 'XLA_IR_DEBUG' and 'XLA_HLO_DEBUG' environment variables. + diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2629259027206010953+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2629259027206010953+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2629259027206010953+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2629259027206010953+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2629259027206010953+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2629259027206010953+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2629259027206010953+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1d8e0cf5e2571668f7d7cee05675933afe117313 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2629259027206010953+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37a7f9c47700367d81a831d44663a9ac8f3dc98eceed9c60caf63caddab83be0 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2629259027206010953+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2629259027206010953+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..09a35f290e199cc84c5a3e3146d2786653688f60 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2629259027206010953+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_28619913331587313+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_28619913331587313+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_28619913331587313+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_28619913331587313+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_28619913331587313+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_28619913331587313+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_28619913331587313+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..99527613aac38a9ccf298d52516de8e3f952863d --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_28619913331587313+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4991138b51beb424eda5df96a2eacae9bd7006b90f569b37a2ade355cfede5d0 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_28619913331587313+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_28619913331587313+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..bd4df58aed1b16573ea72ae9a274e8b6da6a906d Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_28619913331587313+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2891572966407268505+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2891572966407268505+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2891572966407268505+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2891572966407268505+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2891572966407268505+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2891572966407268505+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2891572966407268505+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..66da87c89d00861f29b565c285a8c6e930f2efac --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2891572966407268505+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:793f2df54b945f68bc082b1e306b1a2fe648fa0e3da939c30cfad4a53718b44f +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2891572966407268505+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2891572966407268505+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..cbbe79363f9dfae450bddc13bd6de98c49b62918 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2891572966407268505+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_29c699a35eb0b8dda4d5+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_29c699a35eb0b8dda4d5+a9d440f5/model.neff index 99d05194538b98a7645a8d4b22f39aca365734cc..f0bca55acaf985f48688bc71b117eb04eb39fe6e 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_29c699a35eb0b8dda4d5+a9d440f5/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_29c699a35eb0b8dda4d5+a9d440f5/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e91897d7e182db481db20a167fa26449d101b3447eebe99c4f8aea88b14b0a93 +oid sha256:d696c6e1c6a435e974c340b8aeea0e33de2b79717cca902b329b8af43cde4048 size 4977664 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_29c699a35eb0b8dda4d5+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_29c699a35eb0b8dda4d5+a9d440f5/wrapped_neff.hlo index b05a40e5c9d905fd633bd247a2218d2c5a2f69d4..046b08a6d73ae052c79d5cf0b87c42ac4bd2b8a3 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_29c699a35eb0b8dda4d5+a9d440f5/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_29c699a35eb0b8dda4d5+a9d440f5/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fa0f0cdfd33f14b3d65e28e1a97bd48a3fe3ab5964f83e8e92dd6251b1e9163c +oid sha256:16b0dc07f8cdc682944017bd5092bef88f0434e6d2ebe457ac93e7c81be5774e size 5134205 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2aa08aa6793c444a88ea+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2aa08aa6793c444a88ea+ed72d204/model.hlo_module.pb index 53e6c1ea9eb6ba3979f5354d81db9ec6306c9754..b1301e1978bb740fc8c68e603fe2b8bcf2ddb281 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2aa08aa6793c444a88ea+ed72d204/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2aa08aa6793c444a88ea+ed72d204/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4bad8cce0aef7eefd85d29624a01be2a07ce8aa67e20dacbd17a14186ea0daef +oid sha256:547b24ae1b39d13b71277a5fc16204490d540a8e25c8f73e779a7a808a3dd1fa size 430182 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2aa08aa6793c444a88ea+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2aa08aa6793c444a88ea+ed72d204/model.neff index df700ca3b3956e06e0cb7c5cf2004db51fa1581f..0a5662c36a60aef8d1162db7fa2059d6b9e1344b 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2aa08aa6793c444a88ea+ed72d204/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_2aa08aa6793c444a88ea+ed72d204/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5c4be9f40c1db625d9c6dfa4d66746efdcb10ec00260f6623a94a751b5a16d3e +oid sha256:47a57a75086bc877641d3bb7f6c2c96061248289c618c5e500ede12e0ee9d836 size 31120384 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3010567314445873136+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3010567314445873136+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3010567314445873136+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3010567314445873136+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3010567314445873136+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3010567314445873136+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3010567314445873136+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e01c4291c9bd46d805c1ac8d99a7501923af1414 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3010567314445873136+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed64af1de021c762ba16eda1c7ae28f24f316a384351f1f4aaba2e5c119d33c7 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3010567314445873136+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3010567314445873136+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..fa511f9c4bdb54a630aff9aa648eac0a252b88bb Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3010567314445873136+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..88d214ff1dc9f2e95ca012bddcf0bdf50fac0e8d --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:210ec47218d2f9175c88442e04911929a0d59767cd11e88a600b5f7456924061 +size 588374 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..061338531e68c94010ad760b8013636d2addeae9 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea05809fef4aa7b0e9fa8b0f792d3213c9311a9d3596b550c30ad0dce35dfd07 +size 1209344 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..2cf45fd53d8cb7523cb2af22df69d9d4be5e5d7a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_308ca0aab5adbc4e264e+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d516c0670b2ae7a13894debac59ce93272afced1dcfd99676a316f94837a5d5 +size 1354255 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..93354bd42abb66b9b6e56b127441174baa403534 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..eed265cf35a8a5290ef80a0adeca7e07950b25f3 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0058240e54b46c6b0db4c14f906f09f3ec484e7e04c3f2cb6e1f8eda3c5888d7 +size 2507590 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b23ece6c63b461c1034f4025e67b54bb93748985 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c74f90bab7cf259aea0daac2a556646ed4ff30addb7831a0a31f1a3b3cb58934 +size 3533824 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..f40f60c89bbd8404b66748e996c003733b896506 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_31248f3f93aafaf6dbaa+cd3419b6/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd51c5d89811b2361e4f8267cb657832f235da127ac6940aed8e0a70761b6052 +size 3783895 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3274027993637618360+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3274027993637618360+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3274027993637618360+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3274027993637618360+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3274027993637618360+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3274027993637618360+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3274027993637618360+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f6abc0c89c3f16e78b3869f4813496b26c2b7f03 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3274027993637618360+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abadfcaa9eedb2f185ed24c904b658ca490e28180dad7f310939be00405a3b78 +size 2861 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3274027993637618360+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3274027993637618360+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ce1bfca19713e24460a829bd4fc26f841a4c6e48 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3274027993637618360+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3296693401617587065+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3296693401617587065+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3296693401617587065+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3296693401617587065+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3296693401617587065+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3296693401617587065+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3296693401617587065+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2e001b1e998ad609ac00a61566013878fa450772 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3296693401617587065+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d21cb4011c120f03305205b6cbd16aa9aaa3c4d3bb8d862fe6904606cbcaa652 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3296693401617587065+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3296693401617587065+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..e38fb945f5ebb69e35b7254a4aaa1770a09e84e9 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3296693401617587065+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3584083482496600619+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3584083482496600619+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3584083482496600619+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3584083482496600619+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3584083482496600619+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3584083482496600619+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3584083482496600619+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..9c8d892b5e1b7919d439c3785e8a20da90b763ba --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3584083482496600619+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:227368435c1e8ffe2b46e4b822f1332a212bf4b5c866ef534ea2b225694482c3 +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3584083482496600619+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3584083482496600619+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..bd2dc03e15cf0bd3d9fa93a9bb5beb14c3844465 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3584083482496600619+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3677608697266465166+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3677608697266465166+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3677608697266465166+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3677608697266465166+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3677608697266465166+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3677608697266465166+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3677608697266465166+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..bfed03255b01b35299ebc637711a8d58c05ec462 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3677608697266465166+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e5918ed79a90b94d93d230fe9d9dece2ea3674361398f695e39ea12bfcb7708 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3677608697266465166+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3677608697266465166+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..be5b0ee1e3375299af6ade04ac833bdec572bd27 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3677608697266465166+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3726318503065748382+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3726318503065748382+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3726318503065748382+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3726318503065748382+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3726318503065748382+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3726318503065748382+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3726318503065748382+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..52a840c9dce2ac86d66b1b83342314024acde28e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3726318503065748382+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db1de91ef640d5eb13a673dfdc9be9045617c4aaaedb9e477fd8814ca7018e94 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3726318503065748382+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3726318503065748382+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b6de9517f4390ecbec781c554337dacb1a32a6e5 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3726318503065748382+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3733582788604956194+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3733582788604956194+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3733582788604956194+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3733582788604956194+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3733582788604956194+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3733582788604956194+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3733582788604956194+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..096fc4363852567724093d958f6244ccbdd7bb10 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3733582788604956194+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8799d2408fc1465ce0b6131489977ad21e63e23fb124c534cd3f2a643466a2c +size 1585 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3733582788604956194+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3733582788604956194+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4d017f25652d596572bc2827e6c4568878a4e57f Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3733582788604956194+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_38a491bb249cb0a65a66+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_38a491bb249cb0a65a66+ed72d204/model.hlo_module.pb index 3a937948727ebd33b6e71c467d98be772f9f4205..5ee8001d0129cf64929c75afa235cc6d8f47e115 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_38a491bb249cb0a65a66+ed72d204/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_38a491bb249cb0a65a66+ed72d204/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:004a842a6a8f26ded0c2a3c6975d382b36cecd0007fc63d53f39e61f0285c1e8 +oid sha256:15d80f68cffd4942710961a2986779fbc3d28a33f9945875fcd0d503d25c6d75 size 1037449 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_38a491bb249cb0a65a66+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_38a491bb249cb0a65a66+ed72d204/model.neff index 975ce27d16f059714def1027cd9e0bda00ae20f6..3a25633198e3f9243edb6f591c2193a1bafac275 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_38a491bb249cb0a65a66+ed72d204/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_38a491bb249cb0a65a66+ed72d204/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7d2c3f962dd9545304d485267b9dec3f68a33752177089d19035c550496e9d99 +oid sha256:8965232110cbae756f3f06e1060c457108b9643e1e119a95cab1bb688e79f3b2 size 6626304 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3973195210839298171+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3973195210839298171+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3973195210839298171+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3973195210839298171+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3973195210839298171+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3973195210839298171+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3973195210839298171+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f843b77ce5aca3d08dddad1907ddb8fcfcdafeaa --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3973195210839298171+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4cd8c9bb30b80bbae17c37817e07cd72864c7431ffe820db04cc90175ae6c79 +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3973195210839298171+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3973195210839298171+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1f111324f84432a3ba54d04f0bf6ed600d5936ff Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3973195210839298171+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..77fe912990ecb3204d33eeaf82d249e6dcce79d9 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12093b664d384d4f227211cf30520c33cb2f168bf18efd5680e7a6f0759e3946 +size 103130389 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b8ccbfdf034aad4a8dbe268d227293c4cd972073 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fafff6c8809235ac7997becb99200b923ac6f9c9084ee79e97d7948b30d87e8f +size 7803904 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..9160deab4c8483e48f8bfb8cae9c213dca3115c7 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_3cbaae1c02abefd7f494+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4013a9888058e7c0e8ac2ce33000d806be95273272575932d5e51e724e37a029 +size 8121064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4029365533398324907+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4029365533398324907+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4029365533398324907+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4029365533398324907+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4029365533398324907+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4029365533398324907+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4029365533398324907+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..45a15c2b2d9db06c7f04d66cd9b4f2310b9ed477 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4029365533398324907+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b93861fc70f22c6400c8523b59472675ee8994ba602ffd3ae398ddfae4fe189 +size 1585 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4029365533398324907+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4029365533398324907+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..22a7de79a2bb5595d7a8014d3611c27aa4424b95 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4029365533398324907+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4102306456011547160+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4102306456011547160+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4102306456011547160+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4102306456011547160+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4102306456011547160+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4102306456011547160+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4102306456011547160+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4ce37aac5f1fde5dfe97deacd2f2efcf2156bf06 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4102306456011547160+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db4125f63f109313509b125a9e78c5ebf9f0f81584fd65adc5d09a5b3cb0e4c +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4102306456011547160+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4102306456011547160+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1eade5f76e45e97e5e6252cfdf10e02d22ee773e Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4102306456011547160+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_410348709543574224+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_410348709543574224+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_410348709543574224+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_410348709543574224+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_410348709543574224+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_410348709543574224+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_410348709543574224+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7087c149ab10d3e6623e4141b6ec36b9d4b463f0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_410348709543574224+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039e9d48f7f34906d77484e66a1bb4877dc8c917213d93a22dbd116de1187039 +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_410348709543574224+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_410348709543574224+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6970e65f20d81dea61e66fb2827d4bc167b81ca6 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_410348709543574224+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..93354bd42abb66b9b6e56b127441174baa403534 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..475e9fbfbf5b38f298fddc13e8298d8b6fde22a4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9b145a643ac4afcec643c5a4cf0003579212a43c2ea7b2cab1f7635446c3c40 +size 2458664 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6e49d477e0aa8132d206d4e5de1cbb0db484e609 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ecc4a985b50e6be447dcba49851f6869f4bc0661ddb70c5528f11b5a721ac0a +size 3492864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..951aaa09cad090316c3428760fb681da1e21e92f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_43116d82b5805ba3ae20+cd3419b6/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b58e441608e9340359965eeeb8e0d0229dfbd7a847939c284e69325334c98780 +size 3742824 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4475477153125485388+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4475477153125485388+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4475477153125485388+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4475477153125485388+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4475477153125485388+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4475477153125485388+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4475477153125485388+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ed1574fb23309367c7a33ef2b9dd26cef56326ef --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4475477153125485388+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66fd38fc8debaca681c6e8b774eed44b00d15ed3ae3a91a59bfbd7787ee2dfe0 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4475477153125485388+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4475477153125485388+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..89e24a099fd00af11a6144b4d66d6c693fc8b7d8 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4475477153125485388+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4500629659777983660+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4500629659777983660+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4500629659777983660+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4500629659777983660+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4500629659777983660+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4500629659777983660+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4500629659777983660+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f0e99b73455431d4ffbc13231cd3aa086c125d5e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4500629659777983660+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f845b504c0b19d058472e862c0b64990746c7410873d9b166dc87bbf767b086f +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4500629659777983660+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4500629659777983660+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5917b95c3d098694b420fee28f033963c57a283c Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4500629659777983660+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4597534921574083181+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4597534921574083181+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4597534921574083181+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4597534921574083181+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4597534921574083181+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4597534921574083181+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4597534921574083181+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7a53155c3a843137a7789da264b465d33d564550 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4597534921574083181+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb66bf82d28c84e4a5b045ecdf4b1020fcfe7a56c6081899742b495d7e5e81af +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4597534921574083181+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4597534921574083181+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8c90c4b79fb2f8de55fdea0f2e029a59e6abb5bd Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4597534921574083181+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4845384173285952555+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4845384173285952555+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4845384173285952555+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4845384173285952555+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4845384173285952555+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4845384173285952555+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4845384173285952555+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..784f0110ba100a90eeb593ff1f371b0082fb5213 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4845384173285952555+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7fd7987a874632f4273335e8533a6eb70e4723fe24ff54c239377415003ef49 +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4845384173285952555+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4845384173285952555+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f2d95e05bf505b4bc03372c5d34c3295b1e8a00f Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4845384173285952555+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_497689108418605143+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_497689108418605143+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_497689108418605143+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_497689108418605143+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_497689108418605143+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_497689108418605143+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_497689108418605143+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4be9c9441c70a6497381a14a66cf92d2a238a41c --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_497689108418605143+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c677c7bc44e425031add4e8c2ee5035a5d8e3bfa4a20b9206a9280479719d9f2 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_497689108418605143+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_497689108418605143+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..558b6e1843201702c01b1bfaf5f3d9d4028270bf Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_497689108418605143+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4ab214a26135c9602b57+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4ab214a26135c9602b57+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4ab214a26135c9602b57+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4ab214a26135c9602b57+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4ab214a26135c9602b57+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4ab214a26135c9602b57+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4ab214a26135c9602b57+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c9c6493aaf3cafe305f72691a8490215089d8aab --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4ab214a26135c9602b57+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df61ac9ae7cc3b8d0b92f84adaaafb47ca0c3968defd912edc4a081cd7c233d6 +size 104317794 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4ab214a26135c9602b57+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4ab214a26135c9602b57+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..21fae107ff8e57321fd16dc67fab42c1cfbb2f53 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_4ab214a26135c9602b57+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2632ba92083ecea71ec19ae561a0ca4e56249ffbd65c624502bc366b7b3cb3d4 +size 38933504 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5062c09b51ff9154f184+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5062c09b51ff9154f184+a9d440f5/model.neff index acb3c198a477b12cd675d865bb92ad6a5dd85727..cf1cbf30b6a89edd651cd279901e0545ae430391 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5062c09b51ff9154f184+a9d440f5/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5062c09b51ff9154f184+a9d440f5/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e5625dfa5e600d8aef4ed293645867163112521fe828fc0e5856335ec28d4a4d +oid sha256:58a936ed98bc686ae01cd1153b9753578c84db9043f3fa8a00427c3dfdac1541 size 8827904 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5062c09b51ff9154f184+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5062c09b51ff9154f184+a9d440f5/wrapped_neff.hlo index de540af2871da302b9f59ee3ca8a3057a26f294d..adec45a4b132092023d227244717d74368594cca 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5062c09b51ff9154f184+a9d440f5/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5062c09b51ff9154f184+a9d440f5/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:129017e8e9887bc15ef819527db3044b0bac79a328316a8764f69925a2ed1a46 +oid sha256:47691a6ce998b1727a0ba56f08b8984b9ec94b2eb6b2124dea4846a9bc9348b4 size 8965270 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_514904626320229970+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_514904626320229970+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_514904626320229970+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_514904626320229970+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_514904626320229970+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_514904626320229970+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_514904626320229970+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4eb6512c8c76ac8737c6519403b66c20b91c275e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_514904626320229970+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faad67f60f451d7be3dc1de8b30fb20285e1c8e09349dccee964d63daca6655c +size 1582 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_514904626320229970+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_514904626320229970+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9295dd9e73171cc011f67c61dff5b54b2ad0fe18 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_514904626320229970+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5226137176673983632+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5226137176673983632+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5226137176673983632+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5226137176673983632+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5226137176673983632+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5226137176673983632+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5226137176673983632+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..77de4f4bd225419e1cceb41761e42d784794d0a4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5226137176673983632+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:604974ae0ba20745debcda04b0dbfb0cb379733289d5afcdddd9e5c7e110388b +size 1585 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5226137176673983632+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5226137176673983632+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c263d6ec49aa16f7a202c70b5c0fc03bba902754 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5226137176673983632+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_552d1a3105a0e273b50a+388b7e4b/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_552d1a3105a0e273b50a+388b7e4b/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..e8d3af0707b6329fc79d8c4ec9acf0691b2de059 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_552d1a3105a0e273b50a+388b7e4b/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_05fa1c72-7802-464d-9e26-0892c34a0f54/compiler_workdir/Llama3RotaryEmbedding/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_552d1a3105a0e273b50a+388b7e4b/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_552d1a3105a0e273b50a+388b7e4b/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_552d1a3105a0e273b50a+388b7e4b/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_552d1a3105a0e273b50a+388b7e4b/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f1e2473c54cffac949ecf31d3b6ec636c290545b --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_552d1a3105a0e273b50a+388b7e4b/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4a29d4cf27aec9af90e53324eff9ee69e033679482f4016a9dd3e5416c7c68a +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_552d1a3105a0e273b50a+388b7e4b/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_552d1a3105a0e273b50a+388b7e4b/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ab28b5000cf8134123b05e9a1074757177b51459 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_552d1a3105a0e273b50a+388b7e4b/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5533629969901078552+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5533629969901078552+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5533629969901078552+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5533629969901078552+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5533629969901078552+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5533629969901078552+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5533629969901078552+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0bc51e5f7b01eb5992ce05e13f8fbe0e68baf913 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5533629969901078552+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df936becd64dda0177d3f57cdc28f9f36c9b4ec17b364b1eeec0f2869710a0eb +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5533629969901078552+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5533629969901078552+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..2ff114ab0f0f3375e2d43aa154ffc40eeadbd798 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5533629969901078552+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5562114832786762356+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5562114832786762356+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5562114832786762356+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5562114832786762356+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5562114832786762356+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5562114832786762356+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5562114832786762356+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ec3e04f0ffa8bab5b7331e2d4b877f2031e844da --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5562114832786762356+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d001874c1cfff56a7406c62ab384aea6aaa95dfde55a4fdfe5b23b9a21f01ed1 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5562114832786762356+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5562114832786762356+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..01c3cd4401bba2b65bd48ad39c9c439981549124 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5562114832786762356+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5895476730067979013+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5895476730067979013+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5895476730067979013+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5895476730067979013+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5895476730067979013+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5895476730067979013+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5895476730067979013+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..052b6e009a7e46218f341bc8c2c1e7ddcee4f23b --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5895476730067979013+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3882a8d688fef84e1e5f2e7a376a851fafb60860f697b26f47b109236267833a +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5895476730067979013+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5895476730067979013+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b2b633ef0188839994b6d60615c4a6ad94ce9cdc Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5895476730067979013+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5d5dadc2c2138bf8ab44/decoder/model.neuron b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5d5dadc2c2138bf8ab44/decoder/model.neuron index 98dc7748d0d8480bd13d93c318944c36a1cb55db..d45c38a214bccc8cc84cedcbaf685e0d3a87f3b0 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5d5dadc2c2138bf8ab44/decoder/model.neuron +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5d5dadc2c2138bf8ab44/decoder/model.neuron @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8e7ed179c776a09dd00aaa5347656ca55f30a25cec07b7fbb278051a49788c69 -size 633172 +oid sha256:a9d1936dd388b9f965a4e1b24fedb24fb7c6a748789332d0d885bfbff8eded56 +size 633236 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5d5dadc2c2138bf8ab44/encoder/model.neuron b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5d5dadc2c2138bf8ab44/encoder/model.neuron index 972416c09677f07c83e9aa8e43b6e74510c21ea9..baf05a201ecf596a763c9179f155b1851be99b38 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5d5dadc2c2138bf8ab44/encoder/model.neuron +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_5d5dadc2c2138bf8ab44/encoder/model.neuron @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8bfc4ed25f9998aa656120620c0a3c0ce35bfc8aeefd672bc1695585a6bd1320 -size 351030 +oid sha256:12ca8cdd5d2f8186de84a66171ac1d9d021405c8a3c6b37c33e4945f018f175d +size 351094 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6041836500170073779+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6041836500170073779+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6041836500170073779+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6041836500170073779+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6041836500170073779+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6041836500170073779+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6041836500170073779+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..806c1b44528c71e535b60fadd883a19d07953e23 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6041836500170073779+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20f04fd44d5c3c60b41d274465832a19736ef191f8bb0e11d61ffd319fc90dc5 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6041836500170073779+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6041836500170073779+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d219390357a114c67e8de70ea80b71355fad35f2 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6041836500170073779+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_63cd0b95d5730c3ea2ff+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_63cd0b95d5730c3ea2ff+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_63cd0b95d5730c3ea2ff+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_63cd0b95d5730c3ea2ff+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_63cd0b95d5730c3ea2ff+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_63cd0b95d5730c3ea2ff+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_63cd0b95d5730c3ea2ff+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0f549bd30b89ae1398077ad99891f27c14c15c6e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_63cd0b95d5730c3ea2ff+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:352ab657e2f088fc7fb97e52d94260befdeb0c4e7827b7e4e2e661696a05f9f1 +size 104207293 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_63cd0b95d5730c3ea2ff+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_63cd0b95d5730c3ea2ff+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9294319ed90b5da452f4c0ec7c4d4e762a93b949 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_63cd0b95d5730c3ea2ff+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63edb5697fe7d15cfecfd4fbc02a257c8c5b7778969bd81dd498e64221b1e039 +size 38892544 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6642d35addb60ec085b1+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6642d35addb60ec085b1+a9d440f5/model.neff index aef624e96780b8128a84328a86e64754bdf2ecff..cfab72abbbd4f636c20ec95531306f17cc606b5c 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6642d35addb60ec085b1+a9d440f5/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6642d35addb60ec085b1+a9d440f5/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c2ee99ed969f1b132ca9cc586347645f2327b3c508bc60094ebbb5ecb4a229e9 +oid sha256:ad19c98c3e197f08503cf5b7f699cbc34d49fe85c2eb037db0d5910839f04be4 size 1434624 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6642d35addb60ec085b1+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6642d35addb60ec085b1+a9d440f5/wrapped_neff.hlo index d319aa149fafad6edb33d2db73c3ecbdbcf4b797..f6db22ced5efb7460d0894cc68803e016d0ec01b 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6642d35addb60ec085b1+a9d440f5/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6642d35addb60ec085b1+a9d440f5/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:539ad2a559b69dc9d11d0151d61aec1e60be16b36761018c710b2d6ac0eb002c +oid sha256:49c69b1f275e71c1fdb46255940ed202beb451f5843b221202dc57b2d924a214 size 1521594 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6808350649031706313+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6808350649031706313+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6808350649031706313+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6808350649031706313+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6808350649031706313+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6808350649031706313+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6808350649031706313+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..bbda7847f15c722522e0633fb35886058b796503 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6808350649031706313+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c20b03b5f808b1728a8ccbe18b35db71159daf9aab44dc54a201ddec4b5ce3e4 +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6808350649031706313+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6808350649031706313+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..665e94ecd2eedcdc2f9ab264ecf860fa2e5801e3 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6808350649031706313+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6819259119391355174+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6819259119391355174+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6819259119391355174+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6819259119391355174+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6819259119391355174+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6819259119391355174+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6819259119391355174+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..341f984b86cd0d9198450dfd971c77e4acd21fc4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6819259119391355174+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7deabae600784856e767b65d057075165713745a080fc73088104d5e622ae7e +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6819259119391355174+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6819259119391355174+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..880e9f58ce9375b2691f9d2456b875ae5d265b13 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6819259119391355174+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..6085784586e5c531d521096883b6df01c2dd7e88 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4941f7a4c2773e1e362c0926b970972364cc6a11fba521df1bd85f6be5c35886 +size 103130005 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0b82921b88315425b06a9876e1dd89d67227a9b3 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9909a5e54b3523d9adaa4e07bb3ca58d752bf840ab774ae32b9f61dfecc922b2 +size 7721984 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..79845144dc34aadbe2d2b59cb649a6b052f684f1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6972265ccbc24ff4448c+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c96ddf0267cd407e73f8ac27a10f628bd6861ae452af4627fa616a624cbb99c3 +size 7996904 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..691358a8696986b2175a3ba92c1e7716f5225be1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a428bd8f83c4a722785ed440b47277011681572669d6eb5771db9d093585f13a +size 104067050 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..aa2c39e05a9b2acc7dae86228d2ab3e233d5c3d6 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d0fc0d34f44ca4b39e2257e2fc912b5d9662e0cf5c5772c7343dd108a85eef3 +size 11377664 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..c16334ea6373753c8d4d4e18a651af93ea7c8982 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ddd5b729b9e4ecede70+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a48a1ffb1043c4f172ef65685fbbcae53db0a3670657a8f321d47245718a5a9 +size 11652584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a078c3548bc0f03ae31ae83196df65bd7e392080 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e8bfff8477709368ce31a7d33f42990e6a2b02331bea021ebb35636de81cc5e +size 588374 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0962cf8cadb8e758368adddb3d5f9eb1b3656cc8 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73bfb1795a540ec325918d8be5f6353b1ed9b72acec14786fbf4a5bd3e497694 +size 1444864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..1a77c064d99dacdfbe7f11b3fd3bb0e9b1a83213 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_6fcc6140d0bae101d7db+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbebe9538a508e045da52637fd9411c30a6712987f6551864b5977d9c860c5f0 +size 1589775 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_746058432585752165+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_746058432585752165+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_746058432585752165+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_746058432585752165+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_746058432585752165+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_746058432585752165+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_746058432585752165+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3d4c69632a75fc4f250328eb60993734b08f4c80 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_746058432585752165+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6df760532a487465927f6e3e04bc6493c7457718f0dffb3e3896e3c092c4050b +size 2861 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_746058432585752165+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_746058432585752165+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..711c5b85019914d620eb4d160a407382b1498c15 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_746058432585752165+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7492a59ff398cdd8c726+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7492a59ff398cdd8c726+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7492a59ff398cdd8c726+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7492a59ff398cdd8c726+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7492a59ff398cdd8c726+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7492a59ff398cdd8c726+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7492a59ff398cdd8c726+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..6da10c7d19e56bcbe9a2c06c2bcbff2fe71f666a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7492a59ff398cdd8c726+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18454f3fd66c63f196e97f6d51c70a03d817c5adb05a90e131b763d7a39f3e6e +size 705694 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7492a59ff398cdd8c726+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7492a59ff398cdd8c726+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..311bb1b8511719351929ad02720e2c1681e43afb --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7492a59ff398cdd8c726+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7cbdc249ada77157539793ec5d2fbbdbef8f31417dd8503f1ea022f7b250ef8 +size 19631104 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7557177e60b224d7d0cc+253d6470/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7557177e60b224d7d0cc+253d6470/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..cb53ce53583cfe21339b4bed39f5fa1a679cddd1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7557177e60b224d7d0cc+253d6470/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7557177e60b224d7d0cc+253d6470/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7557177e60b224d7d0cc+253d6470/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b0ed93ba7fc61080e22cbea3a0ec2d008be74bd2 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7557177e60b224d7d0cc+253d6470/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2553215122056d902b1c55e7e737da5a9dafdc192698ac91c466be727a94caf7 +size 9674651 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7557177e60b224d7d0cc+253d6470/model.log b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7557177e60b224d7d0cc+253d6470/model.log new file mode 100644 index 0000000000000000000000000000000000000000..438253edebeee7c1aad6e6132f142d782fb65a32 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7557177e60b224d7d0cc+253d6470/model.log @@ -0,0 +1,3 @@ +Failed compilation with ['neuronx-cc', 'compile', '--framework=XLA', '/tmp/nxd_model/context_encoding_model/_tp0_bk0/model.MODULE_7557177e60b224d7d0cc+253d6470.hlo_module.pb', '--output', '/tmp/nxd_model/context_encoding_model/_tp0_bk0/model.MODULE_7557177e60b224d7d0cc+253d6470.neff', '--target=trn1', '--enable-saturate-infinity', '--enable-mixed-precision-accumulation', '--model-type', 'transformer', '-O1', '--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2', '--auto-cast=none', '--internal-enable-dge-levels', 'vector_dynamic_offsets', '--internal-hlo2tensorizer-options=--verify-hlo=true', '--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt', '--verbose=35']: [XCG815] Estimated peak HBM usage (17.053570) exceeds 16GB. Neff won't be able to load on chip - Please open a support ticket at https://github.com/aws-neuron/aws-neuron-sdk/issues/new. You may also be able to obtain more information using the 'XLA_IR_DEBUG' and 'XLA_HLO_DEBUG' environment variables. +2025-09-11T08:10:18Z Non-signal exit. Backend exited with code 1 and stderr: [XCG815] Estimated peak HBM usage (17.053570) exceeds 16GB. Neff won't be able to load on chip - Please open a support ticket at https://github.com/aws-neuron/aws-neuron-sdk/issues/new. You may also be able to obtain more information using the 'XLA_IR_DEBUG' and 'XLA_HLO_DEBUG' environment variables. + diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7565122625112339535+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7565122625112339535+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7565122625112339535+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7565122625112339535+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7565122625112339535+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7565122625112339535+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7565122625112339535+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..07a875780732ce90dcfcccf4eec00bb91d737f62 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7565122625112339535+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42a0912a6557ce89d664bd248e9616169077869e62b88b1fc1bd091849d285be +size 1291 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7565122625112339535+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7565122625112339535+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5e5a1e06fe9e208606fb927b234c84ce375accfc Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7565122625112339535+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7619465509971901533+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7619465509971901533+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7619465509971901533+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7619465509971901533+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7619465509971901533+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7619465509971901533+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7619465509971901533+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..262c1aa8943e6a2a3f9296735a32dbd09d1131f4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7619465509971901533+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68a2f12f6bccf30cc2abd7dbbc5b47b3b17004020bd177e6b4e76cbc51f1b577 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7619465509971901533+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7619465509971901533+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7e856ef66ed0ee2567689bf77ff60d459e38ef49 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7619465509971901533+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7731931779321626430+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7731931779321626430+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7731931779321626430+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7731931779321626430+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7731931779321626430+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7731931779321626430+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7731931779321626430+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c4169c7a9a63acaafee70d76e3d484e282f53713 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7731931779321626430+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa596c0a9f77d8680ca3227ae5069e643d3eb7d8cd8e6233c2c3646a33eb26d6 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7731931779321626430+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7731931779321626430+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..67dbc35183a1cf223c19be7ad41c10066cd93052 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7731931779321626430+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c3334ebde4334499745+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c3334ebde4334499745+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c3334ebde4334499745+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c3334ebde4334499745+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c3334ebde4334499745+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c3334ebde4334499745+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c3334ebde4334499745+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1b55bf771168625cafc7c7fd42e95db99e727884 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c3334ebde4334499745+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e21d06bff81aafa11991b58f80064dc5a04db71ebd537651d4d03d6a7b862b9 +size 88413 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c3334ebde4334499745+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c3334ebde4334499745+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6e7a825ab6fc3b259cadd8bbb6b55cc859221ec5 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_7c3334ebde4334499745+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14cece69317980d8decf5a3c4ed9965738503f20f8988596601098e37fb3fffd +size 308224 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8121416822490248166+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8121416822490248166+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8121416822490248166+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8121416822490248166+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8121416822490248166+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8121416822490248166+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8121416822490248166+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..306076a9bd36c3ea5fc0e515e72b3e5ac5234475 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8121416822490248166+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8ea22281fc2add77e3c3c6711d133bc46cf99b3ee28352feb135c440d5c9170 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8121416822490248166+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8121416822490248166+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..e81989c12d6348bc2e5d21a385af226620842e69 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8121416822490248166+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_826fd2949b06a672b9bc+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_826fd2949b06a672b9bc+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_826fd2949b06a672b9bc+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_826fd2949b06a672b9bc+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_826fd2949b06a672b9bc+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_826fd2949b06a672b9bc+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_826fd2949b06a672b9bc+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..cc23fd3402c8a943a80f911e7a32db50aeb22f14 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_826fd2949b06a672b9bc+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e849d859bec3a78845d8d8edfb39d11296a9cdfa2632cfc46fceb0d4c17f2eed +size 107879818 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_826fd2949b06a672b9bc+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_826fd2949b06a672b9bc+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0d325c26a67423043949b2a3b82afe3979f37052 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_826fd2949b06a672b9bc+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9271d2c6a64d31824da4da9ab85b1f57769e801aa053e05b8b63109c5da7ab5f +size 42476544 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8410360898827170920+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8410360898827170920+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8410360898827170920+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8410360898827170920+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8410360898827170920+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8410360898827170920+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8410360898827170920+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..db71d4e3106206a25053761dca771eac1b1131e4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8410360898827170920+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19706837fa8f629355d388fc369e1998698d2c0f03aa9a93aebce4592bfd2715 +size 1585 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8410360898827170920+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8410360898827170920+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1abf05d24ed9d94e0c13f80903b1bb189c0b29a1 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8410360898827170920+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_85a3b00cb47dd0b8aebf+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_85a3b00cb47dd0b8aebf+ed72d204/model.hlo_module.pb index 7891f4c9a2c75d1b782d9143d6b23b30bbec9dcc..a1a266c9d0f31ecd5a9e5f08e8ddb43834bfa43f 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_85a3b00cb47dd0b8aebf+ed72d204/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_85a3b00cb47dd0b8aebf+ed72d204/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6ffeb8e9ece16ac41c4cf88706d49bf0b121145138f40c6107f5f96f3cb6a275 +oid sha256:97a37fa929a4e10a1de1ddba776b80db22cb13d5ac4565706dc0e73a706f4c97 size 847776 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_85a3b00cb47dd0b8aebf+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_85a3b00cb47dd0b8aebf+ed72d204/model.neff index 21921bff2561bdb6bbf49a3af3b97b0e63dbeac1..35fd902f5a055890c60156dc5729f1ca431d22e9 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_85a3b00cb47dd0b8aebf+ed72d204/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_85a3b00cb47dd0b8aebf+ed72d204/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:134d14dba6aae5338b4dbbc3b448710798a58d8b15010a09d424dfe2f7a911b5 +oid sha256:d805b88f127c5709846c5f7ebdb89770d1623f5a5e6016c3033a40eb3aaf934e size 27546624 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..93354bd42abb66b9b6e56b127441174baa403534 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4e68c099ba73beee04e489e7e95d36ce8ebf6264 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e44bcca2d0392946b04d76ea0c08920b2977dd8ebbe62045de5b09475eb6ee +size 3545413 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1383d31f337094b7e15f113a11a1e9f17bd207e8 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:256f25747a13b5e7d2d90243de1bed6f01d5792cd4a0597b5a4816d086a85af6 +size 7035904 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..156a15f92251fc61f68ca7961394d43f878e3bb0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8671664c95847cf8d9a7+cd3419b6/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e2c5a5f4491cfbd43ac527c4b0bd3a0b06581d2b6f4dc4cf9ab1700ec82f2f0 +size 7287366 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_869715862416998377+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_869715862416998377+e30acd3a/model.neff index 8cff81234109cc77899194125e20071944f55496..d5aadd1b622b08625382568c5a3c9751f5850b5e 100644 Binary files a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_869715862416998377+e30acd3a/model.neff and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_869715862416998377+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8730286359330870368+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8730286359330870368+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8730286359330870368+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8730286359330870368+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8730286359330870368+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8730286359330870368+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8730286359330870368+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..dfb3f9c17cd0199cbef0b85ad4ad19190fdf01fb --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8730286359330870368+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4672984557a6f98db9bc6b045a165de6201d8bdc3a5f28d5f23a500275add866 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8730286359330870368+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8730286359330870368+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..fab50bc52b817727587654f34914b7ae09ceee41 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8730286359330870368+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8882312230130555847+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8882312230130555847+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8882312230130555847+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8882312230130555847+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8882312230130555847+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8882312230130555847+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8882312230130555847+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a7e25eeb37121b478d999b750fbcd88e0bf27d24 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8882312230130555847+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:394ead2842be9fad710a8dd2987593d6340a0f6bf739f2bb6bf829d1a65712b6 +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8882312230130555847+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8882312230130555847+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0311dbc94d6d0f14e3d314508fe0f55d0624df98 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8882312230130555847+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_88c363db429237aad147+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_88c363db429237aad147+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_88c363db429237aad147+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_88c363db429237aad147+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_88c363db429237aad147+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_88c363db429237aad147+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_88c363db429237aad147+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..1ae3fdfff2e5d4e617bfc90376a07f658b87060b --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_88c363db429237aad147+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97438df91d4087b7d810d80603732d393604b9705b49b4adcceaeffcd4fb5800 +size 719452 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_88c363db429237aad147+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_88c363db429237aad147+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c427c5a34b89c4b57044daf5565c467196d42600 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_88c363db429237aad147+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1477221ab961818fa4293d5ebc1a25376bb914cd17d01b5c5979c4575aaaf7f4 +size 19835904 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_895360613944277627+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_895360613944277627+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_895360613944277627+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_895360613944277627+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_895360613944277627+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_895360613944277627+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_895360613944277627+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5ddeed939f2f1ae57441a94835c1c3e372b31b0b --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_895360613944277627+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29ee5278b859b36037969c475b41338dfd901468e1065d8fc4579aaf4c13e158 +size 1585 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_895360613944277627+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_895360613944277627+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b9fd29fc8a8c1f310c8b8d9e6b8fb19293d19635 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_895360613944277627+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..93354bd42abb66b9b6e56b127441174baa403534 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b7c399964b3ec27bcc58726b07bc431a2dd3a471 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d38232b18f13a6843f2572e1d5ebf9f675b587693f6af9893523e2a2c0e3e63 +size 55986 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..bdc93df5a26530d93722510506e94cde951b3836 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d04f368ee98a74d289c5725ef9e76b3b8204efb107e50754aa4c57e0b9f8ff0d +size 297984 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..0b7a92060e44418d0fdf405bbc746a3f993d27f6 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_8954b51aa51e21a41d91+cd3419b6/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e75baec4f7e9174eda684e3943cad7e2176f45d2c9dfa3532a1c21fb68e24b48 +size 306898 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..93354bd42abb66b9b6e56b127441174baa403534 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..109bcc0f4bf744e8fb75d9cdecfccbc5ae8c880c --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1baf13daf477f131f4a0605183ccd7855c12e7fad5122e3634807a697266aff3 +size 3548477 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7cf9ca59f01baecd3f94999e4f1995245a080d00 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d430973d6a80a63feebf4521fa290aa1860acae23fb344a68c94f6390b9c13a5 +size 6083584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..c599afe31ec2df5646d4c787ecd7689cbdf52f89 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_91ccf5a53294ba164897+cd3419b6/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3b708e8d335217684701b929f706c8d5c0c7a625f4027602d07a952a038d2dc +size 6333655 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9386326336670335099+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9386326336670335099+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9386326336670335099+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9386326336670335099+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9386326336670335099+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9386326336670335099+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9386326336670335099+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0fb4f5a0968de7f41688feb865adf3fd1c65cfa8 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9386326336670335099+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95ac4cb2f31241edb0bbc24e895d46e4b98131b4e55e5380122c86ce200b2f0 +size 1146 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9386326336670335099+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9386326336670335099+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..98cd7787c5be4b7245df47d7c5dab3d9ec6e9f65 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9386326336670335099+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_939df082e49d595a3158+253d6470/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_939df082e49d595a3158+253d6470/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..cb53ce53583cfe21339b4bed39f5fa1a679cddd1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_939df082e49d595a3158+253d6470/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_939df082e49d595a3158+253d6470/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_939df082e49d595a3158+253d6470/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..53165f920319a3c44d2da0c68c8939598f4e352f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_939df082e49d595a3158+253d6470/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76ac335630a721f2e3de37d63a053c4199b2c39ad751a52b3e7c05ee260d9efc +size 9665709 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_939df082e49d595a3158+253d6470/model.log b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_939df082e49d595a3158+253d6470/model.log new file mode 100644 index 0000000000000000000000000000000000000000..c98ccfe8f51f8a32764cc444cba74ed9b6ef23df --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_939df082e49d595a3158+253d6470/model.log @@ -0,0 +1,3 @@ +Failed compilation with ['neuronx-cc', 'compile', '--framework=XLA', '/tmp/nxd_model/context_encoding_model/_tp0_bk0/model.MODULE_939df082e49d595a3158+253d6470.hlo_module.pb', '--output', '/tmp/nxd_model/context_encoding_model/_tp0_bk0/model.MODULE_939df082e49d595a3158+253d6470.neff', '--target=trn1', '--enable-saturate-infinity', '--enable-mixed-precision-accumulation', '--model-type', 'transformer', '-O1', '--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2', '--auto-cast=none', '--internal-enable-dge-levels', 'vector_dynamic_offsets', '--internal-hlo2tensorizer-options=--verify-hlo=true', '--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt', '--verbose=35']: [XCG815] Estimated peak HBM usage (16.329037) exceeds 16GB. Neff won't be able to load on chip - Please open a support ticket at https://github.com/aws-neuron/aws-neuron-sdk/issues/new. You may also be able to obtain more information using the 'XLA_IR_DEBUG' and 'XLA_HLO_DEBUG' environment variables. +2025-09-11T15:00:22Z Non-signal exit. Backend exited with code 1 and stderr: [XCG815] Estimated peak HBM usage (16.329037) exceeds 16GB. Neff won't be able to load on chip - Please open a support ticket at https://github.com/aws-neuron/aws-neuron-sdk/issues/new. You may also be able to obtain more information using the 'XLA_IR_DEBUG' and 'XLA_HLO_DEBUG' environment variables. + diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_958184176017870682+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_958184176017870682+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_958184176017870682+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_958184176017870682+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_958184176017870682+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_958184176017870682+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_958184176017870682+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..934b21876914fcdf9aab30fd43c5d2d458dab872 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_958184176017870682+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3caca14697a55e9d583316a1e5009411087bc4c2c21ca1ba38bd1d90857ccbb4 +size 1585 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_958184176017870682+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_958184176017870682+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1fe7bade1fb53e8f7918dc8cd3b870ff8029528a Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_958184176017870682+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96aa20706930df3658e1+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96aa20706930df3658e1+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96aa20706930df3658e1+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96aa20706930df3658e1+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96aa20706930df3658e1+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96aa20706930df3658e1+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96aa20706930df3658e1+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5a9a496595b5357604e6b6a2acc95580f996756e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96aa20706930df3658e1+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ada6b6503422ec5090ed0ed680e54be4e4f63bd6e02f8406896e0b3978536633 +size 665847 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96aa20706930df3658e1+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96aa20706930df3658e1+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7036a39c20bde38ea3787bd2c5df264ba7771066 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96aa20706930df3658e1+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:951c556e5bcbd4830b7d098213dee36b17d08bb83852f566c21134da5f20f4bd +size 21648384 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0e4e764c67b2b733f69ba66834bc26e694ab9473 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffd42f55cc5c81b6313f96e55873674d2133e9043a79afb6e612b5556ccd1348 +size 90039 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..aadf5a9f750f56ca0779fbfdd84f77a2b2da48e9 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:599762ae4b0636a1734145c644de6d9b73a0b0fbe8ac978b2bb8b60e78a53d8e +size 236544 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..a2306779787c7af0ffa2ca58209574c1b9f66270 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f456d652b2d2b5604f+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f71e39c17a3411e18568c55b52651b53ab17e1d4e8b529b9ac921e9cee82761e +size 247185 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_978910d0b56af3a47501+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_978910d0b56af3a47501+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_978910d0b56af3a47501+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_978910d0b56af3a47501+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_978910d0b56af3a47501+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_978910d0b56af3a47501+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_978910d0b56af3a47501+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..53106159b41032be7c47dbdc5a3c64a8376b0ba1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_978910d0b56af3a47501+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bfdc0760a79380ea1098fa4aed18a291ebcb6762914301413e21bf0d01ae0bf +size 81089 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_978910d0b56af3a47501+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_978910d0b56af3a47501+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..96fc08cdd8288b538319c02e4ce83c17b7deb53e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_978910d0b56af3a47501+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea708693657b4495fe8c265dbfe08ff697b61c8937de5b2b0abd16b63663a0d +size 226304 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9817560555747346786+e30acd3a/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9817560555747346786+e30acd3a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..32157f229be17480afc9e02a7ed48ca0cbc8f22a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9817560555747346786+e30acd3a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9817560555747346786+e30acd3a/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9817560555747346786+e30acd3a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9817560555747346786+e30acd3a/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9817560555747346786+e30acd3a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..6fd01a462989bdb0f9262cf9df66ee190b67e888 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9817560555747346786+e30acd3a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5db9875bfb45337adbb610dd67d5895463189bd817618cec70e55fa3a40c26a6 +size 1584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9817560555747346786+e30acd3a/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9817560555747346786+e30acd3a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..3c890d884c056a40b01de1310cc3b253959a3976 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9817560555747346786+e30acd3a/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..640a81f6e36a80e7e418419a201f1be054ddc5ac --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_37cc541f-5422-47c2-bfcd-2c2315456b7d/compiler_workdir/AttentionModelWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8496781848c02ecd308b5b2c5a3c342b702425e7 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51e79a5cc325f9a317d158d931d75ec73ae1cfb16a4d83343a2593edd95d0044 +size 8979 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1ea58ed387a4a9be184523e080dadc16aca6e43d --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2921a248a0a6d5ac64fe039f2ab144f42edd9de9726386085ae64fa04a4abebb +size 195584 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..a23a7e653e986e39df5dc10e6e17f49231de607a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9ba467e042d35e9b674e+183b369f/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd3bb8d33675f04c83039615c88efb0b98876a94b4057c272d3ddf2fbde3eb98 +size 198230 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8fff47b5086ee5079a230a53eb41a92acac61499 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e4068082d0b537a4ab9ca1b9bbb4463fd32fdcde75aab900c7ef7212ed55d98 +size 625621 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..96025dc2c721db659d1380875a741ecbd6e43eb2 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83363cfd17c5c2e282dcc95246a712b4efd20bdb2dff7820bad9cbf508e9a6d3 +size 1168384 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..878eece4f8d62eaa3e6c0c74ae4428602b39db5a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_9dc23dbecde949377e19+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ec0bf25dd121c1fae30f00e47234de4dff684e44867a34c29fcea84ae6704e2 +size 1313410 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a063942b4ff1b0d8f4dc+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a063942b4ff1b0d8f4dc+a9d440f5/model.neff index 5629b4356295d92253421403b140dc57b4e15466..58fddf08f26149feb57540bfb4b90f99030133a8 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a063942b4ff1b0d8f4dc+a9d440f5/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a063942b4ff1b0d8f4dc+a9d440f5/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4ad71d8b6338ff2c14e47e9b22d8cfb8d91979355c7cf8427e6452fd95f370a2 +oid sha256:245bada10f4582fed1ceb499a5080110993224a0103d5ecae5a07f6863258d33 size 2233344 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a063942b4ff1b0d8f4dc+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a063942b4ff1b0d8f4dc+a9d440f5/wrapped_neff.hlo index 2559fe3b1db79fb84eae71fd231ba345d2f05441..157566be9c1b1509d132a3c49247b4807c32707f 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a063942b4ff1b0d8f4dc+a9d440f5/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a063942b4ff1b0d8f4dc+a9d440f5/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0ef2a9d2c8684d1a2494eaf6e20339f67a87ce9717662b111f9434525ad99ef4 +oid sha256:d4c95c102a8729ed58b78094ae57d047361ccc53a7fc3b96336843930bd4a291 size 2303088 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a8844fe97439b2667680+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a8844fe97439b2667680+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a8844fe97439b2667680+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a8844fe97439b2667680+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a8844fe97439b2667680+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a8844fe97439b2667680+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a8844fe97439b2667680+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b5b48885de03cb92ef95ca0e2d8b065a979ca57f --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a8844fe97439b2667680+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e49db54c9f59a8ed22017758ba4c3885791e87ae22f6aea1a65af2d2fdef1e90 +size 581894 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a8844fe97439b2667680+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a8844fe97439b2667680+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..254004655177d848463d007923eb35b595989f72 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a8844fe97439b2667680+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac0207bc53613864486455ff22206b0a4f31d43ccbbc342dc4f56e2d9bb9154c +size 2724864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a9b761f317f27ca2c845+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a9b761f317f27ca2c845+a9d440f5/model.neff index 62c08c0dcf65c3a657bc6761c5570bb4d2599e37..77112ea337b384246bc1cc5e465864ac7b3ac42c 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a9b761f317f27ca2c845+a9d440f5/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a9b761f317f27ca2c845+a9d440f5/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3943a35d4a79c83f1ae10ba16c0785b81d73494ad9f043f5c51ae1e6ccb160ea +oid sha256:b303572e10366024665d0c7b8a998379ecedfcf0daa4c490590e33e3858238e8 size 4998144 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a9b761f317f27ca2c845+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a9b761f317f27ca2c845+a9d440f5/wrapped_neff.hlo index 7d3ff5c29bcdcf392e80bd46f9e323f37b752710..50e0ff2876dd4a82dc79687f5f3483c3a528e5e3 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a9b761f317f27ca2c845+a9d440f5/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_a9b761f317f27ca2c845+a9d440f5/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f06dfa5266a83fea6bc8becedc14e5393fd3765894bb33dcbb1381dc870cc22 +oid sha256:5af64a54fc92984175f1f6d3cf1aa627df4ec8abe31d4d3c033c61a8c9ab55a8 size 5171427 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ae0fabd3d0b75f0150a0+253d6470/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ae0fabd3d0b75f0150a0+253d6470/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..cb53ce53583cfe21339b4bed39f5fa1a679cddd1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ae0fabd3d0b75f0150a0+253d6470/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ae0fabd3d0b75f0150a0+253d6470/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ae0fabd3d0b75f0150a0+253d6470/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ae0fabd3d0b75f0150a0+253d6470/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ae0fabd3d0b75f0150a0+253d6470/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..80148f1d687144285b6b69f925994b0242431520 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ae0fabd3d0b75f0150a0+253d6470/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2332baeb0d308febdb97fcb05ef1ad4e1192e9902603bb488b0381d1bf94380d +size 63776 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ae0fabd3d0b75f0150a0+253d6470/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ae0fabd3d0b75f0150a0+253d6470/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..e4715ebbf1325b1f2a278f25831fdb122cac2f33 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ae0fabd3d0b75f0150a0+253d6470/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:215b39aafe9a55e761356d8ea81883bed7b6f85983535834c3564e379dfd694d +size 318464 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..705784f85650c65ff8d1c44a8e66b14b56a345c2 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6f3beaed47689b723e87507fc62eff03bc6babf99ebff995ce214d8f73eac33 +size 636354 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a3a571f1bd26cba4919495fa47f35036477c9071 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a26ef1c1e63da491f0e2d1480b95e0e2666d55ea047709aa20d737ad3132927d +size 431104 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..c722cf9d1e081d2709c9cf81223a66083e828fb5 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b576f2782b3f3348dc52+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:586be70deca88721229e2ed7fe145b1a6f9d21b9ee7a9b02a7fe62f8a938adc3 +size 449015 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b75a1633e11cc79ab173+677eeb9d/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b75a1633e11cc79ab173+677eeb9d/model.neff index aca14539804f206fbd228a8b100b7570a87f900e..29bcacf6bf3f8f8e631e5aa30ea9b6766f0693c0 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b75a1633e11cc79ab173+677eeb9d/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_b75a1633e11cc79ab173+677eeb9d/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f1f7416533727b1fa0d82acbb80380a8156a7a8e53fe897f87fb3a7d309410fe +oid sha256:0dea24cc079d5f17838a99d47df885b1511b36498593e63aa19a6510d978c264 size 2694144 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bbb0c02d6e06f337e549+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bbb0c02d6e06f337e549+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bbb0c02d6e06f337e549+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bbb0c02d6e06f337e549+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bbb0c02d6e06f337e549+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bbb0c02d6e06f337e549+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bbb0c02d6e06f337e549+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..de0707bd8623b511536894ce23bd06617ecbeb15 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bbb0c02d6e06f337e549+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f660949bb2cab99b5089891b82c30be2231452ec8de9805200759f28a28d883a +size 104367341 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bbb0c02d6e06f337e549+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bbb0c02d6e06f337e549+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..622fcd4513272e80a1d9268edb2d1226fe34fa94 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bbb0c02d6e06f337e549+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9293bc3c4e67b2d20c5686b8c1fb26107ef467b1c29589845f6639e1dbbae0f3 +size 38984704 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e39362994c1679aa5165c7d5a6df2d8dec1b4c80 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15362c6d52e74b24ac0eb1eec6b9301b4c06a679a07d8f7d9c8c08ccde70eb94 +size 80739 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..7c14608b0f8ccd6253325aa5ed50905410f6f63a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e68a76f10320ff5d42f050fe1c47771ba6cbacd17ac69f38f98df3726a3331a +size 216064 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..16b339ba3687a755a0b13cdd5691f2dfba9fd212 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd02c2f7c4741c76fe15+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd62275e4f4cda20ab569c4cf4400e0cf00f54a14dcb048cee54fd347acfa501 +size 223802 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_cb6ef7b1205d1d19bf46+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_cb6ef7b1205d1d19bf46+ed72d204/model.neff index 9c3abcd4b1116e32c1e8b91daaab7543c1bee18f..9db050ed48195749898ae0cad8685be0fc268329 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_cb6ef7b1205d1d19bf46+ed72d204/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_cb6ef7b1205d1d19bf46+ed72d204/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4492649f3ff048845468a54a5c5784fef7a4dc5f56df87f811e1db00990653ba +oid sha256:a19b13f8bbad710539910031ea87d11b9923f862a5d17bc149fc0657894a76b9 size 31878144 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ec00951bc7ebde2143dfa72345eb3a44ed20f182 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd153213a2751e0d15100aa0467bf7538b94a0344bd9890daf2705e96ac1990f +size 103179258 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..2815497496f5b360643569f55d27414adbd66e0c --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0be1d76828f4c564ad6225fc249f3ddd933295963bc2ef353ff97a48c337e4ea +size 7742464 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..57423eeb950cd6829a93d4a532c610c78db2a82d --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0af99bdae3af4d95a22+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b434e9136e6af6215840183871c0f74e8652f547f35b2793081455ddf8ca610c +size 8059735 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d83e395611ddc3a29d9f/decoder/model.neuron b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d83e395611ddc3a29d9f/decoder/model.neuron index e508428cb594c801349275dfcf5fd1e3bf8b1caa..96ca96eee14a7820a06ace716cdf4f74ac59ea93 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d83e395611ddc3a29d9f/decoder/model.neuron +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d83e395611ddc3a29d9f/decoder/model.neuron @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a125074fe97f2423bbd01a6203536371aed73cab8724c49156b56f13ab714258 -size 621268 +oid sha256:b016e529b0db94f982dc684c6cd597ff95142018c4401531e3d45c334ca808bd +size 621326 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d83e395611ddc3a29d9f/encoder/model.neuron b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d83e395611ddc3a29d9f/encoder/model.neuron index 501702fac626c05876e6664d6955f70236f3045d..2516a5cf490371a0afceba1f02930b588ba9fdc5 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d83e395611ddc3a29d9f/encoder/model.neuron +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d83e395611ddc3a29d9f/encoder/model.neuron @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9b783ea6ed00b83d80a1c1f7198ccb054d0a458fb200f6721567b144aa81ae53 -size 351030 +oid sha256:4dd637aeb4e611e2a48213ff691ba79eaa6d693c11e6a71733df8ddae343641a +size 350074 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..55f45c3a9863883a7fe6038b38e200d534136a49 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_21aaf1ef-8433-4296-aec1-8c76011195d2/compiler_workdir/AttentionModelWrapper/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a11cc062167102b0f4faa9fdf16388d72d9e0015 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4590b82eb167fd46963abdbb717cc18cb9511961a3393d100eeacdbdc45b0243 +size 11280 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..58be1555d80c8c6cd79dd9505d6260bb1772e2c7 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c76bdb8b377803e1cd75e7006f8021eadc4675562936c50cbb4be6c7648f4cc +size 1096704 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..0919735f41c436aac37829b035450689e61a2c1e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_d8d9690a1b9d2bd4cec3+87c2f0d1/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:986c0b70d2bf415feba62be729d104a13794be67c4cb653c733fc426dca5f95f +size 1099577 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db25850f47f3c97209ab+ed72d204/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db25850f47f3c97209ab+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db25850f47f3c97209ab+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db25850f47f3c97209ab+ed72d204/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db25850f47f3c97209ab+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db25850f47f3c97209ab+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db25850f47f3c97209ab+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0d2ee3ee46bf15b601812f4712bf5a60de58923c --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db25850f47f3c97209ab+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7c077b146c093d1094b99be7d6233d2a6d03d77450a33172f6a69d844f35002 +size 665566 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db25850f47f3c97209ab+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db25850f47f3c97209ab+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..09a3c46ccb7a631ba4b7ccd46a1976a29a273b89 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db25850f47f3c97209ab+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1a435429abb26d37524d78bf65172fd6ab2172cbe033df03f49aa8d073542eb +size 492544 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..91eb5b470d3095d426b6ea9548fecd0d9bb4c161 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20c40a64710bd37c5dafcaa17195416b33bf361c0926c511a6c157106f56e657 +size 578515 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8eec58394bb37cbd1a4c3c196fc2b459ebab7ec9 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6376ca6fb4233ef52b9ba16a63525458a28a39113643a6428e024b3e198d01fb +size 1444864 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..c86a717be1bb0ed8c7f4a43e5d7fc659e39ef102 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7f53e8fbb89bd8136b+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae053162739c06d034e10b5b8c093fe5361328f9817cc130d884d84301f50c4 +size 1589890 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..437c307e7f1d7194897bd0ea577862fac5f47750 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_5a18d9d9-d482-48bc-afe3-652891d43a54/compiler_workdir/NeuronLlamaMLP/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e6084ce6d845ff91b01c0cbfd758d24019f38ef9 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a99355de7043422bc03a8df795afecf586999ec744407bc4fbffe63f002ba2df +size 1931 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..2b18d78a211a997c4ecc2401ccb0b3901feb12e2 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f5e1064fdb76a26a16986136d6a624bc088a8246ece8d51cb1029ea58ec10e +size 113664 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..a088eb7f8a8bb13d1bf2b2a7f8de917e0f97806e --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbb440cbea65d345491d+e4fc2c3d/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7149d47a6240f4a48cef14bd8b964a41a5fff71250018d71e660358ab25b3299 +size 115643 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dcf9688803fac8be3bc6+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dcf9688803fac8be3bc6+ed72d204/model.hlo_module.pb index b8a9679d389721fe5e0b7e823b10ef0e15f4dcd5..2e8321f27f38e54cc06df334847b4ec87495997b 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dcf9688803fac8be3bc6+ed72d204/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dcf9688803fac8be3bc6+ed72d204/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:faf230a29d7c5746f640a9b189af232ed164e806cb1accaefe12c42979cc1673 +oid sha256:eede4373b2454c24f7d226a16a1efa44391995aa3e7e7cbc8b4af8aec85bf412 size 900724 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dcf9688803fac8be3bc6+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dcf9688803fac8be3bc6+ed72d204/model.neff index f8c74c7c17b62eacfd5b43a3732e6406835bf44d..fde37c42837586b74e95787e6ddd852c98b72c7d 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dcf9688803fac8be3bc6+ed72d204/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dcf9688803fac8be3bc6+ed72d204/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c8988d792d050311cca8b32114e026df9b6bc8cfdb6c0bfe28ab8d2572da1744 +oid sha256:e8cbe181602df06148ab18da3141ae57a33c8fc4c36717b3f59637b742783ba2 size 5817344 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dd67c7d76a4a3b7bc5ff+253d6470/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dd67c7d76a4a3b7bc5ff+253d6470/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..cb53ce53583cfe21339b4bed39f5fa1a679cddd1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dd67c7d76a4a3b7bc5ff+253d6470/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dd67c7d76a4a3b7bc5ff+253d6470/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dd67c7d76a4a3b7bc5ff+253d6470/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dd67c7d76a4a3b7bc5ff+253d6470/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dd67c7d76a4a3b7bc5ff+253d6470/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b64a1697759c5c559a7c1e9109cdfbd2e0dc8b76 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dd67c7d76a4a3b7bc5ff+253d6470/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fbd912d9b5ddd548a60cd6f06caf6fab6c360df519845d87f637cb6c1b6e724 +size 9670898 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dd67c7d76a4a3b7bc5ff+253d6470/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dd67c7d76a4a3b7bc5ff+253d6470/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..fe9e2b8fe8d013fca177a18e9957a33365fcf259 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_dd67c7d76a4a3b7bc5ff+253d6470/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abb3918c4f75e7e4dd978ff5a82d00e9547358f20ac608a6fd40853297acca6a +size 17439744 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e57cbde649dde732937d/decoder/model.neuron b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e57cbde649dde732937d/decoder/model.neuron index eba3f1b9a08a81bd5109cb023b2403751a01d3cd..d4611733bffacfd496a35fad9e4bea0f87864843 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e57cbde649dde732937d/decoder/model.neuron +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e57cbde649dde732937d/decoder/model.neuron @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eef6db75fc46e7de94c915df2478eb1903e5bfcef82375a6efd61d9e832cec39 -size 1191764 +oid sha256:b80c82c106b87f1642adf055d6ccb3cdd86256f548428faafa86034794404dde +size 1191828 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e57cbde649dde732937d/encoder/model.neuron b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e57cbde649dde732937d/encoder/model.neuron index b58f03b66612b5e8263420b251f9eef61a2990bb..93f48730f12ba941c75da88ec403650bb31b6a67 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e57cbde649dde732937d/encoder/model.neuron +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e57cbde649dde732937d/encoder/model.neuron @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:67a159b1dff08a90c7d68e4183bc8e88c58e9c125d0f5310908f0b218529c3b4 -size 350900 +oid sha256:2e3fcf5d6788278c0da76de1c0ccb5d7c3ddd39af9404094ba07cd213c650772 +size 350964 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5e262df0f4573dfd367+253d6470/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5e262df0f4573dfd367+253d6470/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..cb53ce53583cfe21339b4bed39f5fa1a679cddd1 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5e262df0f4573dfd367+253d6470/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5e262df0f4573dfd367+253d6470/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5e262df0f4573dfd367+253d6470/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5e262df0f4573dfd367+253d6470/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5e262df0f4573dfd367+253d6470/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..fb2a94b3c2839ae00c8cc1432100570c2a7c7324 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5e262df0f4573dfd367+253d6470/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:771da6a5c18eebc304cca5c020b4d530eb3efee0760e3f5fa09bb7450e1d7f59 +size 9621086 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5e262df0f4573dfd367+253d6470/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5e262df0f4573dfd367+253d6470/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5fe0f8cb744752d9379efc35ae86ca3f4ea02cf7 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5e262df0f4573dfd367+253d6470/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fd1427362c7fca5fb5fc50a45d02bf2906ae40b0d9c9e428954efdc17841b89 +size 17409024 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..fd50cd3da7de1eb5e77056dc4c1acab7b7a6a90d --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--auto-cast=none", "--model-type=transformer", "-O1", "--logfile=/tmp/nxdi_test_a2a3faca-a868-42aa-9426-1c8d236b46dc/compiler_workdir/NeuronRMSNorm/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..6a2752c25c9f7e1092e2b55c010694e168610ce3 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c774c6626fc91684e924b843c1fe807dadbbac6d8a8e19443663b43c13eac35 +size 1165 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ecb3d6aa6430d0a29ec49760036a192027e67486 Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/model.neff differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..2dcf8fe239901e50b1d1c294186ebc26334195bc Binary files /dev/null and b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_ee6d087df2e1cce2446e+62cf4c7d/wrapped_neff.hlo differ diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..93354bd42abb66b9b6e56b127441174baa403534 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--enable-saturate-infinity", "--enable-mixed-precision-accumulation", "--model-type", "transformer", "-O1", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2", "--auto-cast=none", "--internal-enable-dge-levels", "vector_dynamic_offsets", "--internal-hlo2tensorizer-options=--verify-hlo=true", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..791a7b8a582f433cd6e5ffd08589614fd9b25f93 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:632ebdbb83a6e8aeca497132602314bf9294c422f665e1cb531ef57d0a392070 +size 8944812 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8064d2995067b255360ab5726f53b714b6c7cdb2 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a168d7bce50b39b9770ed7519cba29a18cc644e2ef0c6ad535b822402bbe8bba +size 1977344 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..38c7bb883e4004909c2a0df8d8f5965f24f49278 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_efa7fe965caa79aca41c+cd3419b6/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea0d939811c2a42c6c897da50cd46b7e5fe12620f9127c184da98311cf280908 +size 2249687 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f9ed5e3ab30730f18597+ed72d204/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f9ed5e3ab30730f18597+ed72d204/model.hlo_module.pb index 9f21b06d3e3a6a9b5ec4b90cc3e83077053e68ab..b2ab452d9ddbe7e941b15dea1c5143d6f2f8b1c2 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f9ed5e3ab30730f18597+ed72d204/model.hlo_module.pb +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f9ed5e3ab30730f18597+ed72d204/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3f348d7b362916cd5c9ae844f1512726d3a96dbc7698bcd652a48f7cd317ac87 +oid sha256:30865aac066f620329c25ae3bcc4ab61140ae94beefd253a370139c970315bc2 size 1036280 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f9ed5e3ab30730f18597+ed72d204/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f9ed5e3ab30730f18597+ed72d204/model.neff index 30cc1bdc64a51cf2d1ee41e78ebd1f35c6d89f77..73c854522789ef93794cd120cf94f0b88ae729a1 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f9ed5e3ab30730f18597+ed72d204/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_f9ed5e3ab30730f18597+ed72d204/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1d92b43193ac64c59582f565c4aec7d1ed451e489a00f042d015bbd0e8c67cef +oid sha256:7ade42c669c083ac77bd9e757120cf37c07e06032242b4ea18ba5431311c8549 size 10681344 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fdd3c2470676e1b82f01+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fdd3c2470676e1b82f01+a9d440f5/model.neff index c60c7ed4c59b48d77794f82525223ffcfaa98f1f..a383382713e6222f7f183ad91c13c67fa021d7bc 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fdd3c2470676e1b82f01+a9d440f5/model.neff +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fdd3c2470676e1b82f01+a9d440f5/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:965e436898344a1794a7485a6d22c9270a361cc0d1708fc79a009622a4f1024f +oid sha256:ad861842425dc2da9f200172d770c01d1923969a81a8fdedfc5c6d8b33e33d5e size 2612224 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fdd3c2470676e1b82f01+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fdd3c2470676e1b82f01+a9d440f5/wrapped_neff.hlo index 881790075f7406b5325cde84193ff6c94f84d907..1f3df519f62ae22342cf1831077f84c377555e70 100644 --- a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fdd3c2470676e1b82f01+a9d440f5/wrapped_neff.hlo +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fdd3c2470676e1b82f01+a9d440f5/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:89b05680539419dadecda1725b6115918e24721e06b15bd7a0cef2d8306d1d09 +oid sha256:d26aedd259a8a6b35eadcfff9de2d3eecc696164f2238500c3d74b7c8cebf535 size 2742657 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/compile_flags.json b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/model.done b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/model.hlo_module.pb b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3d6ef694608ef9e66aa33f476a2fe1b1a666273a --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63a35631f789d0639ee704f5b00fbb1c39d2bd32c4ab5f5f596df76e21e56c27 +size 102398391 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/model.neff b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..60240658d973b1e6418699c3eff08aa5d5cf33fd --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33caeaadbc10c0e8acc791ab1ed93f764257d306e8dcae087a51ae90b0167e21 +size 4752384 diff --git a/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..5a96412e117fb9a415941de9ed37587dd0437727 --- /dev/null +++ b/neuronxcc-2.19.8089.0+8ab9f450/MODULE_fecd93fec248a64a0b00+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c34ec63b3c6bcc2baba525bf2e36008c165a77b92ceddac688246667d1c5f5b1 +size 5069544