diff --git a/.gitattributes b/.gitattributes index c5faf2a401f1821e0612e27c2b74c82b61481e84..bb527f228fd12fdded44554dfe5c151ecc22f383 100644 --- a/.gitattributes +++ b/.gitattributes @@ -5466,3 +5466,22 @@ neuronxcc-2.21.18209.0+043b1bf7/MODULE_b3156313afcf6f9c1c2b+24129607/model.neff neuronxcc-2.21.18209.0+043b1bf7/MODULE_ea6d0b2d03e12e6e6709+24129607/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.18209.0+043b1bf7/MODULE_f668e8059b4ad00c098b+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.18209.0+043b1bf7/MODULE_f668e8059b4ad00c098b+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_06cc3d220bd81f31483c+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_3321b4e97123c041192d+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_394461f5b793e1c6ddbd+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_45c1a0c25eab451751df+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_5988b4b9e2fe27c7105c+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_616029436a1201c3f014+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_6b37881de0fe95bd8128+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_823cb759235f53a8fe88+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_af5ca2287a6b0d70aac7+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd3408e2c963ac7da056+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_c345ba838e8c529a43e2+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_cb4d848c61c58d4a5351+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_ce7eb4c5ef357b61cc09+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/model.neff filter=lfs diff=lfs merge=lfs -text diff --git a/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-0.6B/11315149f2fec5f9b1e3.json b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-0.6B/11315149f2fec5f9b1e3.json new file mode 100644 index 0000000000000000000000000000000000000000..d4b983f1e437991d05a261ab0d5a5d6c38e9666d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-0.6B/11315149f2fec5f9b1e3.json @@ -0,0 +1,87 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-0.6B", + "_task": "text-generation", + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 1024, + "initializer_range": 0.02, + "intermediate_size": 3072, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 40960, + "max_window_layers": 28, + "model_type": "qwen3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-0.6B", + "checkpoint_revision": "c1899de289a04d12100db370d81485cdf75e47ca", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.18209.0+043b1bf7", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.2.dev0", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 16, + "num_hidden_layers": 28, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/040b1e23663eba2981b3.json b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/040b1e23663eba2981b3.json new file mode 100644 index 0000000000000000000000000000000000000000..c6b9445e7e04fce43b67255375101dda336bf9d7 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/040b1e23663eba2981b3.json @@ -0,0 +1,87 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-Embedding-0.6B", + "_task": "text-generation", + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 1024, + "initializer_range": 0.02, + "intermediate_size": 3072, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 32768, + "max_window_layers": 28, + "model_type": "qwen3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 6, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-Embedding-0.6B", + "checkpoint_revision": "c54f2e6e80b2d7b7de06f51cec4959f6b3e03418", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 24, + "max_batch_size": 6, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.18209.0+043b1bf7", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.2.dev0", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 24 + }, + "num_attention_heads": 16, + "num_hidden_layers": 28, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151669 +} \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/6f5f2cf26c21b525ca82.json b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/6f5f2cf26c21b525ca82.json new file mode 100644 index 0000000000000000000000000000000000000000..75b8ef70669d0bf8af668dd9dbc67da47647e4dc --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/6f5f2cf26c21b525ca82.json @@ -0,0 +1,87 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-Embedding-0.6B", + "_task": "text-generation", + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 1024, + "initializer_range": 0.02, + "intermediate_size": 3072, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 32768, + "max_window_layers": 28, + "model_type": "qwen3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-Embedding-0.6B", + "checkpoint_revision": "c54f2e6e80b2d7b7de06f51cec4959f6b3e03418", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 1, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.18209.0+043b1bf7", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.2.dev0", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 1 + }, + "num_attention_heads": 16, + "num_hidden_layers": 28, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151669 +} \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/8f2f6fc022fb92a08835.json b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/8f2f6fc022fb92a08835.json new file mode 100644 index 0000000000000000000000000000000000000000..e20956915930705e090d84a283ad74cf2951b4c3 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/8f2f6fc022fb92a08835.json @@ -0,0 +1,87 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-Embedding-0.6B", + "_task": "text-generation", + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 1024, + "initializer_range": 0.02, + "intermediate_size": 3072, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 32768, + "max_window_layers": 28, + "model_type": "qwen3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-Embedding-0.6B", + "checkpoint_revision": "c54f2e6e80b2d7b7de06f51cec4959f6b3e03418", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 24, + "max_batch_size": 4, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.18209.0+043b1bf7", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.2.dev0", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 24 + }, + "num_attention_heads": 16, + "num_hidden_layers": 28, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151669 +} \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/922b8f110b9e3fdaa766.json b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/922b8f110b9e3fdaa766.json new file mode 100644 index 0000000000000000000000000000000000000000..a52aa077e4128f03e4957bec8ed436194e993498 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-0.6B/922b8f110b9e3fdaa766.json @@ -0,0 +1,87 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-Embedding-0.6B", + "_task": "text-generation", + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 1024, + "initializer_range": 0.02, + "intermediate_size": 3072, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 32768, + "max_window_layers": 28, + "model_type": "qwen3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-Embedding-0.6B", + "checkpoint_revision": "c54f2e6e80b2d7b7de06f51cec4959f6b3e03418", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 24, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.18209.0+043b1bf7", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.2.dev0", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 24 + }, + "num_attention_heads": 16, + "num_hidden_layers": 28, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151669 +} \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-8B/3c013915c647bb8e6712.json b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-8B/3c013915c647bb8e6712.json new file mode 100644 index 0000000000000000000000000000000000000000..fc9257bf47a2673fcfa1b8741d8a42eb0bb31ad0 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-8B/3c013915c647bb8e6712.json @@ -0,0 +1,95 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-Embedding-8B", + "_task": "text-generation", + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 12288, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 40960, + "max_window_layers": 36, + "model_type": "qwen3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-Embedding-8B", + "checkpoint_revision": "1d8ad4ca9b3dd8059ad90a75d4983776a23d44af", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.18209.0+043b1bf7", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.2.dev0", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 36, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": false, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151665 +} \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-8B/b60a4e37d9a2dbabe961.json b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-8B/b60a4e37d9a2dbabe961.json new file mode 100644 index 0000000000000000000000000000000000000000..7b717ebe5f9bf604f9b98b02a7f8928d1c5e02d9 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.2.dev0/qwen3/Qwen/Qwen3-Embedding-8B/b60a4e37d9a2dbabe961.json @@ -0,0 +1,95 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-Embedding-8B", + "_task": "text-generation", + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 12288, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 40960, + "max_window_layers": 36, + "model_type": "qwen3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 16, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-Embedding-8B", + "checkpoint_revision": "1d8ad4ca9b3dd8059ad90a75d4983776a23d44af", + "continuous_batching": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 16, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.18209.0+043b1bf7", + "on_device_sampling": false, + "optimum_neuron_version": "0.4.2.dev0", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 36, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": false, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151665 +} \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06cc3d220bd81f31483c+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06cc3d220bd81f31483c+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06cc3d220bd81f31483c+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06cc3d220bd81f31483c+fb4cc044/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06cc3d220bd81f31483c+fb4cc044/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06cc3d220bd81f31483c+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06cc3d220bd81f31483c+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..b4384cef07218b1c31307e7b1f0d88e15f052dce --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06cc3d220bd81f31483c+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7607df5f2c7c5132d87730619aa3366ddb2035e223a239aa5a14a1c9d7469d57 +size 848773 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06cc3d220bd81f31483c+fb4cc044/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06cc3d220bd81f31483c+fb4cc044/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..53ebea2910a249a3a5cc978a22d9b51771f9d7e8 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_06cc3d220bd81f31483c+fb4cc044/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d799faaff5e25a7531d12f187cea88faf79b29e045c2b88d2c3ea0b8bd94cab +size 5786624 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0e5b82b136a38372d842+6e4949b4/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0e5b82b136a38372d842+6e4949b4/model.hlo_module.pb index 7c6b4dac34e345ad3a19aaf4aa5aa86472ebd841..b6d58bfddea9fff9d33e332a71aa7e3df064e510 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0e5b82b136a38372d842+6e4949b4/model.hlo_module.pb +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0e5b82b136a38372d842+6e4949b4/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:00ef644e5979852b4384b292b9654db3d05671a18e7c2997041f8228841c496b +oid sha256:ceb0a23b716925f843a16e15f9f0385f067950c8f9f55cd7b3db583ba03b1a7e size 84807 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0e5b82b136a38372d842+6e4949b4/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0e5b82b136a38372d842+6e4949b4/model.neff index 5fd5aff27192a38627879cc594591326dce07c8d..65c3e0dc513174a5405638385f4e4fd1b6fb4ca4 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0e5b82b136a38372d842+6e4949b4/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_0e5b82b136a38372d842+6e4949b4/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d8c78397b4802378ef5aed6265b491f7d9f2c88d33d42c672b8394aa40fbad78 +oid sha256:0f26bc2e40e6e21bffa40348dd28785a0c5ba6ae26126553c85435559849af5d size 646144 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_306829ff9e3811933fe7+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_306829ff9e3811933fe7+a02c3a36/model.neff index 40cfc065101a6b409f4e796118fb9f9feaa93345..6ff7e2c0315aeb33b1e8ee2fe5b817ff3f76d8a4 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_306829ff9e3811933fe7+a02c3a36/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_306829ff9e3811933fe7+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:be0a2ca1ec6303e7c7f1f96a0c58635b22fcc2c5566988781cf2876a2f11f9d6 +oid sha256:690971e38e78e6e8e2e0b2249904244dbe845f18a1d36cb2b763deac5fe550f3 size 277504 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_306829ff9e3811933fe7+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_306829ff9e3811933fe7+a02c3a36/wrapped_neff.hlo index 5e12641446323d9aff26b02389b7d96199c78db6..0605fedfaecfe63a3d5054643fbef3013bda8c52 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_306829ff9e3811933fe7+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_306829ff9e3811933fe7+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1941f77c35018b572d2296e153bda0c1a82b578f3486e690f2e095e5936a2009 +oid sha256:937aba417c7465954a0bf71e8d536e6ce2db41d44b477deb724f8f6154f76e19 size 285854 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_315d9491c827c077575a+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_315d9491c827c077575a+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_315d9491c827c077575a+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_315d9491c827c077575a+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_315d9491c827c077575a+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d2c16ff4a7ab3bdb7b6f0d5f1c453b7e5df4a200 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_315d9491c827c077575a+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949343b64aaeb75ac893058b4181a58759ab30c14ab879041244bb9af4356695 +size 850786 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_315d9491c827c077575a+fb4cc044/model.log b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_315d9491c827c077575a+fb4cc044/model.log new file mode 100644 index 0000000000000000000000000000000000000000..fc2f64a853b59fb1145e8759972e18fe8b3014d3 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_315d9491c827c077575a+fb4cc044/model.log @@ -0,0 +1,3 @@ +Failed compilation with ['neuronx-cc', 'compile', '--framework=XLA', '/tmp/nxd_model/encoding/_tp0_bk0/model.MODULE_315d9491c827c077575a+fb4cc044.hlo_module.pb', '--output', '/tmp/nxd_model/encoding/_tp0_bk0/model.MODULE_315d9491c827c077575a+fb4cc044.neff', '--target=trn1', '--auto-cast=none', '--model-type=transformer', '--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ', '-O2', '--lnc=1', '--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt', '--verbose=35']: [XCG815] Estimated peak HBM usage (19.257GB) exceeds 16GB. Neff might be unable to load on chip. If you believe this estimation to be inaccurate, you can disable the check using: `--internal-backend-options=' --disable-hbm-usage-check '` - Please open a support ticket at https://github.com/aws-neuron/aws-neuron-sdk/issues/new. You may also be able to obtain more information using the 'XLA_IR_DEBUG' and 'XLA_HLO_DEBUG' environment variables. +2025-11-07T14:10:10Z Non-signal exit. Backend exited with code 1 and stderr: [XCG815] Estimated peak HBM usage (19.257GB) exceeds 16GB. Neff might be unable to load on chip. If you believe this estimation to be inaccurate, you can disable the check using: `--internal-backend-options=' --disable-hbm-usage-check '` - Please open a support ticket at https://github.com/aws-neuron/aws-neuron-sdk/issues/new. You may also be able to obtain more information using the 'XLA_IR_DEBUG' and 'XLA_HLO_DEBUG' environment variables. + diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3321b4e97123c041192d+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3321b4e97123c041192d+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3321b4e97123c041192d+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3321b4e97123c041192d+fb4cc044/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3321b4e97123c041192d+fb4cc044/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3321b4e97123c041192d+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3321b4e97123c041192d+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..fed7f25cf4b93c6a441366dc54cf68d43881264e --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3321b4e97123c041192d+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34e6c39ae5aaa2365e0018b111269da40c42b131faed18711a8810bedd68a436 +size 429397 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3321b4e97123c041192d+fb4cc044/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3321b4e97123c041192d+fb4cc044/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c6eab1f1de4334b96862689fb30572e9dee901dd --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3321b4e97123c041192d+fb4cc044/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0135e8fa145738be49848914c2dbb2c52c3854a2403644f1842244e432ed0fe +size 1352704 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_34362baee2ad4784108e+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_34362baee2ad4784108e+a02c3a36/model.neff index b9cedba1fcfe7f44361be7e06d8c6f20ee9f17eb..394c147992a80dc61c65cfb271c654d1852c968c 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_34362baee2ad4784108e+a02c3a36/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_34362baee2ad4784108e+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d03c6300c55f1b499d9c5d804143ff8484a494001339977d2f2296b1ce816fce +oid sha256:adc574992e72adfe26c916de4e344ec745c5f0367620c1183437c3127f9fef15 size 246784 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_34362baee2ad4784108e+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_34362baee2ad4784108e+a02c3a36/wrapped_neff.hlo index f14318dc32b3d83e087710ff2dce7b7b0ce7a26e..c81f0318b71b9bbc335a042b83a9e87ff72482ad 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_34362baee2ad4784108e+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_34362baee2ad4784108e+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2bdbe143e93e40a8157c3303918d7b4ab8d3c4603949e1cf14e9bcf86f43e8aa +oid sha256:6e3995a13290761f8f6f89854871f6a5da48002e637efad7b67cec72e826cc1e size 255104 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_394461f5b793e1c6ddbd+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_394461f5b793e1c6ddbd+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_394461f5b793e1c6ddbd+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_394461f5b793e1c6ddbd+fb4cc044/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_394461f5b793e1c6ddbd+fb4cc044/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_394461f5b793e1c6ddbd+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_394461f5b793e1c6ddbd+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3279f1a5cdfeb71eca5b03cfcca5ced0696022eb --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_394461f5b793e1c6ddbd+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a36ee034700342382b6da2932f74a5d63b34f8b66d47da8dcd5b0cf42842dd7 +size 428915 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_394461f5b793e1c6ddbd+fb4cc044/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_394461f5b793e1c6ddbd+fb4cc044/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..af5eda3c5dc6d1cd509028962965b8a8a8c6e383 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_394461f5b793e1c6ddbd+fb4cc044/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2978f644a5df5278f76096838837e039d1d5a3dc2cf4e9c2a6cae1784f9bec0 +size 4199424 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e3c9e9db5ebafa6c488+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e3c9e9db5ebafa6c488+a02c3a36/model.neff index 6d2973d0b215591901792c6ee1343b83508c6640..71a3bdfe44c2c40ddc76a23f4e943654c9c4ca28 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e3c9e9db5ebafa6c488+a02c3a36/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e3c9e9db5ebafa6c488+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c3d4458ffd347738badcf0b23d0d413a4d36cf853e122a45c2206886aebff211 +oid sha256:40684a5208697e733fd92b531e426c9a49e2e2f3dce8fdc81afe434818f265f2 size 216064 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e3c9e9db5ebafa6c488+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e3c9e9db5ebafa6c488+a02c3a36/wrapped_neff.hlo index 41c2ec13331cf4f2100ab30005776e38d9311a86..e878da9fb5ba13604b80452f8837abbf73e8bde8 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e3c9e9db5ebafa6c488+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3e3c9e9db5ebafa6c488+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0fe259afa434f354cd2ea4cbfa55677adfcd4de255474e7d13f3ee086220a609 +oid sha256:e490cb2df34ae3582e58811ed1a9ea678ca780e9525b51113490839860539904 size 224412 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_45c1a0c25eab451751df+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_45c1a0c25eab451751df+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_45c1a0c25eab451751df+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_45c1a0c25eab451751df+fb4cc044/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_45c1a0c25eab451751df+fb4cc044/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_45c1a0c25eab451751df+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_45c1a0c25eab451751df+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..04c1b8097ceff1583e5730189770e7b7e79e8aab --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_45c1a0c25eab451751df+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f01851ab7ef0b0809a16c7e907029400056497364b603f59ab2c9f38e6cfc9d +size 427538 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_45c1a0c25eab451751df+fb4cc044/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_45c1a0c25eab451751df+fb4cc044/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0a28a6108e524e6aa8bcb7501179110d0b35f10e --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_45c1a0c25eab451751df+fb4cc044/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d530cd99cdeac86375ed3d4ee421b5db73c2cc8ec537732e3f811d227f4c1e +size 4158464 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_574e9a764503b48fbba9+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_574e9a764503b48fbba9+24129607/model.hlo_module.pb index b947beb7eb660412168aeb31c31cd8358fc861ec..062611a49b7db4bec1f9381c667ddac63fccac4c 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_574e9a764503b48fbba9+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_574e9a764503b48fbba9+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b830e756a066effbee9464b2f0ee872654f088ddd85afe47df42d75321a6961b +oid sha256:87c27fc5e9a14dd0d728587d4b5e633e65e6902974129e23c485ea65109a7a63 size 1061093 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_574e9a764503b48fbba9+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_574e9a764503b48fbba9+24129607/model.neff index 03bd51b926c290f114b9d54e4d4fed7516f2cb69..d7aa08d1d2553d9e1872ec1ccfa5f68b218d7d00 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_574e9a764503b48fbba9+24129607/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_574e9a764503b48fbba9+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2f3d938502148f35e5dcbd5ffabf9a05f9faf681ad9f9e99b65cf52a927b8cce +oid sha256:13ca12a9af7e210d81d5d48764b74bea3ad2c8dee1d5f6ec04b511070e5aa4ca size 9473024 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5988b4b9e2fe27c7105c+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5988b4b9e2fe27c7105c+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5988b4b9e2fe27c7105c+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5988b4b9e2fe27c7105c+fb4cc044/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5988b4b9e2fe27c7105c+fb4cc044/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5988b4b9e2fe27c7105c+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5988b4b9e2fe27c7105c+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ebb9e007a6c5445dfbde4f94a2ec1f094ad203e3 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5988b4b9e2fe27c7105c+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd6b6bf0feffa5e590b798a1c60710db88bec1cb49364a0829ce08a05370a91d +size 435194 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5988b4b9e2fe27c7105c+fb4cc044/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5988b4b9e2fe27c7105c+fb4cc044/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c6718c327efefad931a41f4e9c641a143705f64f --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5988b4b9e2fe27c7105c+fb4cc044/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76f32b334d4b29c0442354fbb4970d0103862810dbab9dd6e1d90f2943d2fad5 +size 4731904 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5b1c456704a89716d745+2dde74c7/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5b1c456704a89716d745+2dde74c7/model.neff index 8e151344555bffd003e00f0b6af11b6d925c28d0..2916b3c791c6e86e6519d9605dcbc80ec5f2f009 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5b1c456704a89716d745+2dde74c7/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5b1c456704a89716d745+2dde74c7/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4108281a03ea281002e10678a110e666893df5d987032383a0e7ad4e096dbeaa +oid sha256:c0d1a66ec4620a7bbd95ddcd3f0b8563e7b9fd48c9167bbb83e09de5ea8f2045 size 369664 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5b1c456704a89716d745+2dde74c7/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5b1c456704a89716d745+2dde74c7/wrapped_neff.hlo index 4a73c40c358ca15ba83bf5fd924fe2d95cb6f676..00f1bf5626daa38aadee5cdaaeaf15232e382a9c 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5b1c456704a89716d745+2dde74c7/wrapped_neff.hlo +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5b1c456704a89716d745+2dde74c7/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:90c34fd1fb81a015236d8dc844fa950ab15b39579c066d78a8bec47f68c41d2c +oid sha256:6d780e7908fb2043598326a014149c1adc7cf79ede14eaac7e57a0efd5aaaf1f size 379362 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5f6f4f62aba29e11d946+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5f6f4f62aba29e11d946+24129607/model.hlo_module.pb index f37c00bc38fad42678ca91a321988bcaf8fb6643..82b6d63ef07e8b99f982e5b2a216f4fb928ab10b 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5f6f4f62aba29e11d946+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5f6f4f62aba29e11d946+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f1fe38c017b84f73b7d3ea59c6211db2ed9d5c219e724f7fa46268df0122085b +oid sha256:4b57a81178b87e2fa8d72c53f158790060e6f323a7ea625353c0c2ecec75b33d size 694128 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5f6f4f62aba29e11d946+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5f6f4f62aba29e11d946+24129607/model.neff index 10ddbcec63fac37567195ea00183f89939688213..076477cfd754342b7fb936e67752c55b6434393d 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5f6f4f62aba29e11d946+24129607/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5f6f4f62aba29e11d946+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d1e4c997fc85f924fab368f5e7c1be4735d973e2370b8619493ad63aa1e5acbf +oid sha256:b94b84c6a5ac7142334a119a16754827bff07c49ce7dd2d1b9f71d6c2d29a755 size 625664 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_616029436a1201c3f014+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_616029436a1201c3f014+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_616029436a1201c3f014+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_616029436a1201c3f014+fb4cc044/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_616029436a1201c3f014+fb4cc044/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_616029436a1201c3f014+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_616029436a1201c3f014+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f1105808fa0097ad3d66f3f2bccc9b12bc39f10e --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_616029436a1201c3f014+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ec5e1a252b77227b0d8bf55d0ad8984aaaf05d34c12fbff567fc48bf7f1f98e +size 431779 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_616029436a1201c3f014+fb4cc044/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_616029436a1201c3f014+fb4cc044/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..54d7db4509903e9a8b66923e70feb5174a92a3e1 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_616029436a1201c3f014+fb4cc044/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15884b84559dd7029720a5a83714e250e569eee383b805015a1b0a990e58ebc +size 4158464 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6b37881de0fe95bd8128+24129607/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6b37881de0fe95bd8128+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6b37881de0fe95bd8128+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6b37881de0fe95bd8128+24129607/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6b37881de0fe95bd8128+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6b37881de0fe95bd8128+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6b37881de0fe95bd8128+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..dfff463578c0ede0890c1f13293129fdc22290ed --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6b37881de0fe95bd8128+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7af2b03849ed64587b463db5b9e3970e996aacffcf09d636fc06eda4d05a031f +size 428976 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6b37881de0fe95bd8128+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6b37881de0fe95bd8128+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1526b27eea5d148e8095b871f1c65d09d5f4e604 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6b37881de0fe95bd8128+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:820f5db477d8e1b241e0e47bc41dd45acdd9b86fe4fe58e6391e6f3879f8370e +size 4199424 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_823cb759235f53a8fe88+24129607/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_823cb759235f53a8fe88+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_823cb759235f53a8fe88+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_823cb759235f53a8fe88+24129607/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_823cb759235f53a8fe88+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_823cb759235f53a8fe88+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_823cb759235f53a8fe88+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0bc18f8dc18a593e9507320160b098df0f2d7d3c --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_823cb759235f53a8fe88+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9abda4bd7989f2749cf9583868302f42ca315a2e3de1183197eb1aa8d33ac28b +size 428915 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_823cb759235f53a8fe88+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_823cb759235f53a8fe88+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9cabce9bd8aa6b1f4485daa16c8cfdd49b05b198 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_823cb759235f53a8fe88+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ccdd6902a5acc60bbf9dea8744c143fbcef71b442b84b18a2ce2d7acd752b5 +size 6237184 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9e174a0ad6384712cfa5+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9e174a0ad6384712cfa5+24129607/model.hlo_module.pb index 1631f2c09a8ae63fbac2ac1fb9fd3915b7804545..acf3f511b6ffaff7078cc0c892c0083f21e7e91b 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9e174a0ad6384712cfa5+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9e174a0ad6384712cfa5+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:94f9be6da7e1e991f75a43c98ec4a38bf5f21367b15621e701b9e470690ece07 +oid sha256:8a22b54d714b2e6fd73a96a878615820fd25ebb97a5970c04db7084ddf50b4b0 size 83504 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9e174a0ad6384712cfa5+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9e174a0ad6384712cfa5+24129607/model.neff index 5a0e4733cd293a9678ae673618618fcfa1438746..b1e1ed26daed4964edcf7abbaceb23ed14c61d94 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9e174a0ad6384712cfa5+24129607/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9e174a0ad6384712cfa5+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c0957164ef9c782ed0ea789e4c015073913b3083d31b50835c5548b4563f76f +oid sha256:a60ade2cbe5d1ecb7cf752a53cdb2fb8394d10759cceaba09809d3851485a793 size 328704 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2bdf94343deafea1a7dffee349a18f1ea4860829 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11caf63cab9ec2a78c7116e6e762873e1e1f1b3a6a165b692abb1923676d1796 +size 587842 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ece78e2ff471d162cab2be1e33eee356b6e7c336 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9400060f63d2a3dd20719706b468bb1b0dfc0f605a96b1dcaa82143d7470b1ff +size 809984 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..4c2121746f92b747a527e0710c50fef3fcba5e8b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a0387fe4d05bf37e345a+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b23f902646a683f981d4529dc0f2c868f485a7730be1c7b355a33c07c6579df +size 944468 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a38bf2241a80d200aa33+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a38bf2241a80d200aa33+a02c3a36/model.neff index f95a257630a3f17d1e22fd46921eaf4253c92efb..9eaf5a55d4cdad22266bbe4e70ab16ea0e142332 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a38bf2241a80d200aa33+a02c3a36/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a38bf2241a80d200aa33+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0ae1ee399d4f73930898b73b379c0c264aebc9b2135e44514f9fbe3b18ba3e69 +oid sha256:5063b2ccd377fc1a01a8d3214378204d42f443cf95ded9b30e6dcf73c5ab1de4 size 6769664 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a38bf2241a80d200aa33+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a38bf2241a80d200aa33+a02c3a36/wrapped_neff.hlo index 0f01d856c945be32449c32deb0bf569f9336ca68..ebf3458a52a22aee4d1881f990d2f936fcddf47b 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a38bf2241a80d200aa33+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_a38bf2241a80d200aa33+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:be11b98fc9a04aa64c3b8b26a87bde95f41a1a4e161a4233b3d1f59e81358438 +oid sha256:3d7c13e30d0f05134864003d0128a911eb9ff555ba8e13054cd0fe96717f77b2 size 6936331 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_af5ca2287a6b0d70aac7+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_af5ca2287a6b0d70aac7+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_af5ca2287a6b0d70aac7+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_af5ca2287a6b0d70aac7+fb4cc044/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_af5ca2287a6b0d70aac7+fb4cc044/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_af5ca2287a6b0d70aac7+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_af5ca2287a6b0d70aac7+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a702af93114f0c784c5a74feba6807609697b4e8 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_af5ca2287a6b0d70aac7+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a79593901669a6a26dd4d0391b98b300b7064110aa994f0e322515227f8c944b +size 433643 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_af5ca2287a6b0d70aac7+fb4cc044/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_af5ca2287a6b0d70aac7+fb4cc044/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f09f342baa1fce2c605e4d3534661baba1de0748 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_af5ca2287a6b0d70aac7+fb4cc044/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f21a6684c188efe851de16007f05def2751732fd9943f28c1aa2075b28e9cfb8 +size 4015104 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b559f9b8396895d936b0+80d05c3f/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b559f9b8396895d936b0+80d05c3f/model.neff index b2b61999fa1306b4dcfa5dab93fe7dc7bb61502f..b0102cdf1927883fe3234477be913799074c3dbb 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b559f9b8396895d936b0+80d05c3f/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b559f9b8396895d936b0+80d05c3f/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:77c268abe58721fde4656e58cf77358f5a3db717006feb4749e43756ce82a864 +oid sha256:76eeed1f996721edd4d90e040c8ba23e123b944dd2e18633add5e9705083e6d5 size 277504 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b559f9b8396895d936b0+80d05c3f/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b559f9b8396895d936b0+80d05c3f/wrapped_neff.hlo index de092099b4840cac445b798b5eac30e485b46812..4b52f9010eea2d4081ad81c5c71223fb8c786cb2 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b559f9b8396895d936b0+80d05c3f/wrapped_neff.hlo +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_b559f9b8396895d936b0+80d05c3f/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0b65b7f2f986cb16230bbdeae1b0d7caad7b95a4c5fa160573f243790963ac8f +oid sha256:05b92ec0c7f07df4aa9454f74cd4630602acfef75330bdfb6ed20fc99fcc27b9 size 289571 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd3408e2c963ac7da056+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd3408e2c963ac7da056+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd3408e2c963ac7da056+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd3408e2c963ac7da056+fb4cc044/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd3408e2c963ac7da056+fb4cc044/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd3408e2c963ac7da056+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd3408e2c963ac7da056+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8938038613a8390b96437286c40a69070b6bee4e --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd3408e2c963ac7da056+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8400d9b46cf0f503ba7e4251ae60b1ff81a266ae21d0e312c5cfde66828bfcb9 +size 617833 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd3408e2c963ac7da056+fb4cc044/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd3408e2c963ac7da056+fb4cc044/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8dbbb1ec68cf06f7a2cee8a4d1e509826551af5e --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd3408e2c963ac7da056+fb4cc044/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6673718aa1e2786568db5d56ee245a5bcc6892a1c108054aa1f69c5c75c9005 +size 69643264 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c345ba838e8c529a43e2+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c345ba838e8c529a43e2+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c345ba838e8c529a43e2+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c345ba838e8c529a43e2+fb4cc044/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c345ba838e8c529a43e2+fb4cc044/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c345ba838e8c529a43e2+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c345ba838e8c529a43e2+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..0bc18f8dc18a593e9507320160b098df0f2d7d3c --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c345ba838e8c529a43e2+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9abda4bd7989f2749cf9583868302f42ca315a2e3de1183197eb1aa8d33ac28b +size 428915 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c345ba838e8c529a43e2+fb4cc044/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c345ba838e8c529a43e2+fb4cc044/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d43d65df74c2c0ca3a1bd54df6a1c73805903960 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c345ba838e8c529a43e2+fb4cc044/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57e60ed421b4699c3e623f16a134714d00334237d986474b9171632864df0258 +size 6237184 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c58e0a47eb485c62b0cd+283df001/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c58e0a47eb485c62b0cd+283df001/model.hlo_module.pb index e8c3a9d908b5faa927d3a719c98f3a8a5380e67c..736f69c82c1268401ffca3bfbad76251974b5f45 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c58e0a47eb485c62b0cd+283df001/model.hlo_module.pb +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c58e0a47eb485c62b0cd+283df001/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:921efe2b7b69521922a222c2b7a01152b9a2e4a17adad6f6bd6fe5745feca043 +oid sha256:f167244b4e5955198c7c0ca61b3c87ab0806098bb2885eefc0395531c74cbda7 size 97794 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c58e0a47eb485c62b0cd+283df001/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c58e0a47eb485c62b0cd+283df001/model.neff index 8bc141bf3c5550b0bd29abe6c99f42f268a97b3b..b6a59d8f8fb67662b40b9c852e67e53a30c1c67c 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c58e0a47eb485c62b0cd+283df001/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_c58e0a47eb485c62b0cd+283df001/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:90286015630bce0b6036ab12023599c20307aab9c5011c73ecd45c36ff82437a +oid sha256:902855d7c01e956cebd4ee97d606374819e3d1772628fc92189bd7a1e9c61f78 size 410624 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cb4d848c61c58d4a5351+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cb4d848c61c58d4a5351+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cb4d848c61c58d4a5351+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cb4d848c61c58d4a5351+fb4cc044/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cb4d848c61c58d4a5351+fb4cc044/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cb4d848c61c58d4a5351+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cb4d848c61c58d4a5351+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..cc2cc54570148e0c14230ecbd8c75282712e85a5 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cb4d848c61c58d4a5351+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:493e092fd95afacc57041181604c2e81b2ad3acb7e044553bb6499c1c7074a46 +size 429684 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cb4d848c61c58d4a5351+fb4cc044/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cb4d848c61c58d4a5351+fb4cc044/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..d5ef03cc7302d0c426b071ddea750452fd8b8438 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cb4d848c61c58d4a5351+fb4cc044/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e99d916b563747619fe45f56dfcdb74d5c21b1820ca5e4cc419ac08abb0c7838 +size 4158464 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ce7eb4c5ef357b61cc09+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ce7eb4c5ef357b61cc09+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ce7eb4c5ef357b61cc09+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ce7eb4c5ef357b61cc09+fb4cc044/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ce7eb4c5ef357b61cc09+fb4cc044/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ce7eb4c5ef357b61cc09+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ce7eb4c5ef357b61cc09+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..7469a9bb5988ead48edbd119f934486cd88d4f06 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ce7eb4c5ef357b61cc09+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33a46b94530dd2e9f257ee044a402b122ad73ae7c96bcd4ef5ecdf7e100e2b55 +size 850786 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ce7eb4c5ef357b61cc09+fb4cc044/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ce7eb4c5ef357b61cc09+fb4cc044/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..e06de99205f7d2375c50fa2896910e87418f9fe6 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_ce7eb4c5ef357b61cc09+fb4cc044/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3389b5091ce04a415c4b6677ba5a31c43d8b7aa1e44672df129e2ae134af123c +size 82637824 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cedace9d3d693aab8d35+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cedace9d3d693aab8d35+a02c3a36/model.neff index b31c7b907c0ef71237574acd20bc929fb440f380..be005290c62f5dd8c3ac7cd53a782b00f0987b59 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cedace9d3d693aab8d35+a02c3a36/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cedace9d3d693aab8d35+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e712ba52a94ca2b5cc3225662cd66ca081c6ac9980ee4eb31bd2529e327d7144 +oid sha256:bec5dfc6b85bd28401f2ae9ab0c8ec90e2a88bd02dd3c576d6deba9f2537c5f5 size 543744 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cedace9d3d693aab8d35+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cedace9d3d693aab8d35+a02c3a36/wrapped_neff.hlo index 91ceffe8c6b0f82d68fc2d4a7211550b8d1e56a1..85d9b04936b7744ae5cc0ccb97e8b0596cd86f91 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cedace9d3d693aab8d35+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_cedace9d3d693aab8d35+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b9e56298ad4c45efcef81b609665300a7e0204a23c75e5e1a7f949c82bbf0d75 +oid sha256:c61a3b4c4dba6212222c9cad3593be877e5466393fd035ad5f8cf131926c2c57 size 563380 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_d8cfc8fee2dcbc7833f8+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_d8cfc8fee2dcbc7833f8+24129607/model.hlo_module.pb index 588a268d1e30b6bac8f2dcd7c5f829ec0638baf6..a87347e585e555545a4c675cb4ee611f7a685b0b 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_d8cfc8fee2dcbc7833f8+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_d8cfc8fee2dcbc7833f8+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6690d38e167b9190706bcf1c2af5e45fb65b4a170e48fb7be054fb0036fbff87 +oid sha256:07d09f90f30891e710663ebed6df45c1a6f95b261a9e7bc53dd0bf8fb37cab9d size 82772 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_d8cfc8fee2dcbc7833f8+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_d8cfc8fee2dcbc7833f8+24129607/model.neff index d54dd498e1c8a1db01828bbeeb398e2548794794..3d30f59e0104a26d36d46bb78be39af3726702a7 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_d8cfc8fee2dcbc7833f8+24129607/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_d8cfc8fee2dcbc7833f8+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3a6f133cca407bb037f07ec040d523f1cf7ba622a30eb5c42f37b94656a2c766 +oid sha256:04f04de137a9197b2e345c6e043d111f01bf2b2d5a54fe7ecdcce559bed09d1a size 267264 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3279f1a5cdfeb71eca5b03cfcca5ced0696022eb --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a36ee034700342382b6da2932f74a5d63b34f8b66d47da8dcd5b0cf42842dd7 +size 428915 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1891ba4405f29ba86f01091c8bd6fc9e2af7b929 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_da126386d4d4d4a5bf4f+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc597f6cd2a406443f6c3521267e9b1a415ffc3ef09be331d9970f369bf82986 +size 4199424 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c6c36bcec75732900885291c9c29ad9273d911c0 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd02cc415a9ec23bae8b8c33f608759c1acdb1c1b1d00c2395f02013619bdb55 +size 558318 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..dde1c5632fa6ca476710981cc6d7f967e247f748 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_dd4aa1e96fd3b31b162d+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abb726625781c2508bd21976895f5dbf613a064b512daaf299d84ac18963e1c1 +size 4588544 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..07bdc1045dd850da0b9d66d697f3755e9be37aca --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..6aea211899f1e1bf517714fe32ae73054c23fc0a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2a9d81b45439b73d61796a2819b130dfe5588da28743c6dab28e51b8d6b7b92 +size 445260 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..048cd243ce0a708aa8d6dea85e098883f86b94b5 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_de1482f217f05f48d1dd+fb4cc044/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f02ae0cc9a2c14db262999a7fb54bd7a3345350b4866654843e6a5e17b2c5197 +size 4127744 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_e12a32198da9ddff7d98+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_e12a32198da9ddff7d98+24129607/model.hlo_module.pb index 470d8aab33acebb7218508a382560c16f29728e7..bf00ca0b127128e16e4289e4fb5c4a4b3d0feca3 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_e12a32198da9ddff7d98+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_e12a32198da9ddff7d98+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a71bf93ec8cbabd656baa51969aa29f648cf5493adae23aac0aeb883f112107b +oid sha256:c9cb3b1a05b77d5bb908b7d9a5344001bec8bc04360d230f2d8ba908ed19896a size 81516 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_e12a32198da9ddff7d98+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_e12a32198da9ddff7d98+24129607/model.neff index a7510e862e61b4359655beefb03ce74dd2e47e25..36e2fd2e7228867478301e210ccc4b5d287fbfe7 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_e12a32198da9ddff7d98+24129607/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_e12a32198da9ddff7d98+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0716a4b4317f1746db567f030fc286fc5b2cf6c6cc59c670f4511a598be2c79e +oid sha256:e3ca4a3cc0e9dc7be863a8fd62530378476d4a3010fd01500b88bcf19c02ed78 size 267264 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eaa781288c2e1d7ed527+a02c3a36/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eaa781288c2e1d7ed527+a02c3a36/model.neff index cca408b8cf52aac171449c82b3dadc3a9309c1f7..e85f5bf4d6c2fab180a804e703433d283dbe9551 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eaa781288c2e1d7ed527+a02c3a36/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eaa781288c2e1d7ed527+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:12927161e0de57acf95f140ba37a30a13cb088c211ec00646e21b545a67947ab +oid sha256:4c9a7d9b1ec1b1e241247ec4c7d5a966b709fd0cf6a419d7ac3c6501561efee4 size 277504 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eaa781288c2e1d7ed527+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eaa781288c2e1d7ed527+a02c3a36/wrapped_neff.hlo index 0ae860dbcec4d20eba240e608673b4b21d7408a0..aed0aebfd9079d2a7921fbb1ee00ac31cd9f7d1f 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eaa781288c2e1d7ed527+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_eaa781288c2e1d7ed527+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a7aaeb376a31ae1cf03ae550fa5a4669642f672e9440238963edad1a5af7e193 +oid sha256:9e1b44dc49d450390d788fee69a2e3b4b61b3e79956d4efe89ed6fef696940bb size 289031 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..83719a3bcb5b94c8f07cc9b7416b52508aab2a87 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b537aa9235ac17ac4afc50f42657b98f27013072bb50aab578243173ac38203 +size 482166 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ccb4390e799039b0be36424d668044de8c5878fa --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_f4bed0e6c1426c4b9bc7+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99b9ce48f4cb562ec2c3dc68c3a904aad2dbb1c0703ebbadd6eeb6d0f5c771fc +size 4199424 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fd32caf35dc9cdf42fac+24129607/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fd32caf35dc9cdf42fac+24129607/model.hlo_module.pb index 7d89ddc8cc0511a553734b846edb6c8743662b33..0a534b6f9b9b13756a0c296de4f4491ce2cb4115 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fd32caf35dc9cdf42fac+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fd32caf35dc9cdf42fac+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6db3cfd3e359c57972d807aee60d37c9d97b89aac1b65d0fad01abfa10eff659 +oid sha256:84cc69f930e3e2d6aac7b2581033933d9d5372ffc238b94f014e0901070af434 size 90382 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fd32caf35dc9cdf42fac+24129607/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fd32caf35dc9cdf42fac+24129607/model.neff index 4ed572e254cf13a7acf43855fe69b5811e49f3f8..34ac8d11ea71b6492fb8ddca287dd614b02b1f88 100644 --- a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fd32caf35dc9cdf42fac+24129607/model.neff +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_fd32caf35dc9cdf42fac+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:736e0da356f57525c1947cbb05343f851427d302728ba47ca80b9a1c8b91820d +oid sha256:8e96e22e545fc320f415061f613201ac019eb714022311d84a90adab4f261c1e size 359424