diff --git a/.gitattributes b/.gitattributes index f3df26b1b72ca61017ae4adf580d4b759e21b4e1..f2f196c5499b2f3f05ed0e1cf55c1eb7c9fefb7a 100644 --- a/.gitattributes +++ b/.gitattributes @@ -7180,3 +7180,8 @@ neuronxcc-2.21.33363.0+82129205/MODULE_17bab0cf99484f23e361+b02446f6/model.neff neuronxcc-2.21.33363.0+82129205/MODULE_17bab0cf99484f23e361+b02446f6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.33363.0+82129205/MODULE_04c64527506049d877d9+b02446f6/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.33363.0+82129205/MODULE_04c64527506049d877d9+b02446f6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_0acfe8e118f5645dfe28+24129607/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_14f2cb90587f7f6f0f5a+6c043b9a/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.33363.0+82129205/MODULE_ff6e0ad0581f507d369c+6170d8e1/model.neff filter=lfs diff=lfs merge=lfs -text diff --git a/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/cf6b9a360dcf294104671106bae2adbd9fd291823bb60a351883163684073231/0a461d42d71b4005fa9e.json b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/cf6b9a360dcf294104671106bae2adbd9fd291823bb60a351883163684073231/0a461d42d71b4005fa9e.json new file mode 100644 index 0000000000000000000000000000000000000000..6607fdc8329ac33a3d4606cd0f7c3efebf0d8910 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/0_REGISTRY/0.4.6.dev3/cf6b9a360dcf294104671106bae2adbd9fd291823bb60a351883163684073231/0a461d42d71b4005fa9e.json @@ -0,0 +1,64 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "unsloth/Llama-3.2-1B-Instruct", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 4, + "capacity_factor": null, + "checkpoint_id": "unsloth/Llama-3.2-1B-Instruct", + "checkpoint_revision": "5a8abab4a5d6f164389b1079fb721cfab8d7126c", + "continuous_batching": true, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 4, + "max_context_length": 4096, + "max_topk": 256, + "n_active_tokens": 4096, + "neuronxcc_version": "2.21.33363.0+82129205", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.6.dev3", + "output_logits": false, + "pp_degree": 1, + "prefill_chunk_size": 1024, + "sequence_length": 4096, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn1", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "unsloth_fixed": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0acfe8e118f5645dfe28+24129607/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_0acfe8e118f5645dfe28+24129607/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..836724f44545ce0dedda1521fd4c623a6ea8ec72 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0acfe8e118f5645dfe28+24129607/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0acfe8e118f5645dfe28+24129607/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_0acfe8e118f5645dfe28+24129607/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0acfe8e118f5645dfe28+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_0acfe8e118f5645dfe28+24129607/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..3fde4b8afd225f8f29e912dbb88051c0c8b08a89 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0acfe8e118f5645dfe28+24129607/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01a4fed93c6cd483257d5a1298d72791181c38dd8ce7f0ab1f36bebbd1a4cc93 +size 64986 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_0acfe8e118f5645dfe28+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_0acfe8e118f5645dfe28+24129607/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..fffab253e823de199677276053fd5725ae00633c --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_0acfe8e118f5645dfe28+24129607/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9727bacce9dd2dc9c9936e8edc953101889431256f23ef17f4ae326b84f257f9 +size 226304 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_137d2b1e9d185656d517+6170d8e1/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_137d2b1e9d185656d517+6170d8e1/model.hlo_module.pb index 7e17bd0deef25864ee8c64da9e5f7cf173b76f3e..a203527e641f9a3ff46b69eedb1f181abedfd41c 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_137d2b1e9d185656d517+6170d8e1/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_137d2b1e9d185656d517+6170d8e1/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5405ee9c8f41348d0bd893b5e48ec19122bb8043738550e95ffb2f5449876a4d +oid sha256:8a13429dac9136350dbd707ba487f7744ba8b55d66f6bf4c949684d1a51bfd91 size 866871 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_137d2b1e9d185656d517+6170d8e1/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_137d2b1e9d185656d517+6170d8e1/model.neff index 6935257eceeb0b33304b254bdf5ea279fddcd8df..c544d67df48d0b51b7067df75ad77e8bde884515 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_137d2b1e9d185656d517+6170d8e1/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_137d2b1e9d185656d517+6170d8e1/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3e8bae57e4f136528379d6d32bc9abb7a9db46a13c031d168a46da79d7fc674e +oid sha256:22e26720e026c218975f34e9519d975734c61ab531f4258ffbe8eb09cdb821a5 size 29758464 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14f2cb90587f7f6f0f5a+6c043b9a/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_14f2cb90587f7f6f0f5a+6c043b9a/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..3766f4b13e3c48c89718978c6d8a6066c2c96536 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_14f2cb90587f7f6f0f5a+6c043b9a/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/chunked_encoding/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14f2cb90587f7f6f0f5a+6c043b9a/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_14f2cb90587f7f6f0f5a+6c043b9a/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14f2cb90587f7f6f0f5a+6c043b9a/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_14f2cb90587f7f6f0f5a+6c043b9a/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e1a089ed5d71da740a66db88c13a7cf608ab7170 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_14f2cb90587f7f6f0f5a+6c043b9a/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cc06654f0d8c129836e4af09e2cf287e7ee40b8d3ea206bcaa236cbb85cf092 +size 918002 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_14f2cb90587f7f6f0f5a+6c043b9a/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_14f2cb90587f7f6f0f5a+6c043b9a/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ffb67bea6a129b89af4a544328626854b4e20cf9 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_14f2cb90587f7f6f0f5a+6c043b9a/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a22f1bca8e55d93344621b11327191cfcd203e8cf2180fcffabb3f86d493884 +size 40172544 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_18044ed346a94d78250a+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_18044ed346a94d78250a+24129607/model.hlo_module.pb index 33a2342c9d24f4e4f30ebf8e15aed8e686e0c90a..f4e7c70d0dd1eafa5cbf8beeb663c219dc7562a0 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_18044ed346a94d78250a+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_18044ed346a94d78250a+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:10aec6163a2220dc0eaf386dbf1178e07df1a712fd50b018fe14148cd7e532bc +oid sha256:87ce4944faa2f3d7fa0bfbf935506670db5c41d6a0c08af5194b6449f4388987 size 593552 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_18044ed346a94d78250a+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_18044ed346a94d78250a+24129607/model.neff index 2a6cee160931a299bf997dbf6e0c99262152da0b..ce556079033f66c2dcff0e33525409c420afa561 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_18044ed346a94d78250a+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_18044ed346a94d78250a+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7812a21744e91c1f6fb470437568f2cdaf1dce297e0bd82152e22bc757b1c52c +oid sha256:96aa276b19e37c3ae902d12d5da78e1052a74baef69baa558f27155a0faafe1c size 3769344 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_47bbfc2252c9a9fd3c68+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_47bbfc2252c9a9fd3c68+a02c3a36/model.neff index 355fef2efc72c35c30cd1acdcc924bc40e19d95d..1bf53ee8ba4438a914c8260b4527ccebd46666d1 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_47bbfc2252c9a9fd3c68+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_47bbfc2252c9a9fd3c68+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cd628eec1476064a8204ca007ff40fbed4cc23f378e02ecfc6227569a072e88c +oid sha256:3088284cdea76febed35d14d9ed0ee138b44830bfce57a5749bb49afab1bfa01 size 1240064 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_47bbfc2252c9a9fd3c68+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_47bbfc2252c9a9fd3c68+a02c3a36/wrapped_neff.hlo index 55cd842377b6008459dbd38c4e97ea2705d18893..b46f1cce72da4a818628abec09b47e86a6907d2d 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_47bbfc2252c9a9fd3c68+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_47bbfc2252c9a9fd3c68+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ec7eb8e831982ef037ec0b1ac31e6a7ebad00c4984d69d380c768ba8c01a0075 +oid sha256:6cd8604614fd4d76064135fdb546788ab0de0e460ed5b46c253d38bdcd569e93 size 1362453 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4ff804c2533da46e613e+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_4ff804c2533da46e613e+24129607/model.hlo_module.pb index 0013bd4ca7ed4936088fc1057d8a721660f39e04..f73614f39c62bb2c2bf0e535a64a63b6afadb47b 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_4ff804c2533da46e613e+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4ff804c2533da46e613e+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:77aa6e56466f63a602dedff46d9989619913f612654147b3c637f7d3de61f7bb +oid sha256:ba0dce0602506ec104796b8fd8725dee074d29c0e88ce5ce7f4b4f681250622b size 1050679 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_4ff804c2533da46e613e+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_4ff804c2533da46e613e+24129607/model.neff index 72698f757401d8f6d57f26f552be3771235f57df..6a008b6dd31950ff9dad95d9dd00be5d15d85038 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_4ff804c2533da46e613e+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_4ff804c2533da46e613e+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e50869a02ea30d26e9508066369d2c0e30c2ea31d9a4a49d44bb0826fda5bdd0 +oid sha256:fb95dbd8cc3cab5b05fe9e7717acda2130bde6a0d8ac99b0a2fca725115f9ddf size 14050304 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5620f0d58954f88c2890+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5620f0d58954f88c2890+24129607/model.neff index b4d020eb6da2d99c5496d5219b07d43fed5de8ec..572a12cafe2fa69f35af8f9b788c6a66ab36bb99 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5620f0d58954f88c2890+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5620f0d58954f88c2890+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1cac46ef4ae79281922f276f2620982a3742e6e3c1b7872ddcd81422d481a155 +oid sha256:19221977512f263ecb24051e3ac3b2c979ca21ea4524c714789563faa271365f size 1905664 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/model.hlo_module.pb index 505eb26862644a3def09c975941c55e279a2498c..596f3b9ef84bd67849bbf56ed685f3ee3e28f28b 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7c2a0e27aea45eec39afceeccd973f758e74d7f2b39164586a4bd50817a82017 +oid sha256:b5e7fcdf9f65af1b99f353b41bfb54288571325ca47b98d54e3e989a576ff880 size 1117688 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/model.neff index 041e50d455cf3fa5b377c19671e17953683557bc..a3bc8482bae577394976655312d36b718586b5f5 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c86d6438f711a1112f00061385844a65b878de8c4ec8f31a56f86600544b2cc5 +oid sha256:12483685f9f33f8d93d63a0fd97933ff8dd168697144d649461cd3b5aca95c98 size 5387264 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/wrapped_neff.hlo index 22b4e265b9d03957d9dabb33eac7bbe65474846c..8d4ebeb0b6ca6f484fcd24a80c3a04a3fc0bbee9 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_5742ef8f5910f4e17377+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ccaae03e61bacf189b7472ce831c13c89fd2850d9775d076386bc4d3e1c65e86 +oid sha256:bd7c6b14f10695fed21a2043ca93c89feabc56c16c28f11ec89dc8b0c95cd73e size 5571457 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_691f0ef9fca273527dbe+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_691f0ef9fca273527dbe+24129607/model.hlo_module.pb index 86a02e8a6b52d65d970eeaf3e0e50da02304de6a..47bcf7648165a9c5f3757d10a0e7e963e4d9967f 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_691f0ef9fca273527dbe+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_691f0ef9fca273527dbe+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e51fdfdae7127466be2ec79701008b720297fad35905d1ca7fe02a528931a44f +oid sha256:0eb3378b5d8896763319549ed5b812719fb401cdbc17e7f8ea868f219300074a size 412170 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_691f0ef9fca273527dbe+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_691f0ef9fca273527dbe+24129607/model.neff index 05f31aacc47cf367c46349facb8dd75c9c9ec41f..213e01c034d8fb998d4511d8442df8255375366f 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_691f0ef9fca273527dbe+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_691f0ef9fca273527dbe+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:264d323f483f1b288c66424b9648e9fd7f37c4ff2febad67ae2d0ccfa4526ed7 +oid sha256:6878879817939ab8dc763af00c5a43aa20016ef65d44b5d6d006e30c2749be81 size 5868544 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_71833bfb10ff3967bd3d+6170d8e1/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_71833bfb10ff3967bd3d+6170d8e1/model.hlo_module.pb index eaed824e127a6bef5f2308aef3e2ff73696166e9..0ae982c19e2000faa356dd8444ea3750cfd7a3d2 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_71833bfb10ff3967bd3d+6170d8e1/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_71833bfb10ff3967bd3d+6170d8e1/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:631e2888f6ee71acf1c9eb784246d591937aa8de79993a6850177196c2bc8fa2 +oid sha256:37173b87f2098da51055199893cf6d6b5bc3702f5fca629ddb79f66ed168542f size 1207180 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_71833bfb10ff3967bd3d+6170d8e1/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_71833bfb10ff3967bd3d+6170d8e1/model.neff index a31627a5135a6b8129ed724fb378b163a8494383..5ec0808a3b977d7dbb13ed1315036168f0237706 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_71833bfb10ff3967bd3d+6170d8e1/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_71833bfb10ff3967bd3d+6170d8e1/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ec3da1c0626101d789222ba962ee1f2b30e606a10b59ead008350d5bc0a19e62 +oid sha256:fc29783475d7b499deb17d2c9a2d968020b799a38164f302e863a2871045e619 size 58307584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_95b9072f246645f24461+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_95b9072f246645f24461+a02c3a36/model.hlo_module.pb index af1a1f48a5ef3f69669a415d275780e8bae3db4f..7abae44a2482157ce3494c29fd25be0092c7b214 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_95b9072f246645f24461+a02c3a36/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_95b9072f246645f24461+a02c3a36/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:12bcc80b2ad2cb1e12abbca61cd3f324f6f4f564cf78d121d0f5fcd01305c683 +oid sha256:b364b15f88cdba27d3ac4973f7dcfb2cbc49da9abd971bc1f0c52315364d55dc size 451319 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_95b9072f246645f24461+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_95b9072f246645f24461+a02c3a36/model.neff index a2fab63b246f77f2b81d64bd3aee76b01e3c995e..4690636950b1615801ceb4cf45015cb94597fff5 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_95b9072f246645f24461+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_95b9072f246645f24461+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bdf04a70eb8bda2f7f4e49bedb2c346136c7e9b0dec32fa7421ea72474563fbe +oid sha256:f173e6c1f419b379767e720c82df3bec9c7942c49ca6ce29905fdea0ee240610 size 2509824 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_95b9072f246645f24461+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_95b9072f246645f24461+a02c3a36/wrapped_neff.hlo index 23e1a4ca305899ccce17e373419202f11f100017..136aff59a149d5d7b88632d5f20bf7c40f54fb61 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_95b9072f246645f24461+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_95b9072f246645f24461+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c84f3a91584fb71a18f3ba16dd9c1cde9917ff28ab72e432ab03a61ad722f8dc +oid sha256:5cde9a5e1a781062038054f87a06889f4898ef6a5b5a50ae52638bd62e04342a size 2583911 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a3c6a617f4311e09ad49+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_a3c6a617f4311e09ad49+a02c3a36/model.hlo_module.pb index 4f3dd325b4bf515de91ad979b06f56f9afd8afd5..0be6f402b1091a5ac2106aaac1e5abd993d5ae84 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_a3c6a617f4311e09ad49+a02c3a36/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a3c6a617f4311e09ad49+a02c3a36/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:36ddabd0c90ed641a0ad314822231050850400aa553214d5529473bf4ff0a305 +oid sha256:4fc327b5aedfef4f958b55f2111e6023173d2189cdea1916de9b55b87b7ae397 size 437679 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a3c6a617f4311e09ad49+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_a3c6a617f4311e09ad49+a02c3a36/model.neff index 89c229b1b1058bdcb2a2fb270c20a65af1ccb51d..222c96907724b66ca3aa7b82801a951d3eec261f 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_a3c6a617f4311e09ad49+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a3c6a617f4311e09ad49+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c11b69acff75055f0546f43508dcdbd542ee3eaff6195b6c57a3af7edf77dc6f +oid sha256:35c4d9af9f5e635518ad5a32a994a12900817c494228366cb017a5921a8a0289 size 2438144 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_a3c6a617f4311e09ad49+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_a3c6a617f4311e09ad49+a02c3a36/wrapped_neff.hlo index cfc412486de729dfb647d90574d4f6ddc623fc33..dcb4711dd3a45b73ba8720449b8168b06bbc7d9b 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_a3c6a617f4311e09ad49+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_a3c6a617f4311e09ad49+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b57cd0d9c32e1bb6bce78c9222799e7c01e0b73129fbb8e01387a02910df1030 +oid sha256:b9d9efa9457d5d2d58b8295197380c09b00f5279aa45c44a964a0c4d4a9ffdea size 2512245 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ab293424ba3cf7b684c0+6170d8e1/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_ab293424ba3cf7b684c0+6170d8e1/model.hlo_module.pb index 6aca56152be2b63949b8e7e51c4ab3fd05b96a6e..9c8775f9060b3eb3e4aa65d18783777944cf6e99 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_ab293424ba3cf7b684c0+6170d8e1/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ab293424ba3cf7b684c0+6170d8e1/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:679ce8c5ef949ac06470210b35e4adee33fe05ef0fa91cce2bd5b47cfb6388c9 +oid sha256:47b99d5d3bb1aee834dab4fc1af971d3939c94fc2e1f9e3de69e78097abd2256 size 559974 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ab293424ba3cf7b684c0+6170d8e1/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_ab293424ba3cf7b684c0+6170d8e1/model.neff index 51d39e33165e3898a8841721f54d4c0990b1e4fe..22716f3a7e965e6464667ecb5b7738d4923d8f67 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_ab293424ba3cf7b684c0+6170d8e1/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ab293424ba3cf7b684c0+6170d8e1/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6cd865120e98300df7ed41b6a6657309ee50589d33e8f1aaeb76adb5aad9fac5 +oid sha256:143ccfdb271dbeb652a8aa54d1263612081ab93cf1848c435fddc6a03f301791 size 44893184 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c68ed9d0d3211fb37165+24129607/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_c68ed9d0d3211fb37165+24129607/model.hlo_module.pb index ac3e6b48e8dba764cc288ca883c0f597c620535d..8d39a4a411336ed5e6df11f942b7f1805702d756 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_c68ed9d0d3211fb37165+24129607/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c68ed9d0d3211fb37165+24129607/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:503f2ba00e01ec69dbbab68e814ed2bb73f646b48b6892b515292a585e9dfe2d +oid sha256:990cedcdabb6c3f81555756a62bf720aa67bcf902b798c5bc0ecb2cb1ec99630 size 839610 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c68ed9d0d3211fb37165+24129607/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_c68ed9d0d3211fb37165+24129607/model.neff index a8bb898d682d24a5f13acdcec6e2c7ea242e613d..496dfdc14fd7152229853623f01252dc9f6f208e 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_c68ed9d0d3211fb37165+24129607/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c68ed9d0d3211fb37165+24129607/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ac9d8573bdda4cd25a8b90976246d32cdd841ea5e0890eb3aa6f7ee6a972eb94 +oid sha256:b1fde40d64ad7a1680d0f7140de088850a187367b1d9d807c4a6cce6049608d9 size 12626944 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c69743a3b026cb8c0f9e+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_c69743a3b026cb8c0f9e+a02c3a36/model.hlo_module.pb index 59a076083253d9de16cfd51e1ee597ae9e8d3b14..8cd95de5df78c2d142b4d504f28394664266cb01 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_c69743a3b026cb8c0f9e+a02c3a36/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c69743a3b026cb8c0f9e+a02c3a36/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:726697ae6d69106a35fc6caab871c35bccbf129873b887f75986cfbdd687e625 +oid sha256:19abd02589b7e770cc7d22a41832a1d7c1b18e5db1cdbd0f57e95939951b2311 size 588724 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c69743a3b026cb8c0f9e+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_c69743a3b026cb8c0f9e+a02c3a36/model.neff index 0c16d5ebde5b7936f39a7e05d141a8d45373657b..8a86e392782a0e17219dcf0fd792c3f56b0c1ad5 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_c69743a3b026cb8c0f9e+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c69743a3b026cb8c0f9e+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a7c258ba5a15e6c435b0719ac65ac7aed62119f5d3d3dc497bc8557452b5afc7 +oid sha256:9e9a16db24435f3344d68819315ac43e7ec035fdf41c68ba517491e1cc7db394 size 1659904 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_c69743a3b026cb8c0f9e+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_c69743a3b026cb8c0f9e+a02c3a36/wrapped_neff.hlo index fe11e2ff3fdd06413ccf6d281331049dc701a936..2ae85b1e76a78757ae849161d937252b26a08f00 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_c69743a3b026cb8c0f9e+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_c69743a3b026cb8c0f9e+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fd30f302fc03f3e2cbf90294931da3ae0f5faa5a5f0cf021340988ef20175088 +oid sha256:ee0ea35ca5a7f2dda442d215bb13c572d23bc55b448a956b0f57522e111c3d11 size 1782293 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cafe5e1cc124bf1d35e0+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_cafe5e1cc124bf1d35e0+a02c3a36/model.hlo_module.pb index 35918cf272a3b2b57c280dfab5292a07cb621c1b..59c047a60c10e69df9ea3f3efb2336de7700c1df 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_cafe5e1cc124bf1d35e0+a02c3a36/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_cafe5e1cc124bf1d35e0+a02c3a36/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:78e69b77e5c34297018c01769fa5cb3dc76d5a1edeadcfa530419c770b4bc0bd +oid sha256:e883165574aed0354166f6d95aca4f607724646d2e006e98dba0278cf6ccbda4 size 616389 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cafe5e1cc124bf1d35e0+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_cafe5e1cc124bf1d35e0+a02c3a36/model.neff index e09ba1e54270ae1f5121b2488e3be9a946af0519..7a8c90718d9e9bb8621bcfa8346b7f0bd6a2466f 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_cafe5e1cc124bf1d35e0+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_cafe5e1cc124bf1d35e0+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:440dff8141899e1feee0b232802eb84646ca15db0fdfedf5c6ac261952a33027 +oid sha256:e7d565671b559335ebd689af245b937c3963e13d9c03e7386b1cdc468337e980 size 1793024 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_cafe5e1cc124bf1d35e0+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_cafe5e1cc124bf1d35e0+a02c3a36/wrapped_neff.hlo index d377cdf6bfb78ce7e5db0cebe2747f25dcfc4bd0..0ba5d4a935b68b6eeea6f42cd47c73bec8df569b 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_cafe5e1cc124bf1d35e0+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_cafe5e1cc124bf1d35e0+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d7e7c6096a78d91c83b5aa8a9e9a48f876e3782f8b163f6a69ea89dde69e9e22 +oid sha256:1e0ded5f6ec49b752d33c658d09c59eb423a5d28f1aeedd89b066fe5bbcae935 size 1949215 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/model.hlo_module.pb index c0b701e4164fd2a5e57ab18c5b330e8849286a18..2be42d01f8c9635ae40dda54c81d1492e95953fc 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:df3122b05453bf9f572786aa49b7e5df0168024a8f52330ce2671cc7e157cd81 +oid sha256:179bdac81143630f9d441635b2b26fa7932ed558003eca339746b0003a725b51 size 904767 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/model.neff index b17d55caa1b58e299dee600e47ddd7acc15f59fe..df2021c67dbf73a1bee8200a8b91d77ef129f6ef 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6283f00665e3747e029a916a314a7185c78798b530296350881c6422ec1cad72 +oid sha256:a37fc84e549c108bc966313a5725202957b82812292828925d342489eb7729b4 size 5827584 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/wrapped_neff.hlo index c51d74f1722e036a88f7b7580dcaf479cf3d039d..9579b00f0362321fcdc8283eeab34f80267bc3e2 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/wrapped_neff.hlo +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_d50f09930f3886ac4b66+a02c3a36/wrapped_neff.hlo @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f36761cca5a82603e8d8cb052c52a7b98c82217d90b6c06f094e68d980b82636 +oid sha256:7fef7123c53ed6ad89406099987d3e6d38e26878221cb72cd5cedfb1903467a0 size 5994108 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_da7543b73fbd9c77b695+6170d8e1/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_da7543b73fbd9c77b695+6170d8e1/model.hlo_module.pb index efcaab2c12bed35b75bda2df9c71132dc3a407f8..e1104868a009ec48ecee42207eb0ef654b6bbcdf 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_da7543b73fbd9c77b695+6170d8e1/model.hlo_module.pb +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_da7543b73fbd9c77b695+6170d8e1/model.hlo_module.pb @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8039f37cf8f74df32eb6821df951e715cb9be5a7b6c9374dafd414d5ed8545bd +oid sha256:6d205571fe7e17384578352c7c49dc0c2d095ae2bdb745edb1db783c94df73fc size 1538064 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_da7543b73fbd9c77b695+6170d8e1/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_da7543b73fbd9c77b695+6170d8e1/model.neff index 6b17c7a094f3eed6d7c1501f0916bc4fc22b29b9..437c05b7653d062022a1933cd90f1c870ad57d50 100644 --- a/neuronxcc-2.21.33363.0+82129205/MODULE_da7543b73fbd9c77b695+6170d8e1/model.neff +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_da7543b73fbd9c77b695+6170d8e1/model.neff @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d1d31257822d52e37e1fc1b5d7630208f8c8b75bbff6ad6594c32a1335526791 +oid sha256:98d1b4384f2a614ccd9b9a1bd6dfc1ee06f0277e6dd173cf6795f23e60fc3fb3 size 111862784 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..5726abc7d1d8c52fa95bc7919439a23a23fe3b9a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c3b444a061ff6cb628610bfe5e8dc6ced9d75794 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:045b4161134cc33f193bdc9814c10fa16d6580268459ce1e9f8b2420b90e2687 +size 63730 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a73372f6912ea7efa020f0324f4b496a8e478e2a --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e03ea89708cbc600861ff5d0317bb9cd78dbd197ab4b901e4e29a2203c64640d +size 205824 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/wrapped_neff.hlo b/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..8ef8bee18ba16a946f37e2d07617fe351f5dc955 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_eb72db24aed4f48d28a3+a02c3a36/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51ca963a5e5396123ea678f7c8db629fc8a493a9b51a7174b7153011755791e3 +size 211973 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ff6e0ad0581f507d369c+6170d8e1/compile_flags.json b/neuronxcc-2.21.33363.0+82129205/MODULE_ff6e0ad0581f507d369c+6170d8e1/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..9c277888420f00defd99fc3c102007a98b09199d --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ff6e0ad0581f507d369c+6170d8e1/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/chunked_prefill/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ff6e0ad0581f507d369c+6170d8e1/model.done b/neuronxcc-2.21.33363.0+82129205/MODULE_ff6e0ad0581f507d369c+6170d8e1/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ff6e0ad0581f507d369c+6170d8e1/model.hlo_module.pb b/neuronxcc-2.21.33363.0+82129205/MODULE_ff6e0ad0581f507d369c+6170d8e1/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a5b8d890a4324ce274af387700cd37f5223f2016 --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ff6e0ad0581f507d369c+6170d8e1/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acd64107d28e01165c8ab88ef41786247a405b11ee1ef036aec04441574e3ab4 +size 577272 diff --git a/neuronxcc-2.21.33363.0+82129205/MODULE_ff6e0ad0581f507d369c+6170d8e1/model.neff b/neuronxcc-2.21.33363.0+82129205/MODULE_ff6e0ad0581f507d369c+6170d8e1/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..42ae96f62b594d6c99bb67d306439c7f4b7ce3ad --- /dev/null +++ b/neuronxcc-2.21.33363.0+82129205/MODULE_ff6e0ad0581f507d369c+6170d8e1/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621aa5ade9b49c81ebeaec4c0d0525e99babff80a721576e36c59a1d3c1c7d66 +size 27526144