diff --git a/.gitattributes b/.gitattributes index 9973172379135fd6c0459a712dba784629351df8..31669fa3bc4fecb02568de5c373d8eb65c829a0f 100644 --- a/.gitattributes +++ b/.gitattributes @@ -11846,3 +11846,16 @@ neuronxcc-2.21.18209.0+043b1bf7/MODULE_7585b7b81ecc283af772+a9d440f5/model.neff neuronxcc-2.21.18209.0+043b1bf7/MODULE_7585b7b81ecc283af772+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.18209.0+043b1bf7/MODULE_bae931052fc7117dae12+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.18209.0+043b1bf7/MODULE_bae931052fc7117dae12+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_10817282954366970288+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_11100513296980391091+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_11829150976780473518+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_126401019188484947+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_12706500199947902857+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_14723768718767503596+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_1517159787117774618+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_3432504749543175755+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_6009855936990338611+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_8781809999900598498+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd89854370a2ef01c9c4+877608f3/model.neff filter=lfs diff=lfs merge=lfs -text diff --git a/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.0/qwen3/Qwen/Qwen3-1.7B/b585d22c18c97a77d096.json b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.0/qwen3/Qwen/Qwen3-1.7B/b585d22c18c97a77d096.json new file mode 100644 index 0000000000000000000000000000000000000000..0313e982d16ad7e05f874eed319d7d98ffeda933 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/0_REGISTRY/0.4.0/qwen3/Qwen/Qwen3-1.7B/b585d22c18c97a77d096.json @@ -0,0 +1,87 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen3-1.7B", + "_task": "text-generation", + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 6144, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 40960, + "max_window_layers": 28, + "model_type": "qwen3", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "batch_size": 1, + "capacity_factor": null, + "checkpoint_id": "Qwen/Qwen3-1.7B", + "checkpoint_revision": "70d244cc86ccca08cf5af4e1e306ecf908b1ad5e", + "continuous_batching": false, + "enable_bucketing": false, + "ep_degree": 1, + "fused_qkv": true, + "glu_mlp": true, + "local_ranks_size": 2, + "max_batch_size": 1, + "max_context_length": 1024, + "max_topk": 256, + "n_active_tokens": 1024, + "neuronxcc_version": "2.21.18209.0+043b1bf7", + "on_device_sampling": true, + "optimum_neuron_version": "0.4.0", + "output_logits": false, + "pp_degree": 1, + "sequence_length": 1024, + "speculation_length": 0, + "start_rank_id": 0, + "target": "trn2", + "torch_dtype": "bfloat16", + "tp_degree": 2 + }, + "num_attention_heads": 16, + "num_hidden_layers": 28, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10817282954366970288+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10817282954366970288+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10817282954366970288+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10817282954366970288+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10817282954366970288+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10817282954366970288+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10817282954366970288+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..4c38858d1b0cd3b024059d9b15733d59c838ad1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10817282954366970288+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07174650ed082f05343a1a0c22304432637b32de422464f64e36dea97f029d9d +size 2521699 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10817282954366970288+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10817282954366970288+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9224d89f2c9d06c99935dbde904667b6487ef5c3 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_10817282954366970288+bad9cf09/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8d0c9498543cb73b93023034b26d64a0b737e90818e36ccaafce638fee60d43 +size 22918144 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11100513296980391091+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11100513296980391091+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11100513296980391091+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11100513296980391091+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11100513296980391091+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11100513296980391091+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11100513296980391091+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..9f032d4117a3ac1b0eab1a687361cc480367026a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11100513296980391091+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dfc1f574b376498bd4e195b60167f1c8023101ff924536a4c6b4e47c887a59a +size 2443379 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11100513296980391091+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11100513296980391091+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..458591837a695beeb14fa48b14730e8f4b80786d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11100513296980391091+bad9cf09/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95eb2db32f69df655725730f969c7af6468e81b8b8bfabc5336712d6ad2b6874 +size 22457344 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11829150976780473518+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11829150976780473518+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11829150976780473518+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11829150976780473518+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11829150976780473518+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11829150976780473518+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11829150976780473518+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..21a822dfb7e75a6b0f0219fc4cd8a6dbe9602028 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11829150976780473518+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30f5f0278402f49bed4e4d3ffa3e216e4ef13575b8b64092ffa81ab9841bf4b5 +size 2521579 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11829150976780473518+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11829150976780473518+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..4549666e70afbee7028b8ce905a5777569cf90d1 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11829150976780473518+bad9cf09/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b4a46d9afd8d647ace6916aa71ddde6c330bba7cdf0a29a55a903c6e661316e +size 22918144 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_126401019188484947+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_126401019188484947+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_126401019188484947+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_126401019188484947+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_126401019188484947+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_126401019188484947+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_126401019188484947+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5a83f317e5e75d3e8c73da92135bc1f32a5f8d02 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_126401019188484947+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d45403b54475b0cb139b2dbba9afdbcbedc544de8feaa0f6080aaf28c4f51504 +size 2444070 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_126401019188484947+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_126401019188484947+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..865fd4aca707485fe7d2c862ae7eb10ced9f5861 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_126401019188484947+bad9cf09/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a94126a878f4aafc1bb889b789438a7ace15d69cb2270213f789f07483484d0 +size 22457344 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12706500199947902857+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12706500199947902857+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12706500199947902857+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12706500199947902857+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12706500199947902857+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12706500199947902857+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12706500199947902857+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..598d57f2bc7b71439f778ad85eb5351e4d535916 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12706500199947902857+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:934d38fdefe53a4af49f8852c3e627c320721a6fde85269c0f4a1a826f340613 +size 2444194 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12706500199947902857+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12706500199947902857+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c3eb81d3a76b64082c48003bc67bf3a742833628 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_12706500199947902857+bad9cf09/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ff87237d4d2ed6c14ac2e7f14d4909cd55b059890cd841acb725760255e2da8 +size 22498304 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14723768718767503596+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14723768718767503596+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14723768718767503596+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14723768718767503596+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14723768718767503596+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14723768718767503596+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14723768718767503596+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..be2f7dd47fbf3879a9cba1869de6be3251ecb4af --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14723768718767503596+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c34a957e105066af033ea058fe161dcb4e89d43bd0f5b10c1fbb54fcd40a79cd +size 1312413 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14723768718767503596+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14723768718767503596+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1a0ac2ad5ee3f56ae6913add470dbc9a57a7d63d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_14723768718767503596+bad9cf09/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f982317fbdbf4f4802c25a6fafc0091569293c3f0004c3363d6e1843bae446 +size 3871744 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1517159787117774618+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1517159787117774618+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1517159787117774618+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1517159787117774618+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1517159787117774618+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1517159787117774618+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1517159787117774618+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8c4ff937ece29aaf50873506b5ed42c0714b79ea --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1517159787117774618+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84cdaec48dec521acf57d467d37567782b9e4e146ddae93ba75b1fde167fae2d +size 2444074 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1517159787117774618+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1517159787117774618+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..948e95700f96c1a7956ffd633d445852af0c15a5 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_1517159787117774618+bad9cf09/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4854866cb4f8f324dbe2f710c2135831b8c5376431a50957455984a01eb5012c +size 22498304 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15786686745870740384+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15786686745870740384+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15786686745870740384+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15786686745870740384+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15786686745870740384+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15786686745870740384+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15786686745870740384+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..8b4a77108953b5e669277746b78116fbec211bb3 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15786686745870740384+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5415e070fef2b0f82ab8dc83a1b7235ee56907766147007335809b59d549572 +size 1810 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15786686745870740384+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15786686745870740384+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..e4ce16234fe9be502f8b8f4deb6188ee6b1cdbed Binary files /dev/null and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15786686745870740384+bad9cf09/model.neff differ diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15804984955746879243+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15804984955746879243+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15804984955746879243+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15804984955746879243+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15804984955746879243+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15804984955746879243+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15804984955746879243+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..2a4fe1e15641dd0c2d5e4f5e6e62f90d4e5a2993 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15804984955746879243+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed0b10113b065f9981de47571651f2ef421e5b6c355d83a034a5803d07ea61ff +size 346 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15804984955746879243+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15804984955746879243+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ae0e16ad3708151df3e61b26680a4875d3df6b6d Binary files /dev/null and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15804984955746879243+bad9cf09/model.neff differ diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..8da50ffdebbe4b136d67d64bb87ac42d154163d7 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=2", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..312ae3d3c2102acd346fee0a5de155fb14d6ada1 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c21183781ec82e4446778469cd7bada09e0ac4f1745c4b3aea2d7c34f63d9454 +size 1989136 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..90874c22dd57985ef20305f7312e85c950fea1ff --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:563983466664c40d4fc21fe8849dc3e121bfc0b2385cab79d445d5d96008effa +size 3687424 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/wrapped_neff.hlo b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..7b87798f2c0eae663cf2b3a16bd131a710d82a35 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_2a171560988b9ff4796c+747527b0/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b071395cef8730962a25537669c31ff152815487c77421e439a177fb7d1ba3ec +size 3825515 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3432504749543175755+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3432504749543175755+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3432504749543175755+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3432504749543175755+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3432504749543175755+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3432504749543175755+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3432504749543175755+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..d0727cfeb5cb9134e6f6af0542945f538eb08e96 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3432504749543175755+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43ccea92314c735d4f60af13dfb9c65c8d98759d4b397f9e6e04c99939a22bf0 +size 2520884 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3432504749543175755+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3432504749543175755+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..13da27e1590cc985b861abb31c5d6aa88c017f2c --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_3432504749543175755+bad9cf09/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71260077fd6c31ba0d9175141d3559c2fd109bc27b8b83195dc48fd5515a2c6c +size 22846464 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5922683378015269857+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5922683378015269857+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5922683378015269857+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5922683378015269857+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5922683378015269857+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5922683378015269857+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5922683378015269857+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..a1b318938bfcc70b261cd86785d13559dc12bef6 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5922683378015269857+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1efde08019c2a149cd0013bc813c6feeb2f62239ee1e97bf902e91af117e056b +size 1028 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5922683378015269857+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5922683378015269857+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5608e9a246db3a81311cb0c7c1d8e8ae1bcfda53 Binary files /dev/null and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_5922683378015269857+bad9cf09/model.neff differ diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6009855936990338611+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6009855936990338611+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6009855936990338611+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6009855936990338611+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6009855936990338611+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6009855936990338611+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6009855936990338611+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..774625225b22739279ec95af891678cf58f21554 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6009855936990338611+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c1abe59f3f84ba4624d3024ef8f3d4c157bb76d13332eb8df7c9fb2a074f3bf +size 2521575 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6009855936990338611+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6009855936990338611+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..87b215c293226c039a2494a074a8bf066ae923db --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_6009855936990338611+bad9cf09/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea099508846fbfdec9d10c6af94636f229d02d03046f0d135d994282fd73bb58 +size 22856704 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8781809999900598498+bad9cf09/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8781809999900598498+bad9cf09/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..eb5e1b634149a270654878b6978943bf4c50af1b --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8781809999900598498+bad9cf09/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8781809999900598498+bad9cf09/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8781809999900598498+bad9cf09/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8781809999900598498+bad9cf09/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8781809999900598498+bad9cf09/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..138e7963a7b6538b966abe60e84c3b6d7f9030b9 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8781809999900598498+bad9cf09/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f516f524713616a92c64c17a4911587790c4b94c7813f640fcd04c6a5b12d144 +size 1175351 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8781809999900598498+bad9cf09/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8781809999900598498+bad9cf09/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..9afb6e782852e26ac7eab40d81f62189c255cb69 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8781809999900598498+bad9cf09/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52bde2cca7f76daaaf696deee14b412d44911320fba52a37280b74791d8c320a +size 3124224 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd89854370a2ef01c9c4+877608f3/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd89854370a2ef01c9c4+877608f3/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..fc27c67e0f3bd30aba010defcc6c2d0646e87b83 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd89854370a2ef01c9c4+877608f3/compile_flags.json @@ -0,0 +1 @@ +["--target=trn2", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=2", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd89854370a2ef01c9c4+877608f3/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd89854370a2ef01c9c4+877608f3/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd89854370a2ef01c9c4+877608f3/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd89854370a2ef01c9c4+877608f3/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..dbe64d7551c33e3c78e7a9e7efa874a6c1ff2edf --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd89854370a2ef01c9c4+877608f3/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c764646a387504e073b9894b2e7079cf9ca659e2f6ff9b8630f0cfb37fc98e73 +size 2198633 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd89854370a2ef01c9c4+877608f3/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd89854370a2ef01c9c4+877608f3/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..663e429ba4d6838891028d47ce869bebfd175d09 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_bd89854370a2ef01c9c4+877608f3/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71c9d2e3c1af79348a199fafc7af5aa758c249dac5fa6630434695bd74a77297 +size 9739264