diff --git a/.gitattributes b/.gitattributes index 2e3fc92e367ae5bcb9ab5e82e1501a2851b5e94c..c8a97229c5ebbc35b879709c7dcbad61fa76836f 100644 --- a/.gitattributes +++ b/.gitattributes @@ -11867,3 +11867,25 @@ neuronxcc-2.21.18209.0+043b1bf7/MODULE_14611821751025129524+bad9cf09/model.neff neuronxcc-2.21.18209.0+043b1bf7/MODULE_1798959443618413102+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.18209.0+043b1bf7/MODULE_393045707851385331+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text neuronxcc-2.21.18209.0+043b1bf7/MODULE_4395987120667329067+bad9cf09/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_0a113de31eae6e0cd5ea+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_21fb9cbd6bc31f93ffc7+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_244d0637c526ac81b414+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_52f62927e2aef61c8a2a+ae6a382b/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_7e3a1a26312c81c65e8f+ae6a382b/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_a7bb15d22b2a18c55870+ed72d204/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_b42ea471c6d81a15b0b3+ae6a382b/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_d22c269383bdc0775b95+ae6a382b/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_15640073450153027801+f7f529f3/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_17272134439322064525+f7f529f3/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_17799376403849510564+f7f529f3/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_18274421132528031246+f7f529f3/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_7645671890323173873+f7f529f3/model.neff filter=lfs diff=lfs merge=lfs -text +neuronxcc-2.21.18209.0+043b1bf7/MODULE_9669004554499106932+f7f529f3/model.neff filter=lfs diff=lfs merge=lfs -text diff --git a/neuronxcc-2.20.9961.0+0acef03a/0_REGISTRY/0.3.0/llama/meta-llama/Llama-3.2-1B/59041c9140e83957fcc2.json b/neuronxcc-2.20.9961.0+0acef03a/0_REGISTRY/0.3.0/llama/meta-llama/Llama-3.2-1B/59041c9140e83957fcc2.json new file mode 100644 index 0000000000000000000000000000000000000000..06f894bf8eb660de0451daac2b0d82de94221a6b --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/0_REGISTRY/0.3.0/llama/meta-llama/Llama-3.2-1B/59041c9140e83957fcc2.json @@ -0,0 +1,77 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-3.2-1B", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 1, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "meta-llama/Llama-3.2-1B", + "checkpoint_revision": "4e20de362430cd3b72f300e6b0f18e50e7166e08", + "continuous_batching": false, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": true, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 2, + "logical_nc_config": 1, + "max_batch_size": 1, + "max_context_length": 2048, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 2048, + "neuronxcc_version": "2.20.9961.0+0acef03a", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 2048, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 2, + "vocab_parallel": false + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/0_REGISTRY/0.3.0/llama/meta-llama/Llama-3.2-1B/96440af3992c61db1915.json b/neuronxcc-2.20.9961.0+0acef03a/0_REGISTRY/0.3.0/llama/meta-llama/Llama-3.2-1B/96440af3992c61db1915.json new file mode 100644 index 0000000000000000000000000000000000000000..88bb07eb7b9a17cef17367a873dffdff5e2ce72b --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/0_REGISTRY/0.3.0/llama/meta-llama/Llama-3.2-1B/96440af3992c61db1915.json @@ -0,0 +1,77 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "meta-llama/Llama-3.2-1B", + "_task": "text-generation", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 1, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "meta-llama/Llama-3.2-1B", + "checkpoint_revision": "4e20de362430cd3b72f300e6b0f18e50e7166e08", + "continuous_batching": false, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": true, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 1, + "logical_nc_config": 1, + "max_batch_size": 1, + "max_context_length": 2048, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 2048, + "neuronxcc_version": "2.20.9961.0+0acef03a", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 2048, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 1, + "vocab_parallel": false + }, + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "use_cache": true, + "vocab_size": 128256 +} \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/0_REGISTRY/0.3.0/qwen2/Qwen/Qwen2.5-7B/6fc75d9e400329069010.json b/neuronxcc-2.20.9961.0+0acef03a/0_REGISTRY/0.3.0/qwen2/Qwen/Qwen2.5-7B/6fc75d9e400329069010.json new file mode 100644 index 0000000000000000000000000000000000000000..43358af2228dfdd537be096d3475c7317a2b0f60 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/0_REGISTRY/0.3.0/qwen2/Qwen/Qwen2.5-7B/6fc75d9e400329069010.json @@ -0,0 +1,71 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "Qwen/Qwen2.5-7B", + "_task": "text-generation", + "architectures": [ + "Qwen2ForCausalLM" + ], + "attention_dropout": 0.0, + "hidden_act": "silu", + "hidden_size": 3584, + "initializer_range": 0.02, + "intermediate_size": 18944, + "max_position_embeddings": 131072, + "max_window_layers": 28, + "model_type": "qwen2", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 1, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "Qwen/Qwen2.5-7B", + "checkpoint_revision": "d149729398750b98c0af14eb82c78cfe92750796", + "continuous_batching": false, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": false, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 2, + "logical_nc_config": 1, + "max_batch_size": 1, + "max_context_length": 2048, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 2048, + "neuronxcc_version": "2.20.9961.0+0acef03a", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 2048, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 2, + "vocab_parallel": false + }, + "num_attention_heads": 28, + "num_hidden_layers": 28, + "num_key_value_heads": 4, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000.0, + "sliding_window": 131072, + "tie_word_embeddings": false, + "use_cache": true, + "use_mrope": false, + "use_sliding_window": false, + "vocab_size": 152064 +} \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/0_REGISTRY/0.3.0/qwen2/arcee-ai/arcee-lite/aaad74b827582e109166.json b/neuronxcc-2.20.9961.0+0acef03a/0_REGISTRY/0.3.0/qwen2/arcee-ai/arcee-lite/aaad74b827582e109166.json new file mode 100644 index 0000000000000000000000000000000000000000..45ab71a4cf62bde325e5a8dfab099cef7055cae4 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/0_REGISTRY/0.3.0/qwen2/arcee-ai/arcee-lite/aaad74b827582e109166.json @@ -0,0 +1,70 @@ +{ + "_entry_class": "SingleModelCacheEntry", + "_model_id": "arcee-ai/arcee-lite", + "_task": "text-generation", + "architectures": [ + "Qwen2ForCausalLM" + ], + "attention_dropout": 0.0, + "hidden_act": "silu", + "hidden_size": 1536, + "initializer_range": 0.02, + "intermediate_size": 8960, + "max_position_embeddings": 32768, + "max_window_layers": 28, + "model_type": "qwen2", + "neuron": { + "_serialized_key": "NxDNeuronConfig", + "async_mode": false, + "attn_kernel_enabled": false, + "batch_size": 1, + "capacity_factor": null, + "cc_pipeline_tiling_factor": 2, + "checkpoint_id": "arcee-ai/arcee-lite", + "checkpoint_revision": "c5cb9c38be16b64757f785f0df36dca87f76d5e2", + "continuous_batching": false, + "enable_bucketing": false, + "ep_degree": 1, + "flash_decoding_enabled": false, + "fused_qkv": false, + "glu_mlp": true, + "is_chunked_prefill": false, + "local_ranks_size": 2, + "logical_nc_config": 1, + "max_batch_size": 1, + "max_context_length": 2048, + "max_topk": 256, + "mlp_kernel_enabled": false, + "mlp_kernel_fuse_residual_add": false, + "n_active_tokens": 2048, + "neuronxcc_version": "2.20.9961.0+0acef03a", + "num_cores_per_group": 1, + "on_device_sampling": true, + "optimum_neuron_version": "0.3.0", + "output_logits": false, + "padding_side": "right", + "pp_degree": 1, + "qk_layernorm": false, + "qkv_kernel_enabled": false, + "rpl_reduce_dtype": "bfloat16", + "sequence_length": 2048, + "sequence_parallel_enabled": false, + "speculation_length": 0, + "start_rank_id": 0, + "target": null, + "torch_dtype": "bfloat16", + "tp_degree": 2, + "vocab_parallel": false + }, + "num_attention_heads": 12, + "num_hidden_layers": 28, + "num_key_value_heads": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000.0, + "sliding_window": null, + "tie_word_embeddings": true, + "use_cache": true, + "use_sliding_window": false, + "vocab_size": 151936 +} \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_0a113de31eae6e0cd5ea+ed72d204/compile_flags.json b/neuronxcc-2.20.9961.0+0acef03a/MODULE_0a113de31eae6e0cd5ea+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_0a113de31eae6e0cd5ea+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_0a113de31eae6e0cd5ea+ed72d204/model.done b/neuronxcc-2.20.9961.0+0acef03a/MODULE_0a113de31eae6e0cd5ea+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_0a113de31eae6e0cd5ea+ed72d204/model.hlo_module.pb b/neuronxcc-2.20.9961.0+0acef03a/MODULE_0a113de31eae6e0cd5ea+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..07b8a0cd343ef055a376342f97e8f789dad4ebaa --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_0a113de31eae6e0cd5ea+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70e97945c7aa39207e4c0573a12e7c0daf41de18887466041dae687748e11602 +size 679803 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_0a113de31eae6e0cd5ea+ed72d204/model.neff b/neuronxcc-2.20.9961.0+0acef03a/MODULE_0a113de31eae6e0cd5ea+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..8fd9b97793843b58c04515266ddfd5721dfbc672 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_0a113de31eae6e0cd5ea+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8755b3ca0b48f0875b7ef368ce891da56963170f4f8b46e352718100990ee252 +size 3636224 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_21fb9cbd6bc31f93ffc7+ed72d204/compile_flags.json b/neuronxcc-2.20.9961.0+0acef03a/MODULE_21fb9cbd6bc31f93ffc7+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_21fb9cbd6bc31f93ffc7+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_21fb9cbd6bc31f93ffc7+ed72d204/model.done b/neuronxcc-2.20.9961.0+0acef03a/MODULE_21fb9cbd6bc31f93ffc7+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_21fb9cbd6bc31f93ffc7+ed72d204/model.hlo_module.pb b/neuronxcc-2.20.9961.0+0acef03a/MODULE_21fb9cbd6bc31f93ffc7+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..ca52456a698c2220393d65f5a4fec5280750a90b --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_21fb9cbd6bc31f93ffc7+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db744394a0c423f4f3bd9aeed587f1626c4bd8c310867545e7cf7ccc6a912860 +size 371739 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_21fb9cbd6bc31f93ffc7+ed72d204/model.neff b/neuronxcc-2.20.9961.0+0acef03a/MODULE_21fb9cbd6bc31f93ffc7+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a1c104db1c0557eb9ac70869f7b6659ce2e108ee --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_21fb9cbd6bc31f93ffc7+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dd98bac47a28a2d1126fcfca9ad2579a775033448ce80b1c0350e5702f5100c +size 9657344 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_244d0637c526ac81b414+ed72d204/compile_flags.json b/neuronxcc-2.20.9961.0+0acef03a/MODULE_244d0637c526ac81b414+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_244d0637c526ac81b414+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_244d0637c526ac81b414+ed72d204/model.done b/neuronxcc-2.20.9961.0+0acef03a/MODULE_244d0637c526ac81b414+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_244d0637c526ac81b414+ed72d204/model.hlo_module.pb b/neuronxcc-2.20.9961.0+0acef03a/MODULE_244d0637c526ac81b414+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..124660c894564636321ba0275c88bd305143af44 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_244d0637c526ac81b414+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a74c0049d74cb0cc9d967d1d7ea350ba916c89acfbfe54e18c0f36696e0c719 +size 660175 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_244d0637c526ac81b414+ed72d204/model.neff b/neuronxcc-2.20.9961.0+0acef03a/MODULE_244d0637c526ac81b414+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..061e54edabea95e8d9beca58432582918094b71b --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_244d0637c526ac81b414+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e891ff7e08be3d14ee7a833ea2d46a1de88887f6e44c7d103a45b6af959964f +size 10732544 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/compile_flags.json b/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/model.done b/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/model.hlo_module.pb b/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..f995bcd349338e79ffde287fa464f048d7588f18 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:950d4b81fcbc51f2ee05e4b54ec72c34ed6a614a09777678ab8256ccadf4c25a +size 740840 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/model.neff b/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..232b50fc9427c7b65adb5c03c5b5f928b13a2c43 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebe618c73e74cdd8db0825b2bc1429797edc127378610f6efc354a4275dc62f1 +size 6145024 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..6c7d00aa254b0193481f82a5bded2069c1eecd9c --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_3634540e2564ed96b5da+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:160f04d4186c56abdcafb441db29b46e6a05932c324492e3b7e8f82c35db298a +size 6339591 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/compile_flags.json b/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/model.done b/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/model.hlo_module.pb b/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..47e3824b45a6783ad56f2c375fac6d875e2beea0 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d391b1d7dbf4f034f49282f26255219468054f0a8333e9e7b2990521de02e2a0 +size 388806 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/model.neff b/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..47864ec3c6cc9aa5665d7e537e0077e37970a1ac --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9da7c1e95569880d633b22e37a0a3595d9d7b5512a76703ee264afc7a406f047 +size 2335744 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..815366cbe9c7297907d4ef0bb5c4c95a109ade7e --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_48e1dbda70c7b45843ee+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:106b77e6679e9a0a7723043bf22964feffa0545658a41eccf5953697cb730d34 +size 2407399 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_52f62927e2aef61c8a2a+ae6a382b/compile_flags.json b/neuronxcc-2.20.9961.0+0acef03a/MODULE_52f62927e2aef61c8a2a+ae6a382b/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..724769fc90ef6314ff1aa48b9a44659535acf902 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_52f62927e2aef61c8a2a+ae6a382b/compile_flags.json @@ -0,0 +1 @@ +"--model-type=transformer -O1 --lnc=1 --internal-hlo2tensorizer-options='--experimental-unsafe-fp8e4m3fn-as-fp8e4m3 --verify-hlo=false' --logfile=/tmp/nxd_model/layout_opt/log-neuron-cc.txt" \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_52f62927e2aef61c8a2a+ae6a382b/model.done b/neuronxcc-2.20.9961.0+0acef03a/MODULE_52f62927e2aef61c8a2a+ae6a382b/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_52f62927e2aef61c8a2a+ae6a382b/model.hlo_module.pb b/neuronxcc-2.20.9961.0+0acef03a/MODULE_52f62927e2aef61c8a2a+ae6a382b/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e6c1545d481136586c6679b53694a4c72257de1c --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_52f62927e2aef61c8a2a+ae6a382b/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03509621db932b2ad273e9eb6035e68292df17c21e9eb99d8f09d22c5cc22926 +size 69007 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_52f62927e2aef61c8a2a+ae6a382b/model.neff b/neuronxcc-2.20.9961.0+0acef03a/MODULE_52f62927e2aef61c8a2a+ae6a382b/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..a91863b55eb4f4a374e85e6e9120ba8943ff36bf --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_52f62927e2aef61c8a2a+ae6a382b/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f595fde6155be56d50d6da408103d6a443f33bc13593725934a650d1f79c547 +size 1352704 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_7e3a1a26312c81c65e8f+ae6a382b/compile_flags.json b/neuronxcc-2.20.9961.0+0acef03a/MODULE_7e3a1a26312c81c65e8f+ae6a382b/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..724769fc90ef6314ff1aa48b9a44659535acf902 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_7e3a1a26312c81c65e8f+ae6a382b/compile_flags.json @@ -0,0 +1 @@ +"--model-type=transformer -O1 --lnc=1 --internal-hlo2tensorizer-options='--experimental-unsafe-fp8e4m3fn-as-fp8e4m3 --verify-hlo=false' --logfile=/tmp/nxd_model/layout_opt/log-neuron-cc.txt" \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_7e3a1a26312c81c65e8f+ae6a382b/model.done b/neuronxcc-2.20.9961.0+0acef03a/MODULE_7e3a1a26312c81c65e8f+ae6a382b/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_7e3a1a26312c81c65e8f+ae6a382b/model.hlo_module.pb b/neuronxcc-2.20.9961.0+0acef03a/MODULE_7e3a1a26312c81c65e8f+ae6a382b/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..899aa0646f7cd5ea0a93e6dbe8588885af138381 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_7e3a1a26312c81c65e8f+ae6a382b/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4a026f3c0afa9452f8e28cdfbad2e7e345e697bb30fd481c536111993679da0 +size 201977 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_7e3a1a26312c81c65e8f+ae6a382b/model.neff b/neuronxcc-2.20.9961.0+0acef03a/MODULE_7e3a1a26312c81c65e8f+ae6a382b/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b8e7c824b52c7e40e818a4cfcf7deb6dafd3dd76 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_7e3a1a26312c81c65e8f+ae6a382b/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81e92eb3fef01485419a56e993bff077ed797984730707b5730e493864719624 +size 6554624 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_a7bb15d22b2a18c55870+ed72d204/compile_flags.json b/neuronxcc-2.20.9961.0+0acef03a/MODULE_a7bb15d22b2a18c55870+ed72d204/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..1569eac18fc7f34b3fe66166f2d7a4a59dbc5aa4 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_a7bb15d22b2a18c55870+ed72d204/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/context_encoding_model/_tp0_bk0/log-neuron-cc.txt"] \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_a7bb15d22b2a18c55870+ed72d204/model.done b/neuronxcc-2.20.9961.0+0acef03a/MODULE_a7bb15d22b2a18c55870+ed72d204/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_a7bb15d22b2a18c55870+ed72d204/model.hlo_module.pb b/neuronxcc-2.20.9961.0+0acef03a/MODULE_a7bb15d22b2a18c55870+ed72d204/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..187b04375b42bc61b80893da0378d09e732cfd96 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_a7bb15d22b2a18c55870+ed72d204/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08b3c5395792211a3272bef80039b605b36847cd4a86941f65c417d19b17a1b4 +size 343143 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_a7bb15d22b2a18c55870+ed72d204/model.neff b/neuronxcc-2.20.9961.0+0acef03a/MODULE_a7bb15d22b2a18c55870+ed72d204/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5643abf52bc1ce8a250b798c3e0f2c9ec82960a4 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_a7bb15d22b2a18c55870+ed72d204/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5776d9905351a073af4bfce4191a08faa6247cece91a4368db3e10ab67929cd2 +size 20204544 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_b42ea471c6d81a15b0b3+ae6a382b/compile_flags.json b/neuronxcc-2.20.9961.0+0acef03a/MODULE_b42ea471c6d81a15b0b3+ae6a382b/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..724769fc90ef6314ff1aa48b9a44659535acf902 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_b42ea471c6d81a15b0b3+ae6a382b/compile_flags.json @@ -0,0 +1 @@ +"--model-type=transformer -O1 --lnc=1 --internal-hlo2tensorizer-options='--experimental-unsafe-fp8e4m3fn-as-fp8e4m3 --verify-hlo=false' --logfile=/tmp/nxd_model/layout_opt/log-neuron-cc.txt" \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_b42ea471c6d81a15b0b3+ae6a382b/model.done b/neuronxcc-2.20.9961.0+0acef03a/MODULE_b42ea471c6d81a15b0b3+ae6a382b/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_b42ea471c6d81a15b0b3+ae6a382b/model.hlo_module.pb b/neuronxcc-2.20.9961.0+0acef03a/MODULE_b42ea471c6d81a15b0b3+ae6a382b/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..93803b8e91733b63c9b75075e3fd05148d289130 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_b42ea471c6d81a15b0b3+ae6a382b/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b3df471f965045c386c6e8db1b96baa6e68fd5adbc463b3ff4ee9e534efee4e +size 71540 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_b42ea471c6d81a15b0b3+ae6a382b/model.neff b/neuronxcc-2.20.9961.0+0acef03a/MODULE_b42ea471c6d81a15b0b3+ae6a382b/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..5355656493748f1ab6a9a68abd05780f0da5867f --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_b42ea471c6d81a15b0b3+ae6a382b/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d54349cbc656b3fae72730ffaeadb9a4d2ed25de24bb152402b20385fd1dd0 +size 2663424 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_d22c269383bdc0775b95+ae6a382b/compile_flags.json b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d22c269383bdc0775b95+ae6a382b/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..724769fc90ef6314ff1aa48b9a44659535acf902 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d22c269383bdc0775b95+ae6a382b/compile_flags.json @@ -0,0 +1 @@ +"--model-type=transformer -O1 --lnc=1 --internal-hlo2tensorizer-options='--experimental-unsafe-fp8e4m3fn-as-fp8e4m3 --verify-hlo=false' --logfile=/tmp/nxd_model/layout_opt/log-neuron-cc.txt" \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_d22c269383bdc0775b95+ae6a382b/model.done b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d22c269383bdc0775b95+ae6a382b/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_d22c269383bdc0775b95+ae6a382b/model.hlo_module.pb b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d22c269383bdc0775b95+ae6a382b/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..58c70ec53346cf6218e89c574540b9625ad1613d --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d22c269383bdc0775b95+ae6a382b/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c27fc08e1e4d7a8468ed18e98af82fedc774d2582c19d7152128f4ce8b8e3d2b +size 177861 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_d22c269383bdc0775b95+ae6a382b/model.neff b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d22c269383bdc0775b95+ae6a382b/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..0addb1eb99b40403c839310abbb79069f84527a8 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d22c269383bdc0775b95+ae6a382b/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55bd9e2f6f0168634b093fec4cfc765432ecb8c69add8da6f44065ee3f22cdf4 +size 1557504 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/compile_flags.json b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/model.done b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/model.hlo_module.pb b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..39b7341e4c54b6ff6c26093b8445f9e830410478 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32e82cf9e4b37a6d040b934497f5bd95de4d2bc09d8d1fd9321190908082ef08 +size 417093 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/model.neff b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..19ea551f8e993f43a2742f76a3e0322fd33f9603 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ff6fb536f5311aa204272fdf28bcbdba3d2d2c1a6fe5216ec353631fe404fb0 +size 1475584 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..15af5fc84d128103122016360defd3d7442185c7 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_d48baee12d51947bcd73+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2db0533e3c4f8af4b36bb3d8fb01894facf40b63567bf572a2b0900eece71096 +size 1545293 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/compile_flags.json b/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..34675115220079309bfad2d45680c478c378a3c0 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--auto-cast=none", "--model-type=transformer", "--tensorizer-options=--enable-ccop-compute-overlap --cc-pipeline-tiling-factor=2 --vectorize-strided-dma ", "-O2", "--lnc=1", "--logfile=/tmp/nxd_model/token_generation_model/_tp0_bk0/log-neuron-cc.txt", "--enable-internal-neff-wrapper"] \ No newline at end of file diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/model.done b/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/model.hlo_module.pb b/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..64aeb4a550622fa8a91ae9a1ad38e32a4bbc97de --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8cc2bbd8c94a38a2ead5f56dd679499592383f765fd0ee2bd7360a1e6b5ae59 +size 722078 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/model.neff b/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..12de4959c745e734dfd8b514bc2dbd05a2a4fd5e --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d95adf4dfb6fd313bef5f81d47f4572eeab38e26eb586fdd4e6b952987fcbced +size 2028544 diff --git a/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/wrapped_neff.hlo b/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/wrapped_neff.hlo new file mode 100644 index 0000000000000000000000000000000000000000..8a3ecd75ecb9fe6f7eec3ed9f1d66554d4d38f11 --- /dev/null +++ b/neuronxcc-2.20.9961.0+0acef03a/MODULE_e5fef74c2bea22a04c7c+a9d440f5/wrapped_neff.hlo @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dee3a7460146bce927178756058d46a5c47e457edf21ba3d5c6a2388ef98f9ca +size 2200239 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11196433285822111861+f7f529f3/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11196433285822111861+f7f529f3/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..fcbf3eee4b2662df595c4faa9e131d744f5ad30d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11196433285822111861+f7f529f3/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11196433285822111861+f7f529f3/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11196433285822111861+f7f529f3/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11196433285822111861+f7f529f3/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11196433285822111861+f7f529f3/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..5c225d20574c52bb6515b5d96f001e6c59bb1eb4 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11196433285822111861+f7f529f3/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3091aeeb1f5e4708c1ad59508c67a1fedd3a516df0e0afac4e15f9bfb2d6f30 +size 344 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11196433285822111861+f7f529f3/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11196433285822111861+f7f529f3/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..ca68285d4b482f0041f75691a7d55901d29ac55e Binary files /dev/null and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_11196433285822111861+f7f529f3/model.neff differ diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15640073450153027801+f7f529f3/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15640073450153027801+f7f529f3/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..fcbf3eee4b2662df595c4faa9e131d744f5ad30d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15640073450153027801+f7f529f3/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15640073450153027801+f7f529f3/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15640073450153027801+f7f529f3/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15640073450153027801+f7f529f3/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15640073450153027801+f7f529f3/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..e2a80f4f231b9e95a497ed57c51fb007f56389b0 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15640073450153027801+f7f529f3/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3afd51e170457584f3451175cbc74fc3081a18bd541e5bea42623940e01f6cb6 +size 727356 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15640073450153027801+f7f529f3/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15640073450153027801+f7f529f3/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..1e9299ce71fc9ec21a247c8aecabdc1164affb77 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_15640073450153027801+f7f529f3/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308b62a50b370427d7a5e19bb71b97807941c2e6c2408269b143db0b60ef69fa +size 56843264 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17272134439322064525+f7f529f3/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17272134439322064525+f7f529f3/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..fcbf3eee4b2662df595c4faa9e131d744f5ad30d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17272134439322064525+f7f529f3/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17272134439322064525+f7f529f3/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17272134439322064525+f7f529f3/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17272134439322064525+f7f529f3/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17272134439322064525+f7f529f3/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..966843d3426174da4fbe5439771db802958cce49 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17272134439322064525+f7f529f3/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32a2a59793ee743e4e6791a93826e9d8b659e75fe53fc156eec64c9cb2e3a08b +size 697784 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17272134439322064525+f7f529f3/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17272134439322064525+f7f529f3/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..f020f639bca22e702f02184de6c171ab7531074e --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17272134439322064525+f7f529f3/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7f7e95e4544a67219b0bbf85115cf11732a6ec5cf408c790a9b5539cdb87c74 +size 55512064 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17799376403849510564+f7f529f3/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17799376403849510564+f7f529f3/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..fcbf3eee4b2662df595c4faa9e131d744f5ad30d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17799376403849510564+f7f529f3/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17799376403849510564+f7f529f3/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17799376403849510564+f7f529f3/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17799376403849510564+f7f529f3/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17799376403849510564+f7f529f3/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..381e98366b358fdf5bf6d890924eb36032f66d14 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17799376403849510564+f7f529f3/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68b99d4bdd342d3bf6014ee4f11bb29cbed8851ce637bf9dd0464717458ae1a9 +size 488888 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17799376403849510564+f7f529f3/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17799376403849510564+f7f529f3/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..402c8ac2605aafefd8f7a753c1896955061a5df7 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_17799376403849510564+f7f529f3/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5061358abf9178383d71951a2d2d1d380bda848693df618c3555640fe6e3b820 +size 7640064 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_18274421132528031246+f7f529f3/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_18274421132528031246+f7f529f3/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..fcbf3eee4b2662df595c4faa9e131d744f5ad30d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_18274421132528031246+f7f529f3/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_18274421132528031246+f7f529f3/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_18274421132528031246+f7f529f3/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_18274421132528031246+f7f529f3/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_18274421132528031246+f7f529f3/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..c3f5c8cb0e5b3c615dc5be15c41959bd0be4ce7a --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_18274421132528031246+f7f529f3/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82d729126a1be7d93a829cf3b65f215a18e3f290dcc0e934e81cd507e15ca662 +size 427539 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_18274421132528031246+f7f529f3/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_18274421132528031246+f7f529f3/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..2a660331ae679cf423ff4c51470ab4d88b2b6ba1 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_18274421132528031246+f7f529f3/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330d9392c8b0df5e572f22aac02ca60a4b328d3624fbececc9ca22fa3fb1a05b +size 2786304 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_478170247348345721+f7f529f3/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_478170247348345721+f7f529f3/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..fcbf3eee4b2662df595c4faa9e131d744f5ad30d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_478170247348345721+f7f529f3/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_478170247348345721+f7f529f3/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_478170247348345721+f7f529f3/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_478170247348345721+f7f529f3/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_478170247348345721+f7f529f3/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..cdd842742a654d32cfed3c9be74f8c6ba76f27c7 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_478170247348345721+f7f529f3/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09094ad9afcbdcc0061526a1abbbdf0a441608c11b2441f810748a6233be5585 +size 1808 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_478170247348345721+f7f529f3/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_478170247348345721+f7f529f3/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..c015aa0800ce9aa4a6ba8b72546e82068f9b8087 Binary files /dev/null and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_478170247348345721+f7f529f3/model.neff differ diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7645671890323173873+f7f529f3/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7645671890323173873+f7f529f3/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..fcbf3eee4b2662df595c4faa9e131d744f5ad30d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7645671890323173873+f7f529f3/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7645671890323173873+f7f529f3/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7645671890323173873+f7f529f3/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7645671890323173873+f7f529f3/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7645671890323173873+f7f529f3/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..606f315f8390b7e9f597c725a929b53e82425f33 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7645671890323173873+f7f529f3/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2757f834875524a6874480afa91f38795ae2d85db0c8e41c843b415ffc59cfd6 +size 727846 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7645671890323173873+f7f529f3/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7645671890323173873+f7f529f3/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..624db649f1781cb003d3871f4327939f872263bf --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_7645671890323173873+f7f529f3/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b264aac60717de3e809cc8a82dabb5cbba2ce2dfd36402b03360dfe903dbb2dd +size 56802304 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8351548107491623024+f7f529f3/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8351548107491623024+f7f529f3/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..fcbf3eee4b2662df595c4faa9e131d744f5ad30d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8351548107491623024+f7f529f3/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8351548107491623024+f7f529f3/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8351548107491623024+f7f529f3/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8351548107491623024+f7f529f3/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8351548107491623024+f7f529f3/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..217ce72b44b450aa802e7fd8a0b8ff4d56418c3f --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8351548107491623024+f7f529f3/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:187249b0558d1d9b3cf76d2cc0a566a57172f074f16ce7a86cb13cd25770464c +size 1016 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8351548107491623024+f7f529f3/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8351548107491623024+f7f529f3/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..6e18b238613f5b89cd73aab173187171497dc61d Binary files /dev/null and b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_8351548107491623024+f7f529f3/model.neff differ diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9669004554499106932+f7f529f3/compile_flags.json b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9669004554499106932+f7f529f3/compile_flags.json new file mode 100644 index 0000000000000000000000000000000000000000..fcbf3eee4b2662df595c4faa9e131d744f5ad30d --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9669004554499106932+f7f529f3/compile_flags.json @@ -0,0 +1 @@ +["--target=trn1", "--model-type", "transformer"] \ No newline at end of file diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9669004554499106932+f7f529f3/model.done b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9669004554499106932+f7f529f3/model.done new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9669004554499106932+f7f529f3/model.hlo_module.pb b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9669004554499106932+f7f529f3/model.hlo_module.pb new file mode 100644 index 0000000000000000000000000000000000000000..efe3ca56170028a68a86289fc319b9620f174ac9 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9669004554499106932+f7f529f3/model.hlo_module.pb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1d07a4f6a08a44df8baaf6c500106614b18c8ac3798c810df72494eb8697904 +size 698278 diff --git a/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9669004554499106932+f7f529f3/model.neff b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9669004554499106932+f7f529f3/model.neff new file mode 100644 index 0000000000000000000000000000000000000000..b4cb73463e2dcba1a3805362413002ee3e6f26d3 --- /dev/null +++ b/neuronxcc-2.21.18209.0+043b1bf7/MODULE_9669004554499106932+f7f529f3/model.neff @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dad13313644c22e05dccf5865296c9974a6fd47ce6863182cdeb5e484433645 +size 55471104