Synchronizing local compiler cache.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +34 -0
- neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/9699616599829b48b4a5.json +1 -0
- neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/db1d9051ff5698e52393.json +1 -0
- neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/2a30c91813b1e7196f95.json +1 -0
- neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/6434dcc45c7c9439f30f.json +1 -0
- neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/7e91caedb706bd96bd3a.json +1 -0
- neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/f22f49b5301c6c906c34.json +1 -0
- neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/fd9b28c3749a3bbd30c5.json +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_0129170172f364916548+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_0129170172f364916548+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_0129170172f364916548+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_0157f35eb303445e190f+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_0157f35eb303445e190f+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_0157f35eb303445e190f+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_01cc804175cc5fb0e309+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_01cc804175cc5fb0e309+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_01cc804175cc5fb0e309+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_09f9384fda97faade242+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_09f9384fda97faade242+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_09f9384fda97faade242+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_17fbd51961c885174794+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_17fbd51961c885174794+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_17fbd51961c885174794+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_1d5c76706b604a934e43+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_1d5c76706b604a934e43+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_1d5c76706b604a934e43+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_1fc52214ed4eaafa2af7+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_1fc52214ed4eaafa2af7+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_1fc52214ed4eaafa2af7+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_1fef5a5f1f14da33eb81+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_1fef5a5f1f14da33eb81+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_1fef5a5f1f14da33eb81+2c2d707e/model.hlo_module.pb.lock +0 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_21e3dcaee19883fe287e+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_21e3dcaee19883fe287e+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_21e3dcaee19883fe287e+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_24c094e5b8a7b8e26a59+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_24c094e5b8a7b8e26a59+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_24c094e5b8a7b8e26a59+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_33719efab65aba8971de+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_33719efab65aba8971de+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_33719efab65aba8971de+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_3448a997dcf7ffa8ce06+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_3448a997dcf7ffa8ce06+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_3448a997dcf7ffa8ce06+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_51b8528780dc9259618f+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_51b8528780dc9259618f+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_51b8528780dc9259618f+2c2d707e/model.neff +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_51fa2c5a5f3058eea401+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_51fa2c5a5f3058eea401+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.14.227.0+2d4f85be/MODULE_51fa2c5a5f3058eea401+2c2d707e/model.neff +3 -0
.gitattributes
CHANGED
@@ -3386,3 +3386,37 @@ neuronxcc-2.14.227.0+2d4f85be/MODULE_3ee79106ae9bfc013100+2c2d707e/model.neff fi
|
|
3386 |
neuronxcc-2.14.227.0+2d4f85be/MODULE_7651246321963ddd5906+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3387 |
neuronxcc-2.14.227.0+2d4f85be/MODULE_ade80a2b19e816657dab+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3388 |
neuronxcc-2.14.227.0+2d4f85be/MODULE_e1e4cdeee8e8e42ef9b0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3386 |
neuronxcc-2.14.227.0+2d4f85be/MODULE_7651246321963ddd5906+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3387 |
neuronxcc-2.14.227.0+2d4f85be/MODULE_ade80a2b19e816657dab+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3388 |
neuronxcc-2.14.227.0+2d4f85be/MODULE_e1e4cdeee8e8e42ef9b0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3389 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_0129170172f364916548+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3390 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_0157f35eb303445e190f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3391 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_01cc804175cc5fb0e309+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3392 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_09f9384fda97faade242+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3393 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_17fbd51961c885174794+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3394 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_1d5c76706b604a934e43+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3395 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_1fc52214ed4eaafa2af7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3396 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_21e3dcaee19883fe287e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3397 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_24c094e5b8a7b8e26a59+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3398 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_33719efab65aba8971de+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3399 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_3448a997dcf7ffa8ce06+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3400 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_51b8528780dc9259618f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3401 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_51fa2c5a5f3058eea401+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3402 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_5ddb9c233d7c07c4b83e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3403 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_606e1ed5209ba86b600f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3404 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_64e06093d33a080bb222+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3405 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_667659b5880c8aa3c228+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3406 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_6c1d37c6bbfb3ba83465+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3407 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_712f16088b92ce1552a7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3408 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_7a376947f78404875f58+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3409 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_862db2bb1f4da5e95e09+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3410 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_8ae58871e7bd6db4281f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3411 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_941adcb49c0b0f9430a7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3412 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_a16cad38f886c688ecef+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3413 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_b79befd674e052c44c9f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3414 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_ce4004e47d7f9259e48d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3415 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_cebc0d79dffdb4b073d7+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3416 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_cf27c4eb2bcac29fb7ec+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3417 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_ddff37e03914d1e4cc1a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3418 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_e5482971f7e49838a230+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3419 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_e774925ef02cac9260be+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3420 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_eae40350bbf4ea1569ad+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3421 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_ec7ce1cb59fb29fdc73b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
3422 |
+
neuronxcc-2.14.227.0+2d4f85be/MODULE_f8a00a8cdaa177ccee23+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/9699616599829b48b4a5.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.227.0+2d4f85be", "num_cores": 12, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/db1d9051ff5698e52393.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.14.227.0+2d4f85be", "num_cores": 12, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/2a30c91813b1e7196f95.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 8, "checkpoint_id": "meta-llama/Meta-Llama-3-8B", "checkpoint_revision": "62bd457b6fe961a42a631306577e622c83876cb6", "compiler_type": "neuronx-cc", "compiler_version": "2.14.227.0+2d4f85be", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/6434dcc45c7c9439f30f.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 16, "checkpoint_id": "meta-llama/Meta-Llama-3-8B", "checkpoint_revision": "62bd457b6fe961a42a631306577e622c83876cb6", "compiler_type": "neuronx-cc", "compiler_version": "2.14.227.0+2d4f85be", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/7e91caedb706bd96bd3a.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "meta-llama/Meta-Llama-3-8B", "checkpoint_revision": "62bd457b6fe961a42a631306577e622c83876cb6", "compiler_type": "neuronx-cc", "compiler_version": "2.14.227.0+2d4f85be", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/f22f49b5301c6c906c34.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "meta-llama/Meta-Llama-3-8B", "checkpoint_revision": "62bd457b6fe961a42a631306577e622c83876cb6", "compiler_type": "neuronx-cc", "compiler_version": "2.14.227.0+2d4f85be", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.227.0+2d4f85be/0_REGISTRY/0.0.24.dev0/inference/llama/meta-llama/Meta-Llama-3-8B/fd9b28c3749a3bbd30c5.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "max_position_embeddings": 8192, "mlp_bias": false, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 32, "checkpoint_id": "meta-llama/Meta-Llama-3-8B", "checkpoint_revision": "62bd457b6fe961a42a631306577e622c83876cb6", "compiler_type": "neuronx-cc", "compiler_version": "2.14.227.0+2d4f85be", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "use_cache": true, "vocab_size": 128256}
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_0129170172f364916548+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_0129170172f364916548+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff95035e476d55cb19ab6f04831b676160715c7ba56816bef2dd715f62de978d
|
3 |
+
size 337090
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_0129170172f364916548+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d17fee8b81f0b1a9ee6c71dabc3552b6616c5a395b34b97db4a14f61c93e9aa
|
3 |
+
size 3513344
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_0157f35eb303445e190f+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_0157f35eb303445e190f+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78bda1c787c58a7c91b56f5c7bc8cffba94e94affe25ed93afd5e75f1b41e5ef
|
3 |
+
size 263042
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_0157f35eb303445e190f+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7db5f4e4ff0fb41ea2c0aa51f9da32b038d998b8eb0635fbcab0a8370a38aa75
|
3 |
+
size 2950144
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_01cc804175cc5fb0e309+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_01cc804175cc5fb0e309+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1f9c7e6febf4b6937cf831c6ec7659ef5b065859fc687e36653a12472a9a257
|
3 |
+
size 360581
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_01cc804175cc5fb0e309+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dadd8d705ed9d61451880279b44436fb5abd9d041d6b90e9618a9147f590f63
|
3 |
+
size 3963904
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_09f9384fda97faade242+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_09f9384fda97faade242+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a21b4e04683b0ecb3052baa6c2f05c1f684e2f40d95a167aa502e0e442500f03
|
3 |
+
size 254881
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_09f9384fda97faade242+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c53bac818c03b3c793c41613d5b40308c20d165c3f100ab9df66af5bcdd1b8ea
|
3 |
+
size 2182144
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_17fbd51961c885174794+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_17fbd51961c885174794+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85f62f3312bb3b755f884a1668727749d3edb7c62f5590aa3b004172869bc5b6
|
3 |
+
size 310896
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_17fbd51961c885174794+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b267ba5da88500b41b89df63e92abe854e50731e0dcb566710114839f4705c37
|
3 |
+
size 1803264
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_1d5c76706b604a934e43+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_1d5c76706b604a934e43+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75ddd0fa36baa1ffccb172c1a5e0c2af3a9aec90cf1a79ecbef7a9e747040e4a
|
3 |
+
size 333872
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_1d5c76706b604a934e43+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d81d1a2b6c9128f1f9f3c909c8dff0d0c6f7d839c6f023d57fbe47f009fd2bd
|
3 |
+
size 2386944
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_1fc52214ed4eaafa2af7+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_1fc52214ed4eaafa2af7+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24b359f3a640fad8eb963b7fe1d12dbe1380b0bfd3a56e3ac07119c4d217d779
|
3 |
+
size 310896
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_1fc52214ed4eaafa2af7+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a937ee53b82284d3ed7aff05236e716e7b45577b1030731bbb2cf685e480ac2
|
3 |
+
size 1854464
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_1fef5a5f1f14da33eb81+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_1fef5a5f1f14da33eb81+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1df1d44f0b7301fccee5b1311bb42c246185f9b33739c0de9d3fbc82dbb0f23e
|
3 |
+
size 337090
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_1fef5a5f1f14da33eb81+2c2d707e/model.hlo_module.pb.lock
ADDED
File without changes
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_21e3dcaee19883fe287e+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_21e3dcaee19883fe287e+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c13b522ad45166c5df2d2864c1eb75df2e240879c6db4533b22fec098ee634cf
|
3 |
+
size 266465
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_21e3dcaee19883fe287e+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46d2bbf3ced346caeca9b387944857cc266b88dfb8fc2c6ca2c875bbcf2beae2
|
3 |
+
size 13579264
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_24c094e5b8a7b8e26a59+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_24c094e5b8a7b8e26a59+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66452bc80c6804461bfe9ed58e8d59ba7106d79887919d1139972e51d33fd28f
|
3 |
+
size 254881
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_24c094e5b8a7b8e26a59+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:248d8d76e4a30688a0c48ab115764c4f66071105dd48582da7ab9567a3ffe428
|
3 |
+
size 3021824
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_33719efab65aba8971de+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_33719efab65aba8971de+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79f9714a849abc7a81c860cd24be5de76ad7c037cc74d9c2a225804e0c55e069
|
3 |
+
size 266465
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_33719efab65aba8971de+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:460463feb4e313823bb824da26e2566be4085337a55419a65ec4974c8ace19b3
|
3 |
+
size 3830784
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_3448a997dcf7ffa8ce06+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_3448a997dcf7ffa8ce06+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7caf33af677e610fa453612d92d55000aafccd9b14c1bd123db271075d9e50d5
|
3 |
+
size 254881
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_3448a997dcf7ffa8ce06+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ec3576b030b6fb48ec55178a1056c3af50cd58313a1fdb5a91bf202862db943
|
3 |
+
size 2530304
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_51b8528780dc9259618f+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_51b8528780dc9259618f+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd139da3e58ca2056b373f09ffbf8e773c93a76e58f75c55cbd26628da9d07f5
|
3 |
+
size 445757
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_51b8528780dc9259618f+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:948f59aa59d651441150d47d706482cf1e8021cd4daad8056fda4408ef915bd6
|
3 |
+
size 31960064
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_51fa2c5a5f3058eea401+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_51fa2c5a5f3058eea401+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86bc5dc29eeab6253e1b53adab0036033b35cf8a282f7eb9d965252cb13b244e
|
3 |
+
size 445757
|
neuronxcc-2.14.227.0+2d4f85be/MODULE_51fa2c5a5f3058eea401+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:573f29e5cd81f542c64ce5854cdeb79386e8fd9ea5fe13f8cfa2f10b81d52982
|
3 |
+
size 31960064
|