Synchronizing local compiler cache.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +34 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/5d4688c06ca1eea9cd2d.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/642817569926cd4530c8.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/c29571197f94c8546e45.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/d9b1eaeab430d169db57.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/57d08ed2158d3bc4efd8.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/be28f38f27aeb510e1c8.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/c9527c01253d9424170a.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/d6a72bcc14cde1f0364f.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/f6a3964311a50e56da2e.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22/inference/llama/defog/sqlcoder-7b-2/08b79e703c61b2f851cc.json +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_01fe42b103324d50dd0f+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_01fe42b103324d50dd0f+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_01fe42b103324d50dd0f+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_142005b3d93076706472+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_3020655465d2e0990c19+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_3020655465d2e0990c19+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_3020655465d2e0990c19+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_312cb57ef1e4a82c10e2+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_31bd89a484b00253cd84+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_4051477874156d7450fe+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_4051477874156d7450fe+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_4051477874156d7450fe+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_410c6d6a0c764608be0d+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_410c6d6a0c764608be0d+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_410c6d6a0c764608be0d+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_426cd9312d26b5e0bf95+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_426cd9312d26b5e0bf95+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_426cd9312d26b5e0bf95+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_443c7de81db84f0f078c+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_44563e64a3dddda1db4d+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_44563e64a3dddda1db4d+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_44563e64a3dddda1db4d+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_47eae16823191f315893+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_47eae16823191f315893+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_47eae16823191f315893+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_4d18af62746967c79d82+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_4d18af62746967c79d82+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_4d18af62746967c79d82+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_522ed20ba0b487552ad5+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_539309b68144a4afde0b+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_539309b68144a4afde0b+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_539309b68144a4afde0b+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_53f35b4110e7bebbcc45+2c2d707e/compile_flags.txt +1 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_53f35b4110e7bebbcc45+2c2d707e/model.hlo_module.pb +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_53f35b4110e7bebbcc45+2c2d707e/model.neff +3 -0
- neuronxcc-2.13.66.0+6dfecc895/MODULE_5ab5b6d9ff18b8896d5a+2c2d707e/compile_flags.txt +1 -0
.gitattributes
CHANGED
@@ -2654,3 +2654,37 @@ neuronxcc-2.13.66.0+6dfecc895/MODULE_5f931e8bf304c87202cd+2c2d707e/model.neff fi
|
|
2654 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_a4fe1c700a9abdb20641+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2655 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_b54a08c18ad776940cd0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2656 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_b59ff3b7e545f85152c8+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2654 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_a4fe1c700a9abdb20641+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2655 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_b54a08c18ad776940cd0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2656 |
neuronxcc-2.13.66.0+6dfecc895/MODULE_b59ff3b7e545f85152c8+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2657 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_01fe42b103324d50dd0f+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2658 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2659 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_3020655465d2e0990c19+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2660 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_4051477874156d7450fe+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2661 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_410c6d6a0c764608be0d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2662 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_426cd9312d26b5e0bf95+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2663 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_443c7de81db84f0f078c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2664 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_44563e64a3dddda1db4d+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2665 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_47eae16823191f315893+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2666 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_4d18af62746967c79d82+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2667 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_539309b68144a4afde0b+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2668 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_53f35b4110e7bebbcc45+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2669 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_5ab5b6d9ff18b8896d5a+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2670 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_62cafa382ec618cff287+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2671 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_639cfa0c302f955a704e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2672 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_64d9d7ab844b064ddcff+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2673 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_72f780796470e2d45102+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2674 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_7943455ee983f978e58c+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2675 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_7c67afcb8bd12bae0123+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2676 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_85a47887d4fc41e26097+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2677 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_8f8b48a08a0c68320dbf+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2678 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_98b888cee6ab04043987+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2679 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_9db2a3438f041d4e467e+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2680 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_a29e3f3cc47445e1c231+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2681 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_a97de47fb0d0f47ea4c0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2682 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_b7517ea4b617cd73f3ad+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2683 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_cda75e05b1d55681d8eb+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2684 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_d4cc88cd9d2d907c99f6+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2685 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_d66f5802e5ad890e3919+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2686 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_e334ed8a755e5380cbbd+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2687 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_ea017e5effcd92c4e6ff+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2688 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_ee55eab3eac6b30f23a0+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2689 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_f2145a17aa8d689f7038+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
2690 |
+
neuronxcc-2.13.66.0+6dfecc895/MODULE_f74f07a635721468c2ae+2c2d707e/model.neff filter=lfs diff=lfs merge=lfs -text
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/5d4688c06ca1eea9cd2d.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 24, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/642817569926cd4530c8.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 16, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 24, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/c29571197f94c8546e45.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 8, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 24, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-13b-chat-hf/d9b1eaeab430d169db57.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 5120, "initializer_range": 0.02, "intermediate_size": 13824, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 32, "checkpoint_id": "meta-llama/Llama-2-13b-chat-hf", "checkpoint_revision": "a2cb7a712bb6e5e736ca7f8cd98167f81a0b5bd8", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 24, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 40, "num_hidden_layers": 40, "num_key_value_heads": 40, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/57d08ed2158d3bc4efd8.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 16, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/be28f38f27aeb510e1c8.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/c9527c01253d9424170a.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/d6a72bcc14cde1f0364f.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 32, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22.dev0/inference/llama/meta-llama/Llama-2-7b-chat-hf/f6a3964311a50e56da2e.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 4096, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 8, "checkpoint_id": "meta-llama/Llama-2-7b-chat-hf", "checkpoint_revision": "f5db02db724555f92da89c216ac04704f23d4590", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 8, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 10000.0, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32000}
|
neuronxcc-2.13.66.0+6dfecc895/0_REGISTRY/0.0.22/inference/llama/defog/sqlcoder-7b-2/08b79e703c61b2f851cc.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 11008, "max_position_embeddings": 16384, "model_type": "llama", "neuron": {"auto_cast_type": "fp16", "batch_size": 1, "checkpoint_id": "defog/sqlcoder-7b-2", "checkpoint_revision": "7e5b6f7981c0aa7d143f6bec6fa26625bdfcbe66", "compiler_type": "neuronx-cc", "compiler_version": "2.13.66.0+6dfecc895", "num_cores": 2, "sequence_length": 4096, "task": "text-generation"}, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 32, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 1000000, "tie_word_embeddings": false, "torch_dtype": "float16", "use_cache": true, "vocab_size": 32016}
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_01fe42b103324d50dd0f+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_01fe42b103324d50dd0f+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9651ac6a82101e2da0eaa54eeb71671927d1cd35f7031e1118c9c8e3ce902b75
|
3 |
+
size 292188
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_01fe42b103324d50dd0f+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9aae69ecb4a3764efc750d860ab1879542a56e8aafd867b24207fadd57030ee8
|
3 |
+
size 8244224
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_142005b3d93076706472+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2816b10dcc5107592b5bd8fbb9b828cef19ae6a6dc281edfce5c134ea8620073
|
3 |
+
size 301369
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26525b90f7655fdf8a1366ab186317f8ef87a940102130a131edd3b776c64afa
|
3 |
+
size 299610
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_21b1b0223e4fb6f5af41+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:647d4971554b115074a5d1efb73a71b547215bc89bc5ac3af9683f91af042454
|
3 |
+
size 2161664
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_3020655465d2e0990c19+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_3020655465d2e0990c19+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1a4e9a556d295e43b93fa54987cb08b21f05a761fa322beaf0d839587b5dc0f
|
3 |
+
size 299610
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_3020655465d2e0990c19+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13f64c745785649059fd2bf9f760387b9aa29ed2a436e808878ac9dcc8190b53
|
3 |
+
size 2427904
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_312cb57ef1e4a82c10e2+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:069bc855215002ad4f29ae20d3c0cd082bbcda7d16f8c8ec12634a88a46afba7
|
3 |
+
size 298010
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_31bd89a484b00253cd84+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fffb92a5dc964361ba99f5becaf80f146e749dc2982eb1fc859f504258bd6807
|
3 |
+
size 337486
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_4051477874156d7450fe+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_4051477874156d7450fe+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f92f7c0539766a36e06f93be6b5b8c26736837fbb84bef8e733e5c120d68248
|
3 |
+
size 420713
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_4051477874156d7450fe+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:faadd4e50cafb354ca4100bda46e5f0d49ad82431050ed22da69790a3d1088e7
|
3 |
+
size 30024704
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_410c6d6a0c764608be0d+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_410c6d6a0c764608be0d+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a39002c742b526c1d25080f085d4404e696f5067844da317a4403bdba477a12
|
3 |
+
size 295835
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_410c6d6a0c764608be0d+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7c9a4d8ad38fcaf1fa8e44ac96793d75451f4867d4565c278d4d087246fb207
|
3 |
+
size 8909824
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_426cd9312d26b5e0bf95+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_426cd9312d26b5e0bf95+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54fa5b9b20bbb94ac7dd18e82683af038f246e41bfb3288999d178cb3344e384
|
3 |
+
size 296219
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_426cd9312d26b5e0bf95+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f087f3482370f029c3910b2ebce46016ca33dec12fa2b2b11dbfab59ba8acb3
|
3 |
+
size 2960384
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_443c7de81db84f0f078c+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2710534bde9e62b9aa96153376baf77e2ef7e50d21728ab651f5b97c616c836a
|
3 |
+
size 30024704
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_44563e64a3dddda1db4d+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_44563e64a3dddda1db4d+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a2f181f04beaac9d096d3aebf89aa6ea883d5c6db15fe4a428cf5cffbdd5df7
|
3 |
+
size 299610
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_44563e64a3dddda1db4d+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04731055ba71bc04552825fc869ee2fc20dea0efe8e56b5ce5aac95584ec347a
|
3 |
+
size 2212864
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_47eae16823191f315893+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_47eae16823191f315893+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74fd95bec34f2c116fa9bca9f99add961a4c24981b58125584a6ac5b1043c244
|
3 |
+
size 299610
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_47eae16823191f315893+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:036d173fe684811ba65e05a405f930106563744240bfaf8d18160825adc5d652
|
3 |
+
size 2274304
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_4d18af62746967c79d82+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_4d18af62746967c79d82+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0fde127dfb0a3f1949f1d87211ddacd4c9d874cb52202b18fd3018b93864c91
|
3 |
+
size 299226
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_4d18af62746967c79d82+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab29489f59000a5075367e42c5edd166c342f5cd6a8abb3f879482db038fffe6
|
3 |
+
size 7619584
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_522ed20ba0b487552ad5+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b41ed0c1d8390f2103dc0517b13b748bc779e5644c02efab33444c5f81b76640
|
3 |
+
size 382458
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_539309b68144a4afde0b+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_539309b68144a4afde0b+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f22e2dbe61f23faa7225930e9ede6e502e603385b8e6ad00802b87ec9013f2cc
|
3 |
+
size 476771
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_539309b68144a4afde0b+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ba405706383c6fcafbf7a0879e2579e7b558e76e216b5a6ee6524b8cc0b0f14
|
3 |
+
size 14285824
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_53f35b4110e7bebbcc45+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_53f35b4110e7bebbcc45+2c2d707e/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be6313039d8693ed78d1a25acff373312bf0b3c837edff815caec3f70d2bfabd
|
3 |
+
size 299226
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_53f35b4110e7bebbcc45+2c2d707e/model.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23af3682bd096103b870f32821c8aaea0a03a2fe3c3554f8cb76014c6516d21c
|
3 |
+
size 8182784
|
neuronxcc-2.13.66.0+6dfecc895/MODULE_5ab5b6d9ff18b8896d5a+2c2d707e/compile_flags.txt
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
--model-type=transformer --auto-cast=none
|