optimum-internal-testing-user
commited on
Synchronizing local compiler cache.
Browse files- neuronxcc-2.16.345.0+69131dd3/0_REGISTRY/0.0.28.dev0/inference/gpt2/gpt2/3892f63e7f690f4188da.json +1 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_1090c91454701eac92a9+613edded/compile_flags.json +1 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_1090c91454701eac92a9+613edded/model.done +0 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_1090c91454701eac92a9+613edded/model.hlo_module.pb +3 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_1090c91454701eac92a9+613edded/model.neff +0 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_5a9cc28c7336fd9ea3ab+613edded/compile_flags.json +1 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_5a9cc28c7336fd9ea3ab+613edded/model.done +0 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_5a9cc28c7336fd9ea3ab+613edded/model.hlo_module.pb +3 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_5a9cc28c7336fd9ea3ab+613edded/model.neff +0 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_ab8029e291c37141655e+613edded/compile_flags.json +1 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_ab8029e291c37141655e+613edded/model.done +0 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_ab8029e291c37141655e+613edded/model.hlo_module.pb +3 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_ab8029e291c37141655e+613edded/model.neff +0 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_aeecac19cd61e7fb1951+613edded/compile_flags.json +1 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_aeecac19cd61e7fb1951+613edded/model.done +0 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_aeecac19cd61e7fb1951+613edded/model.hlo_module.pb +3 -0
- neuronxcc-2.16.345.0+69131dd3/MODULE_aeecac19cd61e7fb1951+613edded/model.neff +0 -0
neuronxcc-2.16.345.0+69131dd3/0_REGISTRY/0.0.28.dev0/inference/gpt2/gpt2/3892f63e7f690f4188da.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"activation_function": "gelu_new", "architectures": ["GPT2LMHeadModel"], "attn_pdrop": 0.1, "bos_token_id": 50256, "embd_pdrop": 0.1, "eos_token_id": 50256, "initializer_range": 0.02, "layer_norm_epsilon": 1e-05, "model_type": "gpt2", "n_ctx": 1024, "n_embd": 768, "n_head": 12, "n_inner": null, "n_layer": 12, "n_positions": 1024, "neuron": {"auto_cast_type": "fp16", "batch_size": 4, "checkpoint_id": "gpt2", "checkpoint_revision": "607a30d783dfa663caf39e06633721c8d4cfcd7e", "compiler_type": "neuronx-cc", "compiler_version": "2.16.345.0+69131dd3", "num_cores": 2, "sequence_length": 1024, "task": "text-generation"}, "reorder_and_upcast_attn": false, "resid_pdrop": 0.1, "scale_attn_by_inverse_layer_idx": false, "scale_attn_weights": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "summary_type": "cls_index", "summary_use_proj": true, "task_specific_params": {"text-generation": {"do_sample": true, "max_length": 50}}, "use_cache": true, "vocab_size": 50257}
|
neuronxcc-2.16.345.0+69131dd3/MODULE_1090c91454701eac92a9+613edded/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.16.345.0+69131dd3/MODULE_1090c91454701eac92a9+613edded/model.done
ADDED
File without changes
|
neuronxcc-2.16.345.0+69131dd3/MODULE_1090c91454701eac92a9+613edded/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88b60f37cc5529ee3ea81f418c235ea87ba7b7721a249c48cefe87093fdb03ea
|
3 |
+
size 131152
|
neuronxcc-2.16.345.0+69131dd3/MODULE_1090c91454701eac92a9+613edded/model.neff
ADDED
Binary file (615 kB). View file
|
|
neuronxcc-2.16.345.0+69131dd3/MODULE_5a9cc28c7336fd9ea3ab+613edded/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.16.345.0+69131dd3/MODULE_5a9cc28c7336fd9ea3ab+613edded/model.done
ADDED
File without changes
|
neuronxcc-2.16.345.0+69131dd3/MODULE_5a9cc28c7336fd9ea3ab+613edded/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0623b16d94dcdf5b110f5d7b0ba30e14c32c070a7443e5a6a2cc54b3746db38c
|
3 |
+
size 131152
|
neuronxcc-2.16.345.0+69131dd3/MODULE_5a9cc28c7336fd9ea3ab+613edded/model.neff
ADDED
Binary file (482 kB). View file
|
|
neuronxcc-2.16.345.0+69131dd3/MODULE_ab8029e291c37141655e+613edded/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.16.345.0+69131dd3/MODULE_ab8029e291c37141655e+613edded/model.done
ADDED
File without changes
|
neuronxcc-2.16.345.0+69131dd3/MODULE_ab8029e291c37141655e+613edded/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04503cb2afec625d94e1bc349c1f98e53e0240f290913c89855c64ed0cbcc6ba
|
3 |
+
size 131152
|
neuronxcc-2.16.345.0+69131dd3/MODULE_ab8029e291c37141655e+613edded/model.neff
ADDED
Binary file (462 kB). View file
|
|
neuronxcc-2.16.345.0+69131dd3/MODULE_aeecac19cd61e7fb1951+613edded/compile_flags.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
["--target=trn1", "--model-type=transformer", "--auto-cast=none", "--execute-repetition=1"]
|
neuronxcc-2.16.345.0+69131dd3/MODULE_aeecac19cd61e7fb1951+613edded/model.done
ADDED
File without changes
|
neuronxcc-2.16.345.0+69131dd3/MODULE_aeecac19cd61e7fb1951+613edded/model.hlo_module.pb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f705944710984a8e878af5918f6d9c61b50ed20958fc08747d379761088ea407
|
3 |
+
size 131152
|
neuronxcc-2.16.345.0+69131dd3/MODULE_aeecac19cd61e7fb1951+613edded/model.neff
ADDED
Binary file (534 kB). View file
|
|