Upload folder using huggingface_hub

Browse files

Files changed (6) hide show

README.md +23 -0
assets/tokenizer/vocabulary.spm +0 -0
config.json +121 -0
metadata.json +6 -0
model.weights.h5 +3 -0
tokenizer.json +12 -0

README.md ADDED Viewed

	@@ -0,0 +1,23 @@

+---
+library_name: keras-nlp
+---
+This is a [`Phi3` model](https://keras.io/api/keras_nlp/models/phi3) uploaded using the KerasNLP library and can be used with JAX, TensorFlow, and PyTorch backends.
+Model config:
+* **name:** phi3_backbone_1
+* **trainable:** True
+* **vocabulary_size:** 32064
+* **num_layers:** 32
+* **num_query_heads:** 32
+* **hidden_dim:** 3072
+* **intermediate_dim:** 8192
+* **num_key_value_heads:** 32
+* **layer_norm_epsilon:** 1e-05
+* **dropout:** 0.0
+* **max_sequence_length:** 131072
+* **original_max_sequence_length:** 4096
+* **rope_max_wavelength:** 10000.0
+* **rope_scaling_type:** su
+* **rope_scaling_short_factor:** [1.05, 1.05, 1.05, 1.1, 1.1, 1.1500000000000001, 1.2000000000000002, 1.2500000000000002, 1.3000000000000003, 1.3500000000000003, 1.5000000000000004, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.000000000000001, 2.0500000000000007, 2.0500000000000007, 2.0500000000000007, 2.1000000000000005, 2.1000000000000005, 2.1000000000000005, 2.1500000000000004, 2.1500000000000004, 2.3499999999999996, 2.549999999999999, 2.5999999999999988, 2.5999999999999988, 2.7499999999999982, 2.849999999999998, 2.849999999999998, 2.9499999999999975]
+* **rope_scaling_long_factor:** [1.0299999713897705, 1.0499999523162842, 1.0499999523162842, 1.0799999237060547, 1.2299998998641968, 1.2299998998641968, 1.2999999523162842, 1.4499999284744263, 1.5999999046325684, 1.6499998569488525, 1.8999998569488525, 2.859999895095825, 3.68999981880188, 5.419999599456787, 5.489999771118164, 5.489999771118164, 9.09000015258789, 11.579999923706055, 15.65999984741211, 15.769999504089355, 15.789999961853027, 18.360000610351562, 21.989999771118164, 23.079999923706055, 30.009998321533203, 32.35000228881836, 32.590003967285156, 35.56000518798828, 39.95000457763672, 53.840003967285156, 56.20000457763672, 57.95000457763672, 59.29000473022461, 59.77000427246094, 59.920005798339844, 61.190006256103516, 61.96000671386719, 62.50000762939453, 63.3700065612793, 63.48000717163086, 63.48000717163086, 63.66000747680664, 63.850006103515625, 64.08000946044922, 64.760009765625, 64.80001068115234, 64.81001281738281, 64.81001281738281]
+This model card has been generated automatically and should be completed by the model author. See [Model Cards documentation](https://huggingface.co/docs/hub/model-cards) for more information.

assets/tokenizer/vocabulary.spm ADDED Viewed

Binary file (500 kB). View file

config.json ADDED Viewed

	@@ -0,0 +1,121 @@

+{
+    "module": "keras_nlp.src.models.phi3.phi3_backbone",
+    "class_name": "Phi3Backbone",
+    "config": {
+        "name": "phi3_backbone_1",
+        "trainable": true,
+        "vocabulary_size": 32064,
+        "num_layers": 32,
+        "num_query_heads": 32,
+        "hidden_dim": 3072,
+        "intermediate_dim": 8192,
+        "num_key_value_heads": 32,
+        "layer_norm_epsilon": 1e-05,
+        "dropout": 0.0,
+        "max_sequence_length": 131072,
+        "original_max_sequence_length": 4096,
+        "rope_max_wavelength": 10000.0,
+        "rope_scaling_type": "su",
+        "rope_scaling_short_factor": [
+            1.05,
+            1.05,
+            1.05,
+            1.1,
+            1.1,
+            1.1500000000000001,
+            1.2000000000000002,
+            1.2500000000000002,
+            1.3000000000000003,
+            1.3500000000000003,
+            1.5000000000000004,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.000000000000001,
+            2.0500000000000007,
+            2.0500000000000007,
+            2.0500000000000007,
+            2.1000000000000005,
+            2.1000000000000005,
+            2.1000000000000005,
+            2.1500000000000004,
+            2.1500000000000004,
+            2.3499999999999996,
+            2.549999999999999,
+            2.5999999999999988,
+            2.5999999999999988,
+            2.7499999999999982,
+            2.849999999999998,
+            2.849999999999998,
+            2.9499999999999975
+        ],
+        "rope_scaling_long_factor": [
+            1.0299999713897705,
+            1.0499999523162842,
+            1.0499999523162842,
+            1.0799999237060547,
+            1.2299998998641968,
+            1.2299998998641968,
+            1.2999999523162842,
+            1.4499999284744263,
+            1.5999999046325684,
+            1.6499998569488525,
+            1.8999998569488525,
+            2.859999895095825,
+            3.68999981880188,
+            5.419999599456787,
+            5.489999771118164,
+            5.489999771118164,
+            9.09000015258789,
+            11.579999923706055,
+            15.65999984741211,
+            15.769999504089355,
+            15.789999961853027,
+            18.360000610351562,
+            21.989999771118164,
+            23.079999923706055,
+            30.009998321533203,
+            32.35000228881836,
+            32.590003967285156,
+            35.56000518798828,
+            39.95000457763672,
+            53.840003967285156,
+            56.20000457763672,
+            57.95000457763672,
+            59.29000473022461,
+            59.77000427246094,
+            59.920005798339844,
+            61.190006256103516,
+            61.96000671386719,
+            62.50000762939453,
+            63.3700065612793,
+            63.48000717163086,
+            63.48000717163086,
+            63.66000747680664,
+            63.850006103515625,
+            64.08000946044922,
+            64.760009765625,
+            64.80001068115234,
+            64.81001281738281,
+            64.81001281738281
+        ]
+    },
+    "registered_name": "keras_nlp>Phi3Backbone"
+}

metadata.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+    "keras_version": "3.3.3",
+    "keras_nlp_version": "0.10.0",
+    "parameter_count": 3821079552,
+    "date_saved": "2024-05-06@23:42:02"
+}

model.weights.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d7c2d6ff5183500e9167a354765ed755ab633417e989acf9e8c4aa07a2ea9e60
+size 7643265592

tokenizer.json ADDED Viewed

	@@ -0,0 +1,12 @@

+{
+    "module": "keras_nlp.src.models.phi3.phi3_tokenizer",
+    "class_name": "Phi3Tokenizer",
+    "config": {
+        "name": "phi3_tokenizer",
+        "trainable": true,
+        "dtype": "int32",
+        "proto": null,
+        "sequence_length": null
+    },
+    "registered_name": "keras_nlp>Phi3Tokenizer"
+}