diff --git a/mlc-chat-config.json b/mlc-chat-config.json
new file mode 100644
index 0000000000000000000000000000000000000000..4a0d4acd410f6e24fae9652b0d402193dd13a405
--- /dev/null
+++ b/mlc-chat-config.json
@@ -0,0 +1,16 @@
+{
+ "model_lib": "Llama-2-13b-chat-omniquant-w2a16g128asym",
+ "local_id": "Llama-2-13b-chat-omniquant-w2a16g128asym",
+ "conv_template": "llama-2",
+ "temperature": 0.7,
+ "repetition_penalty": 1.0,
+ "top_p": 0.95,
+ "mean_gen_len": 128,
+ "max_gen_len": 512,
+ "shift_fill_factor": 0.3,
+ "tokenizer_files": [
+ "tokenizer.model"
+ ],
+ "model_category": "llama",
+ "model_name": "Llama-2-13b-chat-omniquant"
+}
\ No newline at end of file
diff --git a/ndarray-cache.json b/ndarray-cache.json
new file mode 100644
index 0000000000000000000000000000000000000000..fa13f8c0dd3e0567f5d873e3e705c93c3d124bf2
--- /dev/null
+++ b/ndarray-cache.json
@@ -0,0 +1,6995 @@
+{
+ "metadata": {
+ "ParamSize": 565
+ },
+ "records": [
+ {
+ "dataPath": "params_shard_0.bin",
+ "format": "raw-shard",
+ "nbytes": 327680000,
+ "records": [
+ {
+ "name": "param_0",
+ "shape": [
+ 32000,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 327680000,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_1.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_7",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_2.bin",
+ "format": "raw-shard",
+ "nbytes": 31703040,
+ "records": [
+ {
+ "name": "param_1",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_2",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 19660800
+ },
+ {
+ "name": "param_3",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20889600
+ },
+ {
+ "name": "param_4",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_5",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 28672000
+ },
+ {
+ "name": "param_6",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 29081600
+ },
+ {
+ "name": "param_8",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 29491200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_3.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_15",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_4.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_21",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_5.bin",
+ "format": "raw-shard",
+ "nbytes": 31969280,
+ "records": [
+ {
+ "name": "param_9",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_10",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_11",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19906560
+ },
+ {
+ "name": "param_12",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 21012480
+ },
+ {
+ "name": "param_13",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_14",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22128640
+ },
+ {
+ "name": "param_16",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22138880
+ },
+ {
+ "name": "param_17",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 23367680
+ },
+ {
+ "name": "param_18",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 24596480
+ },
+ {
+ "name": "param_19",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31150080
+ },
+ {
+ "name": "param_20",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31559680
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_6.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_29",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_7.bin",
+ "format": "raw-shard",
+ "nbytes": 33361920,
+ "records": [
+ {
+ "name": "param_22",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_23",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_24",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 4423680
+ },
+ {
+ "name": "param_25",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_26",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 23224320
+ },
+ {
+ "name": "param_27",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24330240
+ },
+ {
+ "name": "param_28",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24340480
+ },
+ {
+ "name": "param_30",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 24350720
+ },
+ {
+ "name": "param_31",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25579520
+ },
+ {
+ "name": "param_32",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 26808320
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_8.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_35",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_9.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_43",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_10.bin",
+ "format": "raw-shard",
+ "nbytes": 27627520,
+ "records": [
+ {
+ "name": "param_33",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_34",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 409600
+ },
+ {
+ "name": "param_36",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 819200
+ },
+ {
+ "name": "param_37",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 3031040
+ },
+ {
+ "name": "param_38",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 5242880
+ },
+ {
+ "name": "param_39",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22937600
+ },
+ {
+ "name": "param_40",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 24043520
+ },
+ {
+ "name": "param_41",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25149440
+ },
+ {
+ "name": "param_42",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25159680
+ },
+ {
+ "name": "param_44",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25169920
+ },
+ {
+ "name": "param_45",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 26398720
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_11.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_49",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_12.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_57",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_13.bin",
+ "format": "raw-shard",
+ "nbytes": 32952320,
+ "records": [
+ {
+ "name": "param_46",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_47",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6553600
+ },
+ {
+ "name": "param_48",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6963200
+ },
+ {
+ "name": "param_50",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 7372800
+ },
+ {
+ "name": "param_51",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9584640
+ },
+ {
+ "name": "param_52",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 11796480
+ },
+ {
+ "name": "param_53",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 29491200
+ },
+ {
+ "name": "param_54",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30597120
+ },
+ {
+ "name": "param_55",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31703040
+ },
+ {
+ "name": "param_56",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31713280
+ },
+ {
+ "name": "param_58",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 31723520
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_14.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_63",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_15.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_71",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_16.bin",
+ "format": "raw-shard",
+ "nbytes": 32952320,
+ "records": [
+ {
+ "name": "param_59",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_60",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_61",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 7782400
+ },
+ {
+ "name": "param_62",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 8192000
+ },
+ {
+ "name": "param_64",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 8601600
+ },
+ {
+ "name": "param_65",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 10813440
+ },
+ {
+ "name": "param_66",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 13025280
+ },
+ {
+ "name": "param_67",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30720000
+ },
+ {
+ "name": "param_68",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 31825920
+ },
+ {
+ "name": "param_69",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 32931840
+ },
+ {
+ "name": "param_70",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 32942080
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_17.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_77",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_18.bin",
+ "format": "raw-shard",
+ "nbytes": 33054720,
+ "records": [
+ {
+ "name": "param_72",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_73",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_74",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 2457600
+ },
+ {
+ "name": "param_75",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 9011200
+ },
+ {
+ "name": "param_76",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 9420800
+ },
+ {
+ "name": "param_78",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9830400
+ },
+ {
+ "name": "param_79",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 12042240
+ },
+ {
+ "name": "param_80",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 14254080
+ },
+ {
+ "name": "param_81",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 31948800
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_19.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_91",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_20.bin",
+ "format": "raw-shard",
+ "nbytes": 32829440,
+ "records": [
+ {
+ "name": "param_82",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_83",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 1105920
+ },
+ {
+ "name": "param_84",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 1116160
+ },
+ {
+ "name": "param_85",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 1126400
+ },
+ {
+ "name": "param_86",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20787200
+ },
+ {
+ "name": "param_87",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22016000
+ },
+ {
+ "name": "param_88",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 23244800
+ },
+ {
+ "name": "param_89",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 29798400
+ },
+ {
+ "name": "param_90",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 30208000
+ },
+ {
+ "name": "param_92",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 30617600
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_21.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_99",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_22.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_105",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_23.bin",
+ "format": "raw-shard",
+ "nbytes": 31969280,
+ "records": [
+ {
+ "name": "param_93",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_94",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_95",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19906560
+ },
+ {
+ "name": "param_96",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 21012480
+ },
+ {
+ "name": "param_97",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_98",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22128640
+ },
+ {
+ "name": "param_100",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22138880
+ },
+ {
+ "name": "param_101",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 23367680
+ },
+ {
+ "name": "param_102",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 24596480
+ },
+ {
+ "name": "param_103",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31150080
+ },
+ {
+ "name": "param_104",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31559680
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_24.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_113",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_25.bin",
+ "format": "raw-shard",
+ "nbytes": 33361920,
+ "records": [
+ {
+ "name": "param_106",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_107",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_108",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 4423680
+ },
+ {
+ "name": "param_109",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_110",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 23224320
+ },
+ {
+ "name": "param_111",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24330240
+ },
+ {
+ "name": "param_112",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24340480
+ },
+ {
+ "name": "param_114",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 24350720
+ },
+ {
+ "name": "param_115",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25579520
+ },
+ {
+ "name": "param_116",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 26808320
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_26.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_119",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_27.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_127",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_28.bin",
+ "format": "raw-shard",
+ "nbytes": 27627520,
+ "records": [
+ {
+ "name": "param_117",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_118",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 409600
+ },
+ {
+ "name": "param_120",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 819200
+ },
+ {
+ "name": "param_121",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 3031040
+ },
+ {
+ "name": "param_122",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 5242880
+ },
+ {
+ "name": "param_123",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22937600
+ },
+ {
+ "name": "param_124",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 24043520
+ },
+ {
+ "name": "param_125",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25149440
+ },
+ {
+ "name": "param_126",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25159680
+ },
+ {
+ "name": "param_128",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25169920
+ },
+ {
+ "name": "param_129",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 26398720
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_29.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_133",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_30.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_141",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_31.bin",
+ "format": "raw-shard",
+ "nbytes": 32952320,
+ "records": [
+ {
+ "name": "param_130",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_131",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6553600
+ },
+ {
+ "name": "param_132",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6963200
+ },
+ {
+ "name": "param_134",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 7372800
+ },
+ {
+ "name": "param_135",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9584640
+ },
+ {
+ "name": "param_136",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 11796480
+ },
+ {
+ "name": "param_137",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 29491200
+ },
+ {
+ "name": "param_138",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30597120
+ },
+ {
+ "name": "param_139",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31703040
+ },
+ {
+ "name": "param_140",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31713280
+ },
+ {
+ "name": "param_142",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 31723520
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_32.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_147",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_33.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_155",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_34.bin",
+ "format": "raw-shard",
+ "nbytes": 32952320,
+ "records": [
+ {
+ "name": "param_143",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_144",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_145",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 7782400
+ },
+ {
+ "name": "param_146",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 8192000
+ },
+ {
+ "name": "param_148",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 8601600
+ },
+ {
+ "name": "param_149",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 10813440
+ },
+ {
+ "name": "param_150",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 13025280
+ },
+ {
+ "name": "param_151",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30720000
+ },
+ {
+ "name": "param_152",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 31825920
+ },
+ {
+ "name": "param_153",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 32931840
+ },
+ {
+ "name": "param_154",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 32942080
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_35.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_161",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_36.bin",
+ "format": "raw-shard",
+ "nbytes": 33054720,
+ "records": [
+ {
+ "name": "param_156",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_157",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_158",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 2457600
+ },
+ {
+ "name": "param_159",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 9011200
+ },
+ {
+ "name": "param_160",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 9420800
+ },
+ {
+ "name": "param_162",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9830400
+ },
+ {
+ "name": "param_163",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 12042240
+ },
+ {
+ "name": "param_164",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 14254080
+ },
+ {
+ "name": "param_165",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 31948800
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_37.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_175",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_38.bin",
+ "format": "raw-shard",
+ "nbytes": 32829440,
+ "records": [
+ {
+ "name": "param_166",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_167",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 1105920
+ },
+ {
+ "name": "param_168",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 1116160
+ },
+ {
+ "name": "param_169",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 1126400
+ },
+ {
+ "name": "param_170",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20787200
+ },
+ {
+ "name": "param_171",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22016000
+ },
+ {
+ "name": "param_172",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 23244800
+ },
+ {
+ "name": "param_173",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 29798400
+ },
+ {
+ "name": "param_174",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 30208000
+ },
+ {
+ "name": "param_176",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 30617600
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_39.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_183",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_40.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_189",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_41.bin",
+ "format": "raw-shard",
+ "nbytes": 31969280,
+ "records": [
+ {
+ "name": "param_177",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_178",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_179",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19906560
+ },
+ {
+ "name": "param_180",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 21012480
+ },
+ {
+ "name": "param_181",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_182",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22128640
+ },
+ {
+ "name": "param_184",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22138880
+ },
+ {
+ "name": "param_185",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 23367680
+ },
+ {
+ "name": "param_186",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 24596480
+ },
+ {
+ "name": "param_187",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31150080
+ },
+ {
+ "name": "param_188",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31559680
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_42.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_197",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_43.bin",
+ "format": "raw-shard",
+ "nbytes": 33361920,
+ "records": [
+ {
+ "name": "param_190",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_191",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_192",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 4423680
+ },
+ {
+ "name": "param_193",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_194",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 23224320
+ },
+ {
+ "name": "param_195",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24330240
+ },
+ {
+ "name": "param_196",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24340480
+ },
+ {
+ "name": "param_198",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 24350720
+ },
+ {
+ "name": "param_199",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25579520
+ },
+ {
+ "name": "param_200",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 26808320
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_44.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_203",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_45.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_211",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_46.bin",
+ "format": "raw-shard",
+ "nbytes": 27627520,
+ "records": [
+ {
+ "name": "param_201",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_202",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 409600
+ },
+ {
+ "name": "param_204",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 819200
+ },
+ {
+ "name": "param_205",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 3031040
+ },
+ {
+ "name": "param_206",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 5242880
+ },
+ {
+ "name": "param_207",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22937600
+ },
+ {
+ "name": "param_208",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 24043520
+ },
+ {
+ "name": "param_209",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25149440
+ },
+ {
+ "name": "param_210",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25159680
+ },
+ {
+ "name": "param_212",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25169920
+ },
+ {
+ "name": "param_213",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 26398720
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_47.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_217",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_48.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_225",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_49.bin",
+ "format": "raw-shard",
+ "nbytes": 32952320,
+ "records": [
+ {
+ "name": "param_214",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_215",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6553600
+ },
+ {
+ "name": "param_216",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6963200
+ },
+ {
+ "name": "param_218",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 7372800
+ },
+ {
+ "name": "param_219",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9584640
+ },
+ {
+ "name": "param_220",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 11796480
+ },
+ {
+ "name": "param_221",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 29491200
+ },
+ {
+ "name": "param_222",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30597120
+ },
+ {
+ "name": "param_223",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31703040
+ },
+ {
+ "name": "param_224",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31713280
+ },
+ {
+ "name": "param_226",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 31723520
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_50.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_231",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_51.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_239",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_52.bin",
+ "format": "raw-shard",
+ "nbytes": 32952320,
+ "records": [
+ {
+ "name": "param_227",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_228",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_229",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 7782400
+ },
+ {
+ "name": "param_230",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 8192000
+ },
+ {
+ "name": "param_232",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 8601600
+ },
+ {
+ "name": "param_233",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 10813440
+ },
+ {
+ "name": "param_234",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 13025280
+ },
+ {
+ "name": "param_235",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30720000
+ },
+ {
+ "name": "param_236",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 31825920
+ },
+ {
+ "name": "param_237",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 32931840
+ },
+ {
+ "name": "param_238",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 32942080
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_53.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_245",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_54.bin",
+ "format": "raw-shard",
+ "nbytes": 33054720,
+ "records": [
+ {
+ "name": "param_240",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_241",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_242",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 2457600
+ },
+ {
+ "name": "param_243",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 9011200
+ },
+ {
+ "name": "param_244",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 9420800
+ },
+ {
+ "name": "param_246",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9830400
+ },
+ {
+ "name": "param_247",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 12042240
+ },
+ {
+ "name": "param_248",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 14254080
+ },
+ {
+ "name": "param_249",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 31948800
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_55.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_259",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_56.bin",
+ "format": "raw-shard",
+ "nbytes": 32829440,
+ "records": [
+ {
+ "name": "param_250",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_251",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 1105920
+ },
+ {
+ "name": "param_252",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 1116160
+ },
+ {
+ "name": "param_253",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 1126400
+ },
+ {
+ "name": "param_254",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20787200
+ },
+ {
+ "name": "param_255",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22016000
+ },
+ {
+ "name": "param_256",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 23244800
+ },
+ {
+ "name": "param_257",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 29798400
+ },
+ {
+ "name": "param_258",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 30208000
+ },
+ {
+ "name": "param_260",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 30617600
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_57.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_267",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_58.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_273",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_59.bin",
+ "format": "raw-shard",
+ "nbytes": 31969280,
+ "records": [
+ {
+ "name": "param_261",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_262",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_263",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19906560
+ },
+ {
+ "name": "param_264",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 21012480
+ },
+ {
+ "name": "param_265",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_266",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22128640
+ },
+ {
+ "name": "param_268",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22138880
+ },
+ {
+ "name": "param_269",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 23367680
+ },
+ {
+ "name": "param_270",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 24596480
+ },
+ {
+ "name": "param_271",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31150080
+ },
+ {
+ "name": "param_272",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31559680
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_60.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_281",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_61.bin",
+ "format": "raw-shard",
+ "nbytes": 33361920,
+ "records": [
+ {
+ "name": "param_274",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_275",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_276",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 4423680
+ },
+ {
+ "name": "param_277",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_278",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 23224320
+ },
+ {
+ "name": "param_279",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24330240
+ },
+ {
+ "name": "param_280",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24340480
+ },
+ {
+ "name": "param_282",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 24350720
+ },
+ {
+ "name": "param_283",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25579520
+ },
+ {
+ "name": "param_284",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 26808320
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_62.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_287",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_63.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_295",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_64.bin",
+ "format": "raw-shard",
+ "nbytes": 27627520,
+ "records": [
+ {
+ "name": "param_285",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_286",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 409600
+ },
+ {
+ "name": "param_288",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 819200
+ },
+ {
+ "name": "param_289",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 3031040
+ },
+ {
+ "name": "param_290",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 5242880
+ },
+ {
+ "name": "param_291",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22937600
+ },
+ {
+ "name": "param_292",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 24043520
+ },
+ {
+ "name": "param_293",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25149440
+ },
+ {
+ "name": "param_294",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25159680
+ },
+ {
+ "name": "param_296",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25169920
+ },
+ {
+ "name": "param_297",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 26398720
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_65.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_301",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_66.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_309",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_67.bin",
+ "format": "raw-shard",
+ "nbytes": 32952320,
+ "records": [
+ {
+ "name": "param_298",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_299",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6553600
+ },
+ {
+ "name": "param_300",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6963200
+ },
+ {
+ "name": "param_302",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 7372800
+ },
+ {
+ "name": "param_303",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9584640
+ },
+ {
+ "name": "param_304",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 11796480
+ },
+ {
+ "name": "param_305",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 29491200
+ },
+ {
+ "name": "param_306",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30597120
+ },
+ {
+ "name": "param_307",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31703040
+ },
+ {
+ "name": "param_308",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31713280
+ },
+ {
+ "name": "param_310",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 31723520
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_68.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_315",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_69.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_323",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_70.bin",
+ "format": "raw-shard",
+ "nbytes": 32952320,
+ "records": [
+ {
+ "name": "param_311",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_312",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_313",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 7782400
+ },
+ {
+ "name": "param_314",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 8192000
+ },
+ {
+ "name": "param_316",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 8601600
+ },
+ {
+ "name": "param_317",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 10813440
+ },
+ {
+ "name": "param_318",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 13025280
+ },
+ {
+ "name": "param_319",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30720000
+ },
+ {
+ "name": "param_320",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 31825920
+ },
+ {
+ "name": "param_321",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 32931840
+ },
+ {
+ "name": "param_322",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 32942080
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_71.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_329",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_72.bin",
+ "format": "raw-shard",
+ "nbytes": 33054720,
+ "records": [
+ {
+ "name": "param_324",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_325",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_326",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 2457600
+ },
+ {
+ "name": "param_327",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 9011200
+ },
+ {
+ "name": "param_328",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 9420800
+ },
+ {
+ "name": "param_330",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9830400
+ },
+ {
+ "name": "param_331",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 12042240
+ },
+ {
+ "name": "param_332",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 14254080
+ },
+ {
+ "name": "param_333",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 31948800
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_73.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_343",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_74.bin",
+ "format": "raw-shard",
+ "nbytes": 32829440,
+ "records": [
+ {
+ "name": "param_334",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_335",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 1105920
+ },
+ {
+ "name": "param_336",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 1116160
+ },
+ {
+ "name": "param_337",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 1126400
+ },
+ {
+ "name": "param_338",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20787200
+ },
+ {
+ "name": "param_339",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22016000
+ },
+ {
+ "name": "param_340",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 23244800
+ },
+ {
+ "name": "param_341",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 29798400
+ },
+ {
+ "name": "param_342",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 30208000
+ },
+ {
+ "name": "param_344",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 30617600
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_75.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_351",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_76.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_357",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_77.bin",
+ "format": "raw-shard",
+ "nbytes": 31969280,
+ "records": [
+ {
+ "name": "param_345",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_346",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_347",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19906560
+ },
+ {
+ "name": "param_348",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 21012480
+ },
+ {
+ "name": "param_349",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_350",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22128640
+ },
+ {
+ "name": "param_352",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22138880
+ },
+ {
+ "name": "param_353",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 23367680
+ },
+ {
+ "name": "param_354",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 24596480
+ },
+ {
+ "name": "param_355",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31150080
+ },
+ {
+ "name": "param_356",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31559680
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_78.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_365",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_79.bin",
+ "format": "raw-shard",
+ "nbytes": 33361920,
+ "records": [
+ {
+ "name": "param_358",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_359",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_360",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 4423680
+ },
+ {
+ "name": "param_361",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_362",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 23224320
+ },
+ {
+ "name": "param_363",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24330240
+ },
+ {
+ "name": "param_364",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24340480
+ },
+ {
+ "name": "param_366",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 24350720
+ },
+ {
+ "name": "param_367",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25579520
+ },
+ {
+ "name": "param_368",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 26808320
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_80.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_371",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_81.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_379",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_82.bin",
+ "format": "raw-shard",
+ "nbytes": 27627520,
+ "records": [
+ {
+ "name": "param_369",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_370",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 409600
+ },
+ {
+ "name": "param_372",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 819200
+ },
+ {
+ "name": "param_373",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 3031040
+ },
+ {
+ "name": "param_374",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 5242880
+ },
+ {
+ "name": "param_375",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22937600
+ },
+ {
+ "name": "param_376",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 24043520
+ },
+ {
+ "name": "param_377",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25149440
+ },
+ {
+ "name": "param_378",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25159680
+ },
+ {
+ "name": "param_380",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25169920
+ },
+ {
+ "name": "param_381",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 26398720
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_83.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_385",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_84.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_393",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_85.bin",
+ "format": "raw-shard",
+ "nbytes": 32952320,
+ "records": [
+ {
+ "name": "param_382",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_383",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6553600
+ },
+ {
+ "name": "param_384",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6963200
+ },
+ {
+ "name": "param_386",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 7372800
+ },
+ {
+ "name": "param_387",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9584640
+ },
+ {
+ "name": "param_388",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 11796480
+ },
+ {
+ "name": "param_389",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 29491200
+ },
+ {
+ "name": "param_390",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30597120
+ },
+ {
+ "name": "param_391",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31703040
+ },
+ {
+ "name": "param_392",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31713280
+ },
+ {
+ "name": "param_394",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 31723520
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_86.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_399",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_87.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_407",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_88.bin",
+ "format": "raw-shard",
+ "nbytes": 32952320,
+ "records": [
+ {
+ "name": "param_395",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_396",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_397",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 7782400
+ },
+ {
+ "name": "param_398",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 8192000
+ },
+ {
+ "name": "param_400",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 8601600
+ },
+ {
+ "name": "param_401",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 10813440
+ },
+ {
+ "name": "param_402",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 13025280
+ },
+ {
+ "name": "param_403",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30720000
+ },
+ {
+ "name": "param_404",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 31825920
+ },
+ {
+ "name": "param_405",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 32931840
+ },
+ {
+ "name": "param_406",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 32942080
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_89.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_413",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_90.bin",
+ "format": "raw-shard",
+ "nbytes": 33054720,
+ "records": [
+ {
+ "name": "param_408",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_409",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_410",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 2457600
+ },
+ {
+ "name": "param_411",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 9011200
+ },
+ {
+ "name": "param_412",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 9420800
+ },
+ {
+ "name": "param_414",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9830400
+ },
+ {
+ "name": "param_415",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 12042240
+ },
+ {
+ "name": "param_416",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 14254080
+ },
+ {
+ "name": "param_417",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 31948800
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_91.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_427",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_92.bin",
+ "format": "raw-shard",
+ "nbytes": 32829440,
+ "records": [
+ {
+ "name": "param_418",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_419",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 1105920
+ },
+ {
+ "name": "param_420",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 1116160
+ },
+ {
+ "name": "param_421",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 1126400
+ },
+ {
+ "name": "param_422",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20787200
+ },
+ {
+ "name": "param_423",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22016000
+ },
+ {
+ "name": "param_424",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 23244800
+ },
+ {
+ "name": "param_425",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 29798400
+ },
+ {
+ "name": "param_426",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 30208000
+ },
+ {
+ "name": "param_428",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 30617600
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_93.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_435",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_94.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_441",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_95.bin",
+ "format": "raw-shard",
+ "nbytes": 31969280,
+ "records": [
+ {
+ "name": "param_429",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_430",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_431",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19906560
+ },
+ {
+ "name": "param_432",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 21012480
+ },
+ {
+ "name": "param_433",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_434",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22128640
+ },
+ {
+ "name": "param_436",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22138880
+ },
+ {
+ "name": "param_437",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 23367680
+ },
+ {
+ "name": "param_438",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 24596480
+ },
+ {
+ "name": "param_439",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31150080
+ },
+ {
+ "name": "param_440",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31559680
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_96.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_449",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_97.bin",
+ "format": "raw-shard",
+ "nbytes": 33361920,
+ "records": [
+ {
+ "name": "param_442",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_443",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_444",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 4423680
+ },
+ {
+ "name": "param_445",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_446",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 23224320
+ },
+ {
+ "name": "param_447",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24330240
+ },
+ {
+ "name": "param_448",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24340480
+ },
+ {
+ "name": "param_450",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 24350720
+ },
+ {
+ "name": "param_451",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25579520
+ },
+ {
+ "name": "param_452",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 26808320
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_98.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_455",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_99.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_463",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_100.bin",
+ "format": "raw-shard",
+ "nbytes": 27627520,
+ "records": [
+ {
+ "name": "param_453",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_454",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 409600
+ },
+ {
+ "name": "param_456",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 819200
+ },
+ {
+ "name": "param_457",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 3031040
+ },
+ {
+ "name": "param_458",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 5242880
+ },
+ {
+ "name": "param_459",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22937600
+ },
+ {
+ "name": "param_460",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 24043520
+ },
+ {
+ "name": "param_461",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25149440
+ },
+ {
+ "name": "param_462",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25159680
+ },
+ {
+ "name": "param_464",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25169920
+ },
+ {
+ "name": "param_465",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 26398720
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_101.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_469",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_102.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_477",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_103.bin",
+ "format": "raw-shard",
+ "nbytes": 32952320,
+ "records": [
+ {
+ "name": "param_466",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_467",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6553600
+ },
+ {
+ "name": "param_468",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6963200
+ },
+ {
+ "name": "param_470",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 7372800
+ },
+ {
+ "name": "param_471",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9584640
+ },
+ {
+ "name": "param_472",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 11796480
+ },
+ {
+ "name": "param_473",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 29491200
+ },
+ {
+ "name": "param_474",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30597120
+ },
+ {
+ "name": "param_475",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31703040
+ },
+ {
+ "name": "param_476",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31713280
+ },
+ {
+ "name": "param_478",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 31723520
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_104.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_483",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_105.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_491",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_106.bin",
+ "format": "raw-shard",
+ "nbytes": 32952320,
+ "records": [
+ {
+ "name": "param_479",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_480",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_481",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 7782400
+ },
+ {
+ "name": "param_482",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 8192000
+ },
+ {
+ "name": "param_484",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 8601600
+ },
+ {
+ "name": "param_485",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 10813440
+ },
+ {
+ "name": "param_486",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 13025280
+ },
+ {
+ "name": "param_487",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30720000
+ },
+ {
+ "name": "param_488",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 31825920
+ },
+ {
+ "name": "param_489",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 32931840
+ },
+ {
+ "name": "param_490",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 32942080
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_107.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_497",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_108.bin",
+ "format": "raw-shard",
+ "nbytes": 33054720,
+ "records": [
+ {
+ "name": "param_492",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_493",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_494",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 2457600
+ },
+ {
+ "name": "param_495",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 9011200
+ },
+ {
+ "name": "param_496",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 9420800
+ },
+ {
+ "name": "param_498",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9830400
+ },
+ {
+ "name": "param_499",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 12042240
+ },
+ {
+ "name": "param_500",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 14254080
+ },
+ {
+ "name": "param_501",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 31948800
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_109.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_511",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_110.bin",
+ "format": "raw-shard",
+ "nbytes": 32829440,
+ "records": [
+ {
+ "name": "param_502",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_503",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 1105920
+ },
+ {
+ "name": "param_504",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 1116160
+ },
+ {
+ "name": "param_505",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 1126400
+ },
+ {
+ "name": "param_506",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20787200
+ },
+ {
+ "name": "param_507",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22016000
+ },
+ {
+ "name": "param_508",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 23244800
+ },
+ {
+ "name": "param_509",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 29798400
+ },
+ {
+ "name": "param_510",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 30208000
+ },
+ {
+ "name": "param_512",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 30617600
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_111.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_519",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_112.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_525",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_113.bin",
+ "format": "raw-shard",
+ "nbytes": 31969280,
+ "records": [
+ {
+ "name": "param_513",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_514",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_515",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19906560
+ },
+ {
+ "name": "param_516",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 21012480
+ },
+ {
+ "name": "param_517",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_518",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 22128640
+ },
+ {
+ "name": "param_520",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 22138880
+ },
+ {
+ "name": "param_521",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 23367680
+ },
+ {
+ "name": "param_522",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 24596480
+ },
+ {
+ "name": "param_523",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31150080
+ },
+ {
+ "name": "param_524",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 31559680
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_114.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_533",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_115.bin",
+ "format": "raw-shard",
+ "nbytes": 33361920,
+ "records": [
+ {
+ "name": "param_526",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_527",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 2211840
+ },
+ {
+ "name": "param_528",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 4423680
+ },
+ {
+ "name": "param_529",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22118400
+ },
+ {
+ "name": "param_530",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 23224320
+ },
+ {
+ "name": "param_531",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24330240
+ },
+ {
+ "name": "param_532",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 24340480
+ },
+ {
+ "name": "param_534",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 24350720
+ },
+ {
+ "name": "param_535",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25579520
+ },
+ {
+ "name": "param_536",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 26808320
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_116.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_539",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_117.bin",
+ "format": "raw-shard",
+ "nbytes": 19660800,
+ "records": [
+ {
+ "name": "param_547",
+ "shape": [
+ 15360,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 19660800,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_118.bin",
+ "format": "raw-shard",
+ "nbytes": 27627520,
+ "records": [
+ {
+ "name": "param_537",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_538",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 409600
+ },
+ {
+ "name": "param_540",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 819200
+ },
+ {
+ "name": "param_541",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 3031040
+ },
+ {
+ "name": "param_542",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 5242880
+ },
+ {
+ "name": "param_543",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 22937600
+ },
+ {
+ "name": "param_544",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 24043520
+ },
+ {
+ "name": "param_545",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25149440
+ },
+ {
+ "name": "param_546",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 25159680
+ },
+ {
+ "name": "param_548",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 25169920
+ },
+ {
+ "name": "param_549",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 26398720
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_119.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_553",
+ "shape": [
+ 27648,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_120.bin",
+ "format": "raw-shard",
+ "nbytes": 327680000,
+ "records": [
+ {
+ "name": "param_562",
+ "shape": [
+ 32000,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 327680000,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_121.bin",
+ "format": "raw-shard",
+ "nbytes": 32782336,
+ "records": [
+ {
+ "name": "param_550",
+ "shape": [
+ 5120,
+ 320
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 6553600,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_551",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6553600
+ },
+ {
+ "name": "param_552",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 6963200
+ },
+ {
+ "name": "param_554",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 7372800
+ },
+ {
+ "name": "param_555",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 9584640
+ },
+ {
+ "name": "param_556",
+ "shape": [
+ 5120,
+ 864
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 17694720,
+ "byteOffset": 11796480
+ },
+ {
+ "name": "param_557",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 29491200
+ },
+ {
+ "name": "param_558",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 30597120
+ },
+ {
+ "name": "param_559",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31703040
+ },
+ {
+ "name": "param_560",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31713280
+ },
+ {
+ "name": "param_561",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 31723520
+ },
+ {
+ "name": "param_563",
+ "shape": [
+ 2048,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 524288,
+ "byteOffset": 31733760
+ },
+ {
+ "name": "param_564",
+ "shape": [
+ 2048,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 524288,
+ "byteOffset": 32258048
+ }
+ ]
+ }
+ ]
+}
\ No newline at end of file
diff --git a/params_shard_0.bin b/params_shard_0.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5c88e85e65bad524119bfa0f2fae156b044dc45d
--- /dev/null
+++ b/params_shard_0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eeb8c2d8a4ba799831bc7f2feed6bac6fb242a6d26632fa2502a091e83596e44
+size 327680000
diff --git a/params_shard_1.bin b/params_shard_1.bin
new file mode 100644
index 0000000000000000000000000000000000000000..439a84d04a8d7f2266a97a6d822902a30d2d5f6d
--- /dev/null
+++ b/params_shard_1.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8ac8c327c61e3d94e00043992ae989a7ef8f59be7d96a85049193bd34cbb56b4
+size 35389440
diff --git a/params_shard_10.bin b/params_shard_10.bin
new file mode 100644
index 0000000000000000000000000000000000000000..986ff9913eb98153f87fa6a29eb7c27617c1a45a
--- /dev/null
+++ b/params_shard_10.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:db89f9eee3e37020a4611f2d43c1ed1f3ae460c358b86a8e29236cb5882e7adc
+size 27627520
diff --git a/params_shard_100.bin b/params_shard_100.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0c6754d6640b6c7ecf5abb028dd1faa87105ccc4
--- /dev/null
+++ b/params_shard_100.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8a98d18f9c731d2fac3d7faf12393365e375612b123fefae1254f1c54e190e9d
+size 27627520
diff --git a/params_shard_101.bin b/params_shard_101.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1bda6bfc2ed2ad93ce30e486427c4ea4574297a5
--- /dev/null
+++ b/params_shard_101.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b95cd9b54285e79ecda038fc53e544ddcf1909228dc0172689a133e23436d615
+size 35389440
diff --git a/params_shard_102.bin b/params_shard_102.bin
new file mode 100644
index 0000000000000000000000000000000000000000..194ecda1c13a04e94589384a4e86394671a5941c
--- /dev/null
+++ b/params_shard_102.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:413279fe8f15743a1a5e422940b7fcb9db4c6e13b097a7e5f8813d45b6b2a961
+size 19660800
diff --git a/params_shard_103.bin b/params_shard_103.bin
new file mode 100644
index 0000000000000000000000000000000000000000..17ddaa67fa38b5d435f79e2277980b1777d8879a
--- /dev/null
+++ b/params_shard_103.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a145b719098199bab55ee35810a8d033d210e491a6be359cece622f2ace2bef4
+size 32952320
diff --git a/params_shard_104.bin b/params_shard_104.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a674ce911c433ef8f842d926b92279feea46c5d1
--- /dev/null
+++ b/params_shard_104.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38d643aba418fe452bc2edd9eefdd82b95b81fea9d9d0dff9f9d1b8c6bfceae8
+size 35389440
diff --git a/params_shard_105.bin b/params_shard_105.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2df8caf8077b259acabef8c16a64fb5a330a597a
--- /dev/null
+++ b/params_shard_105.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e621849b9e6af299206a3345d0c63c1e40ace2b0c545a7874be3325d335a0daf
+size 19660800
diff --git a/params_shard_106.bin b/params_shard_106.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7381638719a5b70eb65f52fd62b997a6c0a85dc7
--- /dev/null
+++ b/params_shard_106.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1575233467df54e91274a46273a15d7d6e5f422c3d14b87c77553d8539f4e5fd
+size 32952320
diff --git a/params_shard_107.bin b/params_shard_107.bin
new file mode 100644
index 0000000000000000000000000000000000000000..676815c7859687845aba6ddccbcd168ffcd4a678
--- /dev/null
+++ b/params_shard_107.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:79aa1a2c8fb2230dd3b4a12d1503a9f53d43a5b2596aa82a70a781cc0793a7af
+size 35389440
diff --git a/params_shard_108.bin b/params_shard_108.bin
new file mode 100644
index 0000000000000000000000000000000000000000..af5d00769f247dbcf9016e92e6ac2c88141266de
--- /dev/null
+++ b/params_shard_108.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c5a35f7cf31b5fabbfc55d4782990caa43d79d8a75746b17d77319b497df4a76
+size 33054720
diff --git a/params_shard_109.bin b/params_shard_109.bin
new file mode 100644
index 0000000000000000000000000000000000000000..07c74c5d0a68d44d10cb27f36f694f0988d9b9e0
--- /dev/null
+++ b/params_shard_109.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a160a4e496d851bbb053c6272529fcb37a03fa4d5ca7792aa8205b274a1635b7
+size 35389440
diff --git a/params_shard_11.bin b/params_shard_11.bin
new file mode 100644
index 0000000000000000000000000000000000000000..79bdbe8b0710f90bb4902746b8ede919f183d780
--- /dev/null
+++ b/params_shard_11.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:02d1ba3f2a1f36bf890f44ab1aa1e3e66d0b22a15c6cb2114c32a6396d9666bb
+size 35389440
diff --git a/params_shard_110.bin b/params_shard_110.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0479d2edc8b58517f773e0844487cc75dc83871b
--- /dev/null
+++ b/params_shard_110.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:349abcaa9364f868d983a0f1d9c551bd58f1ebd08859ee3746b7966bcaa44506
+size 32829440
diff --git a/params_shard_111.bin b/params_shard_111.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a39912b5797c97db9d748a5bb75effc16296d718
--- /dev/null
+++ b/params_shard_111.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:af251bd824ba072897c4dee30476f7f01e37ddf46b06f2e0f9ad165089b018c4
+size 19660800
diff --git a/params_shard_112.bin b/params_shard_112.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6a813d719f06eca1b7394e521bd942e312af4f7f
--- /dev/null
+++ b/params_shard_112.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3f92e9f9676fd161522f4909417b7f75ee3d8da0f845048924a37219fcd84b9
+size 35389440
diff --git a/params_shard_113.bin b/params_shard_113.bin
new file mode 100644
index 0000000000000000000000000000000000000000..06dacddbe21859cbc4dcc65f192fb4bec528eaa0
--- /dev/null
+++ b/params_shard_113.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cdb5c679e9574a51f2946fce92992dc86aef0c395f3ecdb10d3c33403a21a58a
+size 31969280
diff --git a/params_shard_114.bin b/params_shard_114.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7946f899927dd908a104aac29418952fc2ad5759
--- /dev/null
+++ b/params_shard_114.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5e78253c9b9e62725b8f5a9da67390e3da859642fbb9cd85f40b86d31cde01f6
+size 19660800
diff --git a/params_shard_115.bin b/params_shard_115.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8d35ba0054c14a81191fd0664e6b66dec58911cc
--- /dev/null
+++ b/params_shard_115.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:da42af6430e48a1d851a2c415d4e75a7c18fc1fa33eef61a80afb633ff1a8c36
+size 33361920
diff --git a/params_shard_116.bin b/params_shard_116.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6246e5ef5313b4fad35ea7da104aae03270988a5
--- /dev/null
+++ b/params_shard_116.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:59a7df6e22ad1a16c9b929a64842bc95f6fc76cf4165376fecc28956f5b1cb92
+size 35389440
diff --git a/params_shard_117.bin b/params_shard_117.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6d9e3e02b3a3e22e462905d48109846fb12f4818
--- /dev/null
+++ b/params_shard_117.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1f9a5ba28f751defcfeba086d224e894d8e50f1f5657db284fe8141a9f3bfe85
+size 19660800
diff --git a/params_shard_118.bin b/params_shard_118.bin
new file mode 100644
index 0000000000000000000000000000000000000000..41e69b254449f510c661d6b4f2bf047cf53e4b40
--- /dev/null
+++ b/params_shard_118.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:24de112da564e66d4941555d8de617dec61ae3e5cd2a2e59b2b2271212bd1e85
+size 27627520
diff --git a/params_shard_119.bin b/params_shard_119.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9d27ea628b33f1455b898387d4827e084f597e2b
--- /dev/null
+++ b/params_shard_119.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9330c7e823446d7bbfec8ec8bf2b5edd6ef13c83b81e467dbd48fb954bca9f48
+size 35389440
diff --git a/params_shard_12.bin b/params_shard_12.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0afe1f9f2a4b2b609f30f6b85321ce5a84b962a0
--- /dev/null
+++ b/params_shard_12.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6c7b937ef4dc7df8a8a1796951972fe994b5b8798f9dccac0444f02829a7ef67
+size 19660800
diff --git a/params_shard_120.bin b/params_shard_120.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9aa5e1fa75b01bbfad295e607e70f1a7597ba12e
--- /dev/null
+++ b/params_shard_120.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5fccdfe5f59afdb742bc2a8fba7155f0578ecf599ad9018ae27b806ac73cfadc
+size 327680000
diff --git a/params_shard_121.bin b/params_shard_121.bin
new file mode 100644
index 0000000000000000000000000000000000000000..da4eeb082b07c8ae67f65f6f5bad800308928b95
--- /dev/null
+++ b/params_shard_121.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:25366520631d9263b1ebc0d729662006865328c779c340d27cb58b0da856a045
+size 32782336
diff --git a/params_shard_13.bin b/params_shard_13.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d62678a091753f1e0a747ca7950d03c443b1fc52
--- /dev/null
+++ b/params_shard_13.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:502e1d666207b2491fa413bb1208dd9a4fe95bba0328d38c0c842fd8cd6dea53
+size 32952320
diff --git a/params_shard_14.bin b/params_shard_14.bin
new file mode 100644
index 0000000000000000000000000000000000000000..132f386de2cd60ab239d674a6ca249e29b8c218b
--- /dev/null
+++ b/params_shard_14.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f181886a4fb52b833d137cf2848c25601e3c90373b499cb38c30f5510bb459d0
+size 35389440
diff --git a/params_shard_15.bin b/params_shard_15.bin
new file mode 100644
index 0000000000000000000000000000000000000000..21733ea975c1cb13682c7658c053feb18f8547e9
--- /dev/null
+++ b/params_shard_15.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2ee05bbe9093001b50cd3d364ef97918c68c176bc02d981d77ad26b84a454957
+size 19660800
diff --git a/params_shard_16.bin b/params_shard_16.bin
new file mode 100644
index 0000000000000000000000000000000000000000..535e4de40a46a53f3dd67435475aaa7815586e80
--- /dev/null
+++ b/params_shard_16.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aa03113ad71233c9766b2a4f3678ffbb180596dbd3570e7403c754eb9e33958f
+size 32952320
diff --git a/params_shard_17.bin b/params_shard_17.bin
new file mode 100644
index 0000000000000000000000000000000000000000..645367cc48cd2bb9440b07fa3489c36346e867cf
--- /dev/null
+++ b/params_shard_17.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:48a6d9f56b191966691dda22a097a6eb912c7a3ec0b8df1d04af02ee71666c66
+size 35389440
diff --git a/params_shard_18.bin b/params_shard_18.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ea31754e8c05a9d35d867dec83cd996ccccd131d
--- /dev/null
+++ b/params_shard_18.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cd4daed8b62c77af401bc843be2115e7e749e2d441f06e2a0a438669723f516e
+size 33054720
diff --git a/params_shard_19.bin b/params_shard_19.bin
new file mode 100644
index 0000000000000000000000000000000000000000..65230547ac36945bc9817296d4f24ea96d30fd17
--- /dev/null
+++ b/params_shard_19.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:868f9a6da81a37b2949c3598a3ce86fadc758c6d8041676bf8745361a26a57c6
+size 35389440
diff --git a/params_shard_2.bin b/params_shard_2.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3d01f5bb2a2474982f5481d78aebfb56fbe6f528
--- /dev/null
+++ b/params_shard_2.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d2f9f7d043fee7af88e324e93278fdb7f9da11daf5528749fd643ea82e3c07bd
+size 31703040
diff --git a/params_shard_20.bin b/params_shard_20.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c8bcf113468a677a4059dc88fe50bb0f399a5246
--- /dev/null
+++ b/params_shard_20.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b99f4d106a985463b476c82dd6c8c2f00c9221ced85f4bf79ee5184c4dfefcf5
+size 32829440
diff --git a/params_shard_21.bin b/params_shard_21.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e6ee3ae6906e039690252d272808d6c7f9ac66e6
--- /dev/null
+++ b/params_shard_21.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1dacc0b3974573913bf3b1615858345448e05fb8c239f862a71b66898c7920d4
+size 19660800
diff --git a/params_shard_22.bin b/params_shard_22.bin
new file mode 100644
index 0000000000000000000000000000000000000000..056d3b53b348a0b0fc760783feddd7b0ee686727
--- /dev/null
+++ b/params_shard_22.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8e2f1cf79397b7b1ade4b0b12b41ffa7d4b629f0c4f49c38f9aaddb30062f5cd
+size 35389440
diff --git a/params_shard_23.bin b/params_shard_23.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7f6cc6ae626cab9db4a0d801ed3879f33ab1eb24
--- /dev/null
+++ b/params_shard_23.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3b995fed61c185bfe7ed0a8e833236915b7eea20e690b9467f26ace1fe25da65
+size 31969280
diff --git a/params_shard_24.bin b/params_shard_24.bin
new file mode 100644
index 0000000000000000000000000000000000000000..02f14be23efbceb0cb26b2844b2366c7ab317f9d
--- /dev/null
+++ b/params_shard_24.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c1c237c11d522f14930280a4104124348100873296c334c43f8e4d78665affd1
+size 19660800
diff --git a/params_shard_25.bin b/params_shard_25.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c52060ae1c6f5ed228ec38e89a6cfce2d6d19d6a
--- /dev/null
+++ b/params_shard_25.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c00168f50d7c83e538cbdb20ac18cb41cbdabb4cea1a2ed415e147a09dcd8460
+size 33361920
diff --git a/params_shard_26.bin b/params_shard_26.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3086d55fad3485c6f77ee2be165c46a8ab03943d
--- /dev/null
+++ b/params_shard_26.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cedefcbb94226f7c46e74cfff311882ff5b8f859c86b1f51745ad8e9185cbef1
+size 35389440
diff --git a/params_shard_27.bin b/params_shard_27.bin
new file mode 100644
index 0000000000000000000000000000000000000000..11d184ae277fc208321f62f48ed0f081634b8bd6
--- /dev/null
+++ b/params_shard_27.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7fdf1c3645eafa41c961f60ee201ae90d5d0a849991735416abc3bce3318d12d
+size 19660800
diff --git a/params_shard_28.bin b/params_shard_28.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1fcfe5a0244c3cbfcba63ad65cb51e01a804295a
--- /dev/null
+++ b/params_shard_28.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5853ff1490c25b863d01d0e1a3783c98b10b9a54e6e4f82c968bcae61b485ba5
+size 27627520
diff --git a/params_shard_29.bin b/params_shard_29.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3cb0f073f341728840c3a6a47718f52594169980
--- /dev/null
+++ b/params_shard_29.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fcdc51ae053e6722b9fe5e0b1da42f2b184bad3983af411b3b0ab02a7448f530
+size 35389440
diff --git a/params_shard_3.bin b/params_shard_3.bin
new file mode 100644
index 0000000000000000000000000000000000000000..86c171eba792ce077f225cbe22aa8449ca7f92bd
--- /dev/null
+++ b/params_shard_3.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c1b3ee827e25005820f62a2b96ee5a67bacae92aa7e3cdec92fbe800de75374e
+size 19660800
diff --git a/params_shard_30.bin b/params_shard_30.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b173f785367f0e6b0d4862ccdce92a6956966692
--- /dev/null
+++ b/params_shard_30.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8a95887328ef643f843da5f44248ca62ec2469c650fa3a44f7f59101b095a9f4
+size 19660800
diff --git a/params_shard_31.bin b/params_shard_31.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8cc4b38c574d2317eac685318d27e1f86eb5b14d
--- /dev/null
+++ b/params_shard_31.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:10ca6a69d14e9c7c992966aa125f6b219e588bfdd2c12673d2269558c45a3521
+size 32952320
diff --git a/params_shard_32.bin b/params_shard_32.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7bc685236ae25e74fa3805e593549ce45b39d785
--- /dev/null
+++ b/params_shard_32.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fc135640ebf2cf0cb124be70d5d9713a6a8dd5049c9680ab0cb8b0843e8a090c
+size 35389440
diff --git a/params_shard_33.bin b/params_shard_33.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cdec5cae6e2641aa8071a1290e5e1217d3090b78
--- /dev/null
+++ b/params_shard_33.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c46bb7f775296430aee65878abd140781efdda85d03b7c42b1dd6c7de0474b66
+size 19660800
diff --git a/params_shard_34.bin b/params_shard_34.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ce19595f4b1d493a689a2aca47f52839ab291786
--- /dev/null
+++ b/params_shard_34.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:84db2953c7510b045e629ad8545fc590390f8dedffd57a571bf62654a1cdf481
+size 32952320
diff --git a/params_shard_35.bin b/params_shard_35.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a51b3e7124b3a9a4ecff5120ace82e4613b83fad
--- /dev/null
+++ b/params_shard_35.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f552c36a607b83f5ef7a0f034eea6f9420600d92c7d6ae9eed4ce3403aee7ac1
+size 35389440
diff --git a/params_shard_36.bin b/params_shard_36.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3197a62e6f912af3d48daa4c1f457c2b95ea3372
--- /dev/null
+++ b/params_shard_36.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:34a8ed64804eea58f2c8291f639a33abe24bcd78065fc958d6856d888d5b4ce5
+size 33054720
diff --git a/params_shard_37.bin b/params_shard_37.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6c950cc4aee742cdd026b8e8f82388e63d0dc1ff
--- /dev/null
+++ b/params_shard_37.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0d1db73ae64509eb549c962b9bc1adfc5b32a6e3ff5a647d4bb20a5b3a2e0558
+size 35389440
diff --git a/params_shard_38.bin b/params_shard_38.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c5f9aaa7550295bfbd3c9d68525515739d7dbc00
--- /dev/null
+++ b/params_shard_38.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6530ffd7fb55e991eb62d8695f6308afd63a7950eb6e3bb7fc7316fea5205151
+size 32829440
diff --git a/params_shard_39.bin b/params_shard_39.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eac0a1c9699297fe21f3b4b900fce846b65a7cf3
--- /dev/null
+++ b/params_shard_39.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:33026b8bbaa5318683bc3a1595fed474868fcc9d4bf289ed73520ab2f884759d
+size 19660800
diff --git a/params_shard_4.bin b/params_shard_4.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c208bd517d299adb402c8eb3e34c08415598b23c
--- /dev/null
+++ b/params_shard_4.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d500302656dfe904c1489509289111a7a5840409c62439a5dfe5075b52ed9ede
+size 35389440
diff --git a/params_shard_40.bin b/params_shard_40.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0e0f26b966f267f96124310756d54dc78a541c0f
--- /dev/null
+++ b/params_shard_40.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5f183c24120bccef14176cf41e5bd5b91ccfd5b519d776adb4252d3856cf699a
+size 35389440
diff --git a/params_shard_41.bin b/params_shard_41.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a6ad4a82fecb06cb9523c5bb0dd08c97da5d986d
--- /dev/null
+++ b/params_shard_41.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7eb60a545fa02f95fff6d0692b268525b6805f98ce7b414353ff9b0e9f818ef2
+size 31969280
diff --git a/params_shard_42.bin b/params_shard_42.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a7bd570aa1db3698f2b946dbb1366ec01b412ab1
--- /dev/null
+++ b/params_shard_42.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6568fcd74deefccf8fd5ae049b5dc531eecf4476407b0966af2f6592ba39674d
+size 19660800
diff --git a/params_shard_43.bin b/params_shard_43.bin
new file mode 100644
index 0000000000000000000000000000000000000000..64d2b173c55ac9dbc00ca1ffc9a8a275398debbe
--- /dev/null
+++ b/params_shard_43.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7ebd222ad260589702ab9843a5ef0866c730e0e36c30ad36aaa9ee9d3c168f9e
+size 33361920
diff --git a/params_shard_44.bin b/params_shard_44.bin
new file mode 100644
index 0000000000000000000000000000000000000000..46cc4f685e9f33fa5ed0dc213c98d86012f63984
--- /dev/null
+++ b/params_shard_44.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2225db773d767da886e0dbd6c3d7f681b9dc64aea92dfd7a907ce77f7ab25236
+size 35389440
diff --git a/params_shard_45.bin b/params_shard_45.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3ffa010464c252831ecd81c367af4bf06100deff
--- /dev/null
+++ b/params_shard_45.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:975b9694d7d4f70986388f3355dae34cddd9a8c70163634412346419e1c4729c
+size 19660800
diff --git a/params_shard_46.bin b/params_shard_46.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e36bb1b6e16db0061cfc2ba0da8f884e6782dd1d
--- /dev/null
+++ b/params_shard_46.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4e63e0683ab8b75a70c7bcf572ca2de7038d543e3b38ba594fa484bbca4e0b0b
+size 27627520
diff --git a/params_shard_47.bin b/params_shard_47.bin
new file mode 100644
index 0000000000000000000000000000000000000000..491f913dc135240002b1afe8ab97d64e01a7558d
--- /dev/null
+++ b/params_shard_47.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:663083f6ce9912a3997b259ccf541a8b21a1caadf61d723594711caae92b83ab
+size 35389440
diff --git a/params_shard_48.bin b/params_shard_48.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6bd7011a588d22fe8034656e84a08ca53fc5935e
--- /dev/null
+++ b/params_shard_48.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ba2dedf013f21cec82f2cb962964a9d7c0f4f5424b603d4ac52d3c24dab98e22
+size 19660800
diff --git a/params_shard_49.bin b/params_shard_49.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8097e994e9b592f5d2d4d949d56841986f9a036d
--- /dev/null
+++ b/params_shard_49.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bc539b5b021ab940a65b3eb9c8fca6fcd472f81ac2557828a4d0690f2c85767a
+size 32952320
diff --git a/params_shard_5.bin b/params_shard_5.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e3d864072798abfd7438f113d0db0900f3d8aa33
--- /dev/null
+++ b/params_shard_5.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:060aec9e7bba5efe97fd753cfa6fcc5a18ee4fe50b1da4717fe1517ba350a604
+size 31969280
diff --git a/params_shard_50.bin b/params_shard_50.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ef6c59108962186dca84ed8d43b73ab44e11208a
--- /dev/null
+++ b/params_shard_50.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5306fb3377985fa19aaf25b97bbb6868f0849cdf6f282dc1e032b7510e20efc2
+size 35389440
diff --git a/params_shard_51.bin b/params_shard_51.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c0301b34b0c8505ccb6b1c99aebe3b4ed917b730
--- /dev/null
+++ b/params_shard_51.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0c5c20519e48356a1bd8c4ebe8f07aade79f4e81273301a30d91cd8be5f73cdd
+size 19660800
diff --git a/params_shard_52.bin b/params_shard_52.bin
new file mode 100644
index 0000000000000000000000000000000000000000..24627c2754592974575f5abef52c051b01dce5b4
--- /dev/null
+++ b/params_shard_52.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1f7e230a693d5148871d68d2b6e91570fcc28022472589754c76a45f55c16c04
+size 32952320
diff --git a/params_shard_53.bin b/params_shard_53.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cc82e442c00cf7ff2c3d289bcf0d0d7e19ae41e6
--- /dev/null
+++ b/params_shard_53.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d0dfa245bc85528045d59cacee4f40f90b6655ccf54e7bd61975bb2078dfc81f
+size 35389440
diff --git a/params_shard_54.bin b/params_shard_54.bin
new file mode 100644
index 0000000000000000000000000000000000000000..680fb3bbb3c392279771f04ea197a03d27ae19b6
--- /dev/null
+++ b/params_shard_54.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:894a62caec46b1a0e6e10d5a890dbb66e0bf38d2c62da304a4bd2d36fa8dbb86
+size 33054720
diff --git a/params_shard_55.bin b/params_shard_55.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e85643ffcaa910b7ccd35e02ffb5590894f28c9a
--- /dev/null
+++ b/params_shard_55.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ada895550592ba1d08bbca7702ec18441b4dfc5493249a7671205cd50f138e6e
+size 35389440
diff --git a/params_shard_56.bin b/params_shard_56.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1ad59833c8a54473c4de91f3442267e2d3069eed
--- /dev/null
+++ b/params_shard_56.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3161339e7108560deaddc41accc681d4ef3d5956c4801cb0217958061e422034
+size 32829440
diff --git a/params_shard_57.bin b/params_shard_57.bin
new file mode 100644
index 0000000000000000000000000000000000000000..23812ebe90e4a81bea961315442e1b288a04a116
--- /dev/null
+++ b/params_shard_57.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:07301ded33b03a1b5d18c18f895565c350577d560c5b474bb391fd7518391ef0
+size 19660800
diff --git a/params_shard_58.bin b/params_shard_58.bin
new file mode 100644
index 0000000000000000000000000000000000000000..00c901457b1c0d1c1995f38581959656449b4bde
--- /dev/null
+++ b/params_shard_58.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:03ed24b97286bdbe7dd810aed7582ab8b0c3f65dfdb5f411ec3d38beb7a437b5
+size 35389440
diff --git a/params_shard_59.bin b/params_shard_59.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0035deb820e9b3f6bab0d2459abf3c4ab44028df
--- /dev/null
+++ b/params_shard_59.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a7770ab69427d876012d107ad8153b3cfa53e8e6f9bfd552f9af2ecd5485d47d
+size 31969280
diff --git a/params_shard_6.bin b/params_shard_6.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a2d792373b97cf1d4c38427542637abe0d377dc2
--- /dev/null
+++ b/params_shard_6.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6175668fad52e7599ffb4ba7dd1dda527559e295d5314879551bbd446603165a
+size 19660800
diff --git a/params_shard_60.bin b/params_shard_60.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1eb87940cb327349ccc5be3fa0498e1846503e9d
--- /dev/null
+++ b/params_shard_60.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3ece0d74d39401e5fc372dd6ad3897f7fb14565bcacced4d02f5586b466ceffb
+size 19660800
diff --git a/params_shard_61.bin b/params_shard_61.bin
new file mode 100644
index 0000000000000000000000000000000000000000..37c5846b6ff4b96060875adfe2aa7b2a4e988f49
--- /dev/null
+++ b/params_shard_61.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c43965ac785a406e0abec2b34a10f469e03bdf4940874ff32549b4d4567cc8d9
+size 33361920
diff --git a/params_shard_62.bin b/params_shard_62.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0365b560898626fa5775dc95b224cb71b871bcd4
--- /dev/null
+++ b/params_shard_62.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c79fecebebf0147c0c584b3912009ee4c17231d5aada551cf184a5edfde8293e
+size 35389440
diff --git a/params_shard_63.bin b/params_shard_63.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eae7caddbcb112e5684be5bf0f9f1f0a1da09670
--- /dev/null
+++ b/params_shard_63.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:47db701c14bf1a8f91645757f346a60256711769723daa9c1f527e8737889161
+size 19660800
diff --git a/params_shard_64.bin b/params_shard_64.bin
new file mode 100644
index 0000000000000000000000000000000000000000..23d02e45eaed7a04e8d5c631da70c82362b0930c
--- /dev/null
+++ b/params_shard_64.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:69399b5eb62897140af8bcf00d971dec4f538bb6d939458979b5de530755fc8e
+size 27627520
diff --git a/params_shard_65.bin b/params_shard_65.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bbf9f58fefd7d5ebb760130fdac9dfba42930b8b
--- /dev/null
+++ b/params_shard_65.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2c2aafb5e86ed481e139513d46eec48f0e388dea1801139cf44cac212920b035
+size 35389440
diff --git a/params_shard_66.bin b/params_shard_66.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1218e15a5bbf8e7b491ac87609bf05ac7829e3eb
--- /dev/null
+++ b/params_shard_66.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:74fe21fd65e91b4d3a62860161f260d0e0ce9518ffc93883245a34699bd7146b
+size 19660800
diff --git a/params_shard_67.bin b/params_shard_67.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4a52bf8b9ab389c1b8dced4aa02e8ddda736bac8
--- /dev/null
+++ b/params_shard_67.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:974b48c11508df106e1a05b388e58434604dea219312722d66fd89bae3fa0c8d
+size 32952320
diff --git a/params_shard_68.bin b/params_shard_68.bin
new file mode 100644
index 0000000000000000000000000000000000000000..29dd667abd6a71fef563f58d2062a7934981d399
--- /dev/null
+++ b/params_shard_68.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf3f79d9551ae7788cfb3ecad27d34dcfd64b4de55ee4d00c25bc8634491a359
+size 35389440
diff --git a/params_shard_69.bin b/params_shard_69.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c4b212a52850e8b4b35156d54843b7fffef270b2
--- /dev/null
+++ b/params_shard_69.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e576119b3bb373e0116c66e8d3f9007a4396821bead18db7ada9c5556aa9d6cb
+size 19660800
diff --git a/params_shard_7.bin b/params_shard_7.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b61bb211981b2d4d736dd9c6c9faecad8d4e0ed3
--- /dev/null
+++ b/params_shard_7.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dba2e252759bd762491c6cdf3efac6e1a8bb5e47135c75db55d4bc252e678eea
+size 33361920
diff --git a/params_shard_70.bin b/params_shard_70.bin
new file mode 100644
index 0000000000000000000000000000000000000000..76fda9de79745613778886174ac3e21fefdc8055
--- /dev/null
+++ b/params_shard_70.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cc5f54fdcfc35d3dac2cea016b7f1986a77d0d96735ba961f25558ea37cd3d86
+size 32952320
diff --git a/params_shard_71.bin b/params_shard_71.bin
new file mode 100644
index 0000000000000000000000000000000000000000..24f93fe7310f313c233e8a14dca5c5a0af3b005b
--- /dev/null
+++ b/params_shard_71.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aa2ac7e28aab73ab2db8aa044f1e34710617ca43f29378fe69816ba4e0895b1d
+size 35389440
diff --git a/params_shard_72.bin b/params_shard_72.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9cb70e1973219e74d042979a8504621d010d530a
--- /dev/null
+++ b/params_shard_72.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3a07eabf64e4c3a009c537b586a1724ae94829c96ae17eecb6a720f6300ceeda
+size 33054720
diff --git a/params_shard_73.bin b/params_shard_73.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9a67c1b616bccee25708e24fcccd60d7c274ca7d
--- /dev/null
+++ b/params_shard_73.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9d909a698e8fa91993ca3e8329041e162b04f9f17a86eb8c02edac6bc4e54e9f
+size 35389440
diff --git a/params_shard_74.bin b/params_shard_74.bin
new file mode 100644
index 0000000000000000000000000000000000000000..117e5cacf16a55a6fd18ce9d016fe9def36678ce
--- /dev/null
+++ b/params_shard_74.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c98b5c8c8967b9dac972d3b77e6e725e0efa59657ccd0e9ee1d1a2592e24582f
+size 32829440
diff --git a/params_shard_75.bin b/params_shard_75.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2d7a03f33a6fb54b6978aa88e3d3319c61a2c1e2
--- /dev/null
+++ b/params_shard_75.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a52465ddbe176275653db2422a90f1c0522b8d5ff3a2a13938b9c99d95b5aa13
+size 19660800
diff --git a/params_shard_76.bin b/params_shard_76.bin
new file mode 100644
index 0000000000000000000000000000000000000000..160d2e61ee8c338471291a93836775df4aa36b61
--- /dev/null
+++ b/params_shard_76.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bfda6267ccfbcfd736b477fa7d361c0f346910a4d5be8c8abffd41dd205f5e3f
+size 35389440
diff --git a/params_shard_77.bin b/params_shard_77.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a0c9deed101445a0b984d66c464afd1a74356f8e
--- /dev/null
+++ b/params_shard_77.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2e13fa5a20171946914e493d137f4df612b91a1d756e43c1c35f3bce1117e366
+size 31969280
diff --git a/params_shard_78.bin b/params_shard_78.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dc4401c49f0c6bb8aff05f73b8d7f32e5d881fe8
--- /dev/null
+++ b/params_shard_78.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ce0ea6fb030e2313ff9d72661226ded51e57c232d2c5d3dcb12654450f2c14ad
+size 19660800
diff --git a/params_shard_79.bin b/params_shard_79.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cffd09d40d2344cbb90979891d5f2d849ff9e96d
--- /dev/null
+++ b/params_shard_79.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ff703d3cb37213f10609c1535ea8883c07c4e9f76c8f2e326cd427aa5d6e1e5e
+size 33361920
diff --git a/params_shard_8.bin b/params_shard_8.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a3ae10c221b7590795e86663e3ded116878aeb3e
--- /dev/null
+++ b/params_shard_8.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:426f23a7b9a8634a28a35d8e79605afc7709b9a386df2131bdf6480529937364
+size 35389440
diff --git a/params_shard_80.bin b/params_shard_80.bin
new file mode 100644
index 0000000000000000000000000000000000000000..86e36f1f21a099833c6418929dc37f87df631205
--- /dev/null
+++ b/params_shard_80.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:43aebd6eaadd9470781cbdb66ee724dea69116a7b6977ba14174d1ce62ad0498
+size 35389440
diff --git a/params_shard_81.bin b/params_shard_81.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d14b9ee7f10e437004666ccb84b45d3b8500233b
--- /dev/null
+++ b/params_shard_81.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2ad4c80bf97089ca616f1d15fa23bc32b8ae6e270bc7c3de7a9dc15e1e37f644
+size 19660800
diff --git a/params_shard_82.bin b/params_shard_82.bin
new file mode 100644
index 0000000000000000000000000000000000000000..56698c5e7388306873cbf8eb202277b1635a30ea
--- /dev/null
+++ b/params_shard_82.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a68ef451f64a9c8809e8e4f3f65836f4537616e70d665764cf703db354304bd4
+size 27627520
diff --git a/params_shard_83.bin b/params_shard_83.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5022bfc8633845d02e45dd13308c27ec56d584aa
--- /dev/null
+++ b/params_shard_83.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bdcff590ad7439b420b5cfb7ca1f1fff7e1eeae58312f721717e545a4f95b27e
+size 35389440
diff --git a/params_shard_84.bin b/params_shard_84.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4271f8b64a4d46d26a0935171db925bd7cb238ae
--- /dev/null
+++ b/params_shard_84.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1dc2f5ca9b9dcd249a424597b9fa405c304d52fb4aba5f211af2c163e91923ea
+size 19660800
diff --git a/params_shard_85.bin b/params_shard_85.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e15cc14ff08447084709222bee9351420ed8e6af
--- /dev/null
+++ b/params_shard_85.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a7b46f5650ca28c00ac04a11c184bacc9e2afd68bfcb305f789ecc5012f01619
+size 32952320
diff --git a/params_shard_86.bin b/params_shard_86.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a8cbc236764a633deb88734951d914148888e85b
--- /dev/null
+++ b/params_shard_86.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ccc8796c25ed1ecbc30f33bda74b9e00d4c9463892c7c41aac6a25dd40d22353
+size 35389440
diff --git a/params_shard_87.bin b/params_shard_87.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1bb42ae71aa042afc86aa1a44c362f3e28313c84
--- /dev/null
+++ b/params_shard_87.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c9f732c729320caf13b23e579a660cfbc394e809a47223c71d689d5aba36806f
+size 19660800
diff --git a/params_shard_88.bin b/params_shard_88.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1d40609004af8710209395746db3091d2d4e28e4
--- /dev/null
+++ b/params_shard_88.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:007980a607a308ecc61a239cae3c0bae4aaa1709f33cf055e645ab1d6e5a0bea
+size 32952320
diff --git a/params_shard_89.bin b/params_shard_89.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9bf66c07a5c3e48e414c6eb24d4130af7370fa11
--- /dev/null
+++ b/params_shard_89.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c16ef9583c000837ffc6e833f326a891a29f5da87f8ad2b95b2539adf72d55fc
+size 35389440
diff --git a/params_shard_9.bin b/params_shard_9.bin
new file mode 100644
index 0000000000000000000000000000000000000000..de966dea7ecc6dfa1a741c55efdad63d914dfa89
--- /dev/null
+++ b/params_shard_9.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d9f026499549a56b84ef644e9fa8ccdbc222a2ae5064f87f5a6c669cb2fefee
+size 19660800
diff --git a/params_shard_90.bin b/params_shard_90.bin
new file mode 100644
index 0000000000000000000000000000000000000000..60a3b115fef174a24364a974f072a746360e5ad4
--- /dev/null
+++ b/params_shard_90.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e04bc26649491f3ba4dd73cfcaede5bc023136331710a94b52e44b6694738d79
+size 33054720
diff --git a/params_shard_91.bin b/params_shard_91.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0edea4c15df944bccccf7ec74f995dfbe9b6f351
--- /dev/null
+++ b/params_shard_91.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c5dd095a2e570fd635e856473494d799f0448d4a9489b05b52b5eb8317db8883
+size 35389440
diff --git a/params_shard_92.bin b/params_shard_92.bin
new file mode 100644
index 0000000000000000000000000000000000000000..28d44b35db66fd6beda7523030432eccf8350d41
--- /dev/null
+++ b/params_shard_92.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d72eef6b6e82e65782b5f3130c03c5aeae0432da0f563d495d6b209ebf9504d
+size 32829440
diff --git a/params_shard_93.bin b/params_shard_93.bin
new file mode 100644
index 0000000000000000000000000000000000000000..381314a3bf60805ec1bcdc8fbbf50d56a714466d
--- /dev/null
+++ b/params_shard_93.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9d3358353304f936abe47d50e39b31de7353e32cd2e0f022dd0dd1f6c9df69db
+size 19660800
diff --git a/params_shard_94.bin b/params_shard_94.bin
new file mode 100644
index 0000000000000000000000000000000000000000..963703a748330e32a11efcb1e1eac2280cca4cf0
--- /dev/null
+++ b/params_shard_94.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:76c3055c9b7d6b9de4660792a1eb0c986f149af994fade54983cff3a632d2639
+size 35389440
diff --git a/params_shard_95.bin b/params_shard_95.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f4db0aa8211ef741351d04ffec9cf7255c370fd6
--- /dev/null
+++ b/params_shard_95.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9730e8491c5a1a95bec0d5d6bf6e31b07df4d13afac1c1c72e82415a923193c4
+size 31969280
diff --git a/params_shard_96.bin b/params_shard_96.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a32da04247086b50760e67da3a0d88c45168c817
--- /dev/null
+++ b/params_shard_96.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:493107e8c993395cce9d37b10c1f249d98898f402870def2a8c5787d706b769e
+size 19660800
diff --git a/params_shard_97.bin b/params_shard_97.bin
new file mode 100644
index 0000000000000000000000000000000000000000..690d5e7dac4ef166d95faf6479baa5dd1a1624e1
--- /dev/null
+++ b/params_shard_97.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:74ff467c82a17080f7af581aecb20231147a04a0561f4965960c403f4b8560c7
+size 33361920
diff --git a/params_shard_98.bin b/params_shard_98.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eb932f153909035c400029cf68f2b47b372c5d3f
--- /dev/null
+++ b/params_shard_98.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:03297f838d712998281f28ad27187198d3125700f9efd126e48e035e07403538
+size 35389440
diff --git a/params_shard_99.bin b/params_shard_99.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5b7dc7fedbe70532ce5c6d9ff0e0f79131fb911b
--- /dev/null
+++ b/params_shard_99.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9f212447643d7d152ab1fae97e682d20129eaa2cfc62bc518c468114a1559c51
+size 19660800
diff --git a/tokenizer.model b/tokenizer.model
new file mode 100644
index 0000000000000000000000000000000000000000..6c00c742ce03c627d6cd5b795984876fa49fa899
--- /dev/null
+++ b/tokenizer.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
+size 499723
diff --git a/tokenizer_config.json b/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..2ef41cbc275000b29afe157ba487f0530b8c26dc
--- /dev/null
+++ b/tokenizer_config.json
@@ -0,0 +1,35 @@
+{
+ "add_bos_token": true,
+ "add_eos_token": false,
+ "bos_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "clean_up_tokenization_spaces": false,
+ "eos_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "legacy": false,
+ "model_max_length": 1000000000000000019884624838656,
+ "pad_token": null,
+ "padding_side": "right",
+ "sp_model_kwargs": {},
+ "tokenizer_class": "LlamaTokenizer",
+ "unk_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ }
+}