diff --git a/checkpoint_metadata.json b/checkpoint_metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..dcfff9ea170fb3f3fbef99a15c58ec9524d55010 --- /dev/null +++ b/checkpoint_metadata.json @@ -0,0 +1,9 @@ +{ + "dp": 6, + "metas": { + "consumed_train_samples": 1920000, + "last_train_step": 20000 + }, + "tp": 4, + "version": "1.2" +} \ No newline at end of file diff --git a/config.yaml b/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..941fe7295b4a4eaf11fd749f68b23b6cb8b9f0d3 --- /dev/null +++ b/config.yaml @@ -0,0 +1,150 @@ +checkpoints: + checkpoint_interval: 1000 + checkpoints_path: /fsx/phuc/new_workspace/experiments/exp57_8b_llama_1024_ctx_length_and_64_segment_length_and_100k_bs_and_global_lr_1.0e-5_and_balance_factor_lr_0.01_and_balance_factor_0_weight_decay/checkpoints + checkpoints_path_is_shared_file_system: true + resume_checkpoint_path: /fsx/phuc/new_workspace/experiments/infini_attention_8b_llama/exp57_8b_llama_1024_ctx_length_and_64_segment_length_and_100k_bs_and_global_lr_1.0e-5_and_balance_factor_lr_0.01_and_balance_factor_0_weight_decay/checkpoints + save_initial_state: false +data: + dataset: + dataloader_type: single + dataset_max_tokens: null + dataset_weights: + - 0.3 + - 0.3 + - 0.45 + - 0.15 + - 0.08 + - 0.02 + datasets: + - dtype: uint32 + filename_pattern: .*.ds + folder: s3://huggingface-llm-datasets/stack_full_v21-8k/tokenized-llama3/long/ + skip_tokens: 0 + - dtype: uint32 + filename_pattern: .*.ds + folder: s3://huggingface-llm-datasets/stack_full_v21-8k/tokenized-llama3/short/ + skip_tokens: 0 + - dtype: uint32 + filename_pattern: .*.ds + folder: s3://huggingface-llm-datasets/fineweb-v1-8k/tokenized-llama3/long/CC-MAIN-2024-10 + skip_tokens: 0 + - dtype: uint32 + filename_pattern: .*.ds + folder: s3://huggingface-llm-datasets/fineweb-v1-8k/tokenized-llama3/short/CC-MAIN-2024-10 + skip_tokens: 0 + - dtype: uint32 + filename_pattern: .*.ds + folder: s3://huggingface-llm-datasets/project-gutenberg/tokenized-llama3/ + skip_tokens: 0 + - dtype: uint32 + filename_pattern: .*.ds + folder: s3://huggingface-llm-datasets/OpenHermes-2-5/tokenized-llama3 + skip_tokens: 0 + pad_samples_to_global_batch_size: false + skip_in_stream: true + num_loading_workers: 0 + seed: 42 +data_stages: null +experiment_logger: + tensorboard_logger: + flush_secs: 30 + tensorboard_dir: /fsx/phuc/project_data/infini_attention/tb_logs + wandb_logger: + wandb_entity: null + wandb_project: infini_attention_8b_llama +general: + benchmark_csv_path: null + consumed_train_samples: 1920000 + ignore_sanity_checks: true + project: infini_attention_8b_llama + run: exp57_8b_llama_1024_ctx_length_and_64_segment_length_and_100k_bs_and_global_lr_1.0e-5_and_balance_factor_lr_0.01_and_balance_factor_0_weight_decay + seed: 42 + step: 20000 +infini_attention: + balance_act_type: orig_sigmoid + balance_factor_lr: 0.01 + balance_factor_weight_decay: 0.0 + balance_init_type: zeros + log_grad: false + log_segment_acts: false + logging: true + logging_interval: 250 + segment_length: 64 + turn_on_memory: true +kill_switch_path: null +lighteval: null +logging: + iteration_step_info_interval: 1 + log_level: info + log_level_replica: info +model: + ddp_bucket_cap_mb: 25 + dtype: bfloat16 + init_method: + path: /fsx/phuc/projects/infini-attention/llama3-ckps/haojun-8b-llama-nanotron-ckp/NanotronLlama3-8B + make_vocab_size_divisible_by: 1 + model_config: + bos_token_id: 128000 + eos_token_id: 128001 + hidden_act: silu + hidden_size: 4096 + initializer_range: 0.02 + intermediate_size: 14336 + is_llama_config: true + max_position_embeddings: 8192 + num_attention_heads: 32 + num_hidden_layers: 32 + num_key_value_heads: 8 + pad_token_id: null + pretraining_tp: 1 + rms_norm_eps: 1.0e-05 + rope_interleaved: false + rope_scaling: null + rope_theta: 500000.0 + tie_word_embeddings: false + use_cache: true + vocab_size: 128256 +optimizer: + accumulate_grad_in_fp32: false + adam_beta1: 0.9 + adam_beta2: 0.95 + adam_eps: 1.0e-08 + clip_grad: 1.0 + learning_rate_scheduler: + learning_rate: 1.0e-05 + lr_decay_starting_step: null + lr_decay_steps: 23500 + lr_decay_style: cosine + lr_warmup_steps: 1500 + lr_warmup_style: linear + min_decay_lr: 1.0e-06 + torch_adam_is_fused: true + weight_decay: 0.1 + zero_stage: 0 +parallelism: + dp: 6 + expert_parallel_size: 1 + pp: 1 + pp_engine: 1f1b + tp: 4 + tp_linear_async_communication: false + tp_mode: ALL_REDUCE +profiler: null +s3_upload: + remove_after_upload: true + s5cmd_concurrency: 5 + s5cmd_numworkers: 16 + s5cmd_path: null + upload_s3_path: s3://phuc-experiments/infini-attention/8b-llama/exp57_8b_llama_1024_ctx_length_and_64_segment_length_and_100k_bs_and_global_lr_1.0e-5_and_balance_factor_lr_0.01_and_balance_factor_0_weight_decay +tokenizer: + tokenizer_max_length: null + tokenizer_name_or_path: /fsx/haojun/lighteval_evaluation_model/NanotronLlama3-8B + tokenizer_revision: null +tokens: + batch_accumulation_per_replica: 1 + limit_test_batches: 0 + limit_val_batches: 0 + micro_batch_size: 16 + sequence_length: 1024 + train_steps: 25000 + val_check_interval: -1 diff --git a/lr_scheduler/lr_scheduler.pt b/lr_scheduler/lr_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..28be9857379f1ecbf172ab49391def9dfb71dde2 --- /dev/null +++ b/lr_scheduler/lr_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:737facbe7635b84da684cbb0920e1e12cbfa59d865027e3d29946e1da7fcb6c9 +size 5812 diff --git a/model/model/decoder/0/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/0/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0f4d33322975f6329aea357cd052e2a5c9d06d0c --- /dev/null +++ b/model/model/decoder/0/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd3cd7ea1b37e9d8245500104946a1f9beda585b582c3c6c86417f2143e62c0a +size 200 diff --git a/model/model/decoder/0/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/0/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2438d82e7af29571c6fc6280ca132f3bdce8b028 --- /dev/null +++ b/model/model/decoder/0/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ecce917758b783cf75bcfba65bb98e2598b47fa369e79e97217dac514fe7cb +size 200 diff --git a/model/model/decoder/0/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/0/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..46c0131a31eded119960ff0c6144620555bf0b5b --- /dev/null +++ b/model/model/decoder/0/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4eca6ff9837681e57b8b7359a0b1450a2a2faaa217f191343a224bcfa4bac2d +size 200 diff --git a/model/model/decoder/0/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/0/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9562c52493548dc205aca44ea27b0855fb3f10e9 --- /dev/null +++ b/model/model/decoder/0/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70e26e50995d04b476cef24f25fe3b123db242b79d2b26721e958a27a94e95c3 +size 200 diff --git a/model/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..42270cdb183a99f4e6069f73ca02c5c4a0d98b8e --- /dev/null +++ b/model/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afbb7fafb264594a507fe03060a966b91335e60401aea3f3531c9036a37bdc2b +size 8388848 diff --git a/model/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..21517d71038c3396e320bb2c3be7e316004ef1c9 --- /dev/null +++ b/model/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9505ee95b8f6e228216d63826f095d1d2bd704c090a9496b0cd204b5dc3cc7 +size 8388848 diff --git a/model/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7977603a06e3366fed951cccd35b2c5b0dc26064 --- /dev/null +++ b/model/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f4f77e670759e11cca92e8eb1a4ca8cb1d997cbe1a3c7ec44097d91704dec79 +size 8388848 diff --git a/model/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..83052eb8ecbffa32c989a1110c72274ff1cfd018 --- /dev/null +++ b/model/model/decoder/0/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20f2977cc2ccc9df4828d9170c829143ac84e7bf1a10a17dbcff03b8e7d2b9c4 +size 8388848 diff --git a/model/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..28566d02ba2ade9bcd2fa914ef9503c11a67793b --- /dev/null +++ b/model/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b85fff5b4969a14a90d3251beea89a4f58b3476951dc4d80842fbc42859551a6 +size 12583264 diff --git a/model/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4b05741679a5c6049f9523866da15ac57742a289 --- /dev/null +++ b/model/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c906c130138839577b399f263d2cd0377c684161cab8eb9db82cf4f30e178fa1 +size 12583272 diff --git a/model/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..313bfb785c43d772acb82a02762cdbe94438cdd0 --- /dev/null +++ b/model/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:691718e5119e0a7115a84454c6ed9eafd768b9b9783f747c698059db2233224e +size 12583272 diff --git a/model/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7c7b4696330b317d01907db8027e539b183c2084 --- /dev/null +++ b/model/model/decoder/0/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b315f2fdabb2b6e6aaa65bcbc1e77d7c307f50b20de2b3f55501e3c9e355884 +size 12583272 diff --git a/model/model/decoder/0/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/0/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0aeec9abab2b3ce6cd4b12a7bd32a53c055034d7 --- /dev/null +++ b/model/model/decoder/0/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:839be36eddaad9760a68863d4618402af1893620b281a05ff0ff9e7cfe0ed802 +size 8288 diff --git a/model/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8cd4ec7cd8c1624d05723292e97d9644177659ec --- /dev/null +++ b/model/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d638b1dbd9ab13fbfbeb47885a43ae81679b199c18c0cbaed3f202cf4c36942 +size 29360368 diff --git a/model/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..698f93348863e70f8f7d68771a06e1e478eb7a0c --- /dev/null +++ b/model/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a030aaac659587f67dca0efc2b49aaa8b8736eed1906d2f5980529f6c7fe45c1 +size 29360368 diff --git a/model/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1d06f752f6440ec70fc444fe106e542142820212 --- /dev/null +++ b/model/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c763bab5ae055a0f8d095329c60c4ad64f0d05a52db890ed860d003f0f14ee +size 29360368 diff --git a/model/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c85e614230148943443a8119edfeea28dbf0aa48 --- /dev/null +++ b/model/model/decoder/0/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4001b487aa10205cc4b4a335c2df5dbcf2b6cf692a19b90e1e6346a6adb25df5 +size 29360368 diff --git a/model/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ad82b4796057bf965656a0fdbd24b761b60f2119 --- /dev/null +++ b/model/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eafbd550659acf898eea0fab8867281ce636543eff7f13c40f32f9028bda67d2 +size 58720552 diff --git a/model/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d2b443206a0c828b93daa44b192333bbb799d978 --- /dev/null +++ b/model/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db63345724e44faf6ba407334ecc96348ba03e0192f9f60550518368e87b6ac +size 58720560 diff --git a/model/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..408cc45b9141dca5764c1f084891e2c51149e01f --- /dev/null +++ b/model/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81385d8ec0ae77104655fbb1f5dbf799f70466a32f708c04cb47080b2d46d3e3 +size 58720560 diff --git a/model/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a8a0eaada7673562aafe074aedf0df9154e8d24 --- /dev/null +++ b/model/model/decoder/0/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ba738a34d22e416b1db4bded73974c726edb399b284d23eceb2ef16da5dd06 +size 58720560 diff --git a/model/model/decoder/0/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/0/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5b67b4c0d1eb1321998873a5a7347719722f9bf7 --- /dev/null +++ b/model/model/decoder/0/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:835706c82a03cc5e4a4c3879f76dde2c8873efd2e11c7e6d39789798af173773 +size 8288 diff --git a/model/model/decoder/1/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/1/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e43fdc5000a8a614e081715e5096980023e68ba2 --- /dev/null +++ b/model/model/decoder/1/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10aec76847af0d3b72cbf894d8ef1629db51ddf0721f2e9a839d7294e94b25ba +size 200 diff --git a/model/model/decoder/1/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/1/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52430547a5532f763eddf62483588a011840fb55 --- /dev/null +++ b/model/model/decoder/1/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44e7dc8301e6cac7b9cff6fa11dc95222e33c275101952f0fe8096d6e78927db +size 200 diff --git a/model/model/decoder/1/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/1/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d1cb34a020c9f3095fef50c4a5f8cb889b7fbf2d --- /dev/null +++ b/model/model/decoder/1/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ced99e5e02b4b2df6734a354a1bb1eee1ee32e0f7d71c00c15ba50349c520bc +size 200 diff --git a/model/model/decoder/1/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/1/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52f8c85e66f1e283152231210c89723ccf5fa918 --- /dev/null +++ b/model/model/decoder/1/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62cc82e79b26a0311182c0a0bc0e565d89e7205950536ff511a4190dfe5b4cb2 +size 200 diff --git a/model/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5052c30bf63e518a8f31e17d530bc8cc90fbddeb --- /dev/null +++ b/model/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2fbb9870ae118de4d8225df2d0111916f337e87f6ffb171e6e99e942a6f5e84 +size 8388848 diff --git a/model/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..05ab8e8ef3686615be3e10a2e4bf33ea54acf549 --- /dev/null +++ b/model/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99382bce346eb0aa855de26305cc64d581c209306867ecfe665209e142724cd1 +size 8388848 diff --git a/model/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b428daf3cb03ca95afa632b01a368df58371a077 --- /dev/null +++ b/model/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df614829f243bc8d2c4ba3deda49e8a9bab6ced8cd2e63c46b08fdae176ab6c6 +size 8388848 diff --git a/model/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..557b348d834c9b1dcdbc2c5106e0d39b5f6e541d --- /dev/null +++ b/model/model/decoder/1/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a42aec6f5c07a392ebfc588f67c9b8713c3f1cbf1dad988c3bb7ae0ed72a4d47 +size 8388848 diff --git a/model/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a6f17f9b1f14de0828aa01d44e380556f893ba63 --- /dev/null +++ b/model/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8005058e37aa101f31327e80c1d3a2646a3303acab2e21f6e78c0f4f72f01495 +size 12583264 diff --git a/model/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8686b22111a63029f3a0107e7c770d555be1347d --- /dev/null +++ b/model/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef2b1fe9ec243434a30e0d2aef93794229ca86157146e79a8037b144494246b0 +size 12583272 diff --git a/model/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..176454a650f3adf7f36266861361e903a12ea9bd --- /dev/null +++ b/model/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92f89cc57b8db928d5dd5b2baf9422acf4a6fcb5b13d7c57a63fb6891bd68bcf +size 12583272 diff --git a/model/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..00bf3e7dd267c7cbea0e5be947d6a5314d421689 --- /dev/null +++ b/model/model/decoder/1/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3feca5b544559386a355f31d3658237169eb8c170523fdac2047c0aec838a8b6 +size 12583272 diff --git a/model/model/decoder/1/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/1/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..85a20b500ca9a3f3656fec0a435d96f342b49f7d --- /dev/null +++ b/model/model/decoder/1/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e247f0ff9fef5db3801019d29cbab0e939f9811bc87948dbf2ffccf3c804c7 +size 8288 diff --git a/model/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..333453d6037055d6c6459145843f130b99a57b4a --- /dev/null +++ b/model/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5de65ac6d4af028cfa691029645ba2cdbd80e8717789505e5850c5978807256b +size 29360368 diff --git a/model/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2706f9c07a4065ea82cd8ca474ae14c7b6098487 --- /dev/null +++ b/model/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9d8b4af82370734fa7f9c2a99958a732b8face2142d04ddd7d0b7321eb7af71 +size 29360368 diff --git a/model/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..163037a329aa19abbaa32fcf948d459e588dfbdd --- /dev/null +++ b/model/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c30074512f3a8e912c0f3efd0546d3049d42f2781625ee29184de6b8d2f2b55 +size 29360368 diff --git a/model/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ced2a273408650256ccf7b21c561611af87fa612 --- /dev/null +++ b/model/model/decoder/1/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:111a16b5ed3e23b81976ccee35575e1cb2d7a17f675b9f448315cf813642b157 +size 29360368 diff --git a/model/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9f31b226cd11e32d530fa4d960c4b30f6d290a82 --- /dev/null +++ b/model/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:374da23673af8dde22742199fb2c504849f54ff68978d13e856b3d66f7e1233b +size 58720552 diff --git a/model/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9f452a49c791cfeb328bcec00c052b42a4c8e0cf --- /dev/null +++ b/model/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afd78bf516b96f51ead6a14a5821cec58857c46c98c6ed1bc99924ca4bf9c67b +size 58720560 diff --git a/model/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..093fbe8bc875b40fec072e27ba17976bcbd520fd --- /dev/null +++ b/model/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23e758214cc2fd7c534e5face960fe4123b37d76889d95eec0d548f3734a54ad +size 58720560 diff --git a/model/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..38b93d48e286c953dc4e6ca79540534a9cf17ff4 --- /dev/null +++ b/model/model/decoder/1/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e5d9e4777df66e6bd1affbdb44ed554e66913b0077b83d8551c18979fd5089e +size 58720560 diff --git a/model/model/decoder/1/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/1/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc0c2b70eea17af08c5cea2d19d03ab17b37f6f4 --- /dev/null +++ b/model/model/decoder/1/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:915cdab464967593881825306bb37d3565c1463d54c596606f4756d8b4f3023b +size 8288 diff --git a/model/model/decoder/10/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/10/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6321f6a5ee1d064acaf25755a871ce4644a94a39 --- /dev/null +++ b/model/model/decoder/10/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0800aeaafa9b470cde1e420ebf24a853846755269f90f9b0a54316e4c0666ef9 +size 200 diff --git a/model/model/decoder/10/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/10/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b468103592774cc6e6c73739db75dc6d69c8abaf --- /dev/null +++ b/model/model/decoder/10/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b37c0e48385b0aff19585ad996520319d194b68d8c5bef9a0255b35db6391f19 +size 200 diff --git a/model/model/decoder/10/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/10/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8b3b6d9e193236c91e82b1b8f20d2e3ec8a535d8 --- /dev/null +++ b/model/model/decoder/10/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f81fafc188236802bae75d2f0309ed3988f9d0c7f87a6d4689670be8b41cf8a0 +size 200 diff --git a/model/model/decoder/10/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/10/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..254cebc684ff8435fbbe0e3327d2eb25cc4d1245 --- /dev/null +++ b/model/model/decoder/10/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02973af0805fc777a8f023ce54412f65845c53f2e4811f7cd53a0d009df4e3a2 +size 200 diff --git a/model/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3304e7e56ba300afe9bc37ac0bcc4393db17481d --- /dev/null +++ b/model/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:136293342e66b19661f9116e816077e69746e0b266ad94ab4ed78baa5dd9e76e +size 8388848 diff --git a/model/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..add0c2e31a235b50cd190fb3da1a17a0108ffc82 --- /dev/null +++ b/model/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2d48e933fa41a3c3fcae5f1472eb8184d16860f8995e30372ed723bd05bec0c +size 8388848 diff --git a/model/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..84cfc4ed48deeb624393ebdddaffa940ad0589a9 --- /dev/null +++ b/model/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a5fadd5145277eec5ac636a56966fde47181cd430eeb09102a019e78a2b2e89 +size 8388848 diff --git a/model/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09cb08e75dbef13744df7e1fe4ed6459e1649c32 --- /dev/null +++ b/model/model/decoder/10/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12a4fcb5ad39ec9e176da9498a1a27498ee305e68bc05121bd64bc897a73e3c7 +size 8388848 diff --git a/model/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..373647f050050bf01c81a668782851a924ec9b65 --- /dev/null +++ b/model/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24f8f277adc4457877d276c76fb196914c791c38ec4fbbba50f6268a20fdad25 +size 12583264 diff --git a/model/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d21fad1c7fee530c9276355ab4c6be5b7626b4b6 --- /dev/null +++ b/model/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce5ca7a264414cb9053d7df7bcdb79f54f0813d492aa4ee80a749c06a54673b +size 12583272 diff --git a/model/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c4f8f8689f79e61854a1ab6ee3f0ffd58dc0e37 --- /dev/null +++ b/model/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d46007b88078add582d7eec71faed4077cb2026995b991933c8124f4239becb +size 12583272 diff --git a/model/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6eae4ac7b650ac2d0a939cdad4b7e7dcf7e8dcee --- /dev/null +++ b/model/model/decoder/10/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:737cc4ad29d77c26e148d142b1629b4c55bf2e5a4823a604b83105ed4febccbb +size 12583272 diff --git a/model/model/decoder/10/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/10/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..99f63c82799521643f05d2ce16bab751ac3f86fe --- /dev/null +++ b/model/model/decoder/10/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5676fae834abc7dfc36a899b844e261c5f22fe2418140f68eb60deb991cc1e92 +size 8288 diff --git a/model/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dcde1958351732d3925bb386e72cc8f048db738d --- /dev/null +++ b/model/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57e9531616fee24311d669f03f55635fd5456249bd9dcdcc3d17df132725e169 +size 29360368 diff --git a/model/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1d7e2b2bd4b97e163be98442ccd571a69abbcf51 --- /dev/null +++ b/model/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c1b75f658fb6890ceace47afe559b321fb3d4a6a54b5f9cb86b303acb447d1b +size 29360368 diff --git a/model/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..192ba232389d217b7abfaa26495ddc19eb0e360e --- /dev/null +++ b/model/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1b731e52d883274f30e63db5e1d93f14e23683acf1d59bf306a897d6bae523d +size 29360368 diff --git a/model/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e8deaa93a976cf0713b118b06c06d0516526a412 --- /dev/null +++ b/model/model/decoder/10/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5457a19c6bd3e0b74d71ac47997cc12bb97520c15b64642f1a404f662a965e68 +size 29360368 diff --git a/model/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f51102141194a95593cb0e08e7d4eaebd8ea4a62 --- /dev/null +++ b/model/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d926618001008959bf00b43223a3e6fc980672d2380a1b2acd8f8caa827987f4 +size 58720552 diff --git a/model/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..76bebc23f5c5d08159e3c3f792034b7634955648 --- /dev/null +++ b/model/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea36fac53d5d3d8b0f8c5ae9a299ab441ffb7bc6c065da32b775fbb7d883a00d +size 58720560 diff --git a/model/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5ab581e4338db4e99d6312b36729fdbada16d15c --- /dev/null +++ b/model/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d0b637080616dfc10bf577724fb53ba2e805e75d6b87674224ab11f5082d87 +size 58720560 diff --git a/model/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c172f379869b7fe4db70d7831e74facb94080103 --- /dev/null +++ b/model/model/decoder/10/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67fd72041b2ed47a98063193405737658cc826329459664d086b871a6f5bb70a +size 58720560 diff --git a/model/model/decoder/10/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/10/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3dbbe71a0aa2412b96e3070ba606f7cc191f9a94 --- /dev/null +++ b/model/model/decoder/10/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf4976b831ec6dafa83f610665d894bf8533a336592b09ed624ae93f9e070ed2 +size 8288 diff --git a/model/model/decoder/11/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/11/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0bbcd60033cd93dad04d7a0f4584e15d8929e6fc --- /dev/null +++ b/model/model/decoder/11/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5919dd1b14a3f819c11677253a5a003f5ab5234914dbd7b8e131e42bec18496 +size 200 diff --git a/model/model/decoder/11/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/11/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..df5682e36e56921c817dda9560f56155717dcb99 --- /dev/null +++ b/model/model/decoder/11/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd97d252f1667a8d7cd6018cf15bbcf4cd4c4dc95eb0b98b4e86f628788d4c99 +size 200 diff --git a/model/model/decoder/11/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/11/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d9e244d8a511f16642f2b24adc83fc7909e7c38 --- /dev/null +++ b/model/model/decoder/11/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcf1692f91c0a383316e3ba5ba2020182b1e746278901a342c629a0c8d213cfe +size 200 diff --git a/model/model/decoder/11/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/11/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e95ca9762b2df6b9e49f8bca2d08d06d43002732 --- /dev/null +++ b/model/model/decoder/11/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd136aee1d281b0477fafd319045bb687275bbf164226c0336b5aa68571d4512 +size 200 diff --git a/model/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..39b42bb36598aba9c88039675de7931a748da1e2 --- /dev/null +++ b/model/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:326c4d96d74d113f8f20d5180ca8ffd4f7a4d5c20717662529dd96df695b54a6 +size 8388848 diff --git a/model/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d7af325260e1eda785e1451057846493203eaf8 --- /dev/null +++ b/model/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51b6b29f9b3d902d1641f8f02916523450478f401b826d74a7d88630c8eb3cfc +size 8388848 diff --git a/model/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6dba28efc1eb73ab9d765017c74b487ed9d63fc1 --- /dev/null +++ b/model/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f85d876ff0aa7609d814e77c37f14a9eb99af52df37d73d5d23c03eff791e2 +size 8388848 diff --git a/model/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bb19d7ead0e65df3955e7d7e9964e981ddd9f51d --- /dev/null +++ b/model/model/decoder/11/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c38119d2f8023ecc1e52d34a963637664bfa73fdc3e8164ee8bc7ee8ce6fbb +size 8388848 diff --git a/model/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1d77d9ec24e34da653abe0b5f7bd2d69473c4788 --- /dev/null +++ b/model/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e89053cfd87a541e627fd6bffdc1a11ac6da5f0f3fdfbfdbfb01397023c7a596 +size 12583264 diff --git a/model/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c59334cdb71f68df6b0ce7249a29c4251f1dcd23 --- /dev/null +++ b/model/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:852290d901405c6c0ed3d33507bd8d093774c4da38265fea8d2c7771cdeb4806 +size 12583272 diff --git a/model/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..63cf2b8859c66bf5ff7011a9f31f7b721cc85016 --- /dev/null +++ b/model/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dafacb23479129c83670f93487e4682e1c2b8387b23b5d6440c942b5f3ec8fa2 +size 12583272 diff --git a/model/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cbf2b62bb3e2dad371ef66ca7e02ed9d2c75f06b --- /dev/null +++ b/model/model/decoder/11/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef6073c0f57e6cc1a3954a08c68987ff3b6072b65b39bb1c1e348bcf9fd84c2 +size 12583272 diff --git a/model/model/decoder/11/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/11/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7cf89577edf1c2b4eb8ba23aaec42749d1bacfda --- /dev/null +++ b/model/model/decoder/11/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3d908b6381703c4a9f9e7c028053525be60a3a27fd9d8a5bbdab8464e8fab50 +size 8288 diff --git a/model/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f2ce53e6f9f17e0bd2778960767a0cd81ebdeabe --- /dev/null +++ b/model/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a6d9194581a6918bf045dfbf0f84d2ade9c548109cd70147eebe133b627a1b7 +size 29360368 diff --git a/model/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dd6006b684d428736f3960b5867a40ec3cacce10 --- /dev/null +++ b/model/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85740ba9986864f0bba5812cb1fd4e2d5cf3d2ef4f52beb04de2b4bf570c5f35 +size 29360368 diff --git a/model/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c6f0a7affb74ad25860e0f163890767341901c71 --- /dev/null +++ b/model/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76668aefc7e44c5a13f5dc35be97c99c009cd755b04e15e57f66726ca5d30ee5 +size 29360368 diff --git a/model/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d1eaa3a905918a8908fb2f03f2e562b4beae3f79 --- /dev/null +++ b/model/model/decoder/11/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:886ea4a0955b24d4ee5aa079fc2906f972042967b114379c553c76b3d0c458e2 +size 29360368 diff --git a/model/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0cff81935cfa0128bfe9a49b15ab873809ec8a51 --- /dev/null +++ b/model/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c14bfaed6adf167c0626013fc917968fb866502115dd273e9b46569fa95b6df +size 58720552 diff --git a/model/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..89358456cad89d7c00bb4eb12f588515e88875cc --- /dev/null +++ b/model/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:974eb7e5ad6286092c68b77c804691c86a6d2ffd2b23530d72959c93d44e5a14 +size 58720560 diff --git a/model/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b46866e2e377b53220e85a539ef44e062107f5c6 --- /dev/null +++ b/model/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff26ed20d2b2e06165af7c1b33443613e44b83a7401d17b76b226b2474fe1cd7 +size 58720560 diff --git a/model/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3d8d30621dd73adb1b2b4d699ad989627468b898 --- /dev/null +++ b/model/model/decoder/11/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f688105e8bde5273e10cab108670d56ae1e6b1f8061485ac494da398220f3093 +size 58720560 diff --git a/model/model/decoder/11/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/11/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bffc1dc00ce374edde7c3120862a9c45bc94af17 --- /dev/null +++ b/model/model/decoder/11/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a407842e3bca620805aaf262394b8b1fb02a5c0c6b32c419f0a8c09d1fcf57d5 +size 8288 diff --git a/model/model/decoder/12/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/12/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..428a1222ae8a7f6f21abefdc033e93536d18c9ab --- /dev/null +++ b/model/model/decoder/12/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bf155fb961830d15c267d8755b3839df9d10eca064423941096ce0c9f60a8dd +size 200 diff --git a/model/model/decoder/12/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/12/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c334ad4335b90525e93d7ffb99a5b6d06c5eaa59 --- /dev/null +++ b/model/model/decoder/12/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88456e493a54f2624372e640762249a2e3775737861ac60d90e2a02b03637914 +size 200 diff --git a/model/model/decoder/12/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/12/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..556f5ef68242c15adf3a731f1e5ba11d1a9a214d --- /dev/null +++ b/model/model/decoder/12/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2730b7353ec01f832756156195b3a1b742656f168cada65381bef1edc7efc48a +size 200 diff --git a/model/model/decoder/12/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/12/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2bc05ac1869a721de81b7eee3a6c2f1df31458d1 --- /dev/null +++ b/model/model/decoder/12/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:451db2418243a21b70ca1de062a7e5dd3aceb5b86bb86e5b5db3b06e749b7bdb +size 200 diff --git a/model/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9cd772dc4a38c821a1ee7e6d1a57bd98db6e8c80 --- /dev/null +++ b/model/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd1fa64e843515665ed07fa6ebc0f550000b0fb3cc526e13bfb093be5f9814f8 +size 8388848 diff --git a/model/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..da958142fe3bc490000ad9659db4c1a1edf06587 --- /dev/null +++ b/model/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda71516e797b6a735d9bbb394917029439e82d1675ba8d3ea0c193f11c81691 +size 8388848 diff --git a/model/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4d36a0ec5014f1686628ea7dfc2d9c661727d2fc --- /dev/null +++ b/model/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4258b940753f220ae59e8b4469909ff3a5d55239e1826c1483184939c54a9b7 +size 8388848 diff --git a/model/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8af1ca953ec441290320283b27d7c660075181dc --- /dev/null +++ b/model/model/decoder/12/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ffc118300a66faad9f8dd407092c4e03203b6617ef9dee6bae0166dcd5983a1 +size 8388848 diff --git a/model/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7c2966023dfd210d0fbee2813319b260ac677bdf --- /dev/null +++ b/model/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c6a69c92edc306c29ad1963e7687d8c8e01ea3478d7d7bf2164397615d557d9 +size 12583264 diff --git a/model/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6f3af25dc0e9bc6711e9c6726267806b49e39b35 --- /dev/null +++ b/model/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949af56236bd2b1cdb5dd899e4167fa6f8b3224e7e87a901623e00b88d452d91 +size 12583272 diff --git a/model/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4c1763b2fe4aedf8098f146a7400173af74f3d67 --- /dev/null +++ b/model/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c52fe832237b0831da4473173c3036f86b2f46ea9be454165175b84fd852fe5f +size 12583272 diff --git a/model/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a8b149e9f602d7a8d584e468653526086ee63b8d --- /dev/null +++ b/model/model/decoder/12/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd77e4f4ff265f1a32ff3f519ebcc2dadd1fdba3fb0b444ef4111cd5ed644bc8 +size 12583272 diff --git a/model/model/decoder/12/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/12/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6881baa8100c7085ce9b9ca4063d21ab3274f1d3 --- /dev/null +++ b/model/model/decoder/12/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2766ab4df2e4b58da4c47d7a780290e50131bdf77739acead60021ce79d23fc8 +size 8288 diff --git a/model/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..83eaed9f3d84266718120eb5f83abeaaa3185d91 --- /dev/null +++ b/model/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2337337031118bc44a85a1f7a4ebd7e05852bdd57857f6dab490d5ee826b98b +size 29360368 diff --git a/model/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f0b023a6a115a1b43d7cb451a0c281a5be0a0fbb --- /dev/null +++ b/model/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02c06c85f99c516d7426eac6f25c96d8bc70e19f4ef37d18de2347fa6a84da1b +size 29360368 diff --git a/model/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..babaa0111871c827fc4241bcb947cb567bb17776 --- /dev/null +++ b/model/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fc8e24c5ad9ae5b6491ba041b7a2647ff66bf4e1ab71b498228687f1c886136 +size 29360368 diff --git a/model/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d6393576a42b6e5023ae6781b297b143dea8a4ba --- /dev/null +++ b/model/model/decoder/12/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73d68885056f76608b7487f161693196f06f4a0c7e5d7743edbc9a286648113 +size 29360368 diff --git a/model/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d7935010ee6fdd13c8f65ef4a13749144369e1dc --- /dev/null +++ b/model/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09416949322ae93004aab26c7eb0e73ba47d0dc945aa56b54ebd0fc16441db1a +size 58720552 diff --git a/model/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..60666b4469fb9cd87946e3ee883a6b0eb1f031ad --- /dev/null +++ b/model/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f46a70df99c0a446a49672e547aaa324b3d7ab6fd17c42dd8601c11e2169213c +size 58720560 diff --git a/model/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a97d793cbdb70fd0be38eedf2858eaf4204f94a4 --- /dev/null +++ b/model/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:906291e409b1d87ad1339a32ef57d282518ae0c10a25cfdfdd58b6736546681f +size 58720560 diff --git a/model/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2f4e19eb79a26797050aea244598edd30c950309 --- /dev/null +++ b/model/model/decoder/12/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8212f01a4e097f4211fc8414e57aa6b307c3ec46b234bcbfc5a90fe9bfb6a98c +size 58720560 diff --git a/model/model/decoder/12/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/12/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b4e6965a8938cb2ddbe6958be9cfe7cdf6308f6d --- /dev/null +++ b/model/model/decoder/12/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3aac97367f9f248e43222f662bd481071576c22ec7ca3d91c53bc3b12e45586 +size 8288 diff --git a/model/model/decoder/13/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/13/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0d6f9315ab3c89fa9ea10dd28a2052eeff6a5ac9 --- /dev/null +++ b/model/model/decoder/13/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74bf689f66940f0c790d990938e3460cdc40b460ed6d9f8f36e45a3640c9a6b4 +size 200 diff --git a/model/model/decoder/13/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/13/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c099260c6bfe39a5db070ed116d81e257147630a --- /dev/null +++ b/model/model/decoder/13/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37b2da9e7b27c4940a97a7602af092c3f30f232db69970c22ddea513873f38c0 +size 200 diff --git a/model/model/decoder/13/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/13/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e3d2a1c56758976867457d032de217dfdc274c6a --- /dev/null +++ b/model/model/decoder/13/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b4599c224d02e60280cf723f2391b77f5cc400156a9c46685704d6df871ffbe +size 200 diff --git a/model/model/decoder/13/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/13/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5e7540d7fe34cd9310d21d724032bd133d1652ae --- /dev/null +++ b/model/model/decoder/13/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec5f427559486898835bbfc93a6042cba386d9cada0fd3d57fcbd2c574899724 +size 200 diff --git a/model/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..74933a7e9cf6dfbb71ebaa69f7c11dc84ac7effb --- /dev/null +++ b/model/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d3524f088f3f05da70388e0f4b5fa34e0a108705e48feb05d475978add99e6 +size 8388848 diff --git a/model/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..63ca3189e999211f82fda1a2856fd541d61fd9ce --- /dev/null +++ b/model/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd99fc6440cc3eaa69b709c813b8d634497f555aaf4de934364a9fd028e0941e +size 8388848 diff --git a/model/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bc3c7bf2c14ed1ec11bb586811bee37e3bce5e0a --- /dev/null +++ b/model/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3af73de3da0620b3b9ffb17ea7d753d7f686656477da1415642d83df94b1aef +size 8388848 diff --git a/model/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f4cc5f40e46eb4ce3792bfb2929c74df1d95c4dc --- /dev/null +++ b/model/model/decoder/13/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea199a84132a67920d785d08f49c771f543179f90297e2749794916904288dbb +size 8388848 diff --git a/model/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e2bda59c4cbfe4d5b67e1a088d774e41891dbfb3 --- /dev/null +++ b/model/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:707dca46acc9c048986472e5465c6ba6c8d2aeda45e3e069324624c28198f49e +size 12583264 diff --git a/model/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b3a935427c5decf258b6fdfe909fe89d9cbb7c35 --- /dev/null +++ b/model/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec905fc0601fa1fe8a335bd4d7f40e045bd965f9e0908f995debad06b012c784 +size 12583272 diff --git a/model/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5608610a0927ccbc6b868d1428bd12111de0426f --- /dev/null +++ b/model/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d60e830a5b0d1a314f1388c4a6d42cd0dba405f85cd69c69b5a06c4806c8b20 +size 12583272 diff --git a/model/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4b5037cc6a051295a000469b69adc3534ba946a2 --- /dev/null +++ b/model/model/decoder/13/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5647e2613f44b85e5f2e79cdf83a4ac3b13dc64f54f2be6c18dcdc4d4bb33ff1 +size 12583272 diff --git a/model/model/decoder/13/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/13/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..951244a30b3c4298c645c7e26f21f2a5d579d070 --- /dev/null +++ b/model/model/decoder/13/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28e5fe4e52c868bbe5d7457e45dea60606d0eebe4bcbd1268ac51e5dda1fbd12 +size 8288 diff --git a/model/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bb70aa21fa4cee5cc52b0fb91ef378bb91af1665 --- /dev/null +++ b/model/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3934b246b840dc140d89867dbc3d41163fdc9594a012fb096137897df945448c +size 29360368 diff --git a/model/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..63c411bc999e755698d9281733ee2fd0d4e282a2 --- /dev/null +++ b/model/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9e5eac4ce8d9b1110f82512faa02b299ea4a607259e9975d332716b4d8af1d0 +size 29360368 diff --git a/model/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6e0f8969a3ef4a0dd2ea80284b5bd323206a477b --- /dev/null +++ b/model/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d11c22678d26329a2dfdaba2ca2ffa7dbd83ec9d9cf5105ddd99cea4f3900841 +size 29360368 diff --git a/model/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9bd338a56205ffabe100f0a75f69d36825a24276 --- /dev/null +++ b/model/model/decoder/13/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e22619cd072dd002842f720a6c4e2721ecb76085639ba5f50234f4572d1061 +size 29360368 diff --git a/model/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..980ee3a3472433b03dbd7bcfd1122278c1c36e93 --- /dev/null +++ b/model/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14b2548b7e7b56224c9a4e392df8b25f3165fea2891bf370a5da102805b20020 +size 58720552 diff --git a/model/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a837ae34d3cc7a21e490ef387e58940d24c2470d --- /dev/null +++ b/model/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fdbc954fa386dc4516f11c4535e7a96d3b1dcc0f4e1c699d92f6cecc6b6a755 +size 58720560 diff --git a/model/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c2731bb2c4626b120457306ad8af2ec228e8716 --- /dev/null +++ b/model/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbb13222846b09f8bcdb4bc29dd819d32cecc37edcd188eb822e4d272adfac30 +size 58720560 diff --git a/model/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..24cf2a20887e7daee13d887a13157b54fd370c2f --- /dev/null +++ b/model/model/decoder/13/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5210e74fa9ab1c122666782e628cba0777a3391aa869b03c497f4e7aec45356f +size 58720560 diff --git a/model/model/decoder/13/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/13/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..720e5b637b62b582adb9e2ccb2d08f3fd57a3649 --- /dev/null +++ b/model/model/decoder/13/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44153f834b02d23e2e1a092c43598589ea4e50d732dd92fdd2a16b1d79b46cfd +size 8288 diff --git a/model/model/decoder/14/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/14/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..12280c0d8c51659233b2dac83dd8e6b9dd418eea --- /dev/null +++ b/model/model/decoder/14/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ef061b50737573f9044ea95c37572e8d1323f2709416384ad4b10d84a71f11e +size 200 diff --git a/model/model/decoder/14/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/14/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..77fa7fc2505c1c587ca9e3e337b8213f07c15a2c --- /dev/null +++ b/model/model/decoder/14/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68af47b60e00d409ef35f6dc03a4da74f50c5cdac0d2257517ea9fbdd5619420 +size 200 diff --git a/model/model/decoder/14/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/14/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6a8eebae1250acbd53cc89bb67d28ba13fa91962 --- /dev/null +++ b/model/model/decoder/14/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3662a7dd990befe0c6676924b149c075ab51fb5ed3aee9a57e8a303f06b41bf8 +size 200 diff --git a/model/model/decoder/14/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/14/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..63d455228ef70aac9b02d8cdebb35957c30cb7ca --- /dev/null +++ b/model/model/decoder/14/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5994e03e284b2b4fd6a3f8cde23ad22f7dc4f060f56f7da3c8d0f553803b1d5e +size 200 diff --git a/model/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8bcf8ad802fe53bd9d05a77ed9ff2250c3b5fc6 --- /dev/null +++ b/model/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a8887ba8e19e91bcf90c020ccb4412b7efc6af7e070c51238d6ab078ccecb18 +size 8388848 diff --git a/model/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6ff8378d0b19fa47955abf9330400c9e1c08e177 --- /dev/null +++ b/model/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a56e1114ca9965228a9dfa042f26dff2f59b9cc5c61aa845495c87ec344bed6 +size 8388848 diff --git a/model/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d47571c838e88c411a46f058136bbe00998705ee --- /dev/null +++ b/model/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f804507eb02081d5b522f6820d7b699f68c47d4a4569294668aae3d40da9c6 +size 8388848 diff --git a/model/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c47824985b30dcc89fd5dee6fa9e038e5d5954c5 --- /dev/null +++ b/model/model/decoder/14/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bb46ddffa340b07c8be69bd99baf08d1786dc994be3e28b72d603893d6f3064 +size 8388848 diff --git a/model/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..be237b97f476719f29c51134f83908f6eef0403f --- /dev/null +++ b/model/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ea4d34d5c0f821eb78a89fecb087b6c0f31cce2c7c5b3b07d0f80f644fc175f +size 12583264 diff --git a/model/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..81e82afe100a3439a5c7f8ecf188878768177916 --- /dev/null +++ b/model/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbba1e295244414c5e6ec21d039f65a92f484d3ec044b99bd6e0318444b04a1b +size 12583272 diff --git a/model/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..87925c3c97d4f33eb94a53828eb70fb09f5e416a --- /dev/null +++ b/model/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df4a34c49ff23fe9c26fb33751c571a4d454bc90760a9dba6ff97f4533be5ae2 +size 12583272 diff --git a/model/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3d6f4433503b124e4d171b45e5254968f67459ae --- /dev/null +++ b/model/model/decoder/14/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ab9ffc437d1baefbe2d060ca0b74418aeb6f0d322f94ae33f8c9a92c1b66050 +size 12583272 diff --git a/model/model/decoder/14/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/14/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1b27affe5725e57a3d08d70ce9a576590b19f6a2 --- /dev/null +++ b/model/model/decoder/14/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e402d472e2506995a54b6a3e81ed241ae09e2a917199f9f94d9ef81d7aa780cb +size 8288 diff --git a/model/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..477c022d98ca2f09c6aa6a048d0905fa7a490782 --- /dev/null +++ b/model/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5283a21a4120d8f7d5344b337db6fb91d583bd393f382fc18541df29fcdde6fc +size 29360368 diff --git a/model/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f1045ee19eb4a5de36a79bca2816de7a2b32bac3 --- /dev/null +++ b/model/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e0ac8d9b15c2b5a40a56c78a4f8908869dccaf00d5e178032f77f5a390d27a +size 29360368 diff --git a/model/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..78f8c9889bcf03aa1d811fc6c3ddd0e966bc9f3e --- /dev/null +++ b/model/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d21588bf222f907a10a5f17985e6811ec8f62e5d277ede207ce9c9b46d935f1 +size 29360368 diff --git a/model/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ee738be85414bff9f4f860c9b9f66d00f0965278 --- /dev/null +++ b/model/model/decoder/14/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:105865aefb4342de2216e0d381cbb1ef2ddbd8b48350a1e84f9f63d6ff67b3c4 +size 29360368 diff --git a/model/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cee0b53507eb287f5e424eb2d2cd1ebdd9bbc377 --- /dev/null +++ b/model/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:437d53d08ac5895929af27b282b4ad3c47c30d1922c89e1c592fe0e95104d753 +size 58720552 diff --git a/model/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37d126e3f150f4d874bf0c45490b2630e22ceea2 --- /dev/null +++ b/model/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df46c4c2736d21aa36b58f00437b7b6af750234fabfeb5ea306a7e72fca82b6 +size 58720560 diff --git a/model/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6bd7667e0c0168a80a06d27ff8145c269bbc2c80 --- /dev/null +++ b/model/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebdd404e8580dda4ce968847ea94f98b89c627b211ac2fae034a4fd988cc6c17 +size 58720560 diff --git a/model/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bc333824ee75b9dce11125f8af37de0adf5a80d7 --- /dev/null +++ b/model/model/decoder/14/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cec22225b554edb82e5c9b05695faf0162b91a3c06d6126a90174e73d82567c +size 58720560 diff --git a/model/model/decoder/14/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/14/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d8f8b197b49bbdc1a72622df624ac1ac5e8d9e1 --- /dev/null +++ b/model/model/decoder/14/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f364184ede4eaa03fc8a320ccfc0595a540310c37392cc011ed776c0e02890cc +size 8288 diff --git a/model/model/decoder/15/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/15/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b0bae53faefc9ebd3034a0fc1ce62f97379c5cf8 --- /dev/null +++ b/model/model/decoder/15/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e83769460ecf5f1f6953287a84017aa0d7c15e6ba6387a59d4e6d2c12a2d519 +size 200 diff --git a/model/model/decoder/15/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/15/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..391812f650bbaa32c5097a152c2cffcaa8635246 --- /dev/null +++ b/model/model/decoder/15/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1455daa9754d88178ce0bb4d8217b781e529a61ad14c6395bb95918a2fef0afd +size 200 diff --git a/model/model/decoder/15/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/15/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..718d1dbef7e8e34f9100feff0c5e149b9b7bbbc4 --- /dev/null +++ b/model/model/decoder/15/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15e4e8e16420df174e615349dca9fd0d45f98befbffece8f133c05933de6b31b +size 200 diff --git a/model/model/decoder/15/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/15/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..238cfb06b4bd2a44b857ea24991797647842994f --- /dev/null +++ b/model/model/decoder/15/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b3e5c3aea8a9226668b74494caa703b649c8422a77ad923464e8d3f615bdd30 +size 200 diff --git a/model/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..abbc7906364747382265d2b00ea6af83e7ba8aa9 --- /dev/null +++ b/model/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf5a7539ad407431621d8d895305747f59ad186817bbcbfe4fb733d4effdd07 +size 8388848 diff --git a/model/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9f7f7a8f1dc408e49191b63633b60c2e3ef70d97 --- /dev/null +++ b/model/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aa1f4a0596e49b9426deb24014ffab35c79c4ba9e20102c511c5d202b330ec7 +size 8388848 diff --git a/model/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e14e283053c2f9dfd9111e078e1001231c68f270 --- /dev/null +++ b/model/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73599bddcb360a16e3ad25e75b25d88dd838ec2ee92117eea29fb4b273e01a59 +size 8388848 diff --git a/model/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5fc61fd9e903ba688bed1363d3b24d24a74caaf4 --- /dev/null +++ b/model/model/decoder/15/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b14c8ed5d6a94e5ecabf916cd261f933358180abf36cb4ef0b32fa578bbef70 +size 8388848 diff --git a/model/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8329fac88daba5a02533d28e04056a1180405e7e --- /dev/null +++ b/model/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b136cd1a2ff89595079b490e8a7949a74ac20bc185963509e3b85be80cc58d5a +size 12583264 diff --git a/model/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..afa5db976aab30bb72e4b13087427fc63d0aaa57 --- /dev/null +++ b/model/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f3929307b486a0c7f5e9ea4269ac20612f84ff6bb9e8e81c72652807054e0ed +size 12583272 diff --git a/model/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b496e2d77a325f7b5015fcc6f0f6b54cabb2ba3d --- /dev/null +++ b/model/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:070b4cb80e481395c4b99c8657289f3dd3f02d9fb7292efaa3d8e996447b02b6 +size 12583272 diff --git a/model/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2e3130d1bffd6114cbf9ca5903db9936945be3ed --- /dev/null +++ b/model/model/decoder/15/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057e6532e8dd1f118664e0296a6619a1b83955199ac642ea3c8b33da16c06c97 +size 12583272 diff --git a/model/model/decoder/15/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/15/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..658ee2f9b22d264aa2c4d64668537bc592e49edf --- /dev/null +++ b/model/model/decoder/15/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26e905ec3eb6dbb7694417c952ed10e058db2b1fb976f04812d48114cf2b1bdf +size 8288 diff --git a/model/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..810fafdfdab5376586b5db862ffd34208b847a7b --- /dev/null +++ b/model/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92d87d2eb107ec476d2df82e2c59fe445fe6ecf8eb816d706fd721a1b3fa08cd +size 29360368 diff --git a/model/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5b5f801426ea9ce3f3eda39880128d029be7e1e7 --- /dev/null +++ b/model/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41abc3e82a2b3d15953a57cbcba7e6acce27f5c465f03db1b146fd3a348b4b32 +size 29360368 diff --git a/model/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..63993f7d1ac670438e07641690911716a8c463a5 --- /dev/null +++ b/model/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ecf231c3b35a0ea86e8669d980fff9028337fecc41b349868c0a26bbcf4b33 +size 29360368 diff --git a/model/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e737ff1d0584348e9f51feaed0508a83b54e2b3a --- /dev/null +++ b/model/model/decoder/15/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cb3f82e49f7660119f15b7552e8b7cc1f5359a69b8dce5e486d0413b5169ee6 +size 29360368 diff --git a/model/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..655060bf7e03fca7c60c8ee5be0ee8f8200c3543 --- /dev/null +++ b/model/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854674813bc7c7ecf043dc598f104a27c5fa858bbb8fcabf36e10f8d6cdfcc86 +size 58720552 diff --git a/model/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..608a7301376dee0204701c19812b45544a89dbff --- /dev/null +++ b/model/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8959c45198abcf3696a3314d414a615434e0e627cef2eea0c21e9d0381f979c2 +size 58720560 diff --git a/model/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..729776bffd648d41a8fc1579acb566d3187d9f32 --- /dev/null +++ b/model/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc577f979b39446b12ea13c0f3e1a4820704937ca588cdfb2a94b95e9d665e1 +size 58720560 diff --git a/model/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..61c8c348ec6d68b41414930f3d8b36992db9b1a4 --- /dev/null +++ b/model/model/decoder/15/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7691ad0c66d338625ba6d4b1eec46a6f31fa7e678949bbbe31c1cb754c23e04d +size 58720560 diff --git a/model/model/decoder/15/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/15/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f55e4eb448c242325c2db6352fe092ab98b33a95 --- /dev/null +++ b/model/model/decoder/15/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b39d84dca737097211adf6250706d47bb4796c958a1c2ecd25619b6968d9ab44 +size 8288 diff --git a/model/model/decoder/16/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/16/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a9803ddc4d386f69c906ea573b9c34442dd570b4 --- /dev/null +++ b/model/model/decoder/16/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05f98f6f6af9ee5542316d0a096e08e2d89198ebdf622746e4120255cbcde22f +size 200 diff --git a/model/model/decoder/16/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/16/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5431cf8850936b5c183712d91a209dc93356ce1e --- /dev/null +++ b/model/model/decoder/16/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9d39e49ac796ada8d2d3a08688907fc5a1d102c19bfe62e2f698c761bf8381d +size 200 diff --git a/model/model/decoder/16/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/16/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..93e53a11ce64b5f0c367bde735204a4e2fd2694c --- /dev/null +++ b/model/model/decoder/16/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92aaa7c9de5cc53d30c970d7011363a33b180d242d9e18ab721604a5d2ec5d7f +size 200 diff --git a/model/model/decoder/16/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/16/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a3bde99d000263bf857d8863ca0c1095af739407 --- /dev/null +++ b/model/model/decoder/16/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eb6fdfc8ea19d80b9120d1cf59531350cfadb62fa40106dd2b944a4e591b4ed +size 200 diff --git a/model/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f02a21cde114997b1724760844a5aaa4d966ee62 --- /dev/null +++ b/model/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a362c8f8e6c337de78e51c57c996dfb9bdbd903f4e5409d07dd9f3091dd84d2 +size 8388848 diff --git a/model/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09c90f080d8766131c65dfb1d1857fcc65cec330 --- /dev/null +++ b/model/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df3c6a2795433a483a69ee5d730e64cdf985caf49e3a5ef553ce4574eec99c8a +size 8388848 diff --git a/model/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c1b4045c019ce7ea5fa58fe1de8a485b46feae08 --- /dev/null +++ b/model/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c14bf6da30b2533cdca6b65bd74cc30349a24ac420afbe231d93e75c9b27ff2 +size 8388848 diff --git a/model/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0db1bc4ee09a631f9d9034d86b0aee8b4e579854 --- /dev/null +++ b/model/model/decoder/16/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28b247946854f3f92470c17a876eab106b1a4258ac45de5f0571acd3cc53857e +size 8388848 diff --git a/model/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0e407d3929a8d8914d7ce439972cd206c3e762aa --- /dev/null +++ b/model/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:108cd3141a943b2c7740bf5312ef2786986e95e17416a629fb397ceb6721d498 +size 12583264 diff --git a/model/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bab6229de2007e7b1ad54c029f2a759726e6e8aa --- /dev/null +++ b/model/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac0ec198959fb5fb870805ce0acbfcdac5b89d4000295ef14bb6517e82b0099f +size 12583272 diff --git a/model/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..329d8720d00b32c626949e3d85d96c57a444b30b --- /dev/null +++ b/model/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f50e7323b2d77be73c30ba19a316b0a97fc17784e966ec8375963dd93f6ca220 +size 12583272 diff --git a/model/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d50c2d445a63bc84369d99ae21426f91bb8ca419 --- /dev/null +++ b/model/model/decoder/16/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ec63c2d6aea4275d740309284c20393742a2f8d945a07848dfb1f56d3870758 +size 12583272 diff --git a/model/model/decoder/16/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/16/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d5d8a4b9cdd8ed0f79c9ed75a1f127e060cdd37c --- /dev/null +++ b/model/model/decoder/16/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6e1cabbe7ea826c0e86e0cf06af5e7a9ff19d19a9f18aa7d0a25747bdd5ed0c +size 8288 diff --git a/model/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a3553c95f729e60c3e58730991388bf9ec40214d --- /dev/null +++ b/model/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88f99b4586d84d2bfef49510fffa035f16ef10c0f74a3c2ffce1ebb9a02695d2 +size 29360368 diff --git a/model/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8937db1431dfaf8fe03abd146c6741a514c2edcd --- /dev/null +++ b/model/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fa5750ab3efd870027c1f52a510d42cdc79177800b4395d4be0f1d6b8c1a875 +size 29360368 diff --git a/model/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..254377d4c83d00302096e7513f12e75ec29dd781 --- /dev/null +++ b/model/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d64d203e3498f93a60ba368757ed0a2f5fe68f17724ee1cc263e25492d573d9f +size 29360368 diff --git a/model/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4874b10df75e55b429fa5bd624748d48bd042929 --- /dev/null +++ b/model/model/decoder/16/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:add2f6b007291c5e485a865a8c3edae79e81c2d76386eb53e1b672e918083b8e +size 29360368 diff --git a/model/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..23fefb6a43db546f22639e2ac1998e87f5f211f9 --- /dev/null +++ b/model/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebb4a663f403893b775a3c9647fa791419ad0cd58d31ee633d8d7ed84b3a4de4 +size 58720552 diff --git a/model/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f8a7dc9f45a67592252efa0fc30d55aded744645 --- /dev/null +++ b/model/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab42a6fbdf7b2422184892a685932bb2c422fa84c09d6b902e602eee5e7b6d93 +size 58720560 diff --git a/model/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..96c53c8e8b07eed9c31458c4d98a6d8ba53b307c --- /dev/null +++ b/model/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01da0dbb041d4a5113de254793b61b87003a4f7c973aa4c511c23547831d0413 +size 58720560 diff --git a/model/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..381221c57374caf0d42c44edb735195e19c6def9 --- /dev/null +++ b/model/model/decoder/16/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e25fb6414d6a08e7a9bec269d8117dfaa9021609824a4cca37654c2dded80d +size 58720560 diff --git a/model/model/decoder/16/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/16/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e1ca2fa600972ab4ec65bc87ea2faff2744901b2 --- /dev/null +++ b/model/model/decoder/16/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97c338cce866ad130c8df2215c1e27912efc6aca36005db1cfa42ee49f31bc1b +size 8288 diff --git a/model/model/decoder/17/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/17/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7b82c828f3fa4b4cb4b5919334788e73b498927e --- /dev/null +++ b/model/model/decoder/17/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f06c46dc612ee5dbcdad46567176e0892fa778c403219edfa7d5d49512851645 +size 200 diff --git a/model/model/decoder/17/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/17/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e8d52b12199268d4df072aacc433bd8c72d0bc4a --- /dev/null +++ b/model/model/decoder/17/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dba4d2a7fa9b891a8b5b61711d9cabf6f8b0afeacc7a45703083ba1a4c134966 +size 200 diff --git a/model/model/decoder/17/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/17/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..759350919d08c087d4f7571369531bb3085d1d5b --- /dev/null +++ b/model/model/decoder/17/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e80d0f0518d7d93bbdda86d9a2bfc4b1dc9be7599c55fad20030677a76aeb173 +size 200 diff --git a/model/model/decoder/17/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/17/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..065420e403201cdadee396d3d7d0ff1589486c27 --- /dev/null +++ b/model/model/decoder/17/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a6b039f5d4c42f8bd6e517c3a1d21438227423a6e0418c70347e1300ee34774 +size 200 diff --git a/model/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f8545592c53dbd80924aac870ef454ebfd482340 --- /dev/null +++ b/model/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c891945df4664e37cc8d292bad79fb87cbf6030087448d1144a51670edc034ad +size 8388848 diff --git a/model/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dbb5de58daaef58fdd46b62e74f333f93b289f99 --- /dev/null +++ b/model/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6b0a13ac4c851e2ea39df9812643eb88e24f3d6e309be378aee15472b9f4400 +size 8388848 diff --git a/model/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..934c0870da409bd3d849d41251c31d8993c9a312 --- /dev/null +++ b/model/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:653b9f290abee2eb16e45b3dd0a558f412aae4d4b72860745009f4453ba1a2d7 +size 8388848 diff --git a/model/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b6f6bbfcdc3e9c910293c3b89fbe643c5054be38 --- /dev/null +++ b/model/model/decoder/17/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa438c233a27b9052003bf54938d51861105e6b08f97aff6d94e21038ee8fc26 +size 8388848 diff --git a/model/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b7d24ff11456f90807a6995f00b8066c122742d5 --- /dev/null +++ b/model/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2607ffecdd859ee623d4fb9c99ccadfad97a3cac1192d6d2370b2070accadd3a +size 12583264 diff --git a/model/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..025bc4c5769dc821a8987e85be615227190c8811 --- /dev/null +++ b/model/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:061128ae28cb557d4a14f3b0a8b31d1762f3b4687448ac19a185e417b3c7f994 +size 12583272 diff --git a/model/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ffef8ba49a68697db12db1c1d8deb2b026bf7a39 --- /dev/null +++ b/model/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce2c0d098fbab32d7cfc6651add9cd314f33cae4f9ab0fb36e775a1f7547eccf +size 12583272 diff --git a/model/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a47df3ca24afc3e3cdb959abc66fb76ef8d1cb18 --- /dev/null +++ b/model/model/decoder/17/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dab3ed45d23b0ed2f9bc5d744f1408d3b51d1f548c62933e25704f19a3c0996e +size 12583272 diff --git a/model/model/decoder/17/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/17/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6ddb05b91b2b76384b113029455c5e6a3123b9c7 --- /dev/null +++ b/model/model/decoder/17/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fe9e6ef0dadb8ba66d7c2e503a52d4b0fcf4e0051ca97a607a6a1a64aa9fcbe +size 8288 diff --git a/model/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ea78dab209a02db211365156056073df7353d3d --- /dev/null +++ b/model/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31a990bfd94c3f32fc7cc6545dd83dd6839bcd83ee6aa5ac15c6674dad90bbf1 +size 29360368 diff --git a/model/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fb1e3d3debebd500380ebfcedba5bcf51d891f1a --- /dev/null +++ b/model/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d18c693eeb35b1c7af9cdfcd24d2d5f9f4a1c8639dec651b0e41dc186d4b1356 +size 29360368 diff --git a/model/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a276165315a16ef444ccb4560d1088db27dcc87 --- /dev/null +++ b/model/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f31a79af3cc47c430d34cc2db9e212d1ef08814421138d4da6e2907eb9f7fd8 +size 29360368 diff --git a/model/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..11093670bf1815fc81a8e5009a03b6a6ca118b18 --- /dev/null +++ b/model/model/decoder/17/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce6843368ba0a559733955fa75f8351ea057eb22b58f147c95f314762f30ae1 +size 29360368 diff --git a/model/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..66769878c644cc6f9cfb8569af9f616012c31012 --- /dev/null +++ b/model/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e471e95f7c61183441f9c15175d7f4db396220c3cf89ebf381216a4787837b +size 58720552 diff --git a/model/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a8a50675749ee4094064e8a11b1f4ab082aa4f64 --- /dev/null +++ b/model/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb5a74d76f01d709a91442f05fe292bf723f003dd53ab23f2c8e318247b44cf9 +size 58720560 diff --git a/model/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..71df79dbdf7cb61021bbe1233b029e451e3566cf --- /dev/null +++ b/model/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5735a86bd26323877937d71790100f7351cf858d23538bd11b23cfa2d2d64f3 +size 58720560 diff --git a/model/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..561c315b65c7b569b6538cb406d532e77c8a656b --- /dev/null +++ b/model/model/decoder/17/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa136d6c094cf33ece28a8347c1725ce996d34dafaea5d23519757adc3c40d0 +size 58720560 diff --git a/model/model/decoder/17/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/17/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8bbf0ac9916d9b77dcacd8a1af14cbddf28b75a3 --- /dev/null +++ b/model/model/decoder/17/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:937064f299b7d6e14c0decfd7b582c0cd2b0a46145c5b304f1e5a9e3b396045f +size 8288 diff --git a/model/model/decoder/18/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/18/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2426751afa6a3e702c5322c00a7100d1c3309e51 --- /dev/null +++ b/model/model/decoder/18/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9e73af5ca16b7c0f8d811d9c526aff95d5a163f3e72d61fa4394026bb4de9ff +size 200 diff --git a/model/model/decoder/18/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/18/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52059d2bb2b8330a706d6fd2ced29c1db55db343 --- /dev/null +++ b/model/model/decoder/18/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:640bdc67d629dcf5107fc79ec34900cba9391c08f9a8680ba29d65bfd00d1e15 +size 200 diff --git a/model/model/decoder/18/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/18/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..38c67ad5fef5cb49bf6f486a730215d26d18bdac --- /dev/null +++ b/model/model/decoder/18/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f843b9698a531137aadf314804c268915054cf5316e8222253a9b4428b2ff8f4 +size 200 diff --git a/model/model/decoder/18/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/18/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..501497df606288f9cd49b640b4c6e7d17556b6d1 --- /dev/null +++ b/model/model/decoder/18/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8223678504c59d4b33179aa6dde2f7fff316ac9f26cf12cb111eb96083c952 +size 200 diff --git a/model/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dba910563676c426f9accf09e80d7aca6db83c5b --- /dev/null +++ b/model/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37c45e4892d7e050be185dec9ef5e1a5c2ad8bcaae114628cc8da3fe8c636286 +size 8388848 diff --git a/model/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..db9ec25c54289dd08953ff533c795c27619d27a2 --- /dev/null +++ b/model/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a091830db4d939a1485150740cd7a13a82f8e2e99d85d3ccd00f7bdcc5bbb004 +size 8388848 diff --git a/model/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..66f0d8c85cb62c2d7126db79ee3fce481a134b9b --- /dev/null +++ b/model/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39849b15c79a3a82d733d42b445353f1a6608b546dd0529b729e502432024298 +size 8388848 diff --git a/model/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..becfbed8749d7c82c4657b361d02de8c2e66a7d6 --- /dev/null +++ b/model/model/decoder/18/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fec461c403c2890b1942d03bded91483edd2ecf577d302bc07d202e6b212c22f +size 8388848 diff --git a/model/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..43d97882a8678d07bd338b76264899c7315fa66d --- /dev/null +++ b/model/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21687a8ea17c3462975364124d8c1c3d7b8e2599c02de6417d813a3a3ae8a681 +size 12583264 diff --git a/model/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..edbc0e0975623f301b3a1a593befc1714c0c44f5 --- /dev/null +++ b/model/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9030b20579bbc40f92cbf53b826dbe34bfba494d1f199cfc6da2cc37b29b8533 +size 12583272 diff --git a/model/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..05fa49cc9f541624ee735b95b10218670cbdd3d7 --- /dev/null +++ b/model/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21c74951e07525726ea873bd2f5bc9bedf5392791b86accd6d856bc51256c67d +size 12583272 diff --git a/model/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ccf903684eff58f6231c87f650537cd9230e78b --- /dev/null +++ b/model/model/decoder/18/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baa7156a4c1b23e6fbc75f87a8763e8795582bf0c012ee9fe7d4be48b4d679fe +size 12583272 diff --git a/model/model/decoder/18/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/18/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd1a6b7129f82d7b84a484179754e0127ae2970d --- /dev/null +++ b/model/model/decoder/18/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5a4d941f8bb409f5e40910e4df3f21375105cd1d1b1d3e673afa2144181ffcd +size 8288 diff --git a/model/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3805e915e10deb8c51cf769317a4c29bbc779304 --- /dev/null +++ b/model/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7de315d37456d8821b04c9899d1f9f9f3d5d56c488a57a8ab6cbd2d03268561 +size 29360368 diff --git a/model/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b8f916499b24d7323b6ce48b3a234ab22e0fcd1a --- /dev/null +++ b/model/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8826613c8ee241341cdb6b3358f8f166e73acfd19482519f7e88a440183f900d +size 29360368 diff --git a/model/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a6161167fd704d2f93b204dbfcbafe5c0bdb16a9 --- /dev/null +++ b/model/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4433ec929dc3dbac64998cd89f9a370cebe6bfa264ce4ae0da09f0a5d3419752 +size 29360368 diff --git a/model/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8fb91514142d040197490fed1b7a29cc1bde1023 --- /dev/null +++ b/model/model/decoder/18/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d7b6fec9021c6fddeb21fb968f6d2f56c1b816f5a8bc8cb03b6763de0187765 +size 29360368 diff --git a/model/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7db2e9029066944c2f8fe086da3170e61b2aa0f1 --- /dev/null +++ b/model/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3802300d03ae83c76a21490209128dd3a8c094fbbebb9cb9f540a69c3dac9854 +size 58720552 diff --git a/model/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..efaea4a3c62ef8eba40e03492c60ce6995b728d5 --- /dev/null +++ b/model/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:361d16f7c0368d6a68fe761065b19650fed575763d9ea60f2eec6a34ebd1aaa5 +size 58720560 diff --git a/model/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fa16e8ca021563a3577ce6349916ffd562ac6ebc --- /dev/null +++ b/model/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd925da10b84917f10e8cb36c2b28255d705d514d21f7b743475f8161ed06fe6 +size 58720560 diff --git a/model/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f80f7eddae58ee5f5d21d914724dbd5fffeb80fe --- /dev/null +++ b/model/model/decoder/18/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15a70633adce2d86dd4be9fb66f3789ffff02be1138de07787dfa0ff53bfd5e +size 58720560 diff --git a/model/model/decoder/18/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/18/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e82590d9a6306f6d052bcf0bc8f415022e2be6c9 --- /dev/null +++ b/model/model/decoder/18/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9923be986178951238898a0daf17d80eeaf4fbe80f5a90e892b154bc911912c +size 8288 diff --git a/model/model/decoder/19/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/19/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..095096a53c08d523c9a4d65c760ca5aeee97dc6a --- /dev/null +++ b/model/model/decoder/19/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:128d417d14da8c18c1d21d41a600a2867aaf546d6ea6ba3132902ff6efe7f245 +size 200 diff --git a/model/model/decoder/19/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/19/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1b944f3f78f1ef862d1f3c66dea5925c3a4d1515 --- /dev/null +++ b/model/model/decoder/19/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f138bc0fd86e61c64d04f1012ba7fb0bbd8dfdebbdf7a0cb2781a68e1ffcf4c +size 200 diff --git a/model/model/decoder/19/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/19/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c461930c4f9a3f44c9a9e4d601993989f1e1be5d --- /dev/null +++ b/model/model/decoder/19/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50f7b0c243bfb421d4588fc17b8ebaa01f190a9ec3f6e7742bc91fab95a1002d +size 200 diff --git a/model/model/decoder/19/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/19/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..26c47d93871058eb52e86f413af53ee9dfdb876c --- /dev/null +++ b/model/model/decoder/19/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a2c229dc56739dac68ff38bdacf3605f41ff94b8c19e77f9f4a37f6bad62627 +size 200 diff --git a/model/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..200c83ff6281d35933b0f95d2fa60df168b056ef --- /dev/null +++ b/model/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2988a8204ab10f21964abf746b24570cf13902b45bc30a8fdd4ebfa4e5c028fc +size 8388848 diff --git a/model/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f5e93ec64031e6c7eb398f84c4895546a91d6570 --- /dev/null +++ b/model/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368ab4582bad17640cf01fbc38c642451abba1594c8c018e1b2d072ec58245e0 +size 8388848 diff --git a/model/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a0b5b2f89ca8d780156eed14a7743334477bf5ca --- /dev/null +++ b/model/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6eafd458274b427e92454f37515461c0a4979abbd541e4456c5a98e945231df +size 8388848 diff --git a/model/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..44fc2d2d828a0d2f274f4364642763eb9d62e836 --- /dev/null +++ b/model/model/decoder/19/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eee02ba334d93fa99b89af6cbbf6c34b996d7e199386229d8545abac4d9643d4 +size 8388848 diff --git a/model/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d0d88d9a70e37d25e70de27f6712bfe5b850b1b6 --- /dev/null +++ b/model/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9beaf51d10ddc244c5e7339d4921e332a4a82aeb17353eb5c53a2cf415f1e02 +size 12583264 diff --git a/model/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cdce51804c21cf66d5299f69c3acccf45d6e838b --- /dev/null +++ b/model/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa1622a704db5de5750c68d089494408a7786ef5e710678bbfd342c9f6e49163 +size 12583272 diff --git a/model/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8661da27ddd206ab1f0cd87b7acc658b46738692 --- /dev/null +++ b/model/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12da92efc4fbb9dac8b0d13884537f69c140cc5d7bff21ea9fb344faf13d31ea +size 12583272 diff --git a/model/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..025ae85e8c754eb517ad3353ef07a9bbcfb20454 --- /dev/null +++ b/model/model/decoder/19/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7123340e91f7df5718ad6aefbe8da4d90be84408427991b7876952f2feb4afdf +size 12583272 diff --git a/model/model/decoder/19/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/19/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c12819ec0dee1fe554764d391e36af6da6b8576a --- /dev/null +++ b/model/model/decoder/19/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6dc2eeaf6ebfc1cf554796ddab43c8311f2f48cc6bde20321fc04dc08ee2de1 +size 8288 diff --git a/model/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7e8381f55cd7ab8c203034eb6159ad949f452a5a --- /dev/null +++ b/model/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e17602d57c8067b11731a5ae1d8d0dc30cfcb982cf1abe78f8dac164dce41412 +size 29360368 diff --git a/model/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e1d400e35287e7bac0d3b605bb5e8d5821d3867c --- /dev/null +++ b/model/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2470c40526d10a4f66b524874c7e2f91e2002bb4b6678d008c49673ec9afa448 +size 29360368 diff --git a/model/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..392bb15aecc8404b9b575040b2ef9c0cc90253bc --- /dev/null +++ b/model/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81081b339d878579311724a08b7f1626120c6aba789828166a8a354d3664975f +size 29360368 diff --git a/model/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2cf8c162f037fc7d7114b4c6992d10478cfb88e2 --- /dev/null +++ b/model/model/decoder/19/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2720243a3854dd4bfa23072e04830b7c6342082de3a2f534d2b0e55066ad9b37 +size 29360368 diff --git a/model/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..06e990c8e9726693c0f3772117ea12e873edf2fb --- /dev/null +++ b/model/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeae75da3deeb26b97626bad2d6db627e7e56d21037785ef2f4668ef70d7bb93 +size 58720552 diff --git a/model/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6cba13aa441499bf519efede067e38b5b752e526 --- /dev/null +++ b/model/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5643e8722a4c91b0b24b0a7e58c3178da166f14d013dd6ff2cd59580764097cb +size 58720560 diff --git a/model/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6f32aff0fd409f087cbf7a4720439a29d3b308cd --- /dev/null +++ b/model/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7798fe1310d7510a8f8cfffb974dbf58707a9f051001e41a1890f53c725a17f6 +size 58720560 diff --git a/model/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..28d88d4ebd6d33147251ceb32fd2eb6b9d60eb90 --- /dev/null +++ b/model/model/decoder/19/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02394d28d51fae024d2020e36c150069cb198d2ccb0033553c6f4bba079d7a9a +size 58720560 diff --git a/model/model/decoder/19/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/19/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cd9f942d166fc5b91587aba70436162eef122103 --- /dev/null +++ b/model/model/decoder/19/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a88b121b14d1691907f02640ede1d1358979291abe6c67fc92212fe5cbb6018 +size 8288 diff --git a/model/model/decoder/2/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/2/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ca0fdab48f4194c1813242174e394ec2b9058fe3 --- /dev/null +++ b/model/model/decoder/2/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57cbeb39afcfe59d5a66f8e4dbb76ef1ebb96cec563e3bfcdb233b0200ac831b +size 200 diff --git a/model/model/decoder/2/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/2/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3b558ddf2ce7133a737876a233da9e5f443b12ff --- /dev/null +++ b/model/model/decoder/2/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d936d48e466269dfef1a1623af33f64560772b2b030956173c4c6fa9706bcf4f +size 200 diff --git a/model/model/decoder/2/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/2/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0b764cc65e8d948ea250d5de37aab6bca66aec9d --- /dev/null +++ b/model/model/decoder/2/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de6376d3d3cd3391af7509e301f2216fb2fb63ae1df7ff0a4634174f63fa080e +size 200 diff --git a/model/model/decoder/2/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/2/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9fbe5abb0ba40167c838908c078e0f22b30e974d --- /dev/null +++ b/model/model/decoder/2/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d42fd8cfc70a8f4a599ed8ec1d47a892e712f8f3134ecf989488721b03633a1e +size 200 diff --git a/model/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8b42278b399ad07b46abf162536c6103ffbc30b --- /dev/null +++ b/model/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40c851f3cbfa15f0174b4a5ebaa2c99732d9a0776d8762129dab2ee1ce4fa3dc +size 8388848 diff --git a/model/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4ab7b56bccac1dde3f56bd21f5ba663cfbb500e8 --- /dev/null +++ b/model/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b4473c62ce5b41e31548d338e964a6922b095ab79f88e72b1703a72704ab21d +size 8388848 diff --git a/model/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..30ba57836fc95c8ec5771848c83c2c7869e164cf --- /dev/null +++ b/model/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:377578410d1e7d331dcea1f73a67f65a2dfbaec542c4caa7d55c9f8387c3468c +size 8388848 diff --git a/model/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1ceb846deacca44c7ec8b3faf5854236c894d083 --- /dev/null +++ b/model/model/decoder/2/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75bccab9441458126f7811c60a0a5222797d3773296b0d667e23118a455e594f +size 8388848 diff --git a/model/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cadec3595f3091161da6651cc46243d35da348c0 --- /dev/null +++ b/model/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b0fbe3222c825f1c7fbffb6cef185eff18e9ae5b15063a835e999b6bfa70e8e +size 12583264 diff --git a/model/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a628b147280c0772e9db146d718432b0ce075610 --- /dev/null +++ b/model/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b4bb63e5cbb7f733169ee3f14f234f9a884b94d661fcf696fdd9eef5a9f95c1 +size 12583272 diff --git a/model/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f1be648698ca81734b5a42dcd44eeb8d89ce9b05 --- /dev/null +++ b/model/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920464f8cd16bdfe604081af1b9dc38b019220463c6f34a753c47cc6f19b1c99 +size 12583272 diff --git a/model/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ccc8a3c893ca88d980f5e57f8b649aedc42fa72f --- /dev/null +++ b/model/model/decoder/2/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13bb35ec86791aa1af8f0f23195cd6a8426ccb36462aa150b2c5fc0cee1afa48 +size 12583272 diff --git a/model/model/decoder/2/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/2/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9f8f9a1654268cc936fcd1fdf7c1e8376d5ca395 --- /dev/null +++ b/model/model/decoder/2/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b80acb153f7372ed250d38caab623bb05594411ff1ab7fd07f95f8ffffb46568 +size 8288 diff --git a/model/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..96a886eaae76b982ecb06df309003f946d4e5d5c --- /dev/null +++ b/model/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a43f4223c5b47d2f0d986406d16702e01669a6572a24507925b47b4bbb9c59 +size 29360368 diff --git a/model/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5f06676bb16bad4187baaa47531bb50a98eb287 --- /dev/null +++ b/model/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09900c542d2457fbce5d41ff12be28a9f938d6e6d019aea5ec377749049c75ea +size 29360368 diff --git a/model/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..929b8ed0e24eadf7d6d3d3663c46a8f1d7d822c9 --- /dev/null +++ b/model/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bfd1aad09357c51e53e9d79db12f585d580d7bc31a4b2bb37f0c62789cedf52 +size 29360368 diff --git a/model/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..34389c570b249de9e382c6666f54b967b10363da --- /dev/null +++ b/model/model/decoder/2/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c02231cd84abf1385df20bfee05c2e4aad8c631493cf813f74d25366ac26d264 +size 29360368 diff --git a/model/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cb256baf0cc98b63254c45b5a6afa31b8127248d --- /dev/null +++ b/model/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fc23019ffdcba39dd21aac75e1e615c3c2813b6be0fc898e171693b403ca3d3 +size 58720552 diff --git a/model/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..34957435f33ea997cd88c0e916d35cd1004b162f --- /dev/null +++ b/model/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4e9d9eb5344f3cfd6d96998d4b48a0d380a25994d9404e30d8b40e56b9bd5d9 +size 58720560 diff --git a/model/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..51dd46c8040cd45863c3d7edecc0f178ec44f646 --- /dev/null +++ b/model/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5443c867b27cb603b747ab3dd659c47ab73ef03675675ed0cc9c99a013f33e80 +size 58720560 diff --git a/model/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f54a1a6df276f1379b4c38ac0c3054c06d69aa97 --- /dev/null +++ b/model/model/decoder/2/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51127050d148bd643e0af26ee8074b03bb751165771d28e776ce937faced73d6 +size 58720560 diff --git a/model/model/decoder/2/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/2/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cef0edb130cc45948be0b63c1d6b9c2f6ad97c74 --- /dev/null +++ b/model/model/decoder/2/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b712b80bef8d3b2e10f0592acc208bac5e9aacdfa124ce0804cca2f6f91ad32 +size 8288 diff --git a/model/model/decoder/20/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/20/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8af2b185158736ec90bbc103fd9e681194fbd274 --- /dev/null +++ b/model/model/decoder/20/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1121cd1e9e40126f9b4edd8e1b046e1c0bdedd955bf762593869c705f8069eb5 +size 200 diff --git a/model/model/decoder/20/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/20/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09d3763f69eaf48a3d3a46672dc7cde9fe5a46bd --- /dev/null +++ b/model/model/decoder/20/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbbfd8d380be0646a89162872e7af6ed05e99ae77473b08bc9787f6d91108b69 +size 200 diff --git a/model/model/decoder/20/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/20/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d6a84a19384c81417f8319992b3f373d1569d984 --- /dev/null +++ b/model/model/decoder/20/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e4b272ef542aa839ee3d4d6554e2e3b3030f5fd40b333148353e6c170350945 +size 200 diff --git a/model/model/decoder/20/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/20/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69fc8b1f0f3ab0ababc230bb8f20863a750f6d60 --- /dev/null +++ b/model/model/decoder/20/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46f08cde9e0d311dbd119ed3dd62877f476809605090a42437a2ce3e2f201154 +size 200 diff --git a/model/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6e3ab4a6869dd23510f069c444ef9eaa0d4eaece --- /dev/null +++ b/model/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d866845f1a7583bb76e80a00e69f8a2c11e9b6d13ff84fbee8410c6368b30c3b +size 8388848 diff --git a/model/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b178e579c5f03e5321a6751ba174fa7dc6c744a5 --- /dev/null +++ b/model/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da9cc06eabaae1fdc0daceab2d33051f85862d8fdee0cab994b5ec8ce012aaeb +size 8388848 diff --git a/model/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cc7d713347d186bbed5f8a6d730617c6d3d0785a --- /dev/null +++ b/model/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e379cb63b2d3a5c1b2128f02b9438a2b8f56c5ccae27b2fadceff956272023b +size 8388848 diff --git a/model/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bef18648b6f531f85aae21f369272899fe4e3b95 --- /dev/null +++ b/model/model/decoder/20/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f6ab536a4cd1e8777eeb55f870b3dd56920ce7b4b111c93f52e3a0dee48dbdd +size 8388848 diff --git a/model/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fd31e2e635c1b9cae7d28e437be41c10f3aae391 --- /dev/null +++ b/model/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9aee67b7aa71880014cfa6416eaad17c53cabcb0c318007b7708f539a59560f +size 12583264 diff --git a/model/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e674b8de9ee9262643a6c2fbc6e4533297692135 --- /dev/null +++ b/model/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f3ffdde6750864bc792f451d55b3890aaf0b9a2830928f4abc1818e84671609 +size 12583272 diff --git a/model/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e2406a270dd6ae8373fffdd07ba9a82d6187dd4d --- /dev/null +++ b/model/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64e5c09758d0bd9a1c07f973ed0f76e93d43b685544ffdf6f10814a48aa6e1bf +size 12583272 diff --git a/model/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0b24387c6e7faf92613928d8d70f4cf53535862b --- /dev/null +++ b/model/model/decoder/20/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ec169f2e2d1c9bfb54447e22da6a69cf097ee1f58e9da71af74c8e2f56f6b95 +size 12583272 diff --git a/model/model/decoder/20/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/20/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..57cc8aef29df7e14a05159ad016caad286de271f --- /dev/null +++ b/model/model/decoder/20/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b40419fdb6aecfc167fdc248ba0398af41456319825d2b8b52ef5fce39f28346 +size 8288 diff --git a/model/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..549cc0ed4509c1168762934f126a36abe83dc65e --- /dev/null +++ b/model/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87ecbc6c318236811aa0baa78053fe32e0a543a10a8641ee92fa32ad828b717e +size 29360368 diff --git a/model/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a2dbdd2a947d7fcdc32ff711f68bd6b1bda5df9c --- /dev/null +++ b/model/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32234dc562efc73b8c6a6d7ec6bea53d7ea9be0d8bcbd4653f71df39f52b3b54 +size 29360368 diff --git a/model/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..280d5910f6dbc514149ee3fed5087edeafcd8618 --- /dev/null +++ b/model/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78f6adc134eb641d51c0675fcad5d77dfd2b3f5b1db0add888cb5b96387caf2a +size 29360368 diff --git a/model/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9300c9fda56b82169d0138367942190eb265fcd1 --- /dev/null +++ b/model/model/decoder/20/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d311f6b82c049a52b61c0e082ecfa46e3294d343356468fc41a532da8daccd7 +size 29360368 diff --git a/model/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ed24117e519d8a5a7a0c64115d62df877e69aa1c --- /dev/null +++ b/model/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5413e00c7f89ee98d9cfe80ea205cb73be83a7ab2d804e4e000a222d4afc158a +size 58720552 diff --git a/model/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4e3c81c9bb541234caeb5d54c2425867612855a8 --- /dev/null +++ b/model/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:242e9dbdfcc0296431e5e0e30eafc70827aaea1dda1540002edcab4ad3d78567 +size 58720560 diff --git a/model/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3af3ac6015105d884ba8a453c6be769f4506e88b --- /dev/null +++ b/model/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a9e471d80ea34e85ecd8b387675ade6d2488ef3a060eb81a780974f7e8d11da +size 58720560 diff --git a/model/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fcc29e7358fa108ff29bfe6a2996745e696c38e6 --- /dev/null +++ b/model/model/decoder/20/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5515357a131ed80ed18eb747cd8d2e0f845f9bfb3d7dea273e58945159cb3adb +size 58720560 diff --git a/model/model/decoder/20/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/20/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fdc41473d4522e1ffe81536211cff10f0d2fb6e0 --- /dev/null +++ b/model/model/decoder/20/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb47d306e63403e1be3e67ec2389266c7c34af395ba6a6c67c02c1326d255956 +size 8288 diff --git a/model/model/decoder/21/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/21/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..41b111ae86a5c63f6cfa80f89efd2c69c96191c6 --- /dev/null +++ b/model/model/decoder/21/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05ef08b243e128496a75ae4a9a48f5575979b5e4220cdcfe1660d3377e968c0b +size 200 diff --git a/model/model/decoder/21/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/21/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c5d032f15af74ada8d1703ffbb7b80892fdd114e --- /dev/null +++ b/model/model/decoder/21/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a5197f7c197252a97c04c82de0f70894f874d0f705e08ccdfcb981fcc457b9 +size 200 diff --git a/model/model/decoder/21/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/21/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fbcf918611148762c03fc6126764d75a3d9be955 --- /dev/null +++ b/model/model/decoder/21/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b44e6af95f192105c8a83498899fa95ef62f7eae60d3cd4eb7e699b1bb7b0eea +size 200 diff --git a/model/model/decoder/21/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/21/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..923b7e69b215f34e71e1ebb2e4cc72ec4dea0b92 --- /dev/null +++ b/model/model/decoder/21/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60fdefe6977764f8f1ce0cd3ae0723fda574c77ef0818526d91f7acae1d2de5b +size 200 diff --git a/model/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1632ceec52371623b06ccfc8ab46c134c4307701 --- /dev/null +++ b/model/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d54dd2b1a4db87194a81de8b0cc74d2f4ac504e1a3a5db647d41705f0ddb52 +size 8388848 diff --git a/model/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7cdf7c71ba64c7fec1ba9d315326c97c589e4c28 --- /dev/null +++ b/model/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f081ca02350ed51d278c0030d34e4b0d8b482fb9514911d5f3904b22226e3f6 +size 8388848 diff --git a/model/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9c07acc5c0c8ad80ff6177d348739f5ef1311eca --- /dev/null +++ b/model/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23504dd1915105916f81f1ea0f4d8ab94358fc4facbcf540d0bcbf2bd80867a0 +size 8388848 diff --git a/model/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d1d72582d64c6314879a1105fa928a9d0fe4e8f --- /dev/null +++ b/model/model/decoder/21/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:994432257ca2e7013c650ea18c29205a4c4c9dd80b15fcb4e0d395154d85ebf0 +size 8388848 diff --git a/model/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6597b0e8fe6e1475d614adf07ecd157246892fdf --- /dev/null +++ b/model/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68a1a62c300a10742f27b5afcba9154212b66bc056926b2d7a1d32488459b010 +size 12583264 diff --git a/model/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..50e281991c7a6cb3601cd91a6c67dffb4f314fb1 --- /dev/null +++ b/model/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f973ae7674bb37685acf9d2eaeab76a97568b9c6b6bb0c52d9e97db4f7eb45d8 +size 12583272 diff --git a/model/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7c80149a40471648972c5288789d7de3fe0149f2 --- /dev/null +++ b/model/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec28ecdda13976b6936e2fd335fba4e6dc42e3ab462a2ff3a5d455f1075e1872 +size 12583272 diff --git a/model/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0de1d1eab5aca730a2aba0e805ffd4470021ea66 --- /dev/null +++ b/model/model/decoder/21/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afcd02d7c9c69b450152959cd270ec295ade9fe5df79a37b8decf7cb3ff27369 +size 12583272 diff --git a/model/model/decoder/21/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/21/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7066c650bd75bf9c6deee29360048b78af79006c --- /dev/null +++ b/model/model/decoder/21/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cfcc092d2f73604c1c68b870c0e0261a9c700f857ddfe683b52bf00c1b79b5d +size 8288 diff --git a/model/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aeff125ad257b0dbd2cf6a42a2a9a7b173c3684d --- /dev/null +++ b/model/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:570adc06b110df4f093d2083786c241b77fe1c66f399cbba779f2ef4fc4cf4b3 +size 29360368 diff --git a/model/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f161c2b9babdee4a3ce267b852fa6b331a0218ac --- /dev/null +++ b/model/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6e028e62b06f2ec2cb99643be33e86310c76181a253176f4f14f8188bb67a7f +size 29360368 diff --git a/model/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ab7760d1656f2ec408229af79e1fef34198863d8 --- /dev/null +++ b/model/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfdf48c41c7cfa27d6b91741962df9d2ed245ba9ff3e6edfef04aa122cef27c7 +size 29360368 diff --git a/model/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2b997455c5ad2ad4d93f13db9ffd8ecdd31ccf71 --- /dev/null +++ b/model/model/decoder/21/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1395be82f2e7d7f8133ce57f6580235ae8e34f6b0e01baf40fde8ad5b43dfb7c +size 29360368 diff --git a/model/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cf8f03ec3bd01e768d3947cac2fb6481f0577dd8 --- /dev/null +++ b/model/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9c1f4ae0d10e82efa29df0aa60f71327a2c2b0eb1026b639af812f46e66ad76 +size 58720552 diff --git a/model/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0270b0df392fa19e54cb4650f3a816ec2e57def1 --- /dev/null +++ b/model/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55033fb5f145281b643751cf816320967adf71501e210336b2b5f19ceda9a572 +size 58720560 diff --git a/model/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..19e2cfe7042c967ebb3d7f9c0041412c782f298e --- /dev/null +++ b/model/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b408090be2832ff3a3759075789d35ab9ebc25844a740700e2d807ade8ed76e8 +size 58720560 diff --git a/model/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..32254b4a07af869d12fe4ce6ab74bd9918db4db1 --- /dev/null +++ b/model/model/decoder/21/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d239fa6e08de7c66b24a74c6fe429366b8b4060239c0ab30810753374274cd7f +size 58720560 diff --git a/model/model/decoder/21/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/21/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2f96a520de99fda4b7bf4ae275c4e5542724d806 --- /dev/null +++ b/model/model/decoder/21/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b0816ed357b07c7c3e8c1511d27e7c3b39379d4d89ce9613d734fb012aa8be1 +size 8288 diff --git a/model/model/decoder/22/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/22/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2d8ba5fe62e6fc86bf66ba420c9d849c1101f949 --- /dev/null +++ b/model/model/decoder/22/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ec9176bb99ded983157279df9c7500dc43677938d7ee0c2a2935e8b782f05a6 +size 200 diff --git a/model/model/decoder/22/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/22/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5b9bd6daf0692c54e8dcf45d41d729bc8ec63f3f --- /dev/null +++ b/model/model/decoder/22/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22cdd876ef217fed0b79559be25116830ed6d6fe1b84bbcb80bdf7a7ae14dc03 +size 200 diff --git a/model/model/decoder/22/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/22/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5d24e4caa86aabeec5ea49d25fd55420898b1e4 --- /dev/null +++ b/model/model/decoder/22/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7333ac013ff1964a723b99b008aa4fcc0706e0f8abf776d64483d10f00d98023 +size 200 diff --git a/model/model/decoder/22/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/22/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0ad8b96ee5f3b0ec7e83fba808d1a68565d574aa --- /dev/null +++ b/model/model/decoder/22/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d481d157f0d38874d030c97d290e3b9c8920e895854537ce6165caa8773d53a1 +size 200 diff --git a/model/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7865ea997af7889dbd388d1460a12bd94bf80bba --- /dev/null +++ b/model/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8a9d1fd43ce40b68e0759392bc95d5448b91b7ced2f10bea7edf1cba304cf79 +size 8388848 diff --git a/model/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..36da31e5ec2d4e800b98989d1190380d1b5d4e99 --- /dev/null +++ b/model/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aaa8fb1fe3d344e0ef896516158cedee6cfd810396bf4266bd7ec6b744f0fa3 +size 8388848 diff --git a/model/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c2eae130e14076ff19c411e603ed9ab9687a7a26 --- /dev/null +++ b/model/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:727725e1f66768d1445659cd9218af4176efdc59ca58a185272eef5c04a575b6 +size 8388848 diff --git a/model/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fffee42fdd73faddfb224a6f9216dbca3e76c136 --- /dev/null +++ b/model/model/decoder/22/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5180b1f3ea6aa0e8924b99a5feb4b01e61ea3272873431196396b367cb853078 +size 8388848 diff --git a/model/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a2db44726012000f87cc7c4cc20e3c997b0829de --- /dev/null +++ b/model/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6eadd134bb8ae1636f8c190354879471915f547bcb5d83e1a9d5f4f55826889 +size 12583264 diff --git a/model/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd6d96fe99f6a0a8c17a83bedd7a22b9d49f0816 --- /dev/null +++ b/model/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fadb4d752b8ecbd93c9062fdfc507b954cbf3b400ecd2ea59342111887f8927 +size 12583272 diff --git a/model/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..97cce85199d7e5bffff76bc75f046cb8c7464ec8 --- /dev/null +++ b/model/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d023a8a9115d3e340a1a8202dd5d9c79995f33d16cc938d7ea1a8a7a1575bae +size 12583272 diff --git a/model/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d88846f4f2c7b408b80d74e180a4eccae40da07 --- /dev/null +++ b/model/model/decoder/22/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caedecb668b7ab637e4df623f8ed4ead1ef7293b86690b95023207ebc82ccf4c +size 12583272 diff --git a/model/model/decoder/22/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/22/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dac0e2c7f4e0b89b4f7fc3e48b6fff6e1f946959 --- /dev/null +++ b/model/model/decoder/22/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0498147439292f48756f2da9d816a8b07ca5681a9b976581a6695513edec74cb +size 8288 diff --git a/model/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f921d7cc4ad1ef6c68f4693424157e6e7d960170 --- /dev/null +++ b/model/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea6ad063734c7fade83b3989f1c34f17d4fcd71c47dfa769d3bacd20cc64b23e +size 29360368 diff --git a/model/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2fcd3cf34f9ba9049b063df7a72fc807ab6a198c --- /dev/null +++ b/model/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c41e3dc704a325099b4866c0390d24f4995bcaec0e1d053600df5433bb800e90 +size 29360368 diff --git a/model/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c288e2cbdda7a0d1c232c75703cf646bae6f0ee9 --- /dev/null +++ b/model/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:986ae6251b2c271989a97fae545b734e72ba6dd946f29a43bcc671f638adbe28 +size 29360368 diff --git a/model/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..48994d1c917406f6ac5c8dfc14cdb58b7ff8939b --- /dev/null +++ b/model/model/decoder/22/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a52cc297d4271734af6e8ea3717354558b0dd268d3bb816ffb4f9f94c02514c8 +size 29360368 diff --git a/model/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d45aee7f0dd220da418c4a8e62da2491f1473f7f --- /dev/null +++ b/model/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb62a3b31aead9665301eca444bf3b8bb75cf56418f9e0bff7a50f88ca00dd75 +size 58720552 diff --git a/model/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ba6ce9a440da899e70831bee07bfcd9c8dc6b6d --- /dev/null +++ b/model/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e42dd8c0c5993dff62b31a04815965031cf914ded2fc221e25dcb616d989152 +size 58720560 diff --git a/model/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9a03cd29c36c2458fc111ec2d217cc443f385af5 --- /dev/null +++ b/model/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8894d1d5059f28d72b4813383d976582172456613b1ffaf1ec34233b9f01789d +size 58720560 diff --git a/model/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bf0124f72d2c0690dc12d47ba99f74ebe28451ca --- /dev/null +++ b/model/model/decoder/22/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2698552185c93af5d38fbb8346c0179a774f0bd984d5c4229394fdc511866fc +size 58720560 diff --git a/model/model/decoder/22/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/22/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7cab29c35380339fd6f4b2a114f088f6bd3b2a22 --- /dev/null +++ b/model/model/decoder/22/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36efb39b88bc972f357bb29015e639a7de0f69fd02d557074be519f9e6366a34 +size 8288 diff --git a/model/model/decoder/23/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/23/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d18880563ebae6bbe93298f90172b56eb940b218 --- /dev/null +++ b/model/model/decoder/23/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b404b4d230eec90e8a90c203e4f92a984e9a59100e6c6a94b2772e7e5209cff4 +size 200 diff --git a/model/model/decoder/23/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/23/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c6baebd34b6615298a179fd94d820743919005e5 --- /dev/null +++ b/model/model/decoder/23/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15d60321347903495c16c0aea8618c2c8d380670e3c370f3d95a0e78969d5711 +size 200 diff --git a/model/model/decoder/23/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/23/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6f74f15c9eaed5e356dde233565d6d9dcbae8f80 --- /dev/null +++ b/model/model/decoder/23/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d692abf9a16f7b53365d6fb5099871c8036fc16901ce607aa3630f0ade70b312 +size 200 diff --git a/model/model/decoder/23/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/23/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..38560a0eb576466a3f0dbecc818d1182a2d34238 --- /dev/null +++ b/model/model/decoder/23/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc4ebc20a31b2ed292eb35f752cb5a22146085e4955c4d13cb17cc4fa1dfe2ea +size 200 diff --git a/model/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f267e734688755df1cc11e87aba6028508bb2240 --- /dev/null +++ b/model/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:840547f906b590bc379fd8a7f86f619d1f0b76ab6382f49f3caaefbe53fd46bc +size 8388848 diff --git a/model/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d2775e7ef92f9d028e1eb82fde59eb5d13273026 --- /dev/null +++ b/model/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a68da2aa140818cdd77bdf82becf311ea91673afa4073d50fd278cb3201f14d3 +size 8388848 diff --git a/model/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fb00075aa758d389a9aa10e9fb1ab42c11a96ad2 --- /dev/null +++ b/model/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a3935a7b0deae187fe64a5533c086508bee2f59b8dbf572cd90af4d3f239c81 +size 8388848 diff --git a/model/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..86554208782f3d4736baf262e3996cf46831493d --- /dev/null +++ b/model/model/decoder/23/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d92a63c97fd5b94ed9960b53aeee5bc552bbf8c4e9ff4967e0dcbc29552759dc +size 8388848 diff --git a/model/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4787053241e4b7464e603feab2cf909cc972b455 --- /dev/null +++ b/model/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06e5c8e7b6ee01ade3420752fedd4306ba55c502a8ffa37e569d3d602e340361 +size 12583264 diff --git a/model/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..614bffcfc14f3a7a48a0aeb44b6759c112ee4a9b --- /dev/null +++ b/model/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51977b5372b160857470269ee7417aa9797fe96c34c3f31eeee4292f5ee5617c +size 12583272 diff --git a/model/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..47bbb63f29c78a4aa350127c69e7de6a36ca229d --- /dev/null +++ b/model/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f23fab76a837613142fcd2e0edbf18aee3473b0723a44cf6625738765f79c2 +size 12583272 diff --git a/model/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5365fb07998a4e646e1650eeb6bc385c26d1c74f --- /dev/null +++ b/model/model/decoder/23/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b44b8c289ca7727f4117bb40799564061828ab32ddf4a3ae6cfc37deab3ea22a +size 12583272 diff --git a/model/model/decoder/23/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/23/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8166e6908d7be845f1c4dc646fc3fa8262456484 --- /dev/null +++ b/model/model/decoder/23/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6105a9bd00ea98b471dd973198e39afa9b8aebcd422867ccda44f0beec2ce14f +size 8288 diff --git a/model/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..30b8bcc2a2bdb6b23603a4e778322df8cd40e76e --- /dev/null +++ b/model/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d7ef45e33052025351d379243dffbb55dc7f3cf2b4e4feaf04c6f65056595eb +size 29360368 diff --git a/model/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a451c5436492982a7fe2b664e4e7cd9764d1e979 --- /dev/null +++ b/model/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45fc049d308590968d2ea9055ca1cfad47b4ca78ed9ac75515c77c385bc8358f +size 29360368 diff --git a/model/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..db8de5bf774eb5ea7cc6c13a840f6bb332b7df3d --- /dev/null +++ b/model/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e92ff52ee057413cf169550210db3ef83e163ce872cb13247aeb89a8315c0393 +size 29360368 diff --git a/model/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b2564e172cfcbcb9b28ddf67937d1bc9bf592516 --- /dev/null +++ b/model/model/decoder/23/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29a2912f12d3e443573793067dc3314fc59557f7e57240b1279b19353101f338 +size 29360368 diff --git a/model/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..20e167ffbc086a727764ef29f63a007087a3f38e --- /dev/null +++ b/model/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:930d880f9cf1fc2b829a3b64c9946152cd5d70e68e7fff7eeefb5f41b6524f3e +size 58720552 diff --git a/model/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..914da936401da3392ed76ef4318c62ef53041da4 --- /dev/null +++ b/model/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fbd766036c48874a8dd2d64d36b55fc28e211581587e543438cb646b706d994 +size 58720560 diff --git a/model/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..65a6e7251b1a131864f5086e0fce0887cef15d20 --- /dev/null +++ b/model/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d20de8c028a3489be81f402cd755958bf9ccdf532a51b1fda649121ed0831b7c +size 58720560 diff --git a/model/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d13346261ef1ae9b9c230290b34bd69b5a1046f5 --- /dev/null +++ b/model/model/decoder/23/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45524f7143421e7b599caf7c76de82985a76df9f6577dd4cbff4da35e58b603f +size 58720560 diff --git a/model/model/decoder/23/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/23/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a21488e6bc9e893940d898adb439d20a9e479661 --- /dev/null +++ b/model/model/decoder/23/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82b94933eb0370bd487a0324f4732c1e3533090c178dae58bf8bae3493ee49ea +size 8288 diff --git a/model/model/decoder/24/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/24/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fbc10c7a920d52db1dffd6ed62fd2ab4675713f5 --- /dev/null +++ b/model/model/decoder/24/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b48f31b55878ab9b3b667e39bf6fa91fa27fee5c8e89a1e6c77286d47c7f69f +size 200 diff --git a/model/model/decoder/24/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/24/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bfe17deb85b2e5de23511edf69a42495aaea2dd2 --- /dev/null +++ b/model/model/decoder/24/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89074d11d91e1e1956c104253486379956e4d6e07520c0911b2d932739279f8b +size 200 diff --git a/model/model/decoder/24/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/24/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c2b0b188244df57875318e66c811a73e7dc77973 --- /dev/null +++ b/model/model/decoder/24/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d11f51e5c3c33497c0ba8cf64101561e71cf01f7453bd2793ac5f734bf896bd +size 200 diff --git a/model/model/decoder/24/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/24/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bcb096271d40b2802a342732f16df20f0ecf1838 --- /dev/null +++ b/model/model/decoder/24/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cacfc4a212e754a14b0aaa5ff7e230001e75db9c4121ae7f0a9e40f255e042ab +size 200 diff --git a/model/model/decoder/24/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/24/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a7566286eb36fbef8bca13d92a9846ed0ecdae0c --- /dev/null +++ b/model/model/decoder/24/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337192f944fdfa0895b04d569971582c52c9564847e0ebdc467c4d89eeb58dfa +size 8388848 diff --git a/model/model/decoder/24/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/24/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d749f114f0db60ddfdae10ac560dfc7bc89f32fa --- /dev/null +++ b/model/model/decoder/24/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:310f8db356f220727f9bc1d4befb82fdb409ae1b33392e42d0da41b90fc00ada +size 8388848 diff --git a/model/model/decoder/24/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/24/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..29928bf9d7b0f8d25e0bde8092cf60ed24f38d57 --- /dev/null +++ b/model/model/decoder/24/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7ba1a409c08bc9a913dc0e8e16b455f8b7d06d96f54bc497e1d78223b399795 +size 8388848 diff --git a/model/model/decoder/24/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/24/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..39a69dee1c015dbfaad86dbc98925eed8e6a10e6 --- /dev/null +++ b/model/model/decoder/24/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c46da84f0533f01c3b29f6d675287210ad0d9dd2a5f9663283017726c986780a +size 8388848 diff --git a/model/model/decoder/24/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/24/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8bbbdda6837048ca70f4923f38574f2da473fa72 --- /dev/null +++ b/model/model/decoder/24/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e93b5a18d15a663f29c4d7b96895cab4de5320e12cccb76585a873afc2c4c598 +size 12583264 diff --git a/model/model/decoder/24/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/24/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..98dd4a1ad1a305c1dcd47f5bfecebfe0d12f22be --- /dev/null +++ b/model/model/decoder/24/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50536e0cc68b9979d548d041068da05bb8fb4fdb83c586544792459229dab35d +size 12583272 diff --git a/model/model/decoder/24/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/24/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..15f2c93f9e438b7b77ce8f3002f70358fc3dec29 --- /dev/null +++ b/model/model/decoder/24/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ae7d4e5c96d9abe4c6f9be41f74d7f48c87c3b61ae43f3171ffee740b4e35e +size 12583272 diff --git a/model/model/decoder/24/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/24/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4ef71c632bce65a574501687ca4b8bae917b7356 --- /dev/null +++ b/model/model/decoder/24/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42d8ede9082c6dd936a7971ac9ef4244f87a34287e581709788b2fe71cefd6a6 +size 12583272 diff --git a/model/model/decoder/24/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/24/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3c516a978dde0fc9a742a6e721d14328b34fea4b --- /dev/null +++ b/model/model/decoder/24/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4caeab0ea71dd87230f8a7c6c3135a8b11abbe29f82cd103ca177d4e0c7465e +size 8288 diff --git a/model/model/decoder/24/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/24/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..94749cdcb9bb9c3a1e64c20849c3eb5592c077b2 --- /dev/null +++ b/model/model/decoder/24/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c55ddbff58f86afbf3f1d30d3a6428ec16d5ec9a03b3fb9a645e2aed207614ad +size 29360368 diff --git a/model/model/decoder/24/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/24/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..64c25c414d5453fc56a76e1d56b5ffd161928a3e --- /dev/null +++ b/model/model/decoder/24/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d0c5a05d4536724a90e4e460efaff25e53e59b958eb306312d4b1a42f5937d7 +size 29360368 diff --git a/model/model/decoder/24/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/24/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..842a8af68ec20cb3d58705738ead67c37fc77bd7 --- /dev/null +++ b/model/model/decoder/24/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b5982b7455ffdc4d144d306c10903e01d55a4fe69db59dd491919c6cebc5d72 +size 29360368 diff --git a/model/model/decoder/24/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/24/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fc9378f3d40932a98080e61fc584415ada957a41 --- /dev/null +++ b/model/model/decoder/24/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bec28527aea43180865ef86dcc529e1aa9ce5d222d2856dc5aad7ad15ecc4c3 +size 29360368 diff --git a/model/model/decoder/24/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/24/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..769ca8e08f4bc2a56792c69c22c8afd29df6d035 --- /dev/null +++ b/model/model/decoder/24/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:106b10b46fb5d26c99fa43fb092d010259984c340b0c649d8423addd0e096d39 +size 58720552 diff --git a/model/model/decoder/24/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/24/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4d4c155c44e4479ccd3119ceca7d2b076dd2a71c --- /dev/null +++ b/model/model/decoder/24/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97399c6c7fc2701890d9d674178446f78d6f3d25614970489c2381f178f533f8 +size 58720560 diff --git a/model/model/decoder/24/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/24/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e6e4028e956aa0c7d06e03fa71abd73fbcde9633 --- /dev/null +++ b/model/model/decoder/24/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9db7f60c3dcec074d8a6a5db27a20c07bbb157b69c90bda935f55b25ae63213 +size 58720560 diff --git a/model/model/decoder/24/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/24/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37f041bbb8b56c7cee128c09f6b639edcf98ec31 --- /dev/null +++ b/model/model/decoder/24/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0268f1aa0073a96711af5588fd96c9ca3ab6fca38c5a6872e814c257ab74f186 +size 58720560 diff --git a/model/model/decoder/24/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/24/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..23829c8b4cad6726fc129ba1f2020b44440aa003 --- /dev/null +++ b/model/model/decoder/24/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2087fa9dedffb14fa7c4a7dc7fe1e8d8e39ea12796ecca7d5204f3db9bffb0fd +size 8288 diff --git a/model/model/decoder/25/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/25/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d527ac1930b009b84cd605ebb6fdeba036c63690 --- /dev/null +++ b/model/model/decoder/25/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b7b2d85039676833be44990ffd06f479a3c7a9c480a6fc45355d3d2cedcb326 +size 200 diff --git a/model/model/decoder/25/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/25/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..975ba3027e0b673fe7c2f544f3a52fac44836e65 --- /dev/null +++ b/model/model/decoder/25/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f63c9cf6de9f666041d340575b6f1f390b30c82e1f8ac2ab92147e8ef8de47c +size 200 diff --git a/model/model/decoder/25/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/25/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1a9ce0318a53957ff4a6e90ee69912537943f376 --- /dev/null +++ b/model/model/decoder/25/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2249e5154b2f270cfb32b7eb1768ba924129f003998ee3ca2cc5071ebf9130a6 +size 200 diff --git a/model/model/decoder/25/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/25/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ec69b8d78870fbf1170c19eb02977fc7cb0c937f --- /dev/null +++ b/model/model/decoder/25/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b364eaaf0e97f98239b9a3336dd5b39bbeab402c67200275222f267d3269a9a +size 200 diff --git a/model/model/decoder/25/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/25/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0c14c4e2e0d3685475f5babe563db7a0785e1530 --- /dev/null +++ b/model/model/decoder/25/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69e25010dbe3131998936f140ac3f7aea3475803f6e5da9bc5e2fe6e1cf7659c +size 8388848 diff --git a/model/model/decoder/25/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/25/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0c7da84027f79b956037570aaaa7baf52356aba3 --- /dev/null +++ b/model/model/decoder/25/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:615d7f4efc8f91af57fddfd7d39766eba571438d6ebb6239957a06a32c6456dd +size 8388848 diff --git a/model/model/decoder/25/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/25/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..253f553f337b17526870e663220c726fd396059f --- /dev/null +++ b/model/model/decoder/25/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1df68a05c1d97e2466e065b2bf41e9432ed4225c04bde553ab8e76fbfb916a2 +size 8388848 diff --git a/model/model/decoder/25/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/25/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ab7eb9fb23a23d67004e9bf7daf46bc55b339033 --- /dev/null +++ b/model/model/decoder/25/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e98181b5327cdfeee46f3ad4411df9d3cb93e1e386ee8985fd04581fecd24061 +size 8388848 diff --git a/model/model/decoder/25/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/25/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..95eba696e95b18783f351f0ef1240dd253d28004 --- /dev/null +++ b/model/model/decoder/25/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7637cc920ede86fc304ee723da5bea4a34f0f69094d6116d0558558a03cd5050 +size 12583264 diff --git a/model/model/decoder/25/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/25/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8bf2f404f66ecb6f244f062049d9d088b281f4a1 --- /dev/null +++ b/model/model/decoder/25/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f02baa349149933d8ee48f8d98ca6f989eca77ee9bd5f2a03e81c5f462f38f21 +size 12583272 diff --git a/model/model/decoder/25/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/25/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9e6532c6c45397c5207c58a71b1a70be7d69f847 --- /dev/null +++ b/model/model/decoder/25/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794bf4de0fa517cb967f5228f2a3b1a13acba581e35fb61618dcbb8df6486add +size 12583272 diff --git a/model/model/decoder/25/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/25/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f91759f27683a34090d5f72ed9085dc37dfc416a --- /dev/null +++ b/model/model/decoder/25/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1031e8ff0dc4b403f263d004d9b99f746a864f97f0384bba87d2506f732472a3 +size 12583272 diff --git a/model/model/decoder/25/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/25/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..faa9f488599f4fa4716487ff770ab3db4f5b7d39 --- /dev/null +++ b/model/model/decoder/25/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3731020a08ecf61e1cfdf45dcc575c6f36673403414c1d5154844897dd1bbd24 +size 8288 diff --git a/model/model/decoder/25/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/25/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..24494d4a80c55d5e800940355821f95d3657cf11 --- /dev/null +++ b/model/model/decoder/25/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eee27f7e8464fbcdc4634bfccf4c2b28e5b83852b4d21c92429b2ca06a2b22a4 +size 29360368 diff --git a/model/model/decoder/25/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/25/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fc2464798fa44b254443e2e6c7da4273e1264513 --- /dev/null +++ b/model/model/decoder/25/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc7cd9936257ed9db965f1cca1e41820fb650780f9849c025723d1f7ca72cc2f +size 29360368 diff --git a/model/model/decoder/25/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/25/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2293723453a0aa73bf58b2c05933c071472f9541 --- /dev/null +++ b/model/model/decoder/25/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae64fd5bb154efae23cf8d6d98a495ef3692f2e139e5a4eb0603b92703d755d3 +size 29360368 diff --git a/model/model/decoder/25/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/25/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f5cacc2740c3cf56f0ad72d75aede28b13a20993 --- /dev/null +++ b/model/model/decoder/25/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b74dc6e12c4dec2d1edcc74fd8276fa81217f4d66e21b1c4b625b6ec3e253aa6 +size 29360368 diff --git a/model/model/decoder/25/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/25/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c4e7767fb6e91cb18cb6441324bf8df47cc4b4d3 --- /dev/null +++ b/model/model/decoder/25/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de5622eb21e8c6a0454c771a15c5b036c4bfd41d0ea5ffd160142d9b58add9ae +size 58720552 diff --git a/model/model/decoder/25/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/25/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f718d3f4330cb9a577335aedcc8cae9db0ff4349 --- /dev/null +++ b/model/model/decoder/25/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4813d10f907955f509cad4ee31a7445d095819c3d102b10da8dd1887e30e9c72 +size 58720560 diff --git a/model/model/decoder/25/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/25/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4a2496502d06780e743315c9ac0cdc42f8542c86 --- /dev/null +++ b/model/model/decoder/25/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a28ebe0e0f25ac6618c250221a817b4f93c5e6ecc04cdc4fbbd0e5237b46389 +size 58720560 diff --git a/model/model/decoder/25/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/25/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..07e67e0e11857a8b2983aed035b93ee22055a97c --- /dev/null +++ b/model/model/decoder/25/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82077046627f52230dd9d67172f6c0307066523b203ce72ffd04b7c46c7aac9f +size 58720560 diff --git a/model/model/decoder/25/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/25/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..002663ac923cf9ed17a1f72a75d3c5e84c0352ab --- /dev/null +++ b/model/model/decoder/25/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc56a0d9335248de74238b31c9231c23b491236ea707f47f48849e4448594ffb +size 8288 diff --git a/model/model/decoder/26/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/26/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..64084469af374336fad42625e897e6868e18cfe6 --- /dev/null +++ b/model/model/decoder/26/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc2de210871b0ff7c43cd2c765de56841bd3c45debf1fb0de0fc1766bd32cc58 +size 200 diff --git a/model/model/decoder/26/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/26/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eed7a33360e669e8ac2d5dc801c436896060bdcc --- /dev/null +++ b/model/model/decoder/26/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc1c70dd421bf1687dd7a51507437c531689ad3ebb2e7264c19eca79a549ad70 +size 200 diff --git a/model/model/decoder/26/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/26/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9d58a83e996dd392a66c67be2bd0cfccb1a2c475 --- /dev/null +++ b/model/model/decoder/26/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9624536e94c1bdc41e07c6c090c105fa71eacc0adbd51b42a35adb3b1cdab5fc +size 200 diff --git a/model/model/decoder/26/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/26/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..25b9ec8c03402a6ff976edd0a46b470d58de09e0 --- /dev/null +++ b/model/model/decoder/26/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45c1e78302c56cf7d7f8218a529a4151c56c972d368bb9b3791285754d6a8b10 +size 200 diff --git a/model/model/decoder/26/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/26/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b018adbed066c265f75cc3a2715ec5493276f0cb --- /dev/null +++ b/model/model/decoder/26/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae65c4aa0c7dbbe1afb6671ff73db376e3c8d86eb017eb97a9203f41213f0f25 +size 8388848 diff --git a/model/model/decoder/26/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/26/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..564cf34a004cc246d120bd015bf4c5edd420b4c9 --- /dev/null +++ b/model/model/decoder/26/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c87c0d81e3ee1349fdbaa438fb997fb2db25b036ba60a0543cb3b45b68d89df +size 8388848 diff --git a/model/model/decoder/26/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/26/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7a14dd580ba7eebf9a5847374481ec8c8b5b63d2 --- /dev/null +++ b/model/model/decoder/26/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b26c3b852a32da6dc7e46266e8a8b8c6ccb537bab366ab162bab07358f478a98 +size 8388848 diff --git a/model/model/decoder/26/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/26/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..340354c4187c0d85074348ae614704e03fb8fe6f --- /dev/null +++ b/model/model/decoder/26/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a8db49c5541f0c6b73bcb5e6c55e9915749979702526397bcbd01632eaf7fcc +size 8388848 diff --git a/model/model/decoder/26/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/26/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a59df61955e2fbecebff74ef8c7c7b61086c49be --- /dev/null +++ b/model/model/decoder/26/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78aa23c2880df19d66c797a6488ec7b86e10bd8148d7c3d0b67bcca7b22ab1ff +size 12583264 diff --git a/model/model/decoder/26/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/26/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..783ba88998f27996972334d9a30501e0af23baae --- /dev/null +++ b/model/model/decoder/26/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:412e9010af79847efa6e0072dc044e6e59306c66f2b3019372806df41055b185 +size 12583272 diff --git a/model/model/decoder/26/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/26/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..832d9364b47ec3de819f73501c517da960af3a35 --- /dev/null +++ b/model/model/decoder/26/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f001451132ecab91d40ce8b33e99afedb62400a119af729fdece5f0bd6454f3 +size 12583272 diff --git a/model/model/decoder/26/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/26/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..42bbae8b0c8351065bf6abe04dea61e519ef0e2f --- /dev/null +++ b/model/model/decoder/26/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fdb5678c45d15ea2e2bb58fdcac01b95b6103dc55eb06b204dcc1c0a44f95ba +size 12583272 diff --git a/model/model/decoder/26/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/26/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..34dd82ec84a7db265c05cb22a82995f0a324b239 --- /dev/null +++ b/model/model/decoder/26/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c71432c468f41edc8ab117b55601ff83682775965da8162afdb2f946fe16453e +size 8288 diff --git a/model/model/decoder/26/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/26/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..72a66de264974e6f6493f9bbc61345500ce034f8 --- /dev/null +++ b/model/model/decoder/26/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79a55cfde2ea9b2e08510b9b73eeb6f7762729db244ccaa4cc7540cd6ef3fb18 +size 29360368 diff --git a/model/model/decoder/26/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/26/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f536b01a25f4aa887754f7d850f3afc18e11a135 --- /dev/null +++ b/model/model/decoder/26/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8ec16a089b3385f71a09cb0e3fb1250202b848f6d52ab99fec85fd4ff2b062a +size 29360368 diff --git a/model/model/decoder/26/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/26/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1254e3a12b96252b21611b88242cd4a5bad60987 --- /dev/null +++ b/model/model/decoder/26/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb2120ac2bcf1b2d24fe66a0e5a5a0e70ec4383bca3df26dae0c3aaea8675d5e +size 29360368 diff --git a/model/model/decoder/26/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/26/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ee5ce62ded797ae4e3dcd8faa13d64bae4b424e8 --- /dev/null +++ b/model/model/decoder/26/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a578781de5240998b75476034cf8c5137138eb710337ca460e3eb973bf445a +size 29360368 diff --git a/model/model/decoder/26/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/26/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1dd5a0a06128a8529f4ba9805d48a170b73384fd --- /dev/null +++ b/model/model/decoder/26/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be074c61f6d1c4cc22940e3b0fa0bfe960910f630ebde536a99f15b8503820f0 +size 58720552 diff --git a/model/model/decoder/26/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/26/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..054a60f80775fa37ce4bdfe43eee0f4122747312 --- /dev/null +++ b/model/model/decoder/26/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b6e83dd6d0226573d7ebd2f7dded44e631668fb48ba49bf37c97f8f2621507a +size 58720560 diff --git a/model/model/decoder/26/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/26/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a12528606a46af6a2bca55bed01b791f2e096c45 --- /dev/null +++ b/model/model/decoder/26/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a30291ae27f109f429e2d31d34d9d2cab2d68827e7456f0400b7206daa85f4 +size 58720560 diff --git a/model/model/decoder/26/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/26/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b75712904a6f7a76af9ec22bc202339b5a5ec4ee --- /dev/null +++ b/model/model/decoder/26/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bdea76ef9f7e4407c5e7158379b5a966f80b844e283b2fe06a339b0751a7faa +size 58720560 diff --git a/model/model/decoder/26/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/26/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..376218e5a2f8a31d95297a09e3886a161bd94d04 --- /dev/null +++ b/model/model/decoder/26/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63eb1feab223357ded7adf30f865991e057e862166e7517fe10c478c11b2b9b2 +size 8288 diff --git a/model/model/decoder/27/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/27/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..361d58a370dddc8177fca6e6625fde30dc9ac62f --- /dev/null +++ b/model/model/decoder/27/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8363f778a00d30de41ef2536de15d3c8a59870061c997fa9bd645a3928920612 +size 200 diff --git a/model/model/decoder/27/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/27/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b0f72c76120812dc88a7ccd83c4fff8f5bc558ab --- /dev/null +++ b/model/model/decoder/27/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1065ce4271cc81ce476fa5ddc06770d895cddc01e6d21f04ca55ae34c37f87b +size 200 diff --git a/model/model/decoder/27/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/27/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0a3e6e04a990bab0eb2b616e6ba6789ac66bc807 --- /dev/null +++ b/model/model/decoder/27/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b1b239c55cec5c2dea0b0737731d8b816f9d811ee534b2dfdd45ef66911f853 +size 200 diff --git a/model/model/decoder/27/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/27/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..12815ff96e096602d8b414b7bf8621d6c08b7799 --- /dev/null +++ b/model/model/decoder/27/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76ca88e417f6c022e0d2173056085f003509acbe11ab84b6a0c5d884a0618b71 +size 200 diff --git a/model/model/decoder/27/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/27/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..825ae0a46ba93707a0cfc30f95117b1be1942c76 --- /dev/null +++ b/model/model/decoder/27/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bc429fdc6158d0faec22fda92744dbe485c2b99e3ae9c90ae8b6b466797ca5e +size 8388848 diff --git a/model/model/decoder/27/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/27/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fdfe99f4cb771c2a3e6bcb59d65bab6457d4dde2 --- /dev/null +++ b/model/model/decoder/27/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4341fcce9ebb05aca7800a0c89d872e6476cc5609d363b3e076872397b16cc10 +size 8388848 diff --git a/model/model/decoder/27/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/27/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d45e765927019c42ba892d0d0735b8767bf69747 --- /dev/null +++ b/model/model/decoder/27/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c0d17f78d5e8c69c49c20be953809f5ba890fc97e7833bb315f44dd99093814 +size 8388848 diff --git a/model/model/decoder/27/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/27/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f5308bfa48ed792df39c3e538243acf9f20ef0d --- /dev/null +++ b/model/model/decoder/27/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53fe2d2c83791e63a44f10d50aa9559c3a9ee3f11b847b98ef770c355634b55b +size 8388848 diff --git a/model/model/decoder/27/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/27/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2b7332f76400b89410816f6da50cb0c00906902e --- /dev/null +++ b/model/model/decoder/27/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb3f6132a243f5efe9405fa8a9f94a104b714cc8da4143fb20e5a8ded4a191ef +size 12583264 diff --git a/model/model/decoder/27/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/27/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0de29f21af61e2bdb1a3976749748c03826beddc --- /dev/null +++ b/model/model/decoder/27/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5c3afc9081e2e218be98b402a87afbbbb41e0f1fc4d22e5978cf19b30cdfe9d +size 12583272 diff --git a/model/model/decoder/27/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/27/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b04778229d96c1812ac3208ffefa6e161dda81c3 --- /dev/null +++ b/model/model/decoder/27/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10873218cf9b733a6d8475d7d301ea433b372299dafd8c198a6b5123b42654a8 +size 12583272 diff --git a/model/model/decoder/27/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/27/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..07c9f296c89cd4fc6022708fab483f33fb1f184f --- /dev/null +++ b/model/model/decoder/27/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c5112e85592ed1aa3b26de3e4bbff1b72b32640fb42e983d1db366b526f82cb +size 12583272 diff --git a/model/model/decoder/27/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/27/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..321fecc8965ddf1356ada0e529296fc63d994227 --- /dev/null +++ b/model/model/decoder/27/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:405e50fe03b001f977d0d119fc03519a299946d0c3cdd4b2b0046b036ff8b5dd +size 8288 diff --git a/model/model/decoder/27/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/27/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ac9d2307ae1dd450169249da6c383552f3b492fb --- /dev/null +++ b/model/model/decoder/27/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9d2689ef3c92127b01ffd97995fe090ce2d16bc676a0930f28d2e032c8b2f35 +size 29360368 diff --git a/model/model/decoder/27/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/27/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b96cdef6abde4e9863c22689c76ae207a736ef9e --- /dev/null +++ b/model/model/decoder/27/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:436d29e8678f81a183a490363b979f18ab5be0f4e6e78141d484560ce3619e97 +size 29360368 diff --git a/model/model/decoder/27/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/27/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8b427a1f8c184602f6b47dd9d270a0288241f72e --- /dev/null +++ b/model/model/decoder/27/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7458fb5220dff27fa029433d6cffaa3030d5b00f19bb7814f8c40bc44303871 +size 29360368 diff --git a/model/model/decoder/27/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/27/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8a6739d47884a6d8cecef509cc298a0cbbb9f077 --- /dev/null +++ b/model/model/decoder/27/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c9d088e2b2ff483245dc07ba329eedc41b0ef098ad84b2ae259e31654289b3c +size 29360368 diff --git a/model/model/decoder/27/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/27/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c2402fba27dbd5c6d250a346b074fd0263ad8ef9 --- /dev/null +++ b/model/model/decoder/27/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36212d6a436da7446d3ea28a23a703c3091797b25c02e1a42d13f41e43dba9db +size 58720552 diff --git a/model/model/decoder/27/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/27/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc3274ca328db3c602ab4a1657f1252ce6a889e2 --- /dev/null +++ b/model/model/decoder/27/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc6794de8154e970a6cd9e78c85594c29eb8172d1aa06193abc96ee481587c3a +size 58720560 diff --git a/model/model/decoder/27/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/27/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..58a681cd44a5e47360cfc1515558f2944bbbc7a3 --- /dev/null +++ b/model/model/decoder/27/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec439ea1028cb532b0a4167287dcef0f671c42124df4c2b088dd7e88ab1e5511 +size 58720560 diff --git a/model/model/decoder/27/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/27/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2de27ac3b0be6fcfbb7f3ea5a73ec8c5c7c5ea8b --- /dev/null +++ b/model/model/decoder/27/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c66bd140ce4fe21f5f0faa232eb282676bdb6e0cc75f58775f4b4d557191be5d +size 58720560 diff --git a/model/model/decoder/27/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/27/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..be6e1de6b18a8e2d3095fc94f508a5848edfbdbc --- /dev/null +++ b/model/model/decoder/27/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bea932961fcc57801d74b567161f003a23156578075572ce28fd5113d92fdae2 +size 8288 diff --git a/model/model/decoder/28/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/28/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9055f32b8ee3f344a758f7ea84eb59dce96f6d46 --- /dev/null +++ b/model/model/decoder/28/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af7f455151a7c904649ce19d48a4c8774d0a13003706e94c44f64520544cd93 +size 200 diff --git a/model/model/decoder/28/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/28/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..859884681ae3a4c48f698794a0e726db08b8711b --- /dev/null +++ b/model/model/decoder/28/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:510a82977d3724ef425bea64d0592a4b21d360cb2bee17ed2de635f294c8a0a0 +size 200 diff --git a/model/model/decoder/28/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/28/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5148efc103df51f235e7a783b6b3244563d26e8e --- /dev/null +++ b/model/model/decoder/28/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b6974d15f126da93a2311a8d2358d0c59ceed7c1a0af8125894f7bb8791ef80 +size 200 diff --git a/model/model/decoder/28/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/28/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3de70d16da51a4e6a3bd17d3961100abf9e463f8 --- /dev/null +++ b/model/model/decoder/28/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34fe96c8ffc0b476a5a8aee972536b0efdc260ab413941733630da8335a10b51 +size 200 diff --git a/model/model/decoder/28/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/28/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a13d9827b3f61c74676ec25b9badeea32893476e --- /dev/null +++ b/model/model/decoder/28/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e8645f496108d50da867812809651c854378ce67aa30529f72adeb8ef319c8 +size 8388848 diff --git a/model/model/decoder/28/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/28/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc063bfb232085334281880e71266504ea7ec92d --- /dev/null +++ b/model/model/decoder/28/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:121387c2169aaa4ac616ebbb03bfbc210241660e0d6fd5a7c1b0d92aeb3f0d15 +size 8388848 diff --git a/model/model/decoder/28/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/28/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..23e1769c7816310d65a9e8254a67fc988651129e --- /dev/null +++ b/model/model/decoder/28/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4105278afd8df50fb2fa519c5c5cedcc9efb916d4e05c833c8dd1321aeb6de3 +size 8388848 diff --git a/model/model/decoder/28/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/28/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d49ae8d8338fb923ab89c67d037613b1eee0909 --- /dev/null +++ b/model/model/decoder/28/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19f4cbf249f4d9905653c692ab7a55f98509339e0a7d05ec696b6730adf34cfc +size 8388848 diff --git a/model/model/decoder/28/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/28/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..db7c4c2c83161ea208c121757c3d3817191084a2 --- /dev/null +++ b/model/model/decoder/28/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:942421ea09fa7270b74f5c04616040e7d34ca51d5a28dab3544a85ba1255231c +size 12583264 diff --git a/model/model/decoder/28/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/28/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..06c9081f469aa31256d3d6396d513a34cb623660 --- /dev/null +++ b/model/model/decoder/28/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adc70dcb6428603a7dfec9a3c741ab5f8f850cd080ecdd86515ad89020ffb96d +size 12583272 diff --git a/model/model/decoder/28/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/28/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3ae65d7c992a772c1885804deb7d882b3b01e56e --- /dev/null +++ b/model/model/decoder/28/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7b1c8bbb5ef2e107d5dbc82e5b7cee27209629bd65a7af901bea39eb6931d79 +size 12583272 diff --git a/model/model/decoder/28/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/28/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0eb0bb18164cc5636690daf9b4a867491e9d61fc --- /dev/null +++ b/model/model/decoder/28/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b108090238f5cbe4dc4f8fd8ac2750911fb70521036499a68e1301ca371f4c8f +size 12583272 diff --git a/model/model/decoder/28/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/28/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0589c3a4af0769aea9968e55684c71bca1f6874b --- /dev/null +++ b/model/model/decoder/28/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8dcd4aee769efd629bd6c233615a8fdef02deb45f1f8539beb7d1c45235e1d8 +size 8288 diff --git a/model/model/decoder/28/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/28/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cdc5d711bab76cf9c95585871dd50c7cc1e2575d --- /dev/null +++ b/model/model/decoder/28/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2cf608ba2b895e8165fca4713162da1319490244eee9578a339115e8e58c940 +size 29360368 diff --git a/model/model/decoder/28/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/28/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bf46b3442fae55a23283113a1b510b132f1ffa6e --- /dev/null +++ b/model/model/decoder/28/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:740634f144f9eb931ebed5974eab6fd587238028c6ec1989e47a65b4b435a935 +size 29360368 diff --git a/model/model/decoder/28/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/28/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..70a1585e40ae6a162da12e19a82071da7a31e491 --- /dev/null +++ b/model/model/decoder/28/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5270ac55b8cb47172e08ea7f49c8313dc832d0a81937e570bbd4b732bda2d5af +size 29360368 diff --git a/model/model/decoder/28/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/28/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..167e635397eafe1bb6d712aecba3a61213404869 --- /dev/null +++ b/model/model/decoder/28/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd228ad8ffe00fba311746045bcdbd63467187ed588381ce616b7756799aa1ee +size 29360368 diff --git a/model/model/decoder/28/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/28/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f6ac5ff14e00bdebab6c0f59396987ed554e1988 --- /dev/null +++ b/model/model/decoder/28/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77598b957b9a03a0dc9859bbfdf20396dde4a7dbe19c74a924937d85d000f7ce +size 58720552 diff --git a/model/model/decoder/28/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/28/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc4485e8dcf77e276fe3259b4fcc364aa6585670 --- /dev/null +++ b/model/model/decoder/28/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff5815eccf435047136ef2eec055002e6c3bc3efcb96274690b373c1163c6c15 +size 58720560 diff --git a/model/model/decoder/28/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/28/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f8a0efd66692b69fb14dabe07a7efc32763d95d --- /dev/null +++ b/model/model/decoder/28/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f12c7d7313446c7ca379d824f854ece7426c835371bca6ca7c306a64f2bbf84 +size 58720560 diff --git a/model/model/decoder/28/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/28/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..051fc54ca2f6daed5f70e2f37aeac880fc39869d --- /dev/null +++ b/model/model/decoder/28/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:714a8b492b627444c1685dd2294453b6ef8a36376da166036825d30ca8902a93 +size 58720560 diff --git a/model/model/decoder/28/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/28/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cb1e4de0356b2921e6744b8d635f21811852e6d8 --- /dev/null +++ b/model/model/decoder/28/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe7b98a1d5b086b28b66f4a4c03660d8103f23d98ea694583b314ded8886b895 +size 8288 diff --git a/model/model/decoder/29/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/29/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d386e02b5aedb67b7a6f8b15549dc7855902f8e7 --- /dev/null +++ b/model/model/decoder/29/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b88215668868bed27d47d00c818e0f080e47d5d912d18254ac0018906f9cdfb +size 200 diff --git a/model/model/decoder/29/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/29/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..781a11e141b61f578298dfc474f184fae7d5df9c --- /dev/null +++ b/model/model/decoder/29/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cc55555343191f81ccfa484df9015d7b531a08fd943d790384ba09d8fcd6da4 +size 200 diff --git a/model/model/decoder/29/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/29/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2fa3ee16170be3bb33c60b1cb2b5ee2c333d1fb3 --- /dev/null +++ b/model/model/decoder/29/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:317644ca5e037ce70df299366acc37010ebef46e341bd172e3a03c28e2d77d49 +size 200 diff --git a/model/model/decoder/29/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/29/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..568dc2c515d1983a25c1a04820bbfbead8d96d19 --- /dev/null +++ b/model/model/decoder/29/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1737521c5c56bce6fc88c66131363f3afee4589ae6dee577016910147f3a7d3 +size 200 diff --git a/model/model/decoder/29/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/29/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6bc4b6d2a113f64c143a7c109ac7d0da333e819e --- /dev/null +++ b/model/model/decoder/29/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54a99c1f8ca2a4f8b3e4ebacf3720f64f68b23c39ca1cf210c6e41ed9705b91d +size 8388848 diff --git a/model/model/decoder/29/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/29/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3fffc98172fb706b6cad044f4a3788fae3bac2dd --- /dev/null +++ b/model/model/decoder/29/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83b06104a4dcf6ebb37543437bd90d8002c7e84b555064f5e4cf6683920d7249 +size 8388848 diff --git a/model/model/decoder/29/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/29/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ee9afe433b45224a96e67e00411f4bacaff13195 --- /dev/null +++ b/model/model/decoder/29/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4af1df880433ce8daf79c933517d3deba47d89b2b10cd0bcecde74f43263841 +size 8388848 diff --git a/model/model/decoder/29/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/29/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..587b0b5c733ffb0846ed27e4a12544a4e765d249 --- /dev/null +++ b/model/model/decoder/29/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e0fe35f782e91619f57a11b6fc0f4c91ec3fdab371d51fa11eec54fd8aaac36 +size 8388848 diff --git a/model/model/decoder/29/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/29/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..32a41ccbe052c728472d7a428a6bc2d787e47a27 --- /dev/null +++ b/model/model/decoder/29/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68ade8e133a7dcae2ef64b36eb852e180721389e53caad6da1f4dbcb60331f5b +size 12583264 diff --git a/model/model/decoder/29/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/29/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..79702523c164b5eb4db380fe85c375969532f430 --- /dev/null +++ b/model/model/decoder/29/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92fe41b26fcb148345e9993052b2a6699594605f0d2d86978f27c9eb61e5b246 +size 12583272 diff --git a/model/model/decoder/29/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/29/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c5dcc6142077dc92c67507e202c3247f78770bb1 --- /dev/null +++ b/model/model/decoder/29/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a84f90e8d4a06482737c1b18c46930924decc7bacaaee238598de43f3d94d303 +size 12583272 diff --git a/model/model/decoder/29/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/29/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..92bc2384460fa1739d7ace567ff28805fb38f302 --- /dev/null +++ b/model/model/decoder/29/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cefdae74343676011f4c977d2e6b11d5641b71dc4a5c6fa3bb53ffe8924b272 +size 12583272 diff --git a/model/model/decoder/29/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/29/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..133615b96e73482368281df525bd9cc1730ba8af --- /dev/null +++ b/model/model/decoder/29/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:738471af3815fa9b084ec17ff060af23a60a46cbbed26783bb84f62f6b23c217 +size 8288 diff --git a/model/model/decoder/29/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/29/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..348dcd9bffd5125e60293cfa306c19709d63a594 --- /dev/null +++ b/model/model/decoder/29/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12e0918febc37d4a0542071a5af2bb5110a0eab81b5d2bd1ca3537438698e963 +size 29360368 diff --git a/model/model/decoder/29/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/29/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..73e45701e82a2ffd5109871debf9d9b4fe513900 --- /dev/null +++ b/model/model/decoder/29/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b278d9e1d95bd5a5bcdee26ed68502b354d6665385ced5d7af39e905887e6011 +size 29360368 diff --git a/model/model/decoder/29/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/29/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..08c78e5393f7018239d70bfcdee7fcf61573c7c3 --- /dev/null +++ b/model/model/decoder/29/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b5cc18a469ad4758ef93caed51dc0facd00c354ab5c69cd1af227c1ac64904a +size 29360368 diff --git a/model/model/decoder/29/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/29/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..249ac75e3c598982c1692b42a85c762ef4312326 --- /dev/null +++ b/model/model/decoder/29/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee5720f4478346914b334758767d2515843530a8124497746f5fc4b62e761c12 +size 29360368 diff --git a/model/model/decoder/29/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/29/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2a07286257aa2bf32227bf74d28f23ad8afc3a12 --- /dev/null +++ b/model/model/decoder/29/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:144991b36e3d6370e97cb8c42c88b8f425a450afb4c83c7cb737da11d886a4c6 +size 58720552 diff --git a/model/model/decoder/29/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/29/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f83b2b8884adc31d2c0b6894139b670013e3d041 --- /dev/null +++ b/model/model/decoder/29/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8e9f596ea7bfc5509eaec005c630a8950e1aa43385de841e209f5ccc6287a2a +size 58720560 diff --git a/model/model/decoder/29/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/29/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e50a780709bca9a8c944dd316a23ab30d76fadac --- /dev/null +++ b/model/model/decoder/29/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4785dccfba5917b7f53a1913f7bdbbcbdcf93886e7f93e3ff5277b099486329 +size 58720560 diff --git a/model/model/decoder/29/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/29/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ede58a9983555223de2697ca02b303ae3364c3ab --- /dev/null +++ b/model/model/decoder/29/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a178bcb7085573d36f4b6a1e2350ba6eafea33aeffeca86e4e6f034e2a9d188f +size 58720560 diff --git a/model/model/decoder/29/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/29/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..813322e8e2b7573dd8117dfc4a4f00ef745bbe98 --- /dev/null +++ b/model/model/decoder/29/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66ac5ebcf983a78506b3c04cda676edc8622555304f1c505e2d72d57f1c0ddef +size 8288 diff --git a/model/model/decoder/3/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/3/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f0c940eca5bb9672ae6fb6c971faf40f54d94bb --- /dev/null +++ b/model/model/decoder/3/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d478396eaf820aec433eef3f185e818c6b33397a732add2f7f8b2db83dc2256 +size 200 diff --git a/model/model/decoder/3/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/3/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a19b2c61bb024078b65efd33df98967696155ced --- /dev/null +++ b/model/model/decoder/3/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17dc6728acfcb10e673161e7cb7709bc69e0f2d4764a9fa8c585eaebb513f27f +size 200 diff --git a/model/model/decoder/3/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/3/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..375dae64d78ea7a3bf3276d6054bf91427269af5 --- /dev/null +++ b/model/model/decoder/3/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb278704ca86385e67a90a24bde7d408b59dff4f11c5f75435d0802eed32601 +size 200 diff --git a/model/model/decoder/3/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/3/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8fba9ae3c1e66a43fe368d36b375a8f9dcdb1c23 --- /dev/null +++ b/model/model/decoder/3/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f536568f8eb696312af6eac81ff27fcccaa8277b0453fdaa605dfb4c570dcd72 +size 200 diff --git a/model/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..adb28282463087ffc6571aaa3561ada90753813e --- /dev/null +++ b/model/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:890ca6f738f2f3aa7570f9195d572b592585f3c28c0fd9284fb508e58b19d15c +size 8388848 diff --git a/model/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cd8b1b064aa1ec5699806642a562ee9476ab843b --- /dev/null +++ b/model/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec720fba753858fa5c7a3849d0c80a2261eb229f75a5941a4dea92efa5bf463e +size 8388848 diff --git a/model/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..df2d7db6c3ae149fffea2b6bcb016bd4e03d77d2 --- /dev/null +++ b/model/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4df26eb9099fda441e84d242c0ba736cd3089d905ffc390ddc61ac9d9726c8e4 +size 8388848 diff --git a/model/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2a6d29af3779ee5cc034318b7739ebf4ee1a529d --- /dev/null +++ b/model/model/decoder/3/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed1899dd3079490afe65e2214caf382e3265877b9b7d257102dfaab1cdef8266 +size 8388848 diff --git a/model/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09ac419b01816bfc7b4f607561f38ffede205888 --- /dev/null +++ b/model/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6b9e9cb282838e36f6b3ab52758e6a7bdaf14858bfa34ef3124d73b66fdf7b7 +size 12583264 diff --git a/model/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..54a4724ed255a7fb803719cb1db4a51f66132898 --- /dev/null +++ b/model/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:990c639ddc36620cc87a4a15f6449cc5068971464b9bdd35ec0c5a15b9bbffbf +size 12583272 diff --git a/model/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a741ce647ec5c6d8b69878516934b2d672bcc1f4 --- /dev/null +++ b/model/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9fd5774e21e511e497aa2a67e41dc848e7d1ee134a3851477c29e69369942c7 +size 12583272 diff --git a/model/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8756d24320bf4b01fd9614d73ff29f870254c164 --- /dev/null +++ b/model/model/decoder/3/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b55a2531ebb937bf67c9c4a028f5d587663cf47c414c14d1e6917bc79c0aa40c +size 12583272 diff --git a/model/model/decoder/3/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/3/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7fdff466cffcbf2d02c78635ef0b22eb678aa5ce --- /dev/null +++ b/model/model/decoder/3/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5fee77dfeb65e55c95a96dd8176f06d706cb718f2de148cff28a16aba0e70a7 +size 8288 diff --git a/model/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6b68a4de3eb2413b7cebe10ca137d1ad9a745bc5 --- /dev/null +++ b/model/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e60ff3326ad26d2aa15ef875154cf12aa0dcbd218df7bdf3b868309ceb20333c +size 29360368 diff --git a/model/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c2448d211e8da87b3c66c21832e3091c46b0f6e --- /dev/null +++ b/model/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93e6c06dc4a20f64ac24673535a95f09190933ceb3d4e7cd62cbf6300630c7a0 +size 29360368 diff --git a/model/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aed2a32de39195eaaf8fbb7528c396c4e85390aa --- /dev/null +++ b/model/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fff69a5e5a302ee6391f47ac61250c8a76973557934bce870f0971a75590aa5 +size 29360368 diff --git a/model/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bc1dae9a7ed0fe56985e05cd01d10a171b4da061 --- /dev/null +++ b/model/model/decoder/3/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2ad8c2afd12d47eb215eb22ad6df852dd4773f9be7813a905b8e059687ddf2b +size 29360368 diff --git a/model/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..46d0e54231603dbe72ae8d46672672945855096e --- /dev/null +++ b/model/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc8ddc008502e0553eeec505975ae7d34564ff4ac39ee7bb0ccbf0172c1465cd +size 58720552 diff --git a/model/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5d4348e5324145f5cb6b62c77afce3e209267a36 --- /dev/null +++ b/model/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a9086167b66a0b163548707a17c33a580e007c5f2ae8b10cf371bb14890ec1 +size 58720560 diff --git a/model/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9c724398f2584a4359e60c45beb0022b96ef1105 --- /dev/null +++ b/model/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cada3a7678e5a05754084e14c7807b13316c5cfec76d93843667d975a426c03 +size 58720560 diff --git a/model/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c38141978268a0610cf1e4187c712b095ebb39fa --- /dev/null +++ b/model/model/decoder/3/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12c316d88cc3d8e91fa2d60e9efb98f1bf0a837fb93205d6bad71896827a5161 +size 58720560 diff --git a/model/model/decoder/3/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/3/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..92c9b1ea54d0c8cc35d5b10c1cbea6b82ef717fe --- /dev/null +++ b/model/model/decoder/3/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8f3ddd8d6b79cd56aa167eb8fd966acc00f1e2edc7535beecbf6d288bd1072a +size 8288 diff --git a/model/model/decoder/30/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/30/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..85566d2d3ba3b1c84be88462911b709e25d81aa2 --- /dev/null +++ b/model/model/decoder/30/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:923df9e4c06eaf086662fb2d1d7ef1b60e8d45a137f6b7e48c77dbaab2024936 +size 200 diff --git a/model/model/decoder/30/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/30/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..73a3ec7fcab03505776da577673ece63d586edc3 --- /dev/null +++ b/model/model/decoder/30/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ae7a3f4612406200959d27a8c8422a2697a0f15a3471a297f9e5ee2590d150 +size 200 diff --git a/model/model/decoder/30/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/30/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..646ed83a07dfce4751879c8c44eb8dc2985fe638 --- /dev/null +++ b/model/model/decoder/30/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e134e45b66882958000847603df5f5e1dcb18aad2985537c5a958d46041d6bf +size 200 diff --git a/model/model/decoder/30/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/30/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..500c85be7bdb38c8805239c5fdf8a194f80f4088 --- /dev/null +++ b/model/model/decoder/30/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2951154f77d57183ca47ba48180494953a4cb001f5b1b3fb941e08c8b8d990b4 +size 200 diff --git a/model/model/decoder/30/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/30/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..453a627ebcdca610602298d4328c9380c4cc44f0 --- /dev/null +++ b/model/model/decoder/30/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f86eef2bad81b1d261ecca189b18f6e9d7df4b928d02e6c93615bae73a945356 +size 8388848 diff --git a/model/model/decoder/30/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/30/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e9a73b1238b01fd44f914f808632370d721d7935 --- /dev/null +++ b/model/model/decoder/30/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68997bec115ca41f9daf1338ee67cce7687634ede0f6210afafcc6c94d783967 +size 8388848 diff --git a/model/model/decoder/30/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/30/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2d9158a9dfaa5d100db59402f09aa288542126b3 --- /dev/null +++ b/model/model/decoder/30/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c0fb3b05f5d0426ef0dde0137ea4d15608db4ffda9b65e4954a3f19ad243172 +size 8388848 diff --git a/model/model/decoder/30/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/30/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5e7ac53ce21467c7db4c9690f65c6b9bc7559796 --- /dev/null +++ b/model/model/decoder/30/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:781c2f0b51f02db2d2e07ddac91d6944e335db4ea8622971a206f54c79c0c4bf +size 8388848 diff --git a/model/model/decoder/30/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/30/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6726e8d6a6a34b190e1b7b7d4e0c27a014a00b45 --- /dev/null +++ b/model/model/decoder/30/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc3d02d01a987d29607c7f25f4ce61f5f7991ff12a942e0855f83786bd5e58a +size 12583264 diff --git a/model/model/decoder/30/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/30/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..39b0c3cd83310c29649880f85cac7c1f960ea7cf --- /dev/null +++ b/model/model/decoder/30/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6783063256180fbf9933c8af868cf5c4bcd80b7e8b26be137a8f312ff83c253 +size 12583272 diff --git a/model/model/decoder/30/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/30/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7b9d036e2ed8889c5e28971b4599d67d332dc651 --- /dev/null +++ b/model/model/decoder/30/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:004322b2e73f25ebaad8af5a21432f76ec54b691fae30139f63d19fae6cde0a1 +size 12583272 diff --git a/model/model/decoder/30/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/30/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7ac5ed2178581905e5dc6214b1e4839a9ef998b1 --- /dev/null +++ b/model/model/decoder/30/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c50be1ec899de8baa5b31b6bbbdb1e78f3ccf26c01c85865d1fdf8d36a66ef42 +size 12583272 diff --git a/model/model/decoder/30/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/30/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b347ccd76ac936df4fe06295ef0e8311f7911dbf --- /dev/null +++ b/model/model/decoder/30/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac59d353c9bf92afaeb5130603e3eff0a4e6b1fc2066fd315095b72335bab5d +size 8288 diff --git a/model/model/decoder/30/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/30/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..404b5ed196708a3b9a4b8027fe6cbff15cdcca6b --- /dev/null +++ b/model/model/decoder/30/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7e3f92d6d1199cb5fd64390f6f11fd0b5cb5400f3a108a5e7ec00ccdfd6f113 +size 29360368 diff --git a/model/model/decoder/30/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/30/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9db696d7b8f98836c79cf4516c4ae881cf254262 --- /dev/null +++ b/model/model/decoder/30/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1355c017c8ec720a4f5d90f3a69263f6884d834f597935b2eada6aa779d2aa9a +size 29360368 diff --git a/model/model/decoder/30/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/30/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eee17b5b958d69df646a03a43c8543beaef6f0d0 --- /dev/null +++ b/model/model/decoder/30/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9d9ee6803e6ae53e74c521b55a88127578c3bbf2247b2ce78695ed7ea7a6c4d +size 29360368 diff --git a/model/model/decoder/30/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/30/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e370209bfb5fc24e5ac3faa615717cabda7ec919 --- /dev/null +++ b/model/model/decoder/30/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e3c24413c2683e5715a5f4e2ffc7622027ddb4fee6786637f271c0a99a0b899 +size 29360368 diff --git a/model/model/decoder/30/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/30/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..50e961a7ef2478b2652b9ceb274daddc1147b3e0 --- /dev/null +++ b/model/model/decoder/30/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c99f3ef1836425e30505fa614c69fa44e2a354bb42194de524037098a2948ebd +size 58720552 diff --git a/model/model/decoder/30/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/30/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ad8442137dd333bafb87464951211a0713aca415 --- /dev/null +++ b/model/model/decoder/30/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c6c702e9ff8c6bf75b0a60d61554c9b2775712edc9ded8660e2655e3725476d +size 58720560 diff --git a/model/model/decoder/30/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/30/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b8dd7ef1187a24f4c1c82030d32b8ac6d8be24a2 --- /dev/null +++ b/model/model/decoder/30/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e922fb6b7dbab65419fcffd8df8819795437e7daee0f4481895400f813eab5 +size 58720560 diff --git a/model/model/decoder/30/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/30/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fd6fc507aa6fb15c827ac925bcdd8d28e0b20452 --- /dev/null +++ b/model/model/decoder/30/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0534b40ede242fea342ac67e54bdd4baef344d92ca91381f0b95b4df4b4e6b19 +size 58720560 diff --git a/model/model/decoder/30/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/30/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4ffdd3d8f81ba325e29b0fa69acbdc56a624d009 --- /dev/null +++ b/model/model/decoder/30/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99b6e64a0706de83634274dc0d051dde9c9e4744eb41ab0eaad82030c204c8c5 +size 8288 diff --git a/model/model/decoder/31/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/31/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1bbcaa1d65622867e41f136cd4125725b19bd593 --- /dev/null +++ b/model/model/decoder/31/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54980d35e2cbdb74b7f2e7236e2d9d2d0477f1c5ff7fd6913d0fb155baa157cb +size 200 diff --git a/model/model/decoder/31/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/31/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c12cb8f2d0f0f4edc95f12069ad2a91ec0c2703e --- /dev/null +++ b/model/model/decoder/31/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9f8e8a649e6d492833dc572b5ccd8364df215c103e50a0400cab80a88ade291 +size 200 diff --git a/model/model/decoder/31/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/31/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f3a77d22c549f7762039553ed129f517cb8cfc9e --- /dev/null +++ b/model/model/decoder/31/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a55132dbb44c26b741586953af1c26f639bb93cfb6f20a781ee0a9cc0fe17d9 +size 200 diff --git a/model/model/decoder/31/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/31/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fcb7c520127ba69e42df3d4f952de9f466bf1963 --- /dev/null +++ b/model/model/decoder/31/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d76860d72f600a2a67973180022ece49634ed6aec8a8284243dcc6a2caee496 +size 200 diff --git a/model/model/decoder/31/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/31/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d884b026c2e5e9b5feb0204c229facc79e2965d6 --- /dev/null +++ b/model/model/decoder/31/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9848bdc48ef45fc5f87c700396435e68cff66be954e4400d41988f87320dd482 +size 8388848 diff --git a/model/model/decoder/31/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/31/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4871abe8cee081080263d3e62753aec95ce064c2 --- /dev/null +++ b/model/model/decoder/31/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0064e104df43dbebb05eb2928f1fab643b766b1f66fb938cb828e6eddc9d705 +size 8388848 diff --git a/model/model/decoder/31/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/31/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e05a2ca58d87c1ba1cec02fd685a80a5343105c9 --- /dev/null +++ b/model/model/decoder/31/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73ef046938a49affd22fff7c4f57ae3da1f7b3bf226917c955671ab5c74bf3e5 +size 8388848 diff --git a/model/model/decoder/31/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/31/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6895b1eb39e333b88cb30d96652748d16c1e02e7 --- /dev/null +++ b/model/model/decoder/31/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19cab7c097dbe1d686b617bb411f3436a6a8939b634fe53b6deb267b5f99975a +size 8388848 diff --git a/model/model/decoder/31/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/31/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3b82c6ae102835eaeeb65a3bba415c725252825d --- /dev/null +++ b/model/model/decoder/31/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:065733abcbafdb7920e6af7e332feb86970105190b101d831845c4166b9f9959 +size 12583264 diff --git a/model/model/decoder/31/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/31/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3ff609647ef8593d3142843ae4d6282baeab9baf --- /dev/null +++ b/model/model/decoder/31/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d959aca569c1462118c545a72b0175b1a1ada9fa19d98fab3774dbb1bc663c65 +size 12583272 diff --git a/model/model/decoder/31/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/31/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fcdd566892509a51450141f616378de31573dbea --- /dev/null +++ b/model/model/decoder/31/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4adb45a3f0719ef1857f9b07519c6740a04b99850f85c1b0cafba3abb80a0001 +size 12583272 diff --git a/model/model/decoder/31/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/31/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6dd52bb15a16c957d8a48aa4040f4f4fcf6bf0f5 --- /dev/null +++ b/model/model/decoder/31/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfefce8e31e3aac5e6a40ae2d19fc1320649b90574e2971fb70466333c2a1a44 +size 12583272 diff --git a/model/model/decoder/31/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/31/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f26274d398d0a1a57d90b8208c5dbd56ab006122 --- /dev/null +++ b/model/model/decoder/31/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ce3921ce571a4529be069f90f8ae990304b2fe52202c13018a589c3f5b0dd3d +size 8288 diff --git a/model/model/decoder/31/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/31/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..54a57da56bd5b93d73dbafef2e0a664860fc145b --- /dev/null +++ b/model/model/decoder/31/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e86c8a37c8adc50239759efb96d3406bb9efefb3583ef118fe2c679af5db6037 +size 29360368 diff --git a/model/model/decoder/31/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/31/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f8a11dd194ca3d1070ad1ae3478e84cf7d744bf4 --- /dev/null +++ b/model/model/decoder/31/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4ffbe5a705274f5b606c88f16b0ab9a4858fc9a5ec94879040429c1628cf7dd +size 29360368 diff --git a/model/model/decoder/31/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/31/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4c97af209486b779dacf58b93ef72f74541699dc --- /dev/null +++ b/model/model/decoder/31/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:229de9698139d2353433fa5f1b8a7a067d5202ec7e9f141fbe8cc8a3c8cb983b +size 29360368 diff --git a/model/model/decoder/31/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/31/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f8b319ad02b016d163f9fac7309f485f766b6479 --- /dev/null +++ b/model/model/decoder/31/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25ef64224777cd2c1e6030bde77ad1645c4bfebd568e899728c319751c057435 +size 29360368 diff --git a/model/model/decoder/31/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/31/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..635803409780c7953ee19a16c2e1828a4e3704e6 --- /dev/null +++ b/model/model/decoder/31/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cd2a64d4ed5718d1ae48420abd6ba0b5e92b11c3d38191e4a9664dc4071029b +size 58720552 diff --git a/model/model/decoder/31/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/31/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..47e03067e86e3b668cd9d2fb4b6d187be1f5b615 --- /dev/null +++ b/model/model/decoder/31/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec50c7fd201eef6184a3a70372ab10622574b22de1a80f29cc8fc8aa3edbf49c +size 58720560 diff --git a/model/model/decoder/31/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/31/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..99e62078b12359b85adcd86d51ec7a0f493b9ad7 --- /dev/null +++ b/model/model/decoder/31/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91779527dff8711afa4713c82c5f51e77fe398c1360489f10c97f5373d02a0cf +size 58720560 diff --git a/model/model/decoder/31/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/31/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c039fd5a2712870ab3cec09f402f04840384099f --- /dev/null +++ b/model/model/decoder/31/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08e103ef5f9cc4d47950e493b9ec4050295a7c6fdbd0f0394670c2dd6399c7c0 +size 58720560 diff --git a/model/model/decoder/31/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/31/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eceb52beceea791a93d625d3eea5d9447cd28d7e --- /dev/null +++ b/model/model/decoder/31/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:436b4e41dbbc627e95e83676cc86f615e67ecfb290cc4125df2e2b0ea42fc9ce +size 8288 diff --git a/model/model/decoder/4/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/4/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a2b008ea7910b5fb118d5006dc2bd7738e3b32e5 --- /dev/null +++ b/model/model/decoder/4/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c53da48e24cb985fe4842965f4bf04bd3cf485c45aab42628ff1d8b1fe7510c2 +size 200 diff --git a/model/model/decoder/4/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/4/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..05cef729b193a335d306a1720fc419601c993bfd --- /dev/null +++ b/model/model/decoder/4/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a39fa6a06b856b21b13fc0fe7670ea57f0a58fb80baca75bc886c7b9c5144c +size 200 diff --git a/model/model/decoder/4/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/4/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c6b533d46c3b650518bdcdded8f2fa82c3468077 --- /dev/null +++ b/model/model/decoder/4/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:643ff0cbfa8d1389f80bc40318a90dd49f42cacd6e3212a42d6137cc6b7dc356 +size 200 diff --git a/model/model/decoder/4/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/4/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..06ca280a23ee78d4cb5a4b4a1cdcb9d6a9773c1c --- /dev/null +++ b/model/model/decoder/4/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:520b93311eb4ba0b6a422bba2111a923934436ba334a12b520aa2c3570088a19 +size 200 diff --git a/model/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0c1c89f31bd4d5b5dd6f3d47eec0dab33c35e737 --- /dev/null +++ b/model/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5738a81d09c1d8793a2c3bcf3a2be7904f20e9dde41eb53d7ffa0a4da2fc92c +size 8388848 diff --git a/model/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1674f58e5850121bc0da24c38bd2b23006607ad8 --- /dev/null +++ b/model/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35e00926e62e16d6043af8c3bd6a2652296c7a578167ed90b765132aea146ade +size 8388848 diff --git a/model/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8811adf39caeeaa7d4b858c811b79ce12931c2cd --- /dev/null +++ b/model/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2074cb5be2c29a0df09c1264ef984a32feb5047c8db7054924cbdc9abd6614ab +size 8388848 diff --git a/model/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..caef097d6a89deb1eee701ad8ee94cc499c0eaab --- /dev/null +++ b/model/model/decoder/4/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c654a0f233cf516ed671657278054df69b55ed9fb33e4bf846f8bb4cd53fa53 +size 8388848 diff --git a/model/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7170b326392e85273d4b135efbca61db8802c531 --- /dev/null +++ b/model/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3095302259bb701efd4c8c7288405dff230834601757d942396f22418518623f +size 12583264 diff --git a/model/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..00d1eae70fc119a7a470e2be5774f56b509a5742 --- /dev/null +++ b/model/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bbaf06da40d2d79cf7aad9ee912f870f17ff505f7434894cf6cba6d2fdaa138 +size 12583272 diff --git a/model/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8a2f57db605a116e27e01dd9f1a7d0ef91fd399a --- /dev/null +++ b/model/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35f80674935c92d2e921ddd4d49433ba75daeb90937216747a638211eede94cb +size 12583272 diff --git a/model/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d39e3b04d82e9e69121cecb233e5bf3a0762b75d --- /dev/null +++ b/model/model/decoder/4/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:060f47cc4c830ab5c39bc8184ea30fa26aea5907cc66370fed9920daf3048a5a +size 12583272 diff --git a/model/model/decoder/4/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/4/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..01b86ef199508ccd387473b453b54e10748cb6c9 --- /dev/null +++ b/model/model/decoder/4/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eee9a0b07bdf8a6f915119115756afccc11641a1a6bf80069a8929af157a20eb +size 8288 diff --git a/model/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..255b97828093789a9ab7d08f28f45eddafb68295 --- /dev/null +++ b/model/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:407fcd4674e1fdcf6f354b2e92d5624105e62cc12599b628aea23368e4455be8 +size 29360368 diff --git a/model/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2635eedf032b07dcb6245ff313d1d57053114dec --- /dev/null +++ b/model/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cb24a410609e0ccc6040b9ef896c7cf2500b0b91de82f00bc17bbcc62521f88 +size 29360368 diff --git a/model/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7235f192a7b8dcf38e6261b78c8d7a7c49d523a3 --- /dev/null +++ b/model/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8601a8f768c601b35666589d78ad8394e3147904f12102f4c8a7fb8d02ba88ee +size 29360368 diff --git a/model/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..70724a64d939480c3d883637940eb7913923debb --- /dev/null +++ b/model/model/decoder/4/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9ea98278e042acca558abaa48747d1b642a043609d280d16404b2e9962ef770 +size 29360368 diff --git a/model/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1038841a0bed8641b2fe0c71c49334d3cfc2c176 --- /dev/null +++ b/model/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf4b27825d6b6fa2de9e9a1aebfe718e8fc1d5af62a160bd8dd520de17ec5a7 +size 58720552 diff --git a/model/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3b664554777e0ef65500d6dba66169438f8b0901 --- /dev/null +++ b/model/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e80af8d057d11e93906cdb121bc62be44269caadf4ee69871431d50797674ec3 +size 58720560 diff --git a/model/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..49bf6c712bad45d2247215b5cc88090dfeb22cf6 --- /dev/null +++ b/model/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:952045e822741ffa29b97e4a0cc48a942430a80084d417ec1a76636b382bc3fb +size 58720560 diff --git a/model/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..692734088ef74729b5211468d9aedb2f5a9c008d --- /dev/null +++ b/model/model/decoder/4/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2815472a1a06c3b6f921afe7676ac16c50bc10968b83da1822ae1b7988527ab9 +size 58720560 diff --git a/model/model/decoder/4/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/4/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7eb9687a5e7726d2eb9a2f37e0762bd914ee5b2f --- /dev/null +++ b/model/model/decoder/4/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c123bf53f09b0e0ca9b298a251ed8db4c433ec2dd7e0c7ddba5d39535dba371 +size 8288 diff --git a/model/model/decoder/5/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/5/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f35f21cc74aacc63c2736da5bc77f370397728df --- /dev/null +++ b/model/model/decoder/5/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c580c0725aba078ebbadd09f5a7b426cb025d90d6b645a9dd71ff198c1bdcd4 +size 200 diff --git a/model/model/decoder/5/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/5/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e8d3022917949054a336b72f2300d07933ce6909 --- /dev/null +++ b/model/model/decoder/5/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:825dbf35b57f0d6d8653ae1d3dc40815eefe6fc1105a0bc1c28c65505c134042 +size 200 diff --git a/model/model/decoder/5/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/5/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5e7f0fa42af2fa76b6e1d2c1b5c597aa64e7225 --- /dev/null +++ b/model/model/decoder/5/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3273a48f08276c56ee143ea9ebf1eddcd68fdee88eb192c41545b1801c75a068 +size 200 diff --git a/model/model/decoder/5/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/5/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0510d57bdbb23a3abef1f5dc4e724bd2540ed096 --- /dev/null +++ b/model/model/decoder/5/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d075823e5ef7876c48473d50e6f91002b6c0ff38216f3edef76b88ec66b83ca4 +size 200 diff --git a/model/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cdd145480cfd930735a47190d0fd634434fa957e --- /dev/null +++ b/model/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68f691638445b38eeec5afdd8820b16f99e599a9f171de299b1aaf1325b83841 +size 8388848 diff --git a/model/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..713f45a6062f82f08fe37401a04b1bae5a949680 --- /dev/null +++ b/model/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db3d6d1642ef02328653d28d5a607ef6c2fd95a3d7f6d760736567deb94d639e +size 8388848 diff --git a/model/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c562373f5cae75564a63e0ca13aa1c33bfc16d9e --- /dev/null +++ b/model/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fca925f9e28e3021779f644f8e61568e04a81ac6ce2295fafb04ee97a2e0051 +size 8388848 diff --git a/model/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..480abd5c8b2f1650ae1f25e326ae34786b0e6fa7 --- /dev/null +++ b/model/model/decoder/5/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57cb9aabb0a49e3a4b3ef3dd770e20a4d40a3d907730eb1a995da164baeaefc7 +size 8388848 diff --git a/model/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..39890bdae56d072c73bef8aec7c813bfba53c092 --- /dev/null +++ b/model/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6164e91ade9f80c707337094655d3af914d87108871601e7cfe7ed09a4eb2409 +size 12583264 diff --git a/model/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52eb7eb3e670eb50fda1b3df0453ffa6da8f3a0f --- /dev/null +++ b/model/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5acae908e7090a9ae737881a0bd852c2e8dcb2956820ef4ffb01440959c31511 +size 12583272 diff --git a/model/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..38e66962b7b908f48fcb3124f2b8c732cdc56784 --- /dev/null +++ b/model/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:254d49cbe1a6a4ff7d8013ea49eec5d0f83204aab2a4f4471d5e36b7986d8cab +size 12583272 diff --git a/model/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0e93f89dfa4adc7e43031a9d4fe7cbabff1620dc --- /dev/null +++ b/model/model/decoder/5/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98f11a19f3ec23a4d5f27ffb6e90a727b07ccaced92b7c4431fd30bc8690cdd +size 12583272 diff --git a/model/model/decoder/5/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/5/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bcacda504bae7531c171d199c09a0dce944c479d --- /dev/null +++ b/model/model/decoder/5/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a37dfbce9c985e31133ba46b90a554cc75923ae159490394122171b3ea54a2b +size 8288 diff --git a/model/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..53fc8ae9b333cedd8134d5d6a74e0945009239c7 --- /dev/null +++ b/model/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6ca4a68a9b4264d0d611c54c9d986e2975cd490f897648fc25841c05f56ce0a +size 29360368 diff --git a/model/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9950c4fac35a11b74c2ffcc45f0e5175468483fa --- /dev/null +++ b/model/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bcd0b75bb8322a414f831f38fcf4bac5b0dbea23f94a146310fe92f632b87ba +size 29360368 diff --git a/model/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..93a85a33ee50e4f5b23e549f1a0fbc9ea8cedd77 --- /dev/null +++ b/model/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6389760bb66bbc211ed16590af276f9bc5294bcca69b22a82093da08079261da +size 29360368 diff --git a/model/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cbc41137afcd19bbfa7e72b2a6b5fc8b37529ba0 --- /dev/null +++ b/model/model/decoder/5/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:252c2a27f83b69f74474cc69b14a1a614a17dda4d3d2d55218c7c545b33c8a01 +size 29360368 diff --git a/model/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ad719da87e678a7454d6c43f6d968e152aefcd48 --- /dev/null +++ b/model/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:665b7550f0eaf5d5f5c614fdc20d644a37f19fd083a5f9162e204f9844c91c69 +size 58720552 diff --git a/model/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fe0c185209b3e9e78e9ff606aeb47bcc775139d7 --- /dev/null +++ b/model/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a8e442b75cdd7c251bec4904a728adabaaed431b6060a4a6761240ae8275c6 +size 58720560 diff --git a/model/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a9e3fed08fd68eebe0fb26f6ee63bd0eb429107f --- /dev/null +++ b/model/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a98901f61ac46840fdeb580c8ee8ab45bf8cee154985288e6988c023b7f3eab3 +size 58720560 diff --git a/model/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2f6be320d505f1c91745227c56d4c101103abe5a --- /dev/null +++ b/model/model/decoder/5/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdd83e3bdf21d91f6f2e0c367c22510c87071f953b6ee78606538eef73d64d23 +size 58720560 diff --git a/model/model/decoder/5/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/5/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d1bd81a6569373789411a33737b2d2ee0637f2c1 --- /dev/null +++ b/model/model/decoder/5/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:132c1076b543b3fb30147b5328f1670a828cde73a434d000a8f876ff226af936 +size 8288 diff --git a/model/model/decoder/6/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/6/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..67276be33e18afc1b51d46e2051d63fed3fce04f --- /dev/null +++ b/model/model/decoder/6/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:519a8de82202e69dc49528840ba5c086f60f2a688ceae22a6aa390004255d0f5 +size 200 diff --git a/model/model/decoder/6/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/6/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8aa5a3dbc3825e4d153a330e8c34f97179a62798 --- /dev/null +++ b/model/model/decoder/6/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292d0166e3605e191ced63051328b6c484bef2f95428efda2f041de4e9890dd0 +size 200 diff --git a/model/model/decoder/6/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/6/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd314abca250a5351bb8fffb63270ce0d9019f1c --- /dev/null +++ b/model/model/decoder/6/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:687b267ee6362f1bf64d7e2d116eebf1215fdd2f8d66aac2dd21d48762b73d31 +size 200 diff --git a/model/model/decoder/6/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/6/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..450db272f3bcb71ff4f4957ae5e25c174d8e7764 --- /dev/null +++ b/model/model/decoder/6/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd0dc38b994a15577cbe2a491761248d37dbf233b614e79f83d6ab90e2a9b214 +size 200 diff --git a/model/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5694eedf010d9a7fc4cd6917075872b4796d0416 --- /dev/null +++ b/model/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a43bc198eba18c031fe5de519b3117b43c0af146fad16ccf4afaafc08300836c +size 8388848 diff --git a/model/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9cf7a451be5ac3c50963accdb8ebd710512238b2 --- /dev/null +++ b/model/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:863917d2eb747a318996ccb5ede662bed0dd26abfc34c962d88e4764e2898db4 +size 8388848 diff --git a/model/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f5751931ac1db4f0392d26d766bfa6b243febbe9 --- /dev/null +++ b/model/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e882d358603b7ed6699692c1266ef68e4ade0c9d4484fd83a8b720b8c680f78c +size 8388848 diff --git a/model/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e1ae6e3984d51b05f2422a1341b0313036b15ebc --- /dev/null +++ b/model/model/decoder/6/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbe361200c13b33e0f2178d966297abfc7e85b35b623d8453248b72a97638a85 +size 8388848 diff --git a/model/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..767851cc3b43a289af91581917fb67c31b3d8d45 --- /dev/null +++ b/model/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59fb298dae050f91f1609510c5d324f3828888688570868e1692a3519bfb712 +size 12583264 diff --git a/model/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..01312cf006d710bd163831a63106b91b115cd308 --- /dev/null +++ b/model/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:159cda348ff89fba106b65aeda3e8d70c864bafe52f808dec03b2d30914da25f +size 12583272 diff --git a/model/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4939b466b91e8a923f2d16e701f92cf57aac7c34 --- /dev/null +++ b/model/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b985b6f81ad11ad7f34b8b490639bf14b454afb2190e350add18f54b2f7594cf +size 12583272 diff --git a/model/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..90cd94eb793a6513f4318e2774573ebc936834e3 --- /dev/null +++ b/model/model/decoder/6/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a94793bee30c736f6de1d8f93625ecc6b8335f9047cb76ddabe711c03456826f +size 12583272 diff --git a/model/model/decoder/6/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/6/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..57bfac2ffaa6d48bc7c4f4b7ff9274aa5ef78a83 --- /dev/null +++ b/model/model/decoder/6/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5679eb6b7f81758ae4efda2dc65250941d6acc04cbf836dbc1e7b0d515e22cf2 +size 8288 diff --git a/model/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..88932fbd8687261cda20c33d74730652808fc8ca --- /dev/null +++ b/model/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872bf2ac9ad5666f02352b2cf300dd45c2b6e9652899d53088b0fe80dd75ab6a +size 29360368 diff --git a/model/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c7880b373eadbfc6e5caeca90061157c141ff366 --- /dev/null +++ b/model/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fbee3df7d31cc957758ae978dd582934c2b16efdcde43d8f53bf6a89baa121a +size 29360368 diff --git a/model/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8cfc45e7549271115786e46ee609fcef85a6a26e --- /dev/null +++ b/model/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ef6d36b307bf675538aba0ce48515694ea2f05121bdf7be35b38fa50da832a8 +size 29360368 diff --git a/model/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7172609ed3cf5de2b5c21cae9f940586845b0861 --- /dev/null +++ b/model/model/decoder/6/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f8831bf088997d8180a962825ca3a8b1755b72afc8c9deedadec958a6272d04 +size 29360368 diff --git a/model/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..84a3bc2947bde9977bfdc2011de83558e77b86a2 --- /dev/null +++ b/model/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9be87fa37de2be63efc7868af40d3606fb178b90ad3563046a93c44350c089f3 +size 58720552 diff --git a/model/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..860bd0e36ba1ad83cb4f6e2bfe737d5d283f3270 --- /dev/null +++ b/model/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:555527e5e96f8f0e1063e64a5a74cfc1fb19aeb5cd0950fd09d4e52cf5d6cf56 +size 58720560 diff --git a/model/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ffc779c696968628230556856824becb6cda6930 --- /dev/null +++ b/model/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1d3f90e3ceb4f4d5c99b08c3e03c79ea4b3b565d1d7e15415c2832f7a4d0220 +size 58720560 diff --git a/model/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..253638e8c2423aaa21b905620c68e45171b20219 --- /dev/null +++ b/model/model/decoder/6/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0773886aa20ee2ad4b49583c898dcc17c3eb11276d7d7f2f661b2a43bf7ab56 +size 58720560 diff --git a/model/model/decoder/6/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/6/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0914fccf3db33545c3d9871ccead216a4005ab3a --- /dev/null +++ b/model/model/decoder/6/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5865f10acff309bed39c2f2b91baf83f645005b4f4bacae5284ac357bdafae8b +size 8288 diff --git a/model/model/decoder/7/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/7/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5ed65f1b812aeb2e0534e91a7f6fc0d75109e781 --- /dev/null +++ b/model/model/decoder/7/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7198f795b15357c1899a399634442f9d59f62f74e0b494f6fcdcb2d728e41a9b +size 200 diff --git a/model/model/decoder/7/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/7/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..43ba26e7f93f47b998daac22906d014f0cd0457b --- /dev/null +++ b/model/model/decoder/7/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c73a05c77ca7076091c76d8371d40b6062da7f8f9601c8f4af8134bcb0cc4d8 +size 200 diff --git a/model/model/decoder/7/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/7/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..af954edeee6b6b4015f725f038fcc0470ef5fe88 --- /dev/null +++ b/model/model/decoder/7/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f0403e148b3f5c77a717e58e18ff69210d18e4f66d00cf15061fc677666c6b4 +size 200 diff --git a/model/model/decoder/7/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/7/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3aa86d368977c134e78c703579ea3e23fe986247 --- /dev/null +++ b/model/model/decoder/7/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ec5f7ed87a1a9d21fc8ac74013c7b0bc4fbbc7461720c9a58b721dcee03bd3 +size 200 diff --git a/model/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..da11750f3f25443a8aaa30547ad8e364b8be1bc1 --- /dev/null +++ b/model/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aff77753d2360d3cc6ee4ed7ff25f1b6f811f4b86be0e40da630cdfc10d6ffb +size 8388848 diff --git a/model/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4a9f03abe2727ec246f3e352c4b5b131dcdff7cd --- /dev/null +++ b/model/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2290853d2d2e08826f7781771f77dd06eef72a8481a7c8b678f5b8711f820dd0 +size 8388848 diff --git a/model/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..958b31ca391f4ebf0a73daac02f96465d6eaa4b3 --- /dev/null +++ b/model/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dc0ef6433fdd52f62723b4867c8de9ceb396b6dfaaebe22e1e2e923917004f3 +size 8388848 diff --git a/model/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ad40aafeafc8629f36a3cf953e9ce2e223eeb48a --- /dev/null +++ b/model/model/decoder/7/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfb833e870c53d1ea1ff84fd011c10d49e5499b5c94636dbd4855e39e47f451e +size 8388848 diff --git a/model/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0e382b34bc129bd8e9ba6be81c284955def28376 --- /dev/null +++ b/model/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bffecc42bbe4bb7c49f096a523e8c380a556c1fca5563440d04ce4b749bfc971 +size 12583264 diff --git a/model/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..284d9efebf1898fe14effa132113fdd3ccce7ef0 --- /dev/null +++ b/model/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a968e14df1114a97017e5b0239f2ba8488e6b81ece3baf600205b04da6f91251 +size 12583272 diff --git a/model/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b91fa13188ae4f7e68a943f32e34cb64c387e72a --- /dev/null +++ b/model/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dffa23a5949a93bebcd5ff3a83be130e03e0da4e1cabf9e2b34eeb99a94c049f +size 12583272 diff --git a/model/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5dad2c73a54af9bf9e60c45c67f763a828c5566 --- /dev/null +++ b/model/model/decoder/7/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa482b43ce72753210564e489c6b6ff3d7bbf1f713fe4bc0ecb59b0cec615dcb +size 12583272 diff --git a/model/model/decoder/7/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/7/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..06c6bd31ff9fc8f687e210f39a7edde9d3b9e121 --- /dev/null +++ b/model/model/decoder/7/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5662ec8cecef52b77f9340fbe431fd90c2dd8e7a54d71c56350e4a5980977d2 +size 8288 diff --git a/model/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f1531be116524ca20ec9aa6c223ad91eb7cff50e --- /dev/null +++ b/model/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f207b0a621be835ff8ed99d67fc54fa972e1061660b01e52d9fc4e8973b0a9e6 +size 29360368 diff --git a/model/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1c7b5c62a3aee62a9f144ca4df48f9e39b1d41b4 --- /dev/null +++ b/model/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d78a5cb826c8ff97bc4d593431501d4646f75723920409010159dfe2c54bba1 +size 29360368 diff --git a/model/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..15a451490d566d970d803d36354e1403fdb090c0 --- /dev/null +++ b/model/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c82088cabf16c29d7e46865a531bedf8ca8da3a4ed15146506242693c3976509 +size 29360368 diff --git a/model/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..63174616e5c2186c51128286c37c382d4bb64bae --- /dev/null +++ b/model/model/decoder/7/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:774b76d8d08031b05c5c1b4121a4c5fe43df11a6ec22b1b2982170bbb09a2200 +size 29360368 diff --git a/model/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a6f020e0b7e8d5338a80bb66b609d3c1bf6e99ce --- /dev/null +++ b/model/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d7670dc4b063e5ef4ea7c5b82e5fde2cd80bf4430e377fb3f24e9f4683542f +size 58720552 diff --git a/model/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd422b52db37c85cceab8ff297d90ff093a04a04 --- /dev/null +++ b/model/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6aecd2e85fb19d45849dd94ae6161a5949cb0adb261097b9ab7c7df23f89774 +size 58720560 diff --git a/model/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69789784bf4e62aadcc30ddddf28e4fa16e637fa --- /dev/null +++ b/model/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:573a02daa9a97f419c75ed3719a4ed3a12427c798b23629c0924433cb42d706d +size 58720560 diff --git a/model/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..086b91561172cba2f9284fc6dea81321177076c2 --- /dev/null +++ b/model/model/decoder/7/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5e3d194dd6dc1637e0bcd2827c61df81daa797371f59a8bc8a30f1dade5d39a +size 58720560 diff --git a/model/model/decoder/7/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/7/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d0e2c3c42fbaa257ca4b559e9ef0ddeb992e3fdc --- /dev/null +++ b/model/model/decoder/7/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc6657b35f48a5f9294947e4f4296d7aedb73d0a15a94d6ace4d254133a8568f +size 8288 diff --git a/model/model/decoder/8/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/8/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a0f432b150df5efe99c3df9667817b017c5514f3 --- /dev/null +++ b/model/model/decoder/8/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fbf4cb45c3675ca85aa376821473a08f12d39cdef6a8826d02aa2fccedaeb2f +size 200 diff --git a/model/model/decoder/8/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/8/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..de100832126780097a19d46e29f1dfc0441db572 --- /dev/null +++ b/model/model/decoder/8/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d602c776ddd6406bde96dd5a7c07832270dc6dcb53b19fc1079007a7e00a7e05 +size 200 diff --git a/model/model/decoder/8/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/8/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..274b7a12853f0994131c83761a8c02ba7b1ce31e --- /dev/null +++ b/model/model/decoder/8/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6481f201ae778ae12f244fa494af5036e443323fba6e3ebfff8050f6fa141815 +size 200 diff --git a/model/model/decoder/8/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/8/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..155954bdf6bd35cc3d0707c2b670fb7c8a7e54ca --- /dev/null +++ b/model/model/decoder/8/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6a3b80b75bd20aa6f810fd88aca895362ccad01286889e50ed42a157a67b4d2 +size 200 diff --git a/model/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e537caabc77b61b58743e1c0c75f2d8a7b618c6e --- /dev/null +++ b/model/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a76703629f02600e69f9bb298c6f44707fa50a9d2aeee4d5760ce6306e26be17 +size 8388848 diff --git a/model/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d312aee45efba1d1b4f3280eb17981a078f6f6da --- /dev/null +++ b/model/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4baf261c1a4f45738730dfbdc2aa4a5890381947e042174742cd5ab49cec90f7 +size 8388848 diff --git a/model/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5f960c2483404679c1e043d6f3b7ce8b83f30881 --- /dev/null +++ b/model/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e93d653300d3945509996ba331ac74a3c88873d78b70e7b88815f917f3aec507 +size 8388848 diff --git a/model/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37e91503577254b5760003d25b91b104e7146ddf --- /dev/null +++ b/model/model/decoder/8/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40f11e2dcb90bb27b926e0b3b31a3b743cb8038e38cc54967cfb8e9dc70e701e +size 8388848 diff --git a/model/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..07e76101af1c3cbae6e9e72fb8f8f48b6dafc5db --- /dev/null +++ b/model/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c8b0b0b9bbc5629ab29c16bf0da1750804e4ef91c985970b6db9c67eba7d630 +size 12583264 diff --git a/model/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4751aa99836665a3a8d03a493990db6eb43d8353 --- /dev/null +++ b/model/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5b4c0cbd587926284be5292b518f11126e72bf5160b80f9c70c5374c3d35632 +size 12583272 diff --git a/model/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..295a881fdaea485e35ea567832a070df31412856 --- /dev/null +++ b/model/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c018833f177e95a058d2bba1d66a330a0ece3aa549ac1a637fc3b9087a90e6a +size 12583272 diff --git a/model/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f2a65122c93054a947cb3ec23fa6cd826068214a --- /dev/null +++ b/model/model/decoder/8/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e05d4ff22ca729dfd8d02360465aa07d3dd26d477824083fe5ac9eebfaf9f8b7 +size 12583272 diff --git a/model/model/decoder/8/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/8/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..115755c4f8a151a7c348526dfc854cbd4049a015 --- /dev/null +++ b/model/model/decoder/8/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2a98818c3845ad44427bf3ea51a9440cabaec2b52a817e302f8e6841cd573cd +size 8288 diff --git a/model/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3cfdf271aa074a8313485ef69b9f560956c711f3 --- /dev/null +++ b/model/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b31d92bf79832f061cc5a91c33b1c645c72321c3fe991188bd861573f5874dff +size 29360368 diff --git a/model/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..92e21a185f4a9e9d9654a326230e7a58901b3309 --- /dev/null +++ b/model/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcd5fb7f80ef202debe61e2e26a65f2319bb99c822cf1e9543f6d79fb9469c60 +size 29360368 diff --git a/model/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cf589e920ee1166be6b94f9681a9d7caafb8119b --- /dev/null +++ b/model/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ac703a62bb9fb14445cce98570ad4c96c3e97efc466a87ff3f09071ed74d411 +size 29360368 diff --git a/model/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1d9a20e1e62f99eed236a4c3a569b984cf5f05e2 --- /dev/null +++ b/model/model/decoder/8/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7737f68a4a3eee5f722a3734a531b1face90240c4938ab1ed13a26d4e7b258b5 +size 29360368 diff --git a/model/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..71ba92b47df40ce18673350c7e5c5e73c28865b4 --- /dev/null +++ b/model/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09fc705d9407e072f0018cdead4728f5dfc9c871088e7d6ee1904a058d137260 +size 58720552 diff --git a/model/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..56fb2b2fe3e2daa33a007c5d0a71a083676cdda3 --- /dev/null +++ b/model/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:385f3c4f520d46483aa86afaff55e883d8f59ae6b2c088fdb878245b8f46165a +size 58720560 diff --git a/model/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9a82c71b8ba7eeb8c92bc9ba8dc74413f5625658 --- /dev/null +++ b/model/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d57c96a0fa1e62e2f25db61add82dc0f350410b87324c15d8141a9e8e51dc6 +size 58720560 diff --git a/model/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9589797aa0a091b3fc53a3be57b744ec4bdd8d06 --- /dev/null +++ b/model/model/decoder/8/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a0acd49f379d5a77733ac5b7af66eee097369f32d9ffb520e4e3485e0dd5bb6 +size 58720560 diff --git a/model/model/decoder/8/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/8/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..88976907dac5908642f8ff287aa814d9e3885a58 --- /dev/null +++ b/model/model/decoder/8/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43d2369eb3a1408e9ef394879ea123adbe9e45c0e2eba736389952897578154e +size 8288 diff --git a/model/model/decoder/9/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/9/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5781ffe6b4d325340560e4b6c0d2578d71580416 --- /dev/null +++ b/model/model/decoder/9/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae58b5caf82ac5f6f925a303f254ef154d6662874c6537acca9d10540cf68e3 +size 200 diff --git a/model/model/decoder/9/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/9/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7f7278d369d2b6ae10d4d1128035e96c3dfd5189 --- /dev/null +++ b/model/model/decoder/9/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:490a8b6aa946a0b02e89eb8f518041f2237708e20c737364cb50e6aacbe72ad0 +size 200 diff --git a/model/model/decoder/9/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/9/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ecdf55a23d901a3399489a4630059570218a00f4 --- /dev/null +++ b/model/model/decoder/9/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d179bc875a44854af0f827f3d64c7c3e59305e93c91e245438786e6171fc3f90 +size 200 diff --git a/model/model/decoder/9/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/9/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a2e48ada789e13d50a351c2d0847c25073927ed1 --- /dev/null +++ b/model/model/decoder/9/pp_block/attn/model_balance_factors_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa548a7fde0c6ffcdb20a14fa8ae1f6057eb1b5977aed9cc2bd74347573eb0e0 +size 200 diff --git a/model/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c61ac583e42739d82209ff1edc34d510c3012928 --- /dev/null +++ b/model/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc4f62ce75a453104385d24befc1c61abf774c288c930c3428ae13b3064b2cd9 +size 8388848 diff --git a/model/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1dc349766e945bfd88e23ff12b049d5a85794eb8 --- /dev/null +++ b/model/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6f0eade813def473b7aa12064a83571277c81a9f0552c1920ca67d6a54c65b9 +size 8388848 diff --git a/model/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2b98c32db9a0f54b5eeab553bb5b916bf9849809 --- /dev/null +++ b/model/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c816b41acc4fd8b04c0b6e42d98e67499c5b14bb5f0f1cfa2771ba1a6ec403d +size 8388848 diff --git a/model/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e6b23d389a22efe416013711331da2f8dafe299a --- /dev/null +++ b/model/model/decoder/9/pp_block/attn/o_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62cdeb6b81af516508a1c0ec582fa5aa981dfda2e53d568657a0dac7c44d81e0 +size 8388848 diff --git a/model/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..054b3438128a4da5010bb2145560d79300a8811a --- /dev/null +++ b/model/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9c0daf3c4ddd3a0b529aa8c8153d45017d1d86c4d163811d04cc4e19a2a2d7a +size 12583264 diff --git a/model/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1fbdacc9e7b4f1d1898cfd76f97cd1c84805124b --- /dev/null +++ b/model/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2a58a9b4282a9ef4272e31dc92a3e91a237a0855242d9661e4f0562e3eb3155 +size 12583272 diff --git a/model/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f0818218a5fc6175553576fc705b0bd47e50f779 --- /dev/null +++ b/model/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce777fe49d6883429b10bf2629c030cd7ddad9f1cfd1bd9a6dc00d7d7ddb27ec +size 12583272 diff --git a/model/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..05d4aaa5e582db8ba61a8e7030d829e8aa69ab7a --- /dev/null +++ b/model/model/decoder/9/pp_block/attn/qkv_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3706dec3f8916f13bb85f3de23f73758075da27945a3a6b0598e22aec6afb116 +size 12583272 diff --git a/model/model/decoder/9/pp_block/input_layernorm/model_weight.safetensors b/model/model/decoder/9/pp_block/input_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..46adb005454ac995cf8e36011048675f3cd0df1b --- /dev/null +++ b/model/model/decoder/9/pp_block/input_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:979ed92a0b1253076eca781ee510e9dfcffb4ab49ba8767c17114962e1d60ed4 +size 8288 diff --git a/model/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1aacbf871e0f89078a543c8cbb05893b853c9ed5 --- /dev/null +++ b/model/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab675c055db0e1ea97363ab598788fd4f2f1d7d2dd9b9a42dc5df0ec5d6b430 +size 29360368 diff --git a/model/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..67473189b50f8694dab5711420fe366fb2bde0fc --- /dev/null +++ b/model/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45be4cb6a0eaf4c75f4a721592971699fd3134cb40c142b5f90ebbf6150d3c2c +size 29360368 diff --git a/model/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e3d258f7a8486cfe807288dc5c9f25ab882d950f --- /dev/null +++ b/model/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ad83b90bf3c22082e0bbe76ff01da98eb74ba7f2f0db527fd7dbea520f06b1 +size 29360368 diff --git a/model/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6e6c2aa653b76f3779fe0a634fcf085878268c7f --- /dev/null +++ b/model/model/decoder/9/pp_block/mlp/down_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:157b2f137aa8e9b325081f1af65c1523ab688204f6e9ff5af67a56f50fabca66 +size 29360368 diff --git a/model/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c4ef925c23a5c747bef439f45d11865ec6f9aa3f --- /dev/null +++ b/model/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fef237bfda55c7f159486ff7d93d42ff342b49f2eb5869a1e9b833482dac36a +size 58720552 diff --git a/model/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..68ed34da18e607665af5a7cba83c901945394323 --- /dev/null +++ b/model/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f434415bfc664bdfff1995ed62b6d4200937713acc9d86b7e734dca4c603d2ff +size 58720560 diff --git a/model/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d4eb54957a3701e7b07af0a985d64bf6318d2ab5 --- /dev/null +++ b/model/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0f6f6426a399ce220e19460281272bb5bc7f61fba2136671592c93e9e115505 +size 58720560 diff --git a/model/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e8f83ffb0f1a0361d02b05600e55a546067ebf06 --- /dev/null +++ b/model/model/decoder/9/pp_block/mlp/gate_up_proj/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60dab2e09784fcf615f3d2d0f5c2e0a3c27b5ca06595aca27ca88f04abd882fc +size 58720560 diff --git a/model/model/decoder/9/pp_block/post_attention_layernorm/model_weight.safetensors b/model/model/decoder/9/pp_block/post_attention_layernorm/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52b83b3221c2c70f502dbab56f2a9ee93520fb84 --- /dev/null +++ b/model/model/decoder/9/pp_block/post_attention_layernorm/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aaab17cf466fc86d761c106b608e67b7282d96b8b148c18baadd227ceb625c6 +size 8288 diff --git a/model/model/final_layer_norm/pp_block/model_weight.safetensors b/model/model/final_layer_norm/pp_block/model_weight.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..372118a1e6b762d348ecd6d2a3779ccf7b16dfa0 --- /dev/null +++ b/model/model/final_layer_norm/pp_block/model_weight.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb74223df267ae5c2abf523451c03f1367266d0b0e2456a948bd0037664d216 +size 8288 diff --git a/model/model/lm_head/pp_block/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/lm_head/pp_block/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..84a7a8b74df4c620c4c341a2a9e90e6c1116348b --- /dev/null +++ b/model/model/lm_head/pp_block/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a39ea10cf468e28fd9fecd74f3c2856c075997918c7c1303b69c108cd37d108 +size 262668528 diff --git a/model/model/lm_head/pp_block/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/lm_head/pp_block/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d741bbde18ed6700108474f417d12f66bfb9f7c7 --- /dev/null +++ b/model/model/lm_head/pp_block/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ab20d162221abce806b470e2cac60aa1cb48af7f3ddcf61c617cb1dd2a6934 +size 262668536 diff --git a/model/model/lm_head/pp_block/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/lm_head/pp_block/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8839c19260fd362a350d040ce4b79fd0cfdad558 --- /dev/null +++ b/model/model/lm_head/pp_block/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ecde43037de232d7595e21b2eb803701bcf50cacbd68ec035969e7644d8149a +size 262668536 diff --git a/model/model/lm_head/pp_block/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/lm_head/pp_block/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f8f9c0bab56a80454cb8ebb53094a17e8878522 --- /dev/null +++ b/model/model/lm_head/pp_block/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c39835f0a4d56e7020c6891a2fa87e8707ed05b0ae6d8be19c0cd5c5b0a2c342 +size 262668536 diff --git a/model/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors b/model/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..334774bca82a71e90215b7e3c754b1dc4df3007e --- /dev/null +++ b/model/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-0-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca43dcac057b8b9034fac7390ccbdac9244824ae306f6f5220f9327443db7d0c +size 262668528 diff --git a/model/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors b/model/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d0534371cebe5fb749bd6be5fa50b689bcbf8493 --- /dev/null +++ b/model/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-1-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f7d9cf04763178d7fb3b448079caa921084e7df6a8d416cdd3200a5608fe6a6 +size 262668536 diff --git a/model/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors b/model/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69e57ed228994e4f59f5e90e303f836f710674cc --- /dev/null +++ b/model/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-2-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:961fd903f638a6e742ab3fab427e234912f70b661a563fcdc420060a413aa7c3 +size 262668536 diff --git a/model/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors b/model/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8494a30664db4a7e9bbccfb62d53ce8fe0cecc6 --- /dev/null +++ b/model/model/token_position_embeddings/pp_block/token_embedding/model_weight_pp-rank-0-of-1_tp-rank-3-of-4.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5ce3c971b670c0385261597c413492e23497097407a669246b5ef935db7ba43 +size 262668536 diff --git a/model_config.json b/model_config.json new file mode 100644 index 0000000000000000000000000000000000000000..17278212c443cc814a2339ba4cc947a3706ee533 --- /dev/null +++ b/model_config.json @@ -0,0 +1 @@ +{"bos_token_id": 128000, "eos_token_id": 128001, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, "intermediate_size": 14336, "is_llama_config": true, "max_position_embeddings": 8192, "num_attention_heads": 32, "num_hidden_layers": 32, "num_key_value_heads": 8, "pad_token_id": null, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": null, "rope_theta": 500000.0, "rope_interleaved": false, "tie_word_embeddings": false, "use_cache": true, "vocab_size": 128256} \ No newline at end of file diff --git a/optimizer/optimizer_config.json b/optimizer/optimizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..43deb065895c42d2eaeb380f450583f19a7b5acc --- /dev/null +++ b/optimizer/optimizer_config.json @@ -0,0 +1 @@ +{"type": "NamedOptimizer", "parallelism": {"tp_size": "4", "dp_size": "6", "pp_size": "1", "expert_parallel_size": "1"}, "configs": {}} \ No newline at end of file diff --git a/optimizer/optimizer_pp-0-of-1_tp-0-of-4_exp-0-of-1.pt b/optimizer/optimizer_pp-0-of-1_tp-0-of-4_exp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..38c0f816c8ca124fb5b1c2b4e02e4caeff6da3cf --- /dev/null +++ b/optimizer/optimizer_pp-0-of-1_tp-0-of-4_exp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fdec7d51e80420ab9fcf718f09f5495525e0fa5161a0e428fab8c28859f1334 +size 8031321881 diff --git a/optimizer/optimizer_pp-0-of-1_tp-1-of-4_exp-0-of-1.pt b/optimizer/optimizer_pp-0-of-1_tp-1-of-4_exp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..999ef105420d1af418cddea8978395154e32864d --- /dev/null +++ b/optimizer/optimizer_pp-0-of-1_tp-1-of-4_exp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e608e4d8e81c361a6217f168f9c6fa7cf97c7d4a463fc291eea2091553df5985 +size 8031321881 diff --git a/optimizer/optimizer_pp-0-of-1_tp-2-of-4_exp-0-of-1.pt b/optimizer/optimizer_pp-0-of-1_tp-2-of-4_exp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2058bef5f45cf63b4e7ba6692a70d9ed809057e --- /dev/null +++ b/optimizer/optimizer_pp-0-of-1_tp-2-of-4_exp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db113e7c35de70345f7f7d315cd858779a82b286a8dd1e85714aed0cbe9e3b3f +size 8031321881 diff --git a/optimizer/optimizer_pp-0-of-1_tp-3-of-4_exp-0-of-1.pt b/optimizer/optimizer_pp-0-of-1_tp-3-of-4_exp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..09e0b1a4f93fbe783a963a0a8694575610f04427 --- /dev/null +++ b/optimizer/optimizer_pp-0-of-1_tp-3-of-4_exp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccaac97bf3518eda77781ff4065759051118dbbb68741f1d6bc96297d45dde9d +size 8031321881 diff --git a/random/tp-0-of-4_dp-0-of-6_pp-0-of-1.pt b/random/tp-0-of-4_dp-0-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..329c8e3868606973dc8b198e958a70c0fcee52c6 --- /dev/null +++ b/random/tp-0-of-4_dp-0-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1363e5a1856b4eabe1496566847337ac48d7b6ad28f0638f272e1ea52545d268 +size 14620 diff --git a/random/tp-0-of-4_dp-1-of-6_pp-0-of-1.pt b/random/tp-0-of-4_dp-1-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..873c2611c01fdf915cbc779846e6cebfee9d8a9e --- /dev/null +++ b/random/tp-0-of-4_dp-1-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0e77de92df174da3dd3593e1ad18c03f461a0fc00236bf54667551f52f90c71 +size 14620 diff --git a/random/tp-0-of-4_dp-2-of-6_pp-0-of-1.pt b/random/tp-0-of-4_dp-2-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac0aa69a4db9e92fd0bbbc362513c5dc87462810 --- /dev/null +++ b/random/tp-0-of-4_dp-2-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80309638f1bf0db0e51e7e7e560cfe28b6c8362098a7e1b1f5c1fbe8bd8ab08b +size 14620 diff --git a/random/tp-0-of-4_dp-3-of-6_pp-0-of-1.pt b/random/tp-0-of-4_dp-3-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..05c2b6ace05dcf35129138053efd0f49df3ed07b --- /dev/null +++ b/random/tp-0-of-4_dp-3-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:799926aa2a38f6863a689421904f2a093620c5df62e5b4e0bce841c4eeb17a92 +size 14620 diff --git a/random/tp-0-of-4_dp-4-of-6_pp-0-of-1.pt b/random/tp-0-of-4_dp-4-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..506baacad55135b757a887713b159b7588d0ba49 --- /dev/null +++ b/random/tp-0-of-4_dp-4-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5ee3fc236cebd8163dc91f7778110029cfd621633eb0672a7f77015a88ef1f3 +size 14620 diff --git a/random/tp-0-of-4_dp-5-of-6_pp-0-of-1.pt b/random/tp-0-of-4_dp-5-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb49d48e6eb75a2467abcd4abdb9850be9707633 --- /dev/null +++ b/random/tp-0-of-4_dp-5-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7956840340a12b3047b38727e759ccb54b3684163902e892610a1c6bda9f0a9b +size 14620 diff --git a/random/tp-1-of-4_dp-0-of-6_pp-0-of-1.pt b/random/tp-1-of-4_dp-0-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef890ec00aeb318f37fc987ba29c03b0114df7b6 --- /dev/null +++ b/random/tp-1-of-4_dp-0-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b2eac65629df040bfb76b3120e1216c0cb1f55c6280ba55e9c30caaefa3b613 +size 14620 diff --git a/random/tp-1-of-4_dp-1-of-6_pp-0-of-1.pt b/random/tp-1-of-4_dp-1-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c20ac2b90501a4e4ce5b6bc44e303990897ab73 --- /dev/null +++ b/random/tp-1-of-4_dp-1-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94418d87a6c7b361da85d47ae7a22d04d27bba4e149d7b055af05942d89ac40 +size 14620 diff --git a/random/tp-1-of-4_dp-2-of-6_pp-0-of-1.pt b/random/tp-1-of-4_dp-2-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..cee1dc6c1876606406797a230a8f395431d014b4 --- /dev/null +++ b/random/tp-1-of-4_dp-2-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebde4e1b8c7eef00414ce20a95388db4f8882314c5af1cdac351f119f1836169 +size 14620 diff --git a/random/tp-1-of-4_dp-3-of-6_pp-0-of-1.pt b/random/tp-1-of-4_dp-3-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..221f382fc0560794aef66484488fafdf665b7058 --- /dev/null +++ b/random/tp-1-of-4_dp-3-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5443f1bb2a94c9ffbd75194a5b248920463104699dc7fa9f40e0c74c4695e505 +size 14620 diff --git a/random/tp-1-of-4_dp-4-of-6_pp-0-of-1.pt b/random/tp-1-of-4_dp-4-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..e897b59772bcf426bad1ccf1620a48c9e57fb824 --- /dev/null +++ b/random/tp-1-of-4_dp-4-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8484266be760ebaef2b93d51af262d87c0a1f0499144dfbcc0b7b6f738e4c12b +size 14620 diff --git a/random/tp-1-of-4_dp-5-of-6_pp-0-of-1.pt b/random/tp-1-of-4_dp-5-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbf51dd6b3d7841d278226f474ddc294faa94d78 --- /dev/null +++ b/random/tp-1-of-4_dp-5-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19b8d74b8dffa9ef0f247a3935d3ab5630bbff584b568e1578f46902ba67ba60 +size 14620 diff --git a/random/tp-2-of-4_dp-0-of-6_pp-0-of-1.pt b/random/tp-2-of-4_dp-0-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..505251cff76e605b96034f9f81dc833b37452f83 --- /dev/null +++ b/random/tp-2-of-4_dp-0-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5761ab59fea4ea0e859086a3a8692347edb8481ccd4ee58111df3e1b8b61b2e4 +size 14620 diff --git a/random/tp-2-of-4_dp-1-of-6_pp-0-of-1.pt b/random/tp-2-of-4_dp-1-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..b27d2e2cf1fe30794c14547e0df7a01948c1d039 --- /dev/null +++ b/random/tp-2-of-4_dp-1-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9c47dafded0086072883415c19afa3cb1bf4d323e161f38ad7e2a115210ef74 +size 14620 diff --git a/random/tp-2-of-4_dp-2-of-6_pp-0-of-1.pt b/random/tp-2-of-4_dp-2-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfc7212576f4f7b43729110294cce005a50b38c8 --- /dev/null +++ b/random/tp-2-of-4_dp-2-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad9349966ab01bcd02536e696284295cfa1d217e29ec8fdebab8b77bafcccce +size 14620 diff --git a/random/tp-2-of-4_dp-3-of-6_pp-0-of-1.pt b/random/tp-2-of-4_dp-3-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..143617088e58808239896dab94e65bc2a58bad38 --- /dev/null +++ b/random/tp-2-of-4_dp-3-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0296b113027cae6a58c80466e7b0c5459af1f41f9ce2ce4a773cc3addc77d942 +size 14620 diff --git a/random/tp-2-of-4_dp-4-of-6_pp-0-of-1.pt b/random/tp-2-of-4_dp-4-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..8214a31c664bace8f4b67091ef19351aa9b572f3 --- /dev/null +++ b/random/tp-2-of-4_dp-4-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d8e03458dac0b000526d56b7dee4d8d8ab14fa54241c3dc542c2046e8b877cb +size 14620 diff --git a/random/tp-2-of-4_dp-5-of-6_pp-0-of-1.pt b/random/tp-2-of-4_dp-5-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b0f637402a2dc892ff64fe763f6fa320b23e67b --- /dev/null +++ b/random/tp-2-of-4_dp-5-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ad10f82c8b1ddc98914ad04a8f97b46c2f7d0c0b70d940c246b7280901e1469 +size 14620 diff --git a/random/tp-3-of-4_dp-0-of-6_pp-0-of-1.pt b/random/tp-3-of-4_dp-0-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f38ec442959f71e73c3d31ebb277e68ec1a4415 --- /dev/null +++ b/random/tp-3-of-4_dp-0-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b36801aa80446ac2927ef22a234d6488f93d5c24dbf2096931574f96f63ac0e +size 14620 diff --git a/random/tp-3-of-4_dp-1-of-6_pp-0-of-1.pt b/random/tp-3-of-4_dp-1-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2da6a3cb5df63d1cbdca9fd4dfe788da6bdba95 --- /dev/null +++ b/random/tp-3-of-4_dp-1-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdef203bdf5ebd5417835e75b0cad4786435378d889c958d0614deafc21d4824 +size 14620 diff --git a/random/tp-3-of-4_dp-2-of-6_pp-0-of-1.pt b/random/tp-3-of-4_dp-2-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..044f4690d47b623388331986da51a1ef192c1c66 --- /dev/null +++ b/random/tp-3-of-4_dp-2-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66c55bbfa5ea039051af4989d767cdfe924430eaba9ee05268a74c28fbbf5b65 +size 14620 diff --git a/random/tp-3-of-4_dp-3-of-6_pp-0-of-1.pt b/random/tp-3-of-4_dp-3-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c829b8121b52fb580e6a4b6eabb39629b0c1e72 --- /dev/null +++ b/random/tp-3-of-4_dp-3-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f877b2d7997d37ca345f10f8219bb5ab2d7b4049ccbcf8e40eafeb19da27748d +size 14620 diff --git a/random/tp-3-of-4_dp-4-of-6_pp-0-of-1.pt b/random/tp-3-of-4_dp-4-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..99087dbe1f46ddeeda95fac38e4cca47ff0fd8b1 --- /dev/null +++ b/random/tp-3-of-4_dp-4-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcec9f717b19f3f443eec42c86ca045e5d7331a8751670a27731d6e76b3b586f +size 14620 diff --git a/random/tp-3-of-4_dp-5-of-6_pp-0-of-1.pt b/random/tp-3-of-4_dp-5-of-6_pp-0-of-1.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e746f514af1bdc33aede6574ceef6566b9caa23 --- /dev/null +++ b/random/tp-3-of-4_dp-5-of-6_pp-0-of-1.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e886e90a1668327bd99eeb2e9151b74388dad4cbfb46b2253f5b6bb0ac1a5d +size 14620