Neko-Institute-of-Science
/

LLaMA-13B-8bit-LoRA-LightNovels

Model card Files Files and versions Community

Neko-Institute-of-Science commited on Apr 25, 2023

Commit

6434efc

•

1 Parent(s): a119e81

23/150 Hours

Browse files

Files changed (29) hide show

checkpoint-1248/adapter_config.json +17 -0
checkpoint-1248/adapter_model.bin +3 -0
checkpoint-1664/adapter_config.json +17 -0
checkpoint-1664/adapter_model.bin +3 -0
checkpoint-2080/adapter_config.json +17 -0
checkpoint-2080/adapter_model.bin +3 -0
checkpoint-2496/adapter_config.json +17 -0
checkpoint-2496/adapter_model.bin +3 -0
checkpoint-2912/adapter_config.json +17 -0
checkpoint-2912/adapter_model.bin +3 -0
checkpoint-3328/adapter_config.json +17 -0
checkpoint-3328/adapter_model.bin +3 -0
checkpoint-3744/adapter_config.json +17 -0
checkpoint-3744/adapter_model.bin +3 -0
checkpoint-416/adapter_config.json +17 -0
checkpoint-416/adapter_model.bin +3 -0
checkpoint-4160/adapter_config.json +17 -0
checkpoint-4160/adapter_model.bin +3 -0
checkpoint-4576/adapter_config.json +17 -0
checkpoint-4576/adapter_model.bin +3 -0
checkpoint-4992/adapter_config.json +17 -0
checkpoint-4992/adapter_model.bin +3 -0
checkpoint-5408/adapter_config.json +17 -0
checkpoint-5408/adapter_model.bin +3 -0
checkpoint-5824/adapter_config.json +17 -0
checkpoint-5824/adapter_model.bin +3 -0
checkpoint-832/adapter_config.json +17 -0
checkpoint-832/adapter_model.bin +3 -0
training_parameters.json +1 -0

checkpoint-1248/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-1248/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:674ef686e61b33bd71270d8fac4534c92eaa8111a5b28478fd1f49bf5ae9bfee
+size 838918733

checkpoint-1664/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-1664/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cd1c28fc8f75321a71ed3d79891a4e9e7515243bc4d92cd1a0e038ea7ba9bcad
+size 838918733

checkpoint-2080/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-2080/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a959b1c89d27f91fa225aa4892e07e150915ac37c0ecf19b71c94f6e04d69f9
+size 838918733

checkpoint-2496/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-2496/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a384984c1e2b93dd40d0b6f31b5511acefab75162a0c6e1ad1929c83528741c4
+size 838918733

checkpoint-2912/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-2912/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1ce8b4e6f9b4a4f6783987db47e34d8c859816e0ef3a6715fb6de5f54cc49117
+size 838918733

checkpoint-3328/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-3328/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:155ef17fed8fc7d4568a5e80b56dc6350e4c5e9fae54bbd422410cf96e785125
+size 838918733

checkpoint-3744/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-3744/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d0caf6d56c4815d2ad5378f3bac281e5cbc24c6849ccabbcaf26fba039f76231
+size 838918733

checkpoint-416/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-416/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0e5db4ef7912abadf1976e3fa3e171c7bb32685b476f6712e046712ce4708bd5
+size 838918733

checkpoint-4160/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-4160/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:10b7dfecd54a9ed1dba450819eec4fcd1eb16847eb4473dc76b2642ba3b46675
+size 838918733

checkpoint-4576/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-4576/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91e076344275bdbc4f30d5243b0cace1a8d2c0874ed75305d85b3060a12d98b1
+size 838918733

checkpoint-4992/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-4992/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:20ba7fa868fc62aa5fbe9ff2e897e7c551cda46384f9ab7cb94d6426f5c50542
+size 838918733

checkpoint-5408/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-5408/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:48078bea5ea8ea69cc052e22b74d291d4d0f874a18180046db13c57b982f42e2
+size 838918733

checkpoint-5824/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-5824/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b2b8a670041222ff33399eeb22747a86f7ff8cb0e0959f1bed7d0d9061f064e4
+size 838918733

checkpoint-832/adapter_config.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "base_model_name_or_path": "models/llama-13b",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "lora_alpha": 512,
+  "lora_dropout": 0.05,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 256,
+  "target_modules": [
+    "q_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

checkpoint-832/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8af4068daca68b5f524a373f4fa68c94502fcc89afee6d9f38e5d94990515e8c
+size 838918733

training_parameters.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"lora_name": "LightNovels", "always_override": false, "save_steps": 400.0, "micro_batch_size": 4, "batch_size": 128, "epochs": 1.0, "learning_rate": "3e-4", "lr_scheduler_type": "constant", "lora_rank": 256, "lora_alpha": 512, "lora_dropout": 0.05, "cutoff_len": 2048, "dataset": "None", "eval_dataset": "None", "format": "None", "eval_steps": 100.0, "raw_text_file": "LightNovels_clean", "overlap_len": 512, "newline_favor_len": 512, "do_shuffle": true, "higher_rank_limit": false, "warmup_steps": 100.0, "optimizer": "adamw_torch"}