p1atdev commited on
Commit
3c2add4
β€’
1 Parent(s): cb35885

Upload 6 files

Browse files
README.md CHANGED
@@ -1,3 +1,20 @@
1
  ---
2
- license: apache-2.0
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
+ library_name: peft
3
  ---
4
+ ## Training procedure
5
+
6
+
7
+ The following `bitsandbytes` quantization config was used during training:
8
+ - load_in_8bit: True
9
+ - load_in_4bit: False
10
+ - llm_int8_threshold: 6.0
11
+ - llm_int8_skip_modules: None
12
+ - llm_int8_enable_fp32_cpu_offload: False
13
+ - llm_int8_has_fp16_weight: False
14
+ - bnb_4bit_quant_type: fp4
15
+ - bnb_4bit_use_double_quant: False
16
+ - bnb_4bit_compute_dtype: float32
17
+ ### Framework versions
18
+
19
+
20
+ - PEFT 0.4.0
adapter_config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "auto_mapping": null,
3
+ "base_model_name_or_path": "stabilityai/japanese-stablelm-base-alpha-7b",
4
+ "bias": "none",
5
+ "fan_in_fan_out": false,
6
+ "inference_mode": true,
7
+ "init_lora_weights": true,
8
+ "layers_pattern": null,
9
+ "layers_to_transform": null,
10
+ "lora_alpha": 1,
11
+ "lora_dropout": 0.01,
12
+ "modules_to_save": null,
13
+ "peft_type": "LORA",
14
+ "r": 8,
15
+ "revision": null,
16
+ "target_modules": [
17
+ "query_key_value"
18
+ ],
19
+ "task_type": "CAUSAL_LM"
20
+ }
adapter_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a02317b00cc39b4205c4a4964b45bb2784ce02e55265364c0332f69a725c0778
3
+ size 16800945
special_tokens_map.json ADDED
@@ -0,0 +1,79 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "0",
4
+ "1",
5
+ "2",
6
+ "3",
7
+ "4",
8
+ "5",
9
+ "6",
10
+ "7",
11
+ "8",
12
+ "9",
13
+ "▁▁",
14
+ "▁▁▁▁",
15
+ "▁▁▁▁▁▁▁▁",
16
+ "▁▁▁▁▁▁▁▁▁▁▁▁",
17
+ "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
18
+ " ",
19
+ " ",
20
+ "⁂",
21
+ "─",
22
+ "***",
23
+ "----",
24
+ "▁\"",
25
+ "▁Author",
26
+ "▁Title",
27
+ "▁Tags",
28
+ "▁Genre",
29
+ "▁Style",
30
+ "▁Knowledge",
31
+ "▁Summary",
32
+ "▁Rating",
33
+ "Type",
34
+ "Characters",
35
+ "Glossary",
36
+ "<|spmspace|>",
37
+ "<|spmspace|><|spmspace|>",
38
+ "<|spmspace|><|spmspace|><|spmspace|><|spmspace|>",
39
+ "<|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|>",
40
+ "<|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|>",
41
+ "<|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|>",
42
+ "<|mtvocab|>",
43
+ "<|mtvenglish|>",
44
+ "<|mtvjapanese|>",
45
+ "<|mtsentence|>",
46
+ "<|mtsjapanese|>",
47
+ "<|mtsenglish|>",
48
+ "<|mtsentenceend|>",
49
+ "<|mtvocabend|>",
50
+ "<|mtend|>",
51
+ "<|mask|>",
52
+ "<|masksingle|>",
53
+ "<|maskshort|>",
54
+ "<|maskmedium|>",
55
+ "<|masklong|>",
56
+ "<|maskparagraph|>",
57
+ "<|maskend|>",
58
+ "<|fill|>",
59
+ "<|fillend|>",
60
+ "<|rubycover|>",
61
+ "<|rubystart|>",
62
+ "<|rubyend|>",
63
+ "<|reserved0|>",
64
+ "<|reserved1|>",
65
+ "<|reserved2|>",
66
+ "<|reserved3|>",
67
+ "<|reserved4|>",
68
+ "<|reserved5|>",
69
+ "<|reserved6|>",
70
+ "<|reserved7|>",
71
+ "<|reserved8|>",
72
+ "<|reserved9|>",
73
+ "<|reserved10|>"
74
+ ],
75
+ "bos_token": "<|startoftext|>",
76
+ "eos_token": "<|endoftext|>",
77
+ "pad_token": "<|pad|>",
78
+ "unk_token": "<|unknown|>"
79
+ }
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:578fa0ed4d6dbee435f21d7f7a741506d09cdd93cce241008abf725407cbdb41
3
+ size 1033724
tokenizer_config.json ADDED
@@ -0,0 +1,116 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "add_special_tokens": true,
5
+ "additional_special_tokens": [
6
+ "0",
7
+ "1",
8
+ "2",
9
+ "3",
10
+ "4",
11
+ "5",
12
+ "6",
13
+ "7",
14
+ "8",
15
+ "9",
16
+ "▁▁",
17
+ "▁▁▁▁",
18
+ "▁▁▁▁▁▁▁▁",
19
+ "▁▁▁▁▁▁▁▁▁▁▁▁",
20
+ "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
21
+ " ",
22
+ " ",
23
+ "⁂",
24
+ "─",
25
+ "***",
26
+ "----",
27
+ "▁\"",
28
+ "▁Author",
29
+ "▁Title",
30
+ "▁Tags",
31
+ "▁Genre",
32
+ "▁Style",
33
+ "▁Knowledge",
34
+ "▁Summary",
35
+ "▁Rating",
36
+ "Type",
37
+ "Characters",
38
+ "Glossary",
39
+ "<|spmspace|>",
40
+ "<|spmspace|><|spmspace|>",
41
+ "<|spmspace|><|spmspace|><|spmspace|><|spmspace|>",
42
+ "<|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|>",
43
+ "<|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|>",
44
+ "<|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|><|spmspace|>",
45
+ "<|mtvocab|>",
46
+ "<|mtvenglish|>",
47
+ "<|mtvjapanese|>",
48
+ "<|mtsentence|>",
49
+ "<|mtsjapanese|>",
50
+ "<|mtsenglish|>",
51
+ "<|mtsentenceend|>",
52
+ "<|mtvocabend|>",
53
+ "<|mtend|>",
54
+ "<|mask|>",
55
+ "<|masksingle|>",
56
+ "<|maskshort|>",
57
+ "<|maskmedium|>",
58
+ "<|masklong|>",
59
+ "<|maskparagraph|>",
60
+ "<|maskend|>",
61
+ "<|fill|>",
62
+ "<|fillend|>",
63
+ "<|rubycover|>",
64
+ "<|rubystart|>",
65
+ "<|rubyend|>",
66
+ "<|reserved0|>",
67
+ "<|reserved1|>",
68
+ "<|reserved2|>",
69
+ "<|reserved3|>",
70
+ "<|reserved4|>",
71
+ "<|reserved5|>",
72
+ "<|reserved6|>",
73
+ "<|reserved7|>",
74
+ "<|reserved8|>",
75
+ "<|reserved9|>",
76
+ "<|reserved10|>"
77
+ ],
78
+ "bos_token": {
79
+ "__type": "AddedToken",
80
+ "content": "<|startoftext|>",
81
+ "lstrip": false,
82
+ "normalized": true,
83
+ "rstrip": false,
84
+ "single_word": false
85
+ },
86
+ "clean_up_tokenization_spaces": false,
87
+ "eos_token": {
88
+ "__type": "AddedToken",
89
+ "content": "<|endoftext|>",
90
+ "lstrip": false,
91
+ "normalized": true,
92
+ "rstrip": false,
93
+ "single_word": false
94
+ },
95
+ "legacy": true,
96
+ "model_max_length": 8192,
97
+ "pad_token": {
98
+ "__type": "AddedToken",
99
+ "content": "<|pad|>",
100
+ "lstrip": false,
101
+ "normalized": true,
102
+ "rstrip": false,
103
+ "single_word": false
104
+ },
105
+ "sp_model_kwargs": {},
106
+ "tokenizer_class": "LlamaTokenizer",
107
+ "truncation": false,
108
+ "unk_token": {
109
+ "__type": "AddedToken",
110
+ "content": "<|unknown|>",
111
+ "lstrip": false,
112
+ "normalized": true,
113
+ "rstrip": false,
114
+ "single_word": false
115
+ }
116
+ }