Neu256 commited on
Commit
d8e3eae
β€’
1 Parent(s): afd8fc6

Upload 11 files

Browse files
models/TinyLlama_TinyLlama-1.1B-Chat-v1.0/README.md ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ datasets:
4
+ - cerebras/SlimPajama-627B
5
+ - bigcode/starcoderdata
6
+ - HuggingFaceH4/ultrachat_200k
7
+ - HuggingFaceH4/ultrafeedback_binarized
8
+ language:
9
+ - en
10
+ widget:
11
+ - text: "<|system|>\nYou are a chatbot who can help code!</s>\n<|user|>\nWrite me a function to calculate the first 10 digits of the fibonacci sequence in Python and print it out to the CLI.</s>\n<|assistant|>\n"
12
+ ---
13
+ <div align="center">
14
+
15
+ # TinyLlama-1.1B
16
+ </div>
17
+
18
+ https://github.com/jzhang38/TinyLlama
19
+
20
+ The TinyLlama project aims to **pretrain** a **1.1B Llama model on 3 trillion tokens**. With some proper optimization, we can achieve this within a span of "just" 90 days using 16 A100-40G GPUs πŸš€πŸš€. The training has started on 2023-09-01.
21
+
22
+
23
+ We adopted exactly the same architecture and tokenizer as Llama 2. This means TinyLlama can be plugged and played in many open-source projects built upon Llama. Besides, TinyLlama is compact with only 1.1B parameters. This compactness allows it to cater to a multitude of applications demanding a restricted computation and memory footprint.
24
+
25
+ #### This Model
26
+ This is the chat model finetuned on top of [TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T](https://huggingface.co/TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T). **We follow [HF's Zephyr](https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha/edit/main/README.md)'s training recipe.** The model was " initially fine-tuned on a variant of the [`UltraChat`](https://huggingface.co/datasets/stingning/ultrachat) dataset, which contains a diverse range of synthetic dialogues generated by ChatGPT.
27
+ We then further aligned the model with [πŸ€— TRL's](https://github.com/huggingface/trl) `DPOTrainer` on the [openbmb/UltraFeedback](https://huggingface.co/datasets/openbmb/UltraFeedback) dataset, which contain 64k prompts and model completions that are ranked by GPT-4."
28
+
29
+
30
+ #### How to use
31
+ You will need the transformers>=4.34
32
+ Do check the [TinyLlama](https://github.com/jzhang38/TinyLlama) github page for more information.
33
+
34
+ ```python
35
+ # Install transformers from source - only needed for versions <= v4.34
36
+ # pip install git+https://github.com/huggingface/transformers.git
37
+ # pip install accelerate
38
+
39
+ import torch
40
+ from transformers import pipeline
41
+
42
+ pipe = pipeline("text-generation", model="TinyLlama/TinyLlama-1.1B-Chat-v1.0", torch_dtype=torch.bfloat16, device_map="auto")
43
+
44
+ # We use the tokenizer's chat template to format each message - see https://huggingface.co/docs/transformers/main/en/chat_templating
45
+ messages = [
46
+ {
47
+ "role": "system",
48
+ "content": "You are a friendly chatbot who always responds in the style of a pirate",
49
+ },
50
+ {"role": "user", "content": "How many helicopters can a human eat in one sitting?"},
51
+ ]
52
+ prompt = pipe.tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
53
+ outputs = pipe(prompt, max_new_tokens=256, do_sample=True, temperature=0.7, top_k=50, top_p=0.95)
54
+ print(outputs[0]["generated_text"])
55
+ # <|system|>
56
+ # You are a friendly chatbot who always responds in the style of a pirate.</s>
57
+ # <|user|>
58
+ # How many helicopters can a human eat in one sitting?</s>
59
+ # <|assistant|>
60
+ # ...
61
+ ```
models/TinyLlama_TinyLlama-1.1B-Chat-v1.0/config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "LlamaForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "bos_token_id": 1,
7
+ "eos_token_id": 2,
8
+ "hidden_act": "silu",
9
+ "hidden_size": 2048,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 5632,
12
+ "max_position_embeddings": 2048,
13
+ "model_type": "llama",
14
+ "num_attention_heads": 32,
15
+ "num_hidden_layers": 22,
16
+ "num_key_value_heads": 4,
17
+ "pretraining_tp": 1,
18
+ "rms_norm_eps": 1e-05,
19
+ "rope_scaling": null,
20
+ "rope_theta": 10000.0,
21
+ "tie_word_embeddings": false,
22
+ "torch_dtype": "bfloat16",
23
+ "transformers_version": "4.35.0",
24
+ "use_cache": true,
25
+ "vocab_size": 32000
26
+ }
models/TinyLlama_TinyLlama-1.1B-Chat-v1.0/eval_results.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_logits/chosen": -2.707406759262085,
4
+ "eval_logits/rejected": -2.656524419784546,
5
+ "eval_logps/chosen": -370.1297607421875,
6
+ "eval_logps/rejected": -296.0738525390625,
7
+ "eval_loss": 0.513750433921814,
8
+ "eval_rewards/accuracies": 0.738095223903656,
9
+ "eval_rewards/chosen": -0.02744222804903984,
10
+ "eval_rewards/margins": 1.0087225437164307,
11
+ "eval_rewards/rejected": -1.03616464138031,
12
+ "eval_runtime": 93.5908,
13
+ "eval_samples": 2000,
14
+ "eval_samples_per_second": 21.37,
15
+ "eval_steps_per_second": 0.673
16
+ }
models/TinyLlama_TinyLlama-1.1B-Chat-v1.0/generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 1,
3
+ "eos_token_id": 2,
4
+ "max_length": 2048,
5
+ "pad_token_id": 0,
6
+ "transformers_version": "4.35.0"
7
+ }
models/TinyLlama_TinyLlama-1.1B-Chat-v1.0/huggingface-metadata.txt ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ url: https://huggingface.co/TinyLlama/TinyLlama-1.1B-Chat-v1.0
2
+ branch: main
3
+ download date: 2024-01-04 21:10:57
4
+ sha256sum:
5
+ 6e6001da2106d4757498752a021df6c2bdc332c650aae4bae6b0c004dcf14933 model.safetensors
6
+ 9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347 tokenizer.model
models/TinyLlama_TinyLlama-1.1B-Chat-v1.0/special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<unk>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
models/TinyLlama_TinyLlama-1.1B-Chat-v1.0/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
models/TinyLlama_TinyLlama-1.1B-Chat-v1.0/tokenizer.model ADDED
Binary file (500 kB). View file
 
models/TinyLlama_TinyLlama-1.1B-Chat-v1.0/tokenizer_config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<unk>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<s>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ }
27
+ },
28
+ "bos_token": "<s>",
29
+ "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n' + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
30
+ "clean_up_tokenization_spaces": false,
31
+ "eos_token": "</s>",
32
+ "legacy": false,
33
+ "model_max_length": 2048,
34
+ "pad_token": "</s>",
35
+ "padding_side": "right",
36
+ "sp_model_kwargs": {},
37
+ "tokenizer_class": "LlamaTokenizer",
38
+ "unk_token": "<unk>",
39
+ "use_default_system_prompt": false
40
+ }
models/config-user.yaml ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ TinyLlama_TinyLlama-1.1B-Chat-v1.0$:
2
+ loader: Transformers
3
+ cpu_memory: 2048
4
+ auto_devices: false
5
+ disk: false
6
+ cpu: true
7
+ bf16: true
8
+ load_in_8bit: false
9
+ trust_remote_code: false
10
+ no_use_fast: false
11
+ use_flash_attention_2: false
12
+ load_in_4bit: false
13
+ compute_dtype: bfloat16
14
+ quant_type: fp4
15
+ use_double_quant: false
16
+ disable_exllama: false
17
+ disable_exllamav2: false
18
+ compress_pos_emb: 1
19
+ alpha_value: 1
20
+ rope_freq_base: 0
models/config.yaml ADDED
@@ -0,0 +1,192 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ .*(llama|alpac|vicuna|guanaco|koala|llava|wizardlm|metharme|pygmalion-7b|pygmalion-2|mythalion|wizard-mega|openbuddy|vigogne|h2ogpt-research|manticore):
2
+ model_type: 'llama'
3
+ .*(opt-|opt_|opt1|opt3|optfor|galactica|galpaca|pygmalion-350m):
4
+ model_type: 'opt'
5
+ .*(gpt-j|gptj|gpt4all-j|malion-6b|pygway|pygmalion-6b|dolly-v1):
6
+ model_type: 'gptj'
7
+ .*(gpt-neox|koalpaca-polyglot|polyglot.*koalpaca|polyglot-ko|polyglot_ko|pythia|stablelm|incite|dolly-v2|polycoder|h2ogpt-oig|h2ogpt-oasst1|h2ogpt-gm):
8
+ model_type: 'gptneox'
9
+ .*bloom:
10
+ model_type: 'bloom'
11
+ .*gpt2:
12
+ model_type: 'gpt2'
13
+ .*falcon:
14
+ model_type: 'falcon'
15
+ .*mpt:
16
+ model_type: 'mpt'
17
+ .*(starcoder|starchat):
18
+ model_type: 'starcoder'
19
+ .*dolly-v2:
20
+ model_type: 'dollyv2'
21
+ .*replit:
22
+ model_type: 'replit'
23
+ .*(oasst|openassistant-|stablelm-7b-sft-v7-epoch-3):
24
+ instruction_template: 'Open Assistant'
25
+ skip_special_tokens: false
26
+ (?!.*galactica)(?!.*reward).*openassistant:
27
+ instruction_template: 'Open Assistant'
28
+ skip_special_tokens: false
29
+ .*galactica:
30
+ skip_special_tokens: false
31
+ .*dolly-v[0-9]-[0-9]*b:
32
+ instruction_template: 'Alpaca'
33
+ skip_special_tokens: false
34
+ .*alpaca-native-4bit:
35
+ instruction_template: 'Alpaca'
36
+ custom_stopping_strings: '"### End"'
37
+ .*llava:
38
+ instruction_template: 'LLaVA'
39
+ custom_stopping_strings: '"\n###"'
40
+ .*llava.*1.5:
41
+ instruction_template: 'Vicuna-v1.1'
42
+ .*wizard.*mega:
43
+ instruction_template: 'Wizard-Mega'
44
+ custom_stopping_strings: '"</s>"'
45
+ .*starchat-beta:
46
+ instruction_template: 'Starchat-Beta'
47
+ custom_stopping_strings: '"<|end|>"'
48
+ (?!.*v0)(?!.*1.1)(?!.*1_1)(?!.*stable)(?!.*chinese).*vicuna:
49
+ instruction_template: 'Vicuna-v0'
50
+ .*vicuna.*v0:
51
+ instruction_template: 'Vicuna-v0'
52
+ .*vicuna.*(1.1|1_1|1.3|1_3):
53
+ instruction_template: 'Vicuna-v1.1'
54
+ .*vicuna.*(1.5|1_5):
55
+ instruction_template: 'Vicuna-v1.1'
56
+ .*stable.*vicuna:
57
+ instruction_template: 'StableVicuna'
58
+ (?!.*chat).*chinese-vicuna:
59
+ instruction_template: 'Alpaca'
60
+ .*chinese-vicuna.*chat:
61
+ instruction_template: 'Chinese-Vicuna-Chat'
62
+ .*alpaca:
63
+ instruction_template: 'Alpaca'
64
+ .*koala:
65
+ instruction_template: 'Koala'
66
+ .*chatglm:
67
+ instruction_template: 'ChatGLM'
68
+ .*(metharme|pygmalion|mythalion):
69
+ instruction_template: 'Metharme'
70
+ .*raven:
71
+ instruction_template: 'RWKV-Raven'
72
+ .*moss-moon.*sft:
73
+ instruction_template: 'MOSS'
74
+ .*stablelm-tuned:
75
+ instruction_template: 'StableLM'
76
+ .*galactica.*finetuned:
77
+ instruction_template: 'Galactica Finetuned'
78
+ .*galactica.*-v2:
79
+ instruction_template: 'Galactica v2'
80
+ (?!.*finetuned)(?!.*-v2).*galactica:
81
+ instruction_template: 'Galactica'
82
+ .*guanaco:
83
+ instruction_template: 'Guanaco non-chat'
84
+ .*baize:
85
+ instruction_template: 'Baize'
86
+ .*mpt-.*instruct:
87
+ instruction_template: 'Alpaca'
88
+ .*mpt-.*chat:
89
+ instruction_template: 'ChatML'
90
+ (?!.*-flan-)(?!.*-t5-).*lamini-:
91
+ instruction_template: 'Alpaca'
92
+ .*incite.*chat:
93
+ instruction_template: 'INCITE-Chat'
94
+ .*incite.*instruct:
95
+ instruction_template: 'INCITE-Instruct'
96
+ .*ziya-:
97
+ instruction_template: 'Ziya'
98
+ .*koalpaca:
99
+ instruction_template: 'KoAlpaca'
100
+ .*openbuddy:
101
+ instruction_template: 'OpenBuddy'
102
+ (?!.*chat).*vigogne:
103
+ instruction_template: 'Vigogne-Instruct'
104
+ .*vigogne.*chat:
105
+ instruction_template: 'Vigogne-Chat'
106
+ .*(llama-deus|supercot|llama-natural-instructions|open-llama-0.3t-7b-instruct-dolly-hhrlhf|open-llama-0.3t-7b-open-instruct):
107
+ instruction_template: 'Alpaca'
108
+ .*bactrian:
109
+ instruction_template: 'Bactrian'
110
+ .*(h2ogpt-oig-|h2ogpt-oasst1-|h2ogpt-research-oasst1-):
111
+ instruction_template: 'INCITE-Chat'
112
+ .*h2ogpt-gm-:
113
+ instruction_template: 'H2O-prompt_answer'
114
+ .*manticore:
115
+ instruction_template: 'Manticore Chat'
116
+ .*bluemoonrp-(30|13)b:
117
+ instruction_template: 'Bluemoon'
118
+ .*Nous-Hermes-13b:
119
+ instruction_template: 'Alpaca'
120
+ .*airoboros:
121
+ instruction_template: 'Vicuna-v1.1'
122
+ .*airoboros.*1.2:
123
+ instruction_template: 'Airoboros-v1.2'
124
+ .*alpa(cino|sta):
125
+ instruction_template: 'Alpaca'
126
+ .*hippogriff:
127
+ instruction_template: 'Hippogriff'
128
+ .*lazarus:
129
+ instruction_template: 'Alpaca'
130
+ .*guanaco-.*(7|13|33|65)b:
131
+ instruction_template: 'Vicuna-v0'
132
+ .*hypermantis:
133
+ instruction_template: 'Alpaca'
134
+ .*open-llama-.*-open-instruct:
135
+ instruction_template: 'Alpaca'
136
+ .*starcoder-gpteacher-code-instruct:
137
+ instruction_template: 'Alpaca'
138
+ .*tulu:
139
+ instruction_template: 'Tulu'
140
+ .*chronos:
141
+ instruction_template: 'Alpaca'
142
+ .*samantha:
143
+ instruction_template: 'Samantha'
144
+ .*wizardcoder:
145
+ instruction_template: 'Alpaca'
146
+ .*minotaur:
147
+ instruction_template: 'Manticore Chat'
148
+ .*orca_mini:
149
+ instruction_template: 'Orca Mini'
150
+ .*(platypus|gplatty|superplatty):
151
+ instruction_template: 'Alpaca'
152
+ .*(openorca-platypus2):
153
+ instruction_template: 'OpenOrca-Platypus2'
154
+ custom_stopping_strings: '"### Instruction:", "### Response:"'
155
+ .*longchat:
156
+ instruction_template: 'Vicuna-v1.1'
157
+ .*vicuna-33b:
158
+ instruction_template: 'Vicuna-v1.1'
159
+ .*redmond-hermes-coder:
160
+ instruction_template: 'Alpaca'
161
+ .*wizardcoder-15b:
162
+ instruction_template: 'Alpaca'
163
+ .*wizardlm:
164
+ instruction_template: 'Vicuna-v1.1'
165
+ .*godzilla:
166
+ instruction_template: 'Alpaca'
167
+ .*llama(-?)(2|v2).*chat:
168
+ instruction_template: 'Llama-v2'
169
+ .*newhope:
170
+ instruction_template: 'NewHope'
171
+ .*stablebeluga2:
172
+ instruction_template: 'StableBeluga2'
173
+ .*openchat:
174
+ instruction_template: 'OpenChat'
175
+ .*codellama.*instruct:
176
+ instruction_template: 'Llama-v2'
177
+ .*(mistral|mixtral).*instruct:
178
+ instruction_template: 'Mistral'
179
+ .*mistral.*openorca:
180
+ instruction_template: 'ChatML'
181
+ .*(WizardCoder-Python-34B-V1.0|Phind-CodeLlama-34B-v2|CodeBooga-34B-v0.1):
182
+ instruction_template: 'Alpaca'
183
+ .*orca-2-(13|7)b:
184
+ instruction_template: 'ChatML'
185
+ .*openhermes.*mistral:
186
+ instruction_template: 'ChatML'
187
+ .*Yi-34B-Chat:
188
+ instruction_template: 'ChatML'
189
+ (dolphin).*:
190
+ instruction_template: 'ChatML'
191
+ .*synthia:
192
+ instruction_template: 'Synthia'