update dumpfile with correct kv array rendering

Browse files

Files changed (3) hide show

Tinyllama-4.6M-v0.0-F16.md → Tinyllama-4.6M-v0.0-F16.dump.md +19 -19
llama.cpp +1 -1
llamafile-creation.sh +4 -5

Tinyllama-4.6M-v0.0-F16.md → Tinyllama-4.6M-v0.0-F16.dump.md RENAMED Viewed

@@ -11,20 +11,20 @@ There are 36 key-value pairs in this file
 |   1 | UINT32    |     1 | GGUF.version                           | 3                                                                                |
 |   2 | UINT64    |     1 | GGUF.tensor_count                      | 75                                                                               |
 |   3 | UINT64    |     1 | GGUF.kv_count                          | 33                                                                               |
-|   4 | STRING    |     1 | general.architecture                   | 'llama'                                                                          |
-|   5 | STRING    |     1 | general.type                           | 'model'                                                                          |
-|   6 | STRING    |     1 | general.name                           | 'TinyLLama'                                                                      |
-|   7 | STRING    |     1 | general.author                         | 'Maykeye'                                                                        |
-|   8 | STRING    |     1 | general.version                        | 'v0.0'                                                                           |
-|   9 | STRING    |     1 | general.description                    | 'This gguf is ported from a first version of Maykeye attempt '                   |
-|  10 | STRING    |     1 | general.quantized_by                   | 'Mofosyne'                                                                       |
-|  11 | STRING    |     1 | general.size_label                     | '4.6M'                                                                           |
-|  12 | STRING    |     1 | general.license                        | 'apache-2.0'                                                                     |
-|  13 | STRING    |     1 | general.url                            | 'https://huggingface.co/mofosyne/TinyLLama-v0-llamafile'                         |
-|  14 | STRING    |     1 | general.source.url                     | 'https://huggingface.co/Maykeye/TinyLLama-v0'                                    |
-|  15 | [STRING]  |     5 | general.tags                           | [ 'tiny ', '\n\x00\x00\x00\x00', 'tiny', '\x04\x00\x00\x00\x00', 'llama',  ... ] |
-|  16 | [STRING]  |     1 | general.languages                      | [ 'en' ]                                                                         |
-|  17 | [STRING]  |     2 | general.datasets                       | [ 'https', ']\x00\x00\x00\x00',  ... ]                                           |
 |  18 | UINT32    |     1 | llama.block_count                      | 8                                                                                |
 |  19 | UINT32    |     1 | llama.context_length                   | 2048                                                                             |
 |  20 | UINT32    |     1 | llama.embedding_length                 | 64                                                                               |
@@ -34,11 +34,11 @@ There are 36 key-value pairs in this file
 |  24 | UINT32    |     1 | general.file_type                      | 1                                                                                |
 |  25 | UINT32    |     1 | llama.vocab_size                       | 32000                                                                            |
 |  26 | UINT32    |     1 | llama.rope.dimension_count             | 4                                                                                |
-|  27 | STRING    |     1 | tokenizer.ggml.model                   | 'llama'                                                                          |
-|  28 | STRING    |     1 | tokenizer.ggml.pre                     | 'default'                                                                        |
-|  29 | [STRING]  | 32000 | tokenizer.ggml.tokens                  | [ 'А', '\x02\x00\x00\x00\x00', 'š', '\x02\x00\x00\x00\x00', 'α',  ... ]          |
-|  30 | [FLOAT32] | 32000 | tokenizer.ggml.scores                  | [ -31740.0, -31739.0, -31738.0, -31737.0, -31736.0, -31735.0, -31734.0,  ... ]   |
-|  31 | [INT32]   | 32000 | tokenizer.ggml.token_type              | [ 1, 1, 1, 1, 1, 1, 1,  ... ]                                                    |
 |  32 | UINT32    |     1 | tokenizer.ggml.bos_token_id            | 1                                                                                |
 |  33 | UINT32    |     1 | tokenizer.ggml.eos_token_id            | 2                                                                                |
 |  34 | UINT32    |     1 | tokenizer.ggml.unknown_token_id        | 0                                                                                |

 |   1 | UINT32    |     1 | GGUF.version                           | 3                                                                                |
 |   2 | UINT64    |     1 | GGUF.tensor_count                      | 75                                                                               |
 |   3 | UINT64    |     1 | GGUF.kv_count                          | 33                                                                               |
+|   4 | STRING    |     1 | general.architecture                   | `llama`                                                                          |
+|   5 | STRING    |     1 | general.type                           | `model`                                                                          |
+|   6 | STRING    |     1 | general.name                           | `TinyLLama`                                                                      |
+|   7 | STRING    |     1 | general.author                         | `Maykeye`                                                                        |
+|   8 | STRING    |     1 | general.version                        | `v0.0`                                                                           |
+|   9 | STRING    |     1 | general.description                    | `This gguf is ported from a fir`...`M but using Llama architecture`              |
+|  10 | STRING    |     1 | general.quantized_by                   | `Mofosyne`                                                                       |
+|  11 | STRING    |     1 | general.size_label                     | `4.6M`                                                                           |
+|  12 | STRING    |     1 | general.license                        | `apache-2.0`                                                                     |
+|  13 | STRING    |     1 | general.url                            | `https://huggingface.co/mofosyne/TinyLLama-v0-llamafile`                         |
+|  14 | STRING    |     1 | general.source.url                     | `https://huggingface.co/Maykeye/TinyLLama-v0`                                    |
+|  15 | [STRING]  |     5 | general.tags                           | [ `text generation`, `transformer`, `llama`, `tiny`, `tiny model` ]              |
+|  16 | [STRING]  |     1 | general.languages                      | [ `en` ]                                                                         |
+|  17 | [STRING]  |     2 | general.datasets                       | [ `https://hugging`...`-GPT4-train.txt`, `https://hugging`...`-GPT4-valid.txt` ] |
 |  18 | UINT32    |     1 | llama.block_count                      | 8                                                                                |
 |  19 | UINT32    |     1 | llama.context_length                   | 2048                                                                             |
 |  20 | UINT32    |     1 | llama.embedding_length                 | 64                                                                               |
 |  24 | UINT32    |     1 | general.file_type                      | 1                                                                                |
 |  25 | UINT32    |     1 | llama.vocab_size                       | 32000                                                                            |
 |  26 | UINT32    |     1 | llama.rope.dimension_count             | 4                                                                                |
+|  27 | STRING    |     1 | tokenizer.ggml.model                   | `llama`                                                                          |
+|  28 | STRING    |     1 | tokenizer.ggml.pre                     | `default`                                                                        |
+|  29 | [STRING]  | 32000 | tokenizer.ggml.tokens                  | [ `<unk>`, `<s>`, `</s>`, `<0x00>`, `<0x01>`, ... ]                              |
+|  30 | [FLOAT32] | 32000 | tokenizer.ggml.scores                  | [ 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, ... ]                                       |
+|  31 | [INT32]   | 32000 | tokenizer.ggml.token_type              | [ 2, 3, 3, 6, 6, 6, 6, ... ]                                                     |
 |  32 | UINT32    |     1 | tokenizer.ggml.bos_token_id            | 1                                                                                |
 |  33 | UINT32    |     1 | tokenizer.ggml.eos_token_id            | 2                                                                                |
 |  34 | UINT32    |     1 | tokenizer.ggml.unknown_token_id        | 0                                                                                |

llama.cpp CHANGED Viewed

	@@ -1 +1 @@
1	- Subproject commit ~~f299aa98ecc19cbc574e9d698e03999e89de3d3d~~


1	+ Subproject commit c3776cacabce2ee35f172fb72be7a519752125fa

llamafile-creation.sh CHANGED Viewed

@@ -6,7 +6,7 @@ METADATA_FILE="maykeye_tinyllama-metadata.json"
 ###############################################################################
 # Pull both model folder, llamafile (for the engine) and llama.cpp (for the conversion script)
 echo == Prep Enviroment ==
-git submodule update --init
 ###############################################################################
 echo == Build and prep the llamafile engine execuable ==
@@ -37,6 +37,9 @@ echo == Convert from safetensor to gguf ==
 ./llama.cpp/convert_hf_to_gguf.py ${MODEL_DIR} --metadata ${METADATA_FILE} --outtype f16 --verbose
 mv ${MODEL_DIR}/${OUTFILE}.gguf ${OUTFILE}.gguf
 ###############################################################################
 echo == Generating Llamafile ==
 cp ./llamafile/o/llama.cpp/main/main ${OUTFILE}.llamafile
@@ -53,7 +56,3 @@ EOF
 ###############################################################################
 echo == Test Output ./${OUTFILE}.llamafile ==
 ./${OUTFILE}.llamafile --cli -p "hello world the gruff man said"
-###############################################################################
-echo == Useful GGUF Technical Dump ==
-./llama.cpp/gguf-py/scripts/gguf_dump.py --markdown ${OUTFILE}.gguf > ${OUTFILE}.md

 ###############################################################################
 # Pull both model folder, llamafile (for the engine) and llama.cpp (for the conversion script)
 echo == Prep Enviroment ==
+#git submodule update --init
 ###############################################################################
 echo == Build and prep the llamafile engine execuable ==
 ./llama.cpp/convert_hf_to_gguf.py ${MODEL_DIR} --metadata ${METADATA_FILE} --outtype f16 --verbose
 mv ${MODEL_DIR}/${OUTFILE}.gguf ${OUTFILE}.gguf
+# Generate Diagnostics Dumpfile
+./llama.cpp/gguf-py/scripts/gguf_dump.py --markdown ${OUTFILE}.gguf > ${OUTFILE}.dump.md
 ###############################################################################
 echo == Generating Llamafile ==
 cp ./llamafile/o/llama.cpp/main/main ${OUTFILE}.llamafile
 ###############################################################################
 echo == Test Output ./${OUTFILE}.llamafile ==
 ./${OUTFILE}.llamafile --cli -p "hello world the gruff man said"