File size: 609 Bytes
7585b58
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
#!/bin/sh

# Pull both the model folder and llama.cpp (for the conversion script)
git submodule update --init

# Convert from safetensor to gguf
# (Assuming llama.cpp is in the next folder)
./llama.cpp/convert.py maykeye_tinyllama --metadata maykeye_tinyllama-metadata.json

# Copy the generated gguf to this folder
cp maykeye_tinyllama/TinyLLama-v0-5M-F16.gguf TinyLLama-v0-5M-F16.gguf

# Get the llamafile engine
cp /usr/local/bin/llamafile TinyLLama-v0-5M-F16.llamafile

# Combine
zipalign -j0 \
  TinyLLama-v0-5M-F16.llamafile \
  TinyLLama-v0-5M-F16.gguf \
  .args

# Test
./TinyLLama-v0-5M-F16.llamafile