SixOpen commited on
Commit
a06efca
1 Parent(s): 70cc07f
Files changed (5) hide show
  1. Dockerfile +2 -1
  2. app.py +1 -1
  3. groups_merged.txt +0 -0
  4. imatrix_calibration.txt +0 -3
  5. start.sh +4 -0
Dockerfile CHANGED
@@ -60,4 +60,5 @@ ENV PYTHONPATH=${HOME}/app \
60
  PATH=/usr/local/nvidia/bin:${PATH}
61
 
62
 
63
- ENTRYPOINT ["/bin/bash", "-c", "cd llama.cpp && LLAMA_CUDA=1 make -j quantize gguf-split imatrix && cd .. && /bin/sh start.sh"]
 
 
60
  PATH=/usr/local/nvidia/bin:${PATH}
61
 
62
 
63
+ ENTRYPOINT /bin/sh start.sh
64
+
app.py CHANGED
@@ -132,7 +132,7 @@ def process_model(model_id, q_method, use_imatrix, imatrix_q_method, private_rep
132
  if train_data_file:
133
  train_data_path = train_data_file.name
134
  else:
135
- train_data_path = "imatrix_calibration.txt"
136
 
137
  print(f"Training data file path: {train_data_path}")
138
 
 
132
  if train_data_file:
133
  train_data_path = train_data_file.name
134
  else:
135
+ train_data_path = "groups_merged.txt" #fallback calibration dataset
136
 
137
  print(f"Training data file path: {train_data_path}")
138
 
groups_merged.txt ADDED
The diff for this file is too large to render. See raw diff
 
imatrix_calibration.txt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:52062b7643edddbbc83435331ed1bc6ffc3eb463fae9df3551df52fb5638f0e8
3
- size 201119
 
 
 
 
start.sh CHANGED
@@ -1 +1,5 @@
 
 
 
 
1
  python app.py
 
1
+ cd llama.cpp
2
+ make -j quantize gguf-split imatrix
3
+
4
+ cd ..
5
  python app.py