Spaces:
Running
on
A10G
Running
on
A10G
Imatrix
Browse files- Dockerfile +2 -1
- app.py +1 -1
- groups_merged.txt +0 -0
- imatrix_calibration.txt +0 -3
- start.sh +4 -0
Dockerfile
CHANGED
@@ -60,4 +60,5 @@ ENV PYTHONPATH=${HOME}/app \
|
|
60 |
PATH=/usr/local/nvidia/bin:${PATH}
|
61 |
|
62 |
|
63 |
-
ENTRYPOINT
|
|
|
|
60 |
PATH=/usr/local/nvidia/bin:${PATH}
|
61 |
|
62 |
|
63 |
+
ENTRYPOINT /bin/sh start.sh
|
64 |
+
|
app.py
CHANGED
@@ -132,7 +132,7 @@ def process_model(model_id, q_method, use_imatrix, imatrix_q_method, private_rep
|
|
132 |
if train_data_file:
|
133 |
train_data_path = train_data_file.name
|
134 |
else:
|
135 |
-
train_data_path = "
|
136 |
|
137 |
print(f"Training data file path: {train_data_path}")
|
138 |
|
|
|
132 |
if train_data_file:
|
133 |
train_data_path = train_data_file.name
|
134 |
else:
|
135 |
+
train_data_path = "groups_merged.txt" #fallback calibration dataset
|
136 |
|
137 |
print(f"Training data file path: {train_data_path}")
|
138 |
|
groups_merged.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
imatrix_calibration.txt
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:52062b7643edddbbc83435331ed1bc6ffc3eb463fae9df3551df52fb5638f0e8
|
3 |
-
size 201119
|
|
|
|
|
|
|
|
start.sh
CHANGED
@@ -1 +1,5 @@
|
|
|
|
|
|
|
|
|
|
1 |
python app.py
|
|
|
1 |
+
cd llama.cpp
|
2 |
+
make -j quantize gguf-split imatrix
|
3 |
+
|
4 |
+
cd ..
|
5 |
python app.py
|