Spaces:
Running
on
A10G
Running
on
A10G
Imatrix
Browse files- Dockerfile +2 -1
- app.py +1 -1
- groups_merged.txt +0 -0
- start.sh +4 -0
Dockerfile
CHANGED
|
@@ -60,4 +60,5 @@ ENV PYTHONPATH=${HOME}/app \
|
|
| 60 |
PATH=/usr/local/nvidia/bin:${PATH}
|
| 61 |
|
| 62 |
|
| 63 |
-
ENTRYPOINT
|
|
|
|
|
|
| 60 |
PATH=/usr/local/nvidia/bin:${PATH}
|
| 61 |
|
| 62 |
|
| 63 |
+
ENTRYPOINT /bin/sh start.sh
|
| 64 |
+
|
app.py
CHANGED
|
@@ -132,7 +132,7 @@ def process_model(model_id, q_method, use_imatrix, imatrix_q_method, private_rep
|
|
| 132 |
if train_data_file:
|
| 133 |
train_data_path = train_data_file.name
|
| 134 |
else:
|
| 135 |
-
train_data_path = "
|
| 136 |
|
| 137 |
print(f"Training data file path: {train_data_path}")
|
| 138 |
|
|
|
|
| 132 |
if train_data_file:
|
| 133 |
train_data_path = train_data_file.name
|
| 134 |
else:
|
| 135 |
+
train_data_path = "groups_merged.txt" #fallback calibration dataset
|
| 136 |
|
| 137 |
print(f"Training data file path: {train_data_path}")
|
| 138 |
|
groups_merged.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
start.sh
CHANGED
|
@@ -1 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
python app.py
|
|
|
|
| 1 |
+
cd llama.cpp
|
| 2 |
+
make -j quantize gguf-split imatrix
|
| 3 |
+
|
| 4 |
+
cd ..
|
| 5 |
python app.py
|