Spaces:
Running
Running
Apply quant method
Browse files
app.py
CHANGED
|
@@ -21,6 +21,12 @@ from mlx_lm import convert
|
|
| 21 |
|
| 22 |
HF_TOKEN = os.environ.get("HF_TOKEN")
|
| 23 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 24 |
def clear_hf_cache_space():
|
| 25 |
scan = scan_cache_dir()
|
| 26 |
to_delete = []
|
|
@@ -83,17 +89,14 @@ def process_model(model_id, q_method, oauth_token: gr.OAuthToken | None):
|
|
| 83 |
raise ValueError("You must be logged in to use MLX-my-repo")
|
| 84 |
|
| 85 |
model_name = model_id.split('/')[-1]
|
| 86 |
-
print(model_name)
|
| 87 |
username = whoami(oauth_token.token)["name"]
|
| 88 |
-
print(username)
|
| 89 |
-
|
| 90 |
try:
|
| 91 |
-
upload_repo = username
|
| 92 |
print(upload_repo)
|
| 93 |
with tempfile.TemporaryDirectory(dir="converted") as tmpdir:
|
| 94 |
# The target dir must not exist
|
| 95 |
mlx_path = os.path.join(tmpdir, "mlx")
|
| 96 |
-
convert(model_id, mlx_path=mlx_path, quantize=True)
|
| 97 |
print("Conversion done")
|
| 98 |
upload_to_hub(path=mlx_path, upload_repo=upload_repo, hf_path=model_id, token=oauth_token.token)
|
| 99 |
print("Upload done")
|
|
|
|
| 21 |
|
| 22 |
HF_TOKEN = os.environ.get("HF_TOKEN")
|
| 23 |
|
| 24 |
+
# I'm not sure if we need to add more stuff here
|
| 25 |
+
QUANT_PARAMS = {
|
| 26 |
+
"Q4": 4,
|
| 27 |
+
"Q8": 8,
|
| 28 |
+
}
|
| 29 |
+
|
| 30 |
def clear_hf_cache_space():
|
| 31 |
scan = scan_cache_dir()
|
| 32 |
to_delete = []
|
|
|
|
| 89 |
raise ValueError("You must be logged in to use MLX-my-repo")
|
| 90 |
|
| 91 |
model_name = model_id.split('/')[-1]
|
|
|
|
| 92 |
username = whoami(oauth_token.token)["name"]
|
|
|
|
|
|
|
| 93 |
try:
|
| 94 |
+
upload_repo = f"{username}/{model_name}-{q_method}-mlx"
|
| 95 |
print(upload_repo)
|
| 96 |
with tempfile.TemporaryDirectory(dir="converted") as tmpdir:
|
| 97 |
# The target dir must not exist
|
| 98 |
mlx_path = os.path.join(tmpdir, "mlx")
|
| 99 |
+
convert(model_id, mlx_path=mlx_path, quantize=True, q_bits=QUANT_PARAMS[q_method])
|
| 100 |
print("Conversion done")
|
| 101 |
upload_to_hub(path=mlx_path, upload_repo=upload_repo, hf_path=model_id, token=oauth_token.token)
|
| 102 |
print("Upload done")
|