Thewhey-Brian
Fix HF download: download specific checkpoint file and fix permissions
b282fec
raw
history blame
2.77 kB
#!/usr/bin/env python3
"""
Hugging Face Spaces entry point for NanoChat.
This file is automatically detected and run by HF Spaces.
"""
import os
import sys
# Set environment variables for HF Spaces
os.environ.setdefault("NANOCHAT_BASE_DIR", "/data")
# Download model from HF if not present
def download_model():
"""Download model weights from Hugging Face."""
# Create all necessary directories
os.makedirs("/data/chatsft_checkpoints/d20", exist_ok=True)
os.makedirs("/data/.cache/huggingface", exist_ok=True)
checkpoint_path = "/data/chatsft_checkpoints/d20/model_000650.pt"
if os.path.exists(checkpoint_path):
print(f"Model checkpoint found at {checkpoint_path}, skipping download")
return
print("Downloading model checkpoint from BrianGuo/nanochat-d20-chat...")
from huggingface_hub import hf_hub_download
# Download the specific checkpoint file
hf_hub_download(
repo_id="BrianGuo/nanochat-d20-chat",
filename="chatsft_checkpoints/d20/model_000650.pt",
local_dir="/data",
local_dir_use_symlinks=False
)
print("Model downloaded successfully!")
def download_tokenizer():
"""Download tokenizer files from Hugging Face."""
tokenizer_dir = "/data/tokenizer"
if os.path.exists(tokenizer_dir) and os.listdir(tokenizer_dir):
print(f"Tokenizer found, skipping download")
return
print("Downloading tokenizer from BrianGuo/nanochat-d20-chat...")
from huggingface_hub import hf_hub_download
os.makedirs(tokenizer_dir, exist_ok=True)
# Download tokenizer files
hf_hub_download(
repo_id="BrianGuo/nanochat-d20-chat",
filename="tokenizer/token_bytes.pt",
local_dir="/data",
local_dir_use_symlinks=False
)
hf_hub_download(
repo_id="BrianGuo/nanochat-d20-chat",
filename="tokenizer/tokenizer.pkl",
local_dir="/data",
local_dir_use_symlinks=False
)
print("Tokenizer downloaded successfully!")
if __name__ == "__main__":
# Download model and tokenizer before starting
download_model()
download_tokenizer()
# Override sys.argv to pass default arguments for HF Spaces
sys.argv = [
"app.py",
"--port", "7860", # HF Spaces default port
"--host", "0.0.0.0",
"--source", "sft",
"--model-tag", os.environ.get("MODEL_TAG", "d20"),
"--step", os.environ.get("MODEL_STEP", "650"),
]
# Import and run the web server
from scripts.chat_web import app
import uvicorn
print("Starting NanoChat on Hugging Face Spaces...")
print(f"Model: {os.environ.get('MODEL_TAG', 'd20')} - Step: {os.environ.get('MODEL_STEP', '650')}")
uvicorn.run(app, host="0.0.0.0", port=7860)