Spaces:
Build error
Build error
| from gptqmodel import GPTQModel | |
| # load Qwen/Qwen2.5-0.5B-Instruct-GPTQ-Int4 from modelscope | |
| model = GPTQModel.load("TheBloke/Wizard-Vicuna-13B-Uncensored-SuperHOT-8K-GPTQ") | |
| async def generate_response(input: str): | |
| result = model.generate(input)[0] | |
| return model.tokenizer.decode(result) | |
| ############################################## | |
| from fastapi import FastAPI | |
| import uvicorn | |
| app = FastAPI() | |
| def greet_json(): | |
| return {"Hello": "World!"} | |
| async def message(input: str): | |
| return generate_response(input) | |
| if __name__ == "__main__": | |
| uvicorn.run(app, host="0.0.0.0", port=7860) |