aryo100 commited on
Commit
c2609dd
·
1 Parent(s): 28de333

update app

Browse files
Files changed (1) hide show
  1. app.py +9 -1
app.py CHANGED
@@ -2,6 +2,9 @@ from fastapi import FastAPI
2
  from pydantic import BaseModel
3
  from transformers import AutoModelForCausalLM, AutoTokenizer
4
  import torch
 
 
 
5
 
6
  app = FastAPI()
7
 
@@ -11,7 +14,8 @@ tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME, trust_remote_code=True)
11
  model = AutoModelForCausalLM.from_pretrained(
12
  MODEL_NAME,
13
  torch_dtype=torch.float16,
14
- device_map="auto"
 
15
  )
16
 
17
  # Request schema
@@ -46,3 +50,7 @@ def chat(req: ChatRequest):
46
  @app.get("/")
47
  def root():
48
  return {"message": "Qwen FastAPI running 🚀"}
 
 
 
 
 
2
  from pydantic import BaseModel
3
  from transformers import AutoModelForCausalLM, AutoTokenizer
4
  import torch
5
+ import os
6
+ import uvicorn
7
+
8
 
9
  app = FastAPI()
10
 
 
14
  model = AutoModelForCausalLM.from_pretrained(
15
  MODEL_NAME,
16
  torch_dtype=torch.float16,
17
+ device_map="auto",
18
+ trust_remote_code=True,
19
  )
20
 
21
  # Request schema
 
50
  @app.get("/")
51
  def root():
52
  return {"message": "Qwen FastAPI running 🚀"}
53
+
54
+ if __name__ == "__main__":
55
+ port = int(os.environ.get("PORT", 7860))
56
+ uvicorn.run("app:app", host="0.0.0.0", port=port)