ajaykumarr commited on
Commit
72e4d27
·
verified ·
1 Parent(s): 4b33e3e

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +24 -0
app.py ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import torch
2
+ from transformers import AutoModelForCausalLM, AutoTokenizer
3
+ from fastapi import FastAPI, Request
4
+ from pydantic import BaseModel
5
+ import uvicorn
6
+
7
+ app = FastAPI()
8
+
9
+ model_name = "meta-llama/Meta-Llama-3.1-405B"
10
+ tokenizer = AutoTokenizer.from_pretrained(model_name)
11
+ model = AutoModelForCausalLM.from_pretrained(model_name)
12
+
13
+ class Query(BaseModel):
14
+ inputs: str
15
+
16
+ @app.post("/generate")
17
+ async def generate(query: Query):
18
+ inputs = tokenizer(query.inputs, return_tensors="pt")
19
+ outputs = model.generate(inputs["input_ids"])
20
+ response = tokenizer.decode(outputs[0], skip_special_tokens=True)
21
+ return {"generated_text": response}
22
+
23
+ if __name__ == "__main__":
24
+ uvicorn.run(app, host="0.0.0.0", port=8000)