Update server.py
Browse files
server.py
CHANGED
|
@@ -24,14 +24,17 @@ def base():
|
|
| 24 |
|
| 25 |
prefix_prompt="""<s>[INST]Summarize the following transcript[/INST]\n"""
|
| 26 |
suffix_prompt="""\n"""
|
|
|
|
|
|
|
|
|
|
| 27 |
@app.post("/llm")
|
| 28 |
async def main(request: Request):
|
| 29 |
input_json = await request.json()
|
| 30 |
print(input_json)
|
| 31 |
final_prompt = prefix_prompt + str(input_json["prompt"]) + suffix_prompt
|
| 32 |
resp = requests.post(
|
| 33 |
-
|
| 34 |
-
headers={"Authorization": "Api-Key
|
| 35 |
json={'prompt': final_prompt ,'temperature': 0.001, 'max_new_tokens': 100, 'repetition_penalty':1.2},
|
| 36 |
)
|
| 37 |
llm_response = resp.json()
|
|
|
|
| 24 |
|
| 25 |
prefix_prompt="""<s>[INST]Summarize the following transcript[/INST]\n"""
|
| 26 |
suffix_prompt="""\n"""
|
| 27 |
+
import os
|
| 28 |
+
baseten_url = os.getenv("BASETEN_URL")
|
| 29 |
+
baseten_key = os.getenv("BASETEN_KEY")
|
| 30 |
@app.post("/llm")
|
| 31 |
async def main(request: Request):
|
| 32 |
input_json = await request.json()
|
| 33 |
print(input_json)
|
| 34 |
final_prompt = prefix_prompt + str(input_json["prompt"]) + suffix_prompt
|
| 35 |
resp = requests.post(
|
| 36 |
+
baseten_url,
|
| 37 |
+
headers={"Authorization": f"Api-Key {baseten_key}"},
|
| 38 |
json={'prompt': final_prompt ,'temperature': 0.001, 'max_new_tokens': 100, 'repetition_penalty':1.2},
|
| 39 |
)
|
| 40 |
llm_response = resp.json()
|