Spaces:
Runtime error
Runtime error
Feature(MInference): add zeroGPU
Browse files
app.py
CHANGED
|
@@ -73,7 +73,7 @@ if torch.cuda.is_available() and _is_package_available("pycuda"):
|
|
| 73 |
terminators = [tokenizer.eos_token_id, tokenizer.convert_tokens_to_ids("<|eot_id|>")]
|
| 74 |
|
| 75 |
|
| 76 |
-
|
| 77 |
def chat_llama3_8b(
|
| 78 |
message: str, history: list, temperature: float, max_new_tokens: int
|
| 79 |
) -> str:
|
|
|
|
| 73 |
terminators = [tokenizer.eos_token_id, tokenizer.convert_tokens_to_ids("<|eot_id|>")]
|
| 74 |
|
| 75 |
|
| 76 |
+
@spaces.GPU(duration=120)
|
| 77 |
def chat_llama3_8b(
|
| 78 |
message: str, history: list, temperature: float, max_new_tokens: int
|
| 79 |
) -> str:
|