Spaces:

microsoft
/

phi-4-mini

Running

App Files Files Community

nguyenbh commited on Mar 12

Commit

7fc85f7

1 Parent(s): 692b3f2

Update app

Browse files

Files changed (1) hide show

app.py +19 -19

app.py CHANGED Viewed

@@ -1,20 +1,17 @@
 import os
 import gradio as gr
 from azure.ai.inference import ChatCompletionsClient
 from azure.core.credentials import AzureKeyCredential
 # Azure Inference setup
 url = os.getenv("Azure_Endpoint")
 api_key = AzureKeyCredential(os.getenv("Azure_API_KEY"))
 # Initialize the ChatCompletionsClient
-client = ChatCompletionsClient(
-    endpoint=url,
-    credential=api_key,
-    stream=True
-)
 # Get and print model information (optional)
 try:
@@ -46,32 +43,35 @@ def get_azure_response(message, chat_history, temperature, max_tokens, top_p, pr
     Function to get a response from the Azure Phi-4 model
     """
     # Prepare conversation history in the format expected by Azure
-    messages = [{"role": "system", "content": "You are a helpful AI assistant specialized in financial advice and planning."}]
     # Add conversation history
     for human, assistant in chat_history:
-        messages.append({"role": "user", "content": human})
-        if assistant:  # Only add non-empty assistant messages
-            messages.append({"role": "assistant", "content": assistant})
     # Add the current message
-    messages.append({"role": "user", "content": message})
-    # Prepare the payload
-    payload = {
-        "messages": messages,
         "max_tokens": max_tokens,
         "temperature": temperature,
         "top_p": top_p,
-        "presence_penalty": presence_penalty,
-        "frequency_penalty": frequency_penalty,
-        "stream": True
     }
     # Get response
     try:
         print("Sending request to Azure...")
-        response = client.complete(payload)
         return response
     except Exception as e:
         print(f"Error getting response: {str(e)}")

 import os
 import gradio as gr
 from azure.ai.inference import ChatCompletionsClient
+from azure.ai.inference.models import SystemMessage, UserMessage, AssistantMessage
 from azure.core.credentials import AzureKeyCredential
 # Azure Inference setup
 url = os.getenv("Azure_Endpoint")
 api_key = AzureKeyCredential(os.getenv("Azure_API_KEY"))
+model_name = os.getenv("Azure_Model_Name")
 # Initialize the ChatCompletionsClient
+client = ChatCompletionsClient(endpoint=url, credential=api_key, stream=True)
 # Get and print model information (optional)
 try:
     Function to get a response from the Azure Phi-4 model
     """
     # Prepare conversation history in the format expected by Azure
+    messages=[SystemMessage("You are a helpful AI assistant.")]
     # Add conversation history
     for human, assistant in chat_history:
+        messages.append(UserMessage(human))
+        if assistant:
+            messages.append(AssistantMessage(assistant))
     # Add the current message
+    messages.append(UserMessage(message))
+    # Prepare the model_extras
+    model_extras = {
         "max_tokens": max_tokens,
         "temperature": temperature,
         "top_p": top_p,
+        "presence_penalty": 0,
+        "frequency_penalty": 0,
     }
     # Get response
     try:
         print("Sending request to Azure...")
+        response = client.complete(
+            model=model_name,
+            messages=messages,
+            stream=True,
+            model_extras=model_extras
+        )
         return response
     except Exception as e:
         print(f"Error getting response: {str(e)}")