Spaces:

Intel
/

intel-ai-enterprise-inference

Running

App Files Files Community

Benjamin Consolvo commited on Feb 25

Commit

8fced99

1 Parent(s): cbc7aa1

initial files test

Browse files

Files changed (3) hide show

app.py +73 -0
model_info.json +17 -0
requirements.txt +2 -0

app.py ADDED Viewed

	@@ -0,0 +1,73 @@

+# ©2024 Intel Corporation
+# Permission is granted for recipient to internally use and modify this software for purposes of benchmarking and testing on Intel architectures.
+# This software is provided "AS IS" possibly with faults, bugs or errors; it is not intended for production use, and recipient uses this design at their own risk with no liability to Intel.
+# Intel disclaims all warranties, express or implied, including warranties of merchantability, fitness for a particular purpose, and non-infringement.
+# Recipient agrees that any feedback it provides to Intel about this software is licensed to Intel for any purpose worldwide. No permission is granted to use Intel’s trademarks.
+# The above copyright notice and this permission notice shall be included in all copies or substantial portions of the code.
+# Import necessary libraries
+import streamlit as st
+import os
+from openai import OpenAI
+import json
+working_dir = os.path.dirname(os.path.abspath(__file__))
+endpoint_data = json.load(open(f"{working_dir}/model_info.json"))
+def clear_chat():
+    st.session_state.messages = []
+st.title("Chat Bot")
+# Extract the keys (model names) from the JSON data
+model_names = list(endpoint_data.keys())
+with st.sidebar:
+    modelname = st.selectbox("Select a LLM model (Hosted by DENVR DATAWORKS) ", model_names)
+    st.write(f"You selected: {modelname}")
+    st.button("Start New Chat", on_click=clear_chat)
+endpoint = endpoint_data[modelname]
+api_key=os.environ.get('API_KEY')
+if not api_key:
+    st.info("Please add your OpenAI API key to continue.")
+    st.stop()
+base_url = endpoint
+client = OpenAI(api_key=api_key, base_url=base_url)
+# Extract the model name
+models = client.models.list()
+modelname = models.data[0].id
+if "messages" not in st.session_state:
+    st.session_state.messages = []
+for message in st.session_state.messages:
+    with st.chat_message(message["role"]):
+        st.markdown(message["content"])
+if prompt := st.chat_input("What is up?"):
+    st.session_state.messages.append({"role": "user", "content": prompt})
+    with st.chat_message("user"):
+        st.markdown(prompt)
+    with st.chat_message("assistant"):
+        stream = client.chat.completions.create(
+            model=modelname,
+            messages=[
+                {"role": m["role"], "content": m["content"]}
+                for m in st.session_state.messages
+            ],
+            max_tokens=5000,
+            stream=True,
+        )
+        response = st.write_stream(stream)
+    st.session_state.messages.append({"role": "assistant", "content": response})

model_info.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+    "Meta-Llama-3.1-70B-Instruct": "https://inference-api.cloud.denvrdata.com/Meta-Llama-3.1-70B-Instruct/v1/",
+    "Meta-Llama-3.1-8B-Instruct": "https://inference-api.cloud.denvrdata.com/Meta-Llama-3.1-8B-Instruct/v1/",
+    "CodeLlama-34b-Instruct-hf": "https://inference-api.cloud.denvrdata.com/CodeLlama-34b-Instruct/v1/",
+    "Mistral-7B-Instruct-v0.3": "https://inference-api.cloud.denvrdata.com/Mistral-7B-Instruct/v1/",
+    "Mixtral-8x7B-Instruct-v0.1": "https://inference-api.cloud.denvrdata.com/Mixtral-7B-Instruct/v1/",
+    "DENVR: tiiuae/Falcon3-7B-Instruct": "https://inference-api.cloud.denvrdata.com/Falcon3-7B-Instruct/v1/",
+    "DENVR: meta-Llama-3.3-70B-Instruct": "https://inference-api.cloud.denvrdata.com/Llama-3.3-70B-Instruct/v1/",
+    "DENVR: meta-llama/Meta-Llama-3.1-70B-Instruct": "https://inference-api.cloud.denvrdata.com/Meta-Llama-3.1-70B-Instruct/v1/",
+    "DENVR: meta-llama/Meta-Llama-3.1-8B-Instruct": "https://inference-api.cloud.denvrdata.com/Meta-Llama-3.1-8B-Instruct/v1/",
+    "DENVR: codellama/CodeLlama-34b-Instruct-hf": "https://inference-api.cloud.denvrdata.com/CodeLlama-34b-Instruct/v1/",
+    "DENVR: mistralai/Mistral-7B-Instruct-v0.3": "https://inference-api.cloud.denvrdata.com/Mistral-7B-Instruct/v1/",
+    "DENVR: mistralai/Mixtral-8x7B-Instruct-v0.1": "https://inference-api.cloud.denvrdata.com/Mixtral-7B-Instruct/v1/",
+    "DENVR: tiiuae/Falcon3-7B-Instruct": "https://inference-api.cloud.denvrdata.com/Falcon3-7B-Instruct/v1/",
+    "DENVR: deepseek-ai/DeepSeek-R1-Distill-Llama-8B": "https://inference-api.cloud.denvrdata.com/DeepSeek-R1-Distill-Llama-8B/v1/",
+    "DENVR: deepseek-ai/DeepSeek-R1-Distill-Llama-70B": "https://inference-api.cloud.denvrdata.com/DeepSeek-R1-Distill-Llama-70B/v1"
+}

requirements.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ streamlit
2	+ openai