scratch_chat_assisstance_2

Running

App Files Files Community

WebashalarForML commited on Oct 3

Commit

ffd1ea4

verified ·

1 Parent(s): 4d9fce0

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -80

app.py CHANGED Viewed

@@ -44,9 +44,9 @@ CORS(app)
 # --- LLM setup ---
 # Using a model that's good for coding tasks
 llm = ChatGroq(
-    model=os.getenv("LLM_MODEL", "mixtral-8x7b-32768"), # Changed to a coding-friendly model
-    temperature=0.1, # Slightly less creative than general chat
-    max_tokens=2048, # Increased token limit for code
     api_key=GROQ_API_KEY,
 )
@@ -74,34 +74,31 @@ Rules:
 """
 def extract_json_from_llm_response(raw_response: str) -> dict:
-    # Helper function remains largely the same, adapted for new keys
     default = {
         "assistant_reply": "I'm sorry — I couldn't understand that. Could you please rephrase?",
         "state_updates": {},
         "suggested_tags": [],
     }
-    # ... [JSON parsing logic remains similar] ...
     if not raw_response or not isinstance(raw_response, str):
         return default
     m = re.search(r"```(?:json)?\s*([\s\S]*?)\s*```", raw_response)
     json_string = m.group(1).strip() if m else raw_response
     first = json_string.find('{')
     last = json_string.rfind('}')
-    if first == -1 or last == -1 or first >= last:
-        try:
-            return json.loads(json_string)
-        except Exception:
-            logger.warning("Could not locate JSON braces in LLM output. Falling back to default.")
-            return default
-    candidate = json_string[first:last+1]
     candidate = re.sub(r',\s*(?=[}\]])', '', candidate)
     try:
         parsed = json.loads(candidate)
     except Exception as e:
-        logger.warning("Failed to parse JSON from LLM output: %s", e)
         return default
-    # Validation for new keys
     if isinstance(parsed, dict) and "assistant_reply" in parsed and isinstance(parsed["assistant_reply"], str) and parsed["assistant_reply"].strip():
         parsed.setdefault("state_updates", {})
         parsed.setdefault("suggested_tags", [])
@@ -114,13 +111,10 @@ def extract_json_from_llm_response(raw_response: str) -> dict:
 @app.route("/", methods=["GET"])
 def serve_frontend():
     try:
-        # Assuming you will update frontend.html for the new assistant
         return app.send_static_file("frontend.html")
     except Exception:
         return "<h3>frontend.html not found in static/ — please add your frontend.html there.</h3>", 404
-# UPLOAD routes are removed as they are no longer needed.
 @app.route("/chat", methods=["POST"])
 def chat():
     data = request.get_json(force=True)
@@ -128,36 +122,30 @@ def chat():
         return jsonify({"error": "invalid request body"}), 400
     chat_history: List[Dict[str, str]] = data.get("chat_history") or []
-    # Using 'assistant_state' to clearly separate from old patient_state
     assistant_state: AssistantState = data.get("assistant_state") or {}
-    # Initialize/Clean up state
     state: AssistantState = {
         "conversationSummary": assistant_state.get("conversationSummary", ""),
         "lastUserMessage": "",
-        "language": assistant_state.get("language", "Python"), # Default to Python
         "taggedReplies": assistant_state.get("taggedReplies", []),
     }
-    # Find the last user message
     for msg in reversed(chat_history):
         if msg.get("role") == "user" and msg.get("content"):
             state["lastUserMessage"] = msg["content"]
             break
-    # --- Language Detection (Simple check for common programming languages) ---
     last_msg_lower = state["lastUserMessage"].lower()
     known_languages = ["python", "javascript", "java", "c++", "c#", "go", "ruby", "php", "typescript", "swift"]
-    # A simple regex to detect a language mention in the last message
     lang_match = re.search(r'\b(in|using|for)\s+(' + '|'.join(known_languages) + r')\b', last_msg_lower)
     if lang_match:
         detected_lang = lang_match.group(2).capitalize()
-        if detected_lang != state["language"]:
             logger.info("Detected new language: %s", detected_lang)
             state["language"] = detected_lang
-    # --- LLM Prompt Construction ---
     action_hint = ""
     if state["language"]:
         action_hint = f"Focus your answer on the {state['language']} programming language. If the user asks a conceptual question, use {state['language']} for examples."
@@ -165,7 +153,7 @@ def chat():
         action_hint = "The current language is unknown. Please ask the user to specify the programming language they are working in."
     user_prompt = f"""
-Current State: {json.dumps({"language": state["language"], "summary": state["conversationSummary"]})}
 Last user message: {state["lastUserMessage"]}
 SYSTEM_HINT: {action_hint}
@@ -190,10 +178,8 @@ Return ONLY valid JSON with keys: assistant_reply, state_updates, suggested_tags
         logger.exception("LLM invocation failed")
         return jsonify({"error": "LLM invocation failed", "detail": str(e)}), 500
-    # --- State Update from LLM ---
     updated_state_from_llm = parsed_result.get("state_updates", {})
-    # Update state fields that the LLM is allowed to modify
     if 'conversationSummary' in updated_state_from_llm:
         state["conversationSummary"] = updated_state_from_llm["conversationSummary"]
     if 'language' in updated_state_from_llm:
@@ -203,16 +189,14 @@ Return ONLY valid JSON with keys: assistant_reply, state_updates, suggested_tags
     if not assistant_reply or not isinstance(assistant_reply, str) or not assistant_reply.strip():
         assistant_reply = "I'm here to help with your code! What programming language are you using?"
-    # --- Final Response Payload ---
     response_payload = {
         "assistant_reply": assistant_reply,
         "updated_state": state,
-        "suggested_tags": parsed_result.get("suggested_tags", []), # Pass tags to frontend
     }
     return jsonify(response_payload)
-# --- New Route for Tagging/Bookmarking Replies ---
 @app.route("/tag_reply", methods=["POST"])
 def tag_reply():
     data = request.get_json(force=True)
@@ -226,12 +210,10 @@ def tag_reply():
     if not reply_content or not tags:
         return jsonify({"error": "Missing 'reply' or 'tags' in request"}), 400
-    # Ensure tags is a list of strings
     tags = [str(t).strip() for t in tags if str(t).strip()]
     if not tags:
         return jsonify({"error": "Tags list cannot be empty"}), 400
-    # Clean up state dictionary
     state: AssistantState = {
         "conversationSummary": assistant_state.get("conversationSummary", ""),
         "lastUserMessage": "",
@@ -244,7 +226,6 @@ def tag_reply():
         "tags": tags,
     }
-    # Add the new tagged reply
     state["taggedReplies"].append(new_tagged_reply)
     logger.info("Reply tagged with: %s", tags)
@@ -254,55 +235,10 @@ def tag_reply():
         "updated_state": state,
     }), 200
-# --- Filtering/Search Route for Bookmarked Replies ---
-@app.route("/search_tags", methods=["GET"])
-def search_tags():
-    tag_query = request.args.get("tag")
-    # Using POST for /chat, so we'll pass state in the body
-    # For a simple GET search, we'd need the state to be sent here,
-    # but for simplicity, let's assume the state is passed in a POST body
-    # or fetched/maintained on the frontend and this route is just for logic.
-    # Assuming the frontend sends the current state via a POST request for search
-    if request.method == "GET":
-        return jsonify({"error": "Please use POST and include 'assistant_state' in the body for tag search."}), 405
-    # If using POST, you'd process request.get_json() here to get assistant_state
-    # For now, let's stick to the simpler GET and assume the frontend handles the state.
-    # To demonstrate the filtering logic:
-    # --- DUMMY STATE FOR DEMO ---
-    dummy_state: AssistantState = {
-        "conversationSummary": "",
-        "lastUserMessage": "",
-        "language": "Python",
-        "taggedReplies": [
-            {"reply": "A Python loop example.", "tags": ["Python", "Loop Concept"]},
-            {"reply": "Fix for 'undefined' error in JS.", "tags": ["JavaScript", "Debugging"]},
-            {"reply": "Explanation of Polymorphism.", "tags": ["Java", "OOP"]},
-        ],
-    }
-    if not tag_query:
-        # Return all tagged replies if no query
-        return jsonify({"tag_query": "", "results": dummy_state["taggedReplies"]}), 200
-    tag_query_lower = tag_query.lower()
-    filtered_results = [
-        reply for reply in dummy_state["taggedReplies"]
-        if any(tag_query_lower in tag.lower() for tag in reply["tags"])
-    ]
-    return jsonify({
-        "tag_query": tag_query,
-        "results": filtered_results
-    }), 200
 @app.route("/ping", methods=["GET"])
 def ping():
     return jsonify({"status": "ok"})
 if __name__ == "__main__":
     port = int(os.getenv("PORT", 7860))
-    app.run(host="0.0.0.0", port=port, debug=True)

 # --- LLM setup ---
 # Using a model that's good for coding tasks
 llm = ChatGroq(
+    model=os.getenv("LLM_MODEL", "meta-llama/llama-4-scout-17b-16e-instruct"), # Use the supported model
+    temperature=0.1,
+    max_tokens=2048,
     api_key=GROQ_API_KEY,
 )
 """
 def extract_json_from_llm_response(raw_response: str) -> dict:
     default = {
         "assistant_reply": "I'm sorry — I couldn't understand that. Could you please rephrase?",
         "state_updates": {},
         "suggested_tags": [],
     }
     if not raw_response or not isinstance(raw_response, str):
         return default
     m = re.search(r"```(?:json)?\s*([\s\S]*?)\s*```", raw_response)
     json_string = m.group(1).strip() if m else raw_response
     first = json_string.find('{')
     last = json_string.rfind('}')
+    if first != -1 and last != -1 and first < last:
+        candidate = json_string[first:last+1]
+    else:
+        candidate = json_string # Fallback to the whole string if braces aren't clear
     candidate = re.sub(r',\s*(?=[}\]])', '', candidate)
     try:
         parsed = json.loads(candidate)
     except Exception as e:
+        logger.warning("Failed to parse JSON from LLM output: %s. Raw candidate: %s", e, candidate)
         return default
     if isinstance(parsed, dict) and "assistant_reply" in parsed and isinstance(parsed["assistant_reply"], str) and parsed["assistant_reply"].strip():
         parsed.setdefault("state_updates", {})
         parsed.setdefault("suggested_tags", [])
 @app.route("/", methods=["GET"])
 def serve_frontend():
     try:
         return app.send_static_file("frontend.html")
     except Exception:
         return "<h3>frontend.html not found in static/ — please add your frontend.html there.</h3>", 404
 @app.route("/chat", methods=["POST"])
 def chat():
     data = request.get_json(force=True)
         return jsonify({"error": "invalid request body"}), 400
     chat_history: List[Dict[str, str]] = data.get("chat_history") or []
     assistant_state: AssistantState = data.get("assistant_state") or {}
     state: AssistantState = {
         "conversationSummary": assistant_state.get("conversationSummary", ""),
         "lastUserMessage": "",
+        "language": assistant_state.get("language", "Python"),
         "taggedReplies": assistant_state.get("taggedReplies", []),
     }
     for msg in reversed(chat_history):
         if msg.get("role") == "user" and msg.get("content"):
             state["lastUserMessage"] = msg["content"]
             break
     last_msg_lower = state["lastUserMessage"].lower()
     known_languages = ["python", "javascript", "java", "c++", "c#", "go", "ruby", "php", "typescript", "swift"]
     lang_match = re.search(r'\b(in|using|for)\s+(' + '|'.join(known_languages) + r')\b', last_msg_lower)
     if lang_match:
         detected_lang = lang_match.group(2).capitalize()
+        if detected_lang.lower() != state["language"].lower():
             logger.info("Detected new language: %s", detected_lang)
             state["language"] = detected_lang
     action_hint = ""
     if state["language"]:
         action_hint = f"Focus your answer on the {state['language']} programming language. If the user asks a conceptual question, use {state['language']} for examples."
         action_hint = "The current language is unknown. Please ask the user to specify the programming language they are working in."
     user_prompt = f"""
+Current State: {json.dumps({"language": state["language"], "summary": state["conversationSummary"][:200]})}
 Last user message: {state["lastUserMessage"]}
 SYSTEM_HINT: {action_hint}
         logger.exception("LLM invocation failed")
         return jsonify({"error": "LLM invocation failed", "detail": str(e)}), 500
     updated_state_from_llm = parsed_result.get("state_updates", {})
     if 'conversationSummary' in updated_state_from_llm:
         state["conversationSummary"] = updated_state_from_llm["conversationSummary"]
     if 'language' in updated_state_from_llm:
     if not assistant_reply or not isinstance(assistant_reply, str) or not assistant_reply.strip():
         assistant_reply = "I'm here to help with your code! What programming language are you using?"
     response_payload = {
         "assistant_reply": assistant_reply,
         "updated_state": state,
+        "suggested_tags": parsed_result.get("suggested_tags", []),
     }
     return jsonify(response_payload)
 @app.route("/tag_reply", methods=["POST"])
 def tag_reply():
     data = request.get_json(force=True)
     if not reply_content or not tags:
         return jsonify({"error": "Missing 'reply' or 'tags' in request"}), 400
     tags = [str(t).strip() for t in tags if str(t).strip()]
     if not tags:
         return jsonify({"error": "Tags list cannot be empty"}), 400
     state: AssistantState = {
         "conversationSummary": assistant_state.get("conversationSummary", ""),
         "lastUserMessage": "",
         "tags": tags,
     }
     state["taggedReplies"].append(new_tagged_reply)
     logger.info("Reply tagged with: %s", tags)
         "updated_state": state,
     }), 200
 @app.route("/ping", methods=["GET"])
 def ping():
     return jsonify({"status": "ok"})
 if __name__ == "__main__":
     port = int(os.getenv("PORT", 7860))
+    app.run(host="0.0.0.0", port=port, debug=True)