Spaces:

cmu-lti
/

sotopia-space

Runtime error

App Files Files Community

Wonderplex commited on Apr 14, 2024

Commit

237ffdd

1 Parent(s): a3f9a2a

added parsing error check (#41)

Browse files

Files changed (2) hide show

app.py +28 -10
utils.py +7 -1

app.py CHANGED Viewed

@@ -16,7 +16,7 @@ from utils import Agent, format_sotopia_prompt, get_starter_prompt, format_bot_m
 from functools import cache
 DEPLOYED = os.getenv("DEPLOYED", "true").lower() == "true"
-DEFAULT_MODEL_SELECTION = "cmu-lti/sotopia-pi-mistral-7b-BC_SR"
 def prepare_sotopia_info():
     human_agent = Agent(
@@ -59,6 +59,13 @@ def prepare(model_name):
         )
         tokenizer = AutoTokenizer.from_pretrained("mistralai/Mistral-7B-Instruct-v0.1")
         model = PeftModel.from_pretrained(model, model_name).to("cuda")
     else:
          raise RuntimeError(f"Model {model_name} not supported")
     return model, tokenizer
@@ -107,13 +114,15 @@ def param_accordion(according_visible=True):
             interactive=True,
             label="Max Tokens",
         )
-        session_id = gr.Textbox(
-            value=uuid4,
-            interactive=False,
-            visible=False,
-            label="Session ID",
         )
-    return temperature, session_id, max_tokens, model_name
 def sotopia_info_accordion(human_agent, machine_agent, scenario, accordion_visible=True):
@@ -192,11 +201,20 @@ def chat_tab():
         text_output = tokenizer.decode(
             output_tokens[0], skip_special_tokens=True
         )
-        return format_bot_message(text_output)
     with gr.Column():
         with gr.Row():
-            temperature, session_id, max_tokens, model = param_accordion()
             user_name, bot_name, scenario = sotopia_info_accordion(human_agent, machine_agent, scenario)
             instructions = instructions_accordion(instructions)
@@ -226,7 +244,7 @@ def chat_tab():
                         user_name,
                         bot_name,
                         temperature,
-                        session_id,
                         max_tokens,
                         model,
                     ],

 from functools import cache
 DEPLOYED = os.getenv("DEPLOYED", "true").lower() == "true"
+DEFAULT_MODEL_SELECTION = "cmu-lti/sotopia-pi-mistral-7b-BC_SR" # "mistralai/Mistral-7B-Instruct-v0.1"
 def prepare_sotopia_info():
     human_agent = Agent(
         )
         tokenizer = AutoTokenizer.from_pretrained("mistralai/Mistral-7B-Instruct-v0.1")
         model = PeftModel.from_pretrained(model, model_name).to("cuda")
+    elif 'mistralai/Mistral-7B-Instruct-v0.1' in model_name:
+        model = AutoModelForCausalLM.from_pretrained(
+        "mistralai/Mistral-7B-Instruct-v0.1",
+        cache_dir="./.cache",
+        device_map='cuda',
+        )
+        tokenizer = AutoTokenizer.from_pretrained("mistralai/Mistral-7B-Instruct-v0.1")
     else:
          raise RuntimeError(f"Model {model_name} not supported")
     return model, tokenizer
             interactive=True,
             label="Max Tokens",
         )
+        top_p = gr.Slider(
+            minimum=1,
+            maximum=3,
+            value=1,
+            interactive=True,
+            visible=True,
+            label="Top p",
         )
+    return temperature, top_p, max_tokens, model_name
 def sotopia_info_accordion(human_agent, machine_agent, scenario, accordion_visible=True):
         text_output = tokenizer.decode(
             output_tokens[0], skip_special_tokens=True
         )
+        # import pdb; pdb.set_trace()
+        output = ""
+        for _ in range(5):
+            try:
+                output = format_bot_message(text_output)
+                break
+            except Exception as e:
+                print(e)
+                print("Retrying...")
+        return output
     with gr.Column():
         with gr.Row():
+            temperature, top_p, max_tokens, model = param_accordion()
             user_name, bot_name, scenario = sotopia_info_accordion(human_agent, machine_agent, scenario)
             instructions = instructions_accordion(instructions)
                         user_name,
                         bot_name,
                         temperature,
+                        top_p,
                         max_tokens,
                         model,
                     ],

utils.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from typing import List, Tuple
 import ast
 FORMAT_TEMPLATE = """ Your available action types are
 "none action speak non-verbal communication leave".
@@ -49,7 +50,12 @@ def truncate_dialogue_history_to_length(dia_his, surpass_num, tokenizer):
 def format_bot_message(bot_message) -> str:
-    json_response = ast.literal_eval(bot_message)
     match json_response["action_type"]:
         case "none":
             return 'did nothing'

 from typing import List, Tuple
 import ast
+import re
 FORMAT_TEMPLATE = """ Your available action types are
 "none action speak non-verbal communication leave".
 def format_bot_message(bot_message) -> str:
+    # import pdb; pdb.set_trace()
+    start_idx, end_idx = bot_message.index("{"), bot_message.index("}")
+    if end_idx == -1:
+        bot_message += "'}"
+        end_idx = len(bot_message)
+    json_response = ast.literal_eval(bot_message[start_idx:end_idx+1])
     match json_response["action_type"]:
         case "none":
             return 'did nothing'