Spaces:

SimpleBerry
/

LLaMA-O1-Supervised-1129-Demo

Running

Di Zhang commited on Dec 2, 2024

Commit

db4b49f

verified ·

1 Parent(s): be02eff

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -37,6 +37,15 @@ def llama_o1_template(data):
     text = template.format(content=data)
     return text
 @spaces.GPU
 def generate_text(message, history, max_tokens=512, temperature=0.9, top_p=0.95):
     input_text = llama_o1_template(message)
@@ -51,7 +60,7 @@ def generate_text(message, history, max_tokens=512, temperature=0.9, top_p=0.95)
         do_sample=True,
     )
-    response = tokenizer.decode(output[0], skip_special_tokens=True)
     yield response
 with gr.Blocks() as demo:

     text = template.format(content=data)
     return text
+def format_response(response):
+    response = response.replace('<start_of_father_id>','')
+    response = response.replace('<end_of_father_id><start_of_local_id>','👉')
+    response = response.replace('<end_of_local_id><start_of_thought>',', ')
+    response = response.replace('<end_of_thought><start_of_rating>','')
+    response = response.replace('<end_of_rating>','')
+    response = response.replace('<positive_rating>','👍')
+    response = response.replace('<negative_rating>','👎')
 @spaces.GPU
 def generate_text(message, history, max_tokens=512, temperature=0.9, top_p=0.95):
     input_text = llama_o1_template(message)
         do_sample=True,
     )
+    response = tokenizer.decode(output[0], skip_special_tokens=False)
     yield response
 with gr.Blocks() as demo: