Spaces:

SimrusDenuvo
/

practic

Runtime error

App Files Files Community

SimrusDenuvo commited on May 14

Commit

42ccf19

verified ·

1 Parent(s): 11dd5a2

Update app.py

Browse files

Files changed (1) hide show

app.py +22 -13

app.py CHANGED Viewed

@@ -1,35 +1,44 @@
-from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
 import gradio as gr
-model_name = "cointegrated/rut5-small"
 tokenizer = AutoTokenizer.from_pretrained(model_name)
-model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
 def generate_response(prompt):
-    instruction = f"Ответь кратко: {prompt.strip()}"
-    input_ids = tokenizer.encode(instruction, return_tensors="pt", max_length=512, truncation=True)
     output = model.generate(
         input_ids,
-        max_new_tokens=80,
         do_sample=True,
-        top_p=0.9,
-        temperature=0.7,
-        repetition_penalty=1.2,
         eos_token_id=tokenizer.eos_token_id
     )
     response = tokenizer.decode(output[0], skip_special_tokens=True)
-    return response.strip()
 iface = gr.Interface(
     fn=generate_response,
     inputs=gr.Textbox(label="Введите ваш вопрос"),
     outputs=gr.Textbox(label="Ответ модели"),
-    title="Интерфейс ChatGPT",
-    description="Пример взаимодействия с API OpenAI через Hugging Face Space"
 )
 iface.launch()

+from transformers import AutoTokenizer, AutoModelForCausalLM
+import torch
 import gradio as gr
+# Загрузка модели и токенизатора
+model_name = "sberbank-ai/rugpt3medium_based_on_gpt2"
 tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForCausalLM.from_pretrained(model_name)
+# Функция генерации ответа
 def generate_response(prompt):
+    instruction = f"Ответь кратко и понятно на вопрос: {prompt.strip()}"
+    input_ids = tokenizer.encode(instruction, return_tensors="pt")
+    # Генерация ответа
     output = model.generate(
         input_ids,
+        max_length=150,
         do_sample=True,
+        top_k=50,
+        top_p=0.95,
+        temperature=0.8,
+        pad_token_id=tokenizer.eos_token_id,
         eos_token_id=tokenizer.eos_token_id
     )
+    # Декодирование и удаление излишней части промпта
     response = tokenizer.decode(output[0], skip_special_tokens=True)
+    # Возвращаем только ответ, без дублирования запроса
+    return response.replace(instruction, "").strip()
+# Интерфейс Gradio
 iface = gr.Interface(
     fn=generate_response,
     inputs=gr.Textbox(label="Введите ваш вопрос"),
     outputs=gr.Textbox(label="Ответ модели"),
+    title="Ответ от ruGPT-3 Medium",
+    description="Генерация ответа с помощью модели Sberbank ruGPT-3 Medium"
 )
+# Запуск интерфейса
 iface.launch()