Spaces:

MrAlexGov
/

chat-bots-test

Sleeping

App Files Files Community

MrAlexGov commited on 18 days ago

Commit

a3814c1

verified ·

1 Parent(s): b4c97ca

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -18

app.py CHANGED Viewed

@@ -36,9 +36,9 @@ def load_model(model_key: str):
 model_cache = {}
 def respond(message: str,
-            history: List[List[str]],
             model_key: str,
-            system_prompt: str) -> Tuple[List[List[str]], str, Dict[str, Any]]:
     """Локальный чат с pipeline."""
     try:
         if model_key not in model_cache:
@@ -47,16 +47,11 @@ def respond(message: str,
         print(f"🚀 Генерация: {model_key}, Msg='{message[:30]}...'")
-        # Преобразуем формат истории из Gradio в формат сообщений
         messages = []
         if system_prompt.strip():
             messages.append({"role": "system", "content": system_prompt})
-        # Конвертируем историю из формата [["user_msg", "bot_msg"], ...]
-        for user_msg, bot_msg in history:
-            messages.append({"role": "user", "content": user_msg})
-            messages.append({"role": "assistant", "content": bot_msg})
         messages.append({"role": "user", "content": message})
         # Apply chat template (для instruct)
@@ -69,26 +64,31 @@ def respond(message: str,
         print(f"✅ Ответ: {bot_reply[:50]}...")
-        # Обновляем историю в формате Gradio
-        new_history = history + [[message, bot_reply]]
         return new_history, "", gr.update(value="")
     except Exception as e:
         error_msg = f"❌ {model_key}: {str(e)}"
         print(f"💥 {error_msg}")
-        new_history = history + [[message, error_msg]]
         return new_history, error_msg, gr.update(value="")
 # UI
-with gr.Blocks(title="🚀 Локальный HF Чат (на слабом CPU!)") as demo:
     gr.Markdown("# Локальный Inference (без API!)\n**Маленькие модели** — 1-3 сек CPU. Большие думают ооочень долго. Нет limits/token. В качестве примера.")
     with gr.Row():
         model_dropdown = gr.Dropdown(choices=list(MODELS.keys()), value="Qwen2.5-0.5B", label="🧠 Модель")
         system_prompt = gr.Textbox(label="📝 System", placeholder="Ты весёлый ИИ.", lines=2)
-    # Убрал параметр type="messages" для совместимости со старой версией
-    chatbot = gr.Chatbot(height=500)
     with gr.Row():
         msg_input = gr.Textbox(placeholder="Привет! (Enter)", show_label=False, lines=1)
@@ -108,9 +108,9 @@ with gr.Blocks(title="🚀 Локальный HF Чат (на слабом CPU!)
         return [], "", gr.update(value="")
     clear_btn.click(clear, outputs=[chatbot, status, msg_input])
-    def retry(history):
-        if len(history) >= 1:
-            return history[-1][0]  # Последнее сообщение пользователя
         return ""
     retry_btn.click(retry, inputs=[chatbot], outputs=[msg_input])

 model_cache = {}
 def respond(message: str,
+            history: List[Dict[str, str]],
             model_key: str,
+            system_prompt: str) -> Tuple[List[Dict[str, str]], str, Dict[str, Any]]:
     """Локальный чат с pipeline."""
     try:
         if model_key not in model_cache:
         print(f"🚀 Генерация: {model_key}, Msg='{message[:30]}...'")
+        # Chat format (system + history + user)
         messages = []
         if system_prompt.strip():
             messages.append({"role": "system", "content": system_prompt})
+        messages.extend(history)
         messages.append({"role": "user", "content": message})
         # Apply chat template (для instruct)
         print(f"✅ Ответ: {bot_reply[:50]}...")
+        new_history = history + [
+            {"role": "user", "content": message},
+            {"role": "assistant", "content": bot_reply}
+        ]
         return new_history, "", gr.update(value="")
     except Exception as e:
         error_msg = f"❌ {model_key}: {str(e)}"
         print(f"💥 {error_msg}")
+        new_history = history + [
+            {"role": "user", "content": message},
+            {"role": "assistant", "content": error_msg}
+        ]
         return new_history, error_msg, gr.update(value="")
 # UI
+with gr.Blocks(title="🚀 Локальный HF Чат (на слабом CPU!)", theme=gr.themes.Soft()) as demo:
     gr.Markdown("# Локальный Inference (без API!)\n**Маленькие модели** — 1-3 сек CPU. Большие думают ооочень долго. Нет limits/token. В качестве примера.")
     with gr.Row():
         model_dropdown = gr.Dropdown(choices=list(MODELS.keys()), value="Qwen2.5-0.5B", label="🧠 Модель")
         system_prompt = gr.Textbox(label="📝 System", placeholder="Ты весёлый ИИ.", lines=2)
+    # ВЕРНУЛИ type="messages" для правильного формата
+    chatbot = gr.Chatbot(type="messages", height=500, label="Чат")
     with gr.Row():
         msg_input = gr.Textbox(placeholder="Привет! (Enter)", show_label=False, lines=1)
         return [], "", gr.update(value="")
     clear_btn.click(clear, outputs=[chatbot, status, msg_input])
+    def retry(history: List[Dict[str, str]]):
+        if len(history) >= 2 and history[-2]["role"] == "user":
+            return history[-2]["content"]
         return ""
     retry_btn.click(retry, inputs=[chatbot], outputs=[msg_input])