Spaces:

AugustLight
/

LLight-3.2-3b-Instruct

Sleeping

App Files Files Community

AugustLight commited on Oct 26, 2024

Commit

f747916

•

1 Parent(s): 8cc000e

Update app.py

Browse files

Files changed (1) hide show

app.py +39 -43

app.py CHANGED Viewed

@@ -43,55 +43,51 @@ def respond(message, history, system_message, max_new_tokens, temperature, top_p
             model = load_model()
             print("Модель загружена")
-        with gr.Progress() as progress:
-            progress(0, desc="Подготовка контекста...")
-            # Отладочная печать входных параметров
-            print(f"""
-            Входные параметры:
-            - message: {message}
-            - history length: {len(history)}
-            - system_message: {system_message}
-            - max_new_tokens: {max_new_tokens}
-            - temperature: {temperature}
-            - top_p: {top_p}
-            """)
-            # Ограничиваем историю последними 3 сообщениями
-            recent_history = history[-3:] if len(history) > 3 else history
-            context = f"{system_message}\n\n"
-            for user_msg, assistant_msg in recent_history:
-                context += f"User: {user_msg}\nAssistant: {assistant_msg}\n"
-            context += f"User: {message}\nAssistant: "
-            print(f"Генерируем ответ для контекста длиной {len(context)} символов")
-            try:
-                progress(0.3, desc="Генерация ответа...")
-                response = model(
-                    prompt=context,
-                    max_tokens=max_new_tokens,
-                    temperature=temperature,
-                    top_p=top_p,
-                    stop=["User:", "\n\n", "<|endoftext|>"],
-                    echo=False
-                )
-                progress(1, desc="Готово!")
-                generated_text = response['choices'][0]['text']
-                print(f"Ответ сгенерирован успешно, длина: {len(generated_text)}")
-                return generated_text.strip()
-            except Exception as inner_e:
-                print(f"Ошибка при генерации: {str(inner_e)}")
-                print(f"Тип ошибки: {type(inner_e).__name__}")
-                return f"Ошибка при генерации: {str(inner_e)}"
     except KeyboardInterrupt:
         return "Генерация прервана пользователем"
     except Exception as e:
         print(f"Основная ошибка: {str(e)}")
         print(f"Тип ошибки: {type(e).__name__}")
         return f"Произошла ошибка: {str(e)}\nТип ошибки: {type(e).__name__}"
 # Создаем интерфейс с оптимизированными параметрами

             model = load_model()
             print("Модель загружена")
+        # Отладочная печать входных параметров
+        print(f"""
+        Входные параметры:
+        - message: {message}
+        - history length: {len(history)}
+        - system_message: {system_message}
+        - max_new_tokens: {max_new_tokens}
+        - temperature: {temperature}
+        - top_p: {top_p}
+        """)
+        # Ограничиваем историю последними 3 сообщениями
+        recent_history = history[-3:] if len(history) > 3 else history
+        context = f"{system_message}\n\n"
+        for user_msg, assistant_msg in recent_history:
+            context += f"User: {user_msg}\nAssistant: {assistant_msg}\n"
+        context += f"User: {message}\nAssistant: "
+        print(f"Генерируем ответ для контекста длиной {len(context)} символов")
+        try:
+            response = model(
+                prompt=context,
+                max_tokens=max_new_tokens,
+                temperature=temperature,
+                top_p=top_p,
+                stop=["User:", "\n\n", "<|endoftext|>"],
+                echo=False
+            )
+            generated_text = response['choices'][0]['text']
+            print(f"Ответ сгенерирован успешно, длина: {len(generated_text)}")
+            return generated_text.strip()
+        except Exception as inner_e:
+            print(f"Ошибка при генерации: {str(inner_e)}")
+            print(f"Тип ошибки: {type(inner_e).__name__}")
+            return f"Ошибка при генерации: {str(inner_e)}"
     except KeyboardInterrupt:
         return "Генерация прервана пользователем"
     except Exception as e:
         print(f"Основная ошибка: {str(e)}")
         print(f"Тип ошибки: {type(e).__name__}")
+        traceback.print_exc()  # Добавим полный стек ошибки
         return f"Произошла ошибка: {str(e)}\nТип ошибки: {type(e).__name__}"
 # Создаем интерфейс с оптимизированными параметрами