|
|
|
import gradio as gr |
|
from utils.logging_util import logger |
|
from models.cpp_qwen2 import bot |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def generate_query(chatbot, history): |
|
if history and history[-1]["role"] == "user": |
|
gr.Warning('You should generate assistant-response.') |
|
yield None, chatbot, history |
|
else: |
|
chatbot.append(None) |
|
streamer = bot.generate_query(history, stream=True) |
|
for query in streamer: |
|
chatbot[-1] = (query, None) |
|
yield query, chatbot, history |
|
history.append({"role": "user", "content": query}) |
|
yield query, chatbot, history |
|
|
|
|
|
def generate_response(chatbot, history, user_input=None): |
|
""" |
|
auto-mode:query is None |
|
manual-mode:query 是用户输入 |
|
:param chatbot: |
|
:param history: |
|
:return: |
|
""" |
|
if user_input and history[-1]["role"] != "user": |
|
history.append({"role": "user", "content": user_input}) |
|
query = history[-1]["content"] |
|
|
|
if history[-1]["role"] != "user": |
|
gr.Warning('You should generate or type user-input first.') |
|
yield None, chatbot, history |
|
else: |
|
streamer = bot.generate_response(history, stream=True) |
|
for response in streamer: |
|
chatbot[-1] = (query, response) |
|
yield response, chatbot, history |
|
|
|
history.append({"role": "assistant", "content": response}) |
|
print(f"chatbot is {chatbot}") |
|
print(f"history is {history}") |
|
yield response, chatbot, history |
|
|
|
|
|
def generate(chatbot, history): |
|
logger.info(f"chatbot: {chatbot}; history: {history}") |
|
streamer = None |
|
if history[-1]["role"] == "assistant": |
|
streamer = generate_query(chatbot, history) |
|
elif history[-1]["role"] in ["user", "system"]: |
|
streamer = generate_response(chatbot, history) |
|
else: |
|
gr.Warning("bug") |
|
|
|
for out in streamer: |
|
yield out |
|
|
|
|
|
def regenerate(): |
|
""" |
|
删除上一轮,重新生成。 |
|
:return: |
|
""" |
|
pass |
|
|
|
|
|
def reset_user_input(): |
|
return gr.update(value='') |
|
|
|
|
|
def reset_state(system): |
|
return [], [{"role": "system", "content": system}] |
|
|
|
|
|
def set_max_tokens(max_tokens): |
|
bot.generation_kwargs["max_tokens"] = max_tokens |
|
|
|
|
|
def clear_history(): |
|
pass |
|
|
|
|
|
def undo_generate(): |
|
pass |
|
|
|
|
|
|