Spaces:

markqiu
/

prinvest_mate

Sleeping

App Files Files Community

Tuchuanhuhuhu commited on Mar 14, 2023

Commit

ab74909

•

1 Parent(s): 3b0ad60

改进代码质量

Browse files

Files changed (3) hide show

ChuanhuChatbot.py +12 -12
presets.py +9 -1
utils.py +52 -35

ChuanhuChatbot.py CHANGED Viewed

@@ -42,13 +42,6 @@ else:
 gr.Chatbot.postprocess = postprocess
 with gr.Blocks(css=customCSS) as demo:
-    gr.HTML(title)
-    with gr.Row():
-        with gr.Column(scale=4):
-            keyTxt = gr.Textbox(show_label=False, placeholder=f"在这里输入你的OpenAI API-key...",value=my_api_key, type="password", visible=not HIDE_MY_KEY).style(container=True)
-        with gr.Column(scale=1):
-            use_streaming_checkbox = gr.Checkbox(label="实时传输回答", value=True, visible=enable_streaming_option)
-    chatbot = gr.Chatbot()  # .style(color_map=("#1D51EE", "#585A5B"))
     history = gr.State([])
     token_count = gr.State([])
     promptTemplates = gr.State(load_template(get_template_names(plain=True)[0], mode=2))
@@ -56,6 +49,13 @@ with gr.Blocks(css=customCSS) as demo:
     FALSECONSTANT = gr.State(False)
     topic = gr.State("未命名对话历史记录")
     with gr.Row():
         with gr.Column(scale=12):
             user_input = gr.Textbox(show_label=False, placeholder="在这里输入").style(
@@ -68,8 +68,9 @@ with gr.Blocks(css=customCSS) as demo:
         delLastBtn = gr.Button("🗑️ 删除最近一条对话")
         reduceTokenBtn = gr.Button("♻️ 总结对话")
     status_display = gr.Markdown("status: ready")
-    systemPromptTxt = gr.Textbox(show_label=True, placeholder=f"在这里输入System Prompt...",
-                                 label="System prompt", value=initial_prompt).style(container=True)
     with gr.Accordion(label="加载Prompt模板", open=False):
         with gr.Column():
             with gr.Row():
@@ -100,11 +101,10 @@ with gr.Blocks(css=customCSS) as demo:
     #inputs, top_p, temperature, top_k, repetition_penalty
     with gr.Accordion("参数", open=False):
         top_p = gr.Slider(minimum=-0, maximum=1.0, value=1.0, step=0.05,
-                          interactive=True, label="Top-p (nucleus sampling)",)
         temperature = gr.Slider(minimum=-0, maximum=5.0, value=1.0,
                                 step=0.1, interactive=True, label="Temperature",)
-        #top_k = gr.Slider( minimum=1, maximum=50, value=4, step=1, interactive=True, label="Top-k",)
-        #repetition_penalty = gr.Slider( minimum=0.1, maximum=3.0, value=1.03, step=0.01, interactive=True, label="Repetition Penalty", )
     gr.Markdown(description)

 gr.Chatbot.postprocess = postprocess
 with gr.Blocks(css=customCSS) as demo:
     history = gr.State([])
     token_count = gr.State([])
     promptTemplates = gr.State(load_template(get_template_names(plain=True)[0], mode=2))
     FALSECONSTANT = gr.State(False)
     topic = gr.State("未命名对话历史记录")
+    gr.HTML(title)
+    with gr.Row():
+        with gr.Column(scale=4):
+            keyTxt = gr.Textbox(show_label=False, placeholder=f"在这里输入你的OpenAI API-key...",value=my_api_key, type="password", visible=not HIDE_MY_KEY).style(container=False)
+        with gr.Column(scale=1):
+            use_streaming_checkbox = gr.Checkbox(label="实时传输回答", value=True, visible=enable_streaming_option)
+    chatbot = gr.Chatbot()  # .style(color_map=("#1D51EE", "#585A5B"))
     with gr.Row():
         with gr.Column(scale=12):
             user_input = gr.Textbox(show_label=False, placeholder="在这里输入").style(
         delLastBtn = gr.Button("🗑️ 删除最近一条对话")
         reduceTokenBtn = gr.Button("♻️ 总结对话")
     status_display = gr.Markdown("status: ready")
+    systemPromptTxt = gr.Textbox(show_label=True, placeholder=f"在这里输入System Prompt...", label="System prompt", value=initial_prompt).style(container=True)
     with gr.Accordion(label="加载Prompt模板", open=False):
         with gr.Column():
             with gr.Row():
     #inputs, top_p, temperature, top_k, repetition_penalty
     with gr.Accordion("参数", open=False):
         top_p = gr.Slider(minimum=-0, maximum=1.0, value=1.0, step=0.05,
+                        interactive=True, label="Top-p (nucleus sampling)",)
         temperature = gr.Slider(minimum=-0, maximum=5.0, value=1.0,
                                 step=0.1, interactive=True, label="Temperature",)
     gr.Markdown(description)

presets.py CHANGED Viewed

@@ -31,9 +31,17 @@ pre code {
 }
 """
 standard_error_msg = "☹️发生了错误：" # 错误信息的标准前缀
 error_retrieve_prompt = "请检查网络连接，或者API-Key是否有效。" # 获取对话时发生错误
-summarize_prompt = "请总结以上对话，不超过100字。" # 总结对话时的 prompt
 max_token_streaming = 3500 # 流式对话时的最大 token 数
 timeout_streaming = 15 # 流式对话时的超时时间
 max_token_all = 3500 # 非流式对话时的最大 token 数

 }
 """
+summarize_prompt = "请总结以上对话，不超过100字。" # 总结对话时的 prompt
+# 错误信息
 standard_error_msg = "☹️发生了错误：" # 错误信息的标准前缀
 error_retrieve_prompt = "请检查网络连接，或者API-Key是否有效。" # 获取对话时发生错误
+connection_timeout_prompt = "连接超时，无法获取对话。" # 连接超时
+read_timeout_prompt = "读取超时，无法获取对话。" # 读取超时
+proxy_error_prompt = "代理错误，无法获取对话。" # 代理错误
+ssl_error_prompt = "SSL错误，无法获取对话。" # SSL 错误
+no_apikey_msg = "API key长度不是51位，请检查是否输入正确。" # API key 长度不足 51 位
 max_token_streaming = 3500 # 流式对话时的最大 token 数
 timeout_streaming = 15 # 流式对话时的超时时间
 max_token_all = 3500 # 非流式对话时的最大 token 数

utils.py CHANGED Viewed

@@ -124,37 +124,37 @@ def get_response(openai_api_key, system_prompt, history, temperature, top_p, str
     response = requests.post(API_URL, headers=headers, json=payload, stream=True, timeout=timeout)
     return response
-def stream_predict(openai_api_key, system_prompt, history, inputs, chatbot, previous_token_count, top_p, temperature):
     def get_return_value():
-        return chatbot, history, status_text, [*previous_token_count, token_counter]
     print("实时回答模式")
-    token_counter = 0
     partial_words = ""
     counter = 0
     status_text = "开始实时传输回答……"
     history.append(construct_user(inputs))
     user_token_count = 0
-    if len(previous_token_count) == 0:
         system_prompt_token_count = count_token(system_prompt)
         user_token_count = count_token(inputs) + system_prompt_token_count
     else:
         user_token_count = count_token(inputs)
     print(f"输入token计数: {user_token_count}")
     try:
         response = get_response(openai_api_key, system_prompt, history, temperature, top_p, True)
     except requests.exceptions.ConnectTimeout:
-        history.pop()
-        status_text = standard_error_msg + "连接超时，无法获取对话。" + error_retrieve_prompt
         yield get_return_value()
         return
     except requests.exceptions.ReadTimeout:
-        history.pop()
-        status_text = standard_error_msg + "读取超时，无法获取对话。" + error_retrieve_prompt
         yield get_return_value()
         return
-    chatbot.append((parse_text(inputs), ""))
     yield get_return_value()
     for chunk in tqdm(response.iter_lines()):
@@ -169,13 +169,14 @@ def stream_predict(openai_api_key, system_prompt, history, inputs, chatbot, prev
             try:
                 chunk = json.loads(chunk[6:])
             except json.JSONDecodeError:
                 status_text = f"JSON解析错误。请重置对话。收到的内容: {chunk}"
                 yield get_return_value()
-                break
             # decode each line as response data is in bytes
             if chunklength > 6 and "delta" in chunk['choices'][0]:
                 finish_reason = chunk['choices'][0]['finish_reason']
-                status_text = construct_token_message(sum(previous_token_count)+token_counter+user_token_count, stream=True)
                 if finish_reason == "stop":
                     print("生成完毕")
                     yield get_return_value()
@@ -183,60 +184,76 @@ def stream_predict(openai_api_key, system_prompt, history, inputs, chatbot, prev
                 try:
                     partial_words = partial_words + chunk['choices'][0]["delta"]["content"]
                 except KeyError:
-                    status_text = standard_error_msg + "API回复中找不到内容。很可能是Token计数达到上限了。请重置对话。当前Token计数: " + str(sum(previous_token_count)+token_counter+user_token_count)
                     yield get_return_value()
                     break
-                if token_counter == 0:
-                    history.append(construct_assistant(" " + partial_words))
-                else:
-                    history[-1] = construct_assistant(partial_words)
                 chatbot[-1] = (parse_text(inputs), parse_text(partial_words))
-                token_counter += 1
                 yield get_return_value()
-def predict_all(openai_api_key, system_prompt, history, inputs, chatbot, previous_token_count, top_p, temperature):
     print("一次性回答模式")
     history.append(construct_user(inputs))
     try:
         response = get_response(openai_api_key, system_prompt, history, temperature, top_p, False)
     except requests.exceptions.ConnectTimeout:
         status_text = standard_error_msg + error_retrieve_prompt
-        return chatbot, history, status_text, previous_token_count
     response = json.loads(response.text)
     content = response["choices"][0]["message"]["content"]
-    history.append(construct_assistant(content))
     chatbot.append((parse_text(inputs), parse_text(content)))
     total_token_count = response["usage"]["total_tokens"]
-    previous_token_count.append(total_token_count - sum(previous_token_count))
     status_text = construct_token_message(total_token_count)
     print("生成一次性回答完毕")
-    return chatbot, history, status_text, previous_token_count
-def predict(openai_api_key, system_prompt, history, inputs, chatbot, token_count, top_p, temperature, stream=False, should_check_token_count = True):  # repetition_penalty, top_k
     print("输入为：" +colorama.Fore.BLUE + f"{inputs}" + colorama.Style.RESET_ALL)
     if stream:
         print("使用流式传输")
-        iter = stream_predict(openai_api_key, system_prompt, history, inputs, chatbot, token_count, top_p, temperature)
-        for chatbot, history, status_text, token_count in iter:
-            yield chatbot, history, status_text, token_count
     else:
         print("不使用流式传输")
-        chatbot, history, status_text, token_count = predict_all(openai_api_key, system_prompt, history, inputs, chatbot, token_count, top_p, temperature)
-        yield chatbot, history, status_text, token_count
-    print(f"传输完毕。当前token计数为{token_count}")
-    print("回答为：" +colorama.Fore.BLUE + f"{history[-1]['content']}" + colorama.Style.RESET_ALL)
     if stream:
         max_token = max_token_streaming
     else:
         max_token = max_token_all
-    if sum(token_count) > max_token and should_check_token_count:
-        print(f"精简token中{token_count}/{max_token}")
-        iter = reduce_token_size(openai_api_key, system_prompt, history, chatbot, token_count, top_p, temperature, stream=False, hidden=True)
-        for chatbot, history, status_text, token_count in iter:
             status_text = f"Token 达到上限，已自动降低Token计数至 {status_text}"
-            yield chatbot, history, status_text, token_count
 def retry(openai_api_key, system_prompt, history, chatbot, token_count, top_p, temperature, stream=False):

     response = requests.post(API_URL, headers=headers, json=payload, stream=True, timeout=timeout)
     return response
+def stream_predict(openai_api_key, system_prompt, history, inputs, chatbot, all_token_counts, top_p, temperature):
     def get_return_value():
+        return chatbot, history, status_text, all_token_counts
     print("实时回答模式")
     partial_words = ""
     counter = 0
     status_text = "开始实时传输回答……"
     history.append(construct_user(inputs))
+    history.append(construct_assistant(""))
+    chatbot.append((parse_text(inputs), ""))
     user_token_count = 0
+    if len(all_token_counts) == 0:
         system_prompt_token_count = count_token(system_prompt)
         user_token_count = count_token(inputs) + system_prompt_token_count
     else:
         user_token_count = count_token(inputs)
+    all_token_counts.append(user_token_count)
     print(f"输入token计数: {user_token_count}")
+    yield get_return_value()
     try:
         response = get_response(openai_api_key, system_prompt, history, temperature, top_p, True)
     except requests.exceptions.ConnectTimeout:
+        status_text = standard_error_msg + connection_timeout_prompt + error_retrieve_prompt
         yield get_return_value()
         return
     except requests.exceptions.ReadTimeout:
+        status_text = standard_error_msg + read_timeout_prompt + error_retrieve_prompt
         yield get_return_value()
         return
     yield get_return_value()
     for chunk in tqdm(response.iter_lines()):
             try:
                 chunk = json.loads(chunk[6:])
             except json.JSONDecodeError:
+                print(chunk)
                 status_text = f"JSON解析错误。请重置对话。收到的内容: {chunk}"
                 yield get_return_value()
+                continue
             # decode each line as response data is in bytes
             if chunklength > 6 and "delta" in chunk['choices'][0]:
                 finish_reason = chunk['choices'][0]['finish_reason']
+                status_text = construct_token_message(sum(all_token_counts), stream=True)
                 if finish_reason == "stop":
                     print("生成完毕")
                     yield get_return_value()
                 try:
                     partial_words = partial_words + chunk['choices'][0]["delta"]["content"]
                 except KeyError:
+                    status_text = standard_error_msg + "API回复中找不到内容。很可能是Token计数达到上限了。请重置对话。当前Token计数: " + str(sum(all_token_counts))
                     yield get_return_value()
                     break
+                history[-1] = construct_assistant(partial_words)
                 chatbot[-1] = (parse_text(inputs), parse_text(partial_words))
+                all_token_counts[-1] += 1
                 yield get_return_value()
+def predict_all(openai_api_key, system_prompt, history, inputs, chatbot, all_token_counts, top_p, temperature):
     print("一次性回答模式")
     history.append(construct_user(inputs))
+    history.append(construct_assistant(""))
+    chatbot.append((parse_text(inputs), ""))
+    all_token_counts.append(count_token(inputs))
     try:
         response = get_response(openai_api_key, system_prompt, history, temperature, top_p, False)
     except requests.exceptions.ConnectTimeout:
         status_text = standard_error_msg + error_retrieve_prompt
+        return chatbot, history, status_text, all_token_counts
+    except requests.exceptions.ProxyError:
+        status_text = standard_error_msg + proxy_error_prompt + error_retrieve_prompt
+    except requests.exceptions.SSLError:
+        status_text = standard_error_msg + ssl_error_prompt + error_retrieve_prompt
+        return chatbot, history, status_text, all_token_counts
     response = json.loads(response.text)
     content = response["choices"][0]["message"]["content"]
+    history[-1] = construct_assistant(content)
     chatbot.append((parse_text(inputs), parse_text(content)))
     total_token_count = response["usage"]["total_tokens"]
+    all_token_counts[-1] = total_token_count - sum(all_token_counts)
     status_text = construct_token_message(total_token_count)
     print("生成一次性回答完毕")
+    return chatbot, history, status_text, all_token_counts
+def predict(openai_api_key, system_prompt, history, inputs, chatbot, all_token_counts, top_p, temperature, stream=False, should_check_token_count = True):  # repetition_penalty, top_k
     print("输入为：" +colorama.Fore.BLUE + f"{inputs}" + colorama.Style.RESET_ALL)
+    if len(openai_api_key) != 51:
+        status_text = standard_error_msg + no_apikey_msg
+        print(status_text)
+        history.append(construct_user(inputs))
+        history.append("")
+        chatbot.append((parse_text(inputs), ""))
+        all_token_counts.append(0)
+        yield chatbot, history, status_text, all_token_counts
+        return
+    yield chatbot, history, "开始生成回答……", all_token_counts
     if stream:
         print("使用流式传输")
+        iter = stream_predict(openai_api_key, system_prompt, history, inputs, chatbot, all_token_counts, top_p, temperature)
+        for chatbot, history, status_text, all_token_counts in iter:
+            yield chatbot, history, status_text, all_token_counts
     else:
         print("不使用流式传输")
+        chatbot, history, status_text, all_token_counts = predict_all(openai_api_key, system_prompt, history, inputs, chatbot, all_token_counts, top_p, temperature)
+        yield chatbot, history, status_text, all_token_counts
+    print(f"传输完毕。当前token计数为{all_token_counts}")
+    if len(history) > 1 and history[-1]['content'] != inputs:
+        print("回答为：" +colorama.Fore.BLUE + f"{history[-1]['content']}" + colorama.Style.RESET_ALL)
     if stream:
         max_token = max_token_streaming
     else:
         max_token = max_token_all
+    if sum(all_token_counts) > max_token and should_check_token_count:
+        print(f"精简token中{all_token_counts}/{max_token}")
+        iter = reduce_token_size(openai_api_key, system_prompt, history, chatbot, all_token_counts, top_p, temperature, stream=False, hidden=True)
+        for chatbot, history, status_text, all_token_counts in iter:
             status_text = f"Token 达到上限，已自动降低Token计数至 {status_text}"
+            yield chatbot, history, status_text, all_token_counts
 def retry(openai_api_key, system_prompt, history, chatbot, token_count, top_p, temperature, stream=False):