Spaces:

JohnSmith9982
/

ChuanhuChatGPT_Beta

Runtime error

App Files Files Community

JohnSmith9982 commited on Apr 13, 2023

Commit

7b5a1c0

•

1 Parent(s): cecb277

Upload 38 files

Browse files

Files changed (29) hide show

CITATION.cff +20 -0
ChuanhuChatbot.py +159 -128
Dockerfile +2 -1
README.md +105 -13
assets/custom.css +125 -31
assets/custom.js +208 -54
config_example.json +31 -0
configs/ds_config_chatbot.json +17 -0
modules/__init__.py +0 -0
modules/__pycache__/__init__.cpython-311.pyc +0 -0
modules/__pycache__/__init__.cpython-39.pyc +0 -0
modules/__pycache__/base_model.cpython-311.pyc +0 -0
modules/__pycache__/base_model.cpython-39.pyc +0 -0
modules/__pycache__/config.cpython-311.pyc +0 -0
modules/__pycache__/config.cpython-39.pyc +0 -0
modules/__pycache__/llama_func.cpython-311.pyc +0 -0
modules/__pycache__/models.cpython-311.pyc +0 -0
modules/base_model.py +547 -0
modules/config.py +55 -34
modules/llama_func.py +75 -46
modules/models.py +586 -0
modules/overwrites.py +55 -17
modules/presets.py +82 -49
modules/shared.py +3 -3
modules/utils.py +115 -118
requirements.txt +1 -0
requirements_advanced.txt +7 -0
run_Linux.sh +8 -2
run_macOS.command +8 -2

CITATION.cff ADDED Viewed

	@@ -0,0 +1,20 @@

+cff-version: 1.2.0
+title: ChuanhuChatGPT
+message: >-
+  If you use this software, please cite it using these
+  metadata.
+type: software
+authors:
+  - given-names: Chuanhu
+    orcid: https://orcid.org/0000-0001-8954-8598
+  - given-names: MZhao
+    orcid: https://orcid.org/0000-0003-2298-6213
+  - given-names: Keldos
+    orcid: https://orcid.org/0009-0005-0357-272X
+repository-code: 'https://github.com/GaiZhenbiao/ChuanhuChatGPT'
+url: 'https://github.com/GaiZhenbiao/ChuanhuChatGPT'
+abstract: Provided a light and easy to use interface for ChatGPT API
+license: GPL-3.0
+commit: bd0034c37e5af6a90bd9c2f7dd073f6cd27c61af
+version: '20230405'
+date-released: '2023-04-05'

ChuanhuChatbot.py CHANGED Viewed

@@ -10,31 +10,32 @@ from modules.config import *
 from modules.utils import *
 from modules.presets import *
 from modules.overwrites import *
-from modules.chat_func import *
-from modules.openai_func import get_usage
 gr.Chatbot.postprocess = postprocess
 PromptHelper.compact_text_chunks = compact_text_chunks
 with open("assets/custom.css", "r", encoding="utf-8") as f:
     customCSS = f.read()
 with gr.Blocks(css=customCSS, theme=small_and_beautiful_theme) as demo:
     user_name = gr.State("")
-    history = gr.State([])
-    token_count = gr.State([])
     promptTemplates = gr.State(load_template(get_template_names(plain=True)[0], mode=2))
-    user_api_key = gr.State(my_api_key)
     user_question = gr.State("")
-    outputing = gr.State(False)
     topic = gr.State("未命名对话历史记录")
     with gr.Row():
-        with gr.Column():
-            gr.HTML(title)
-            user_info = gr.Markdown(value="", elem_id="user_info")
-        gr.HTML('<center><a href="https://huggingface.co/spaces/JohnSmith9982/ChuanhuChatGPT?duplicate=true"><img src="https://bit.ly/3gLdBN6" alt="Duplicate Space"></a></center>')
         status_display = gr.Markdown(get_geoip(), elem_id="status_display")
         # https://github.com/gradio-app/gradio/pull/3296
         def create_greeting(request: gr.Request):
@@ -50,14 +51,14 @@ with gr.Blocks(css=customCSS, theme=small_and_beautiful_theme) as demo:
             with gr.Row():
                 chatbot = gr.Chatbot(elem_id="chuanhu_chatbot").style(height="100%")
             with gr.Row():
-                with gr.Column(scale=12):
                     user_input = gr.Textbox(
                         elem_id="user_input_tb",
                         show_label=False, placeholder="在这里输入"
                     ).style(container=False)
-                with gr.Column(min_width=70, scale=1):
-                    submitBtn = gr.Button("发送", variant="primary")
-                    cancelBtn = gr.Button("取消", variant="secondary", visible=False)
             with gr.Row():
                 emptyBtn = gr.Button(
                     "🧹 新的对话",
@@ -65,37 +66,41 @@ with gr.Blocks(css=customCSS, theme=small_and_beautiful_theme) as demo:
                 retryBtn = gr.Button("🔄 重新生成")
                 delFirstBtn = gr.Button("🗑️ 删除最旧对话")
                 delLastBtn = gr.Button("🗑️ 删除最新对话")
-                reduceTokenBtn = gr.Button("♻️ 总结对话")
         with gr.Column():
             with gr.Column(min_width=50, scale=1):
-                with gr.Tab(label="ChatGPT"):
                     keyTxt = gr.Textbox(
                         show_label=True,
                         placeholder=f"OpenAI API-key...",
-                        value=hide_middle_chars(my_api_key),
                         type="password",
                         visible=not HIDE_MY_KEY,
                         label="API-Key",
                     )
                     if multi_api_key:
-                        usageTxt = gr.Markdown("多账号模式已开启，无需输入key，可直接开始对话", elem_id="usage_display")
                     else:
-                        usageTxt = gr.Markdown("**发送消息** 或 **提交key** 以显示额度", elem_id="usage_display")
                     model_select_dropdown = gr.Dropdown(
-                        label="选择模型", choices=MODELS, multiselect=False, value=MODELS[0]
                     )
-                    use_streaming_checkbox = gr.Checkbox(
-                        label="实时传输回答", value=True, visible=enable_streaming_option
                     )
-                    use_websearch_checkbox = gr.Checkbox(label="使用在线搜索", value=False)
                     language_select_dropdown = gr.Dropdown(
                         label="选择回复语言（针对搜索&索引功能）",
                         choices=REPLY_LANGUAGES,
                         multiselect=False,
                         value=REPLY_LANGUAGES[0],
                     )
-                    index_files = gr.Files(label="上传索引文件", type="file", multiple=True)
                     two_column = gr.Checkbox(label="双栏pdf", value=advance_docs["pdf"].get("two_column", False))
                     # TODO: 公式ocr
                     # formula_ocr = gr.Checkbox(label="识别公式", value=advance_docs["pdf"].get("formula_ocr", False))
@@ -105,7 +110,7 @@ with gr.Blocks(css=customCSS, theme=small_and_beautiful_theme) as demo:
                         show_label=True,
                         placeholder=f"在这里输入System Prompt...",
                         label="System prompt",
-                        value=initial_prompt,
                         lines=10,
                     ).style(container=False)
                     with gr.Accordion(label="加载Prompt模板", open=True):
@@ -161,27 +166,87 @@ with gr.Blocks(css=customCSS, theme=small_and_beautiful_theme) as demo:
                 with gr.Tab(label="高级"):
                     gr.Markdown("# ⚠️ 务必谨慎更改 ⚠️\n\n如果无法使用请恢复默认设置")
-                    default_btn = gr.Button("🔙 恢复默认设置")
                     with gr.Accordion("参数", open=False):
-                        top_p = gr.Slider(
                             minimum=-0,
                             maximum=1.0,
                             value=1.0,
                             step=0.05,
                             interactive=True,
-                            label="Top-p",
                         )
-                        temperature = gr.Slider(
-                            minimum=-0,
                             maximum=2.0,
-                            value=1.0,
-                            step=0.1,
                             interactive=True,
-                            label="Temperature",
                         )
-                    with gr.Accordion("网络设置", open=False, visible=False):
                         # 优先展示自定义的api_host
                         apihostTxt = gr.Textbox(
                             show_label=True,
@@ -199,27 +264,22 @@ with gr.Blocks(css=customCSS, theme=small_and_beautiful_theme) as demo:
                             lines=2,
                         )
                         changeProxyBtn = gr.Button("🔄 设置代理地址")
-    gr.Markdown(description)
-    gr.HTML(footer.format(versions=versions_html()), elem_id="footer")
     chatgpt_predict_args = dict(
         fn=predict,
         inputs=[
-            user_api_key,
-            systemPromptTxt,
-            history,
             user_question,
             chatbot,
-            token_count,
-            top_p,
-            temperature,
             use_streaming_checkbox,
-            model_select_dropdown,
             use_websearch_checkbox,
             index_files,
             language_select_dropdown,
         ],
-        outputs=[chatbot, history, status_display, token_count],
         show_progress=True,
     )
@@ -243,12 +303,18 @@ with gr.Blocks(css=customCSS, theme=small_and_beautiful_theme) as demo:
     )
     get_usage_args = dict(
-        fn=get_usage, inputs=[user_api_key], outputs=[usageTxt], show_progress=False
     )
     # Chatbot
-    cancelBtn.click(cancel_outputing, [], [])
     user_input.submit(**transfer_input_args).then(**chatgpt_predict_args).then(**end_outputing_args)
     user_input.submit(**get_usage_args)
@@ -256,9 +322,12 @@ with gr.Blocks(css=customCSS, theme=small_and_beautiful_theme) as demo:
     submitBtn.click(**transfer_input_args).then(**chatgpt_predict_args).then(**end_outputing_args)
     submitBtn.click(**get_usage_args)
     emptyBtn.click(
-        reset_state,
-        outputs=[chatbot, history, token_count, status_display],
         show_progress=True,
     )
     emptyBtn.click(**reset_textbox_args)
@@ -266,61 +335,42 @@ with gr.Blocks(css=customCSS, theme=small_and_beautiful_theme) as demo:
     retryBtn.click(**start_outputing_args).then(
         retry,
         [
-            user_api_key,
-            systemPromptTxt,
-            history,
             chatbot,
-            token_count,
-            top_p,
-            temperature,
             use_streaming_checkbox,
-            model_select_dropdown,
             language_select_dropdown,
         ],
-        [chatbot, history, status_display, token_count],
         show_progress=True,
     ).then(**end_outputing_args)
     retryBtn.click(**get_usage_args)
     delFirstBtn.click(
         delete_first_conversation,
-        [history, token_count],
-        [history, token_count, status_display],
     )
     delLastBtn.click(
         delete_last_conversation,
-        [chatbot, history, token_count],
-        [chatbot, history, token_count, status_display],
-        show_progress=True,
     )
-    reduceTokenBtn.click(
-        reduce_token_size,
-        [
-            user_api_key,
-            systemPromptTxt,
-            history,
-            chatbot,
-            token_count,
-            top_p,
-            temperature,
-            gr.State(sum(token_count.value[-4:])),
-            model_select_dropdown,
-            language_select_dropdown,
-        ],
-        [chatbot, history, status_display, token_count],
-        show_progress=True,
-    )
-    reduceTokenBtn.click(**get_usage_args)
     two_column.change(update_doc_config, [two_column], None)
-    # ChatGPT
-    keyTxt.change(submit_key, keyTxt, [user_api_key, status_display]).then(**get_usage_args)
     keyTxt.submit(**get_usage_args)
     # Template
     templateRefreshBtn.click(get_template_names, None, [templateFileSelectDropdown])
     templateFileSelectDropdown.change(
         load_template,
@@ -338,31 +388,33 @@ with gr.Blocks(css=customCSS, theme=small_and_beautiful_theme) as demo:
     # S&L
     saveHistoryBtn.click(
         save_chat_history,
-        [saveFileName, systemPromptTxt, history, chatbot, user_name],
         downloadFile,
         show_progress=True,
     )
     saveHistoryBtn.click(get_history_names, [gr.State(False), user_name], [historyFileSelectDropdown])
     exportMarkdownBtn.click(
         export_markdown,
-        [saveFileName, systemPromptTxt, history, chatbot, user_name],
         downloadFile,
         show_progress=True,
     )
     historyRefreshBtn.click(get_history_names, [gr.State(False), user_name], [historyFileSelectDropdown])
-    historyFileSelectDropdown.change(
-        load_chat_history,
-        [historyFileSelectDropdown, systemPromptTxt, history, chatbot, user_name],
-        [saveFileName, systemPromptTxt, history, chatbot],
-        show_progress=True,
-    )
-    downloadFile.change(
-        load_chat_history,
-        [downloadFile, systemPromptTxt, history, chatbot, user_name],
-        [saveFileName, systemPromptTxt, history, chatbot],
-    )
     # Advanced
     default_btn.click(
         reset_default, [], [apihostTxt, proxyTxt, status_display], show_progress=True
     )
@@ -389,35 +441,14 @@ demo.title = "川虎ChatGPT 🚀"
 if __name__ == "__main__":
     reload_javascript()
-    # if running in Docker
-    if dockerflag:
-        if authflag:
-            demo.queue(concurrency_count=CONCURRENT_COUNT).launch(
-                server_name="0.0.0.0",
-                server_port=7860,
-                auth=auth_list,
-                favicon_path="./assets/favicon.ico",
-            )
-        else:
-            demo.queue(concurrency_count=CONCURRENT_COUNT).launch(
-                server_name="0.0.0.0",
-                server_port=7860,
-                share=False,
-                favicon_path="./assets/favicon.ico",
-            )
-    # if not running in Docker
-    else:
-        if authflag:
-            demo.queue(concurrency_count=CONCURRENT_COUNT).launch(
-                share=False,
-                auth=auth_list,
-                favicon_path="./assets/favicon.ico",
-                inbrowser=True,
-            )
-        else:
-            demo.queue(concurrency_count=CONCURRENT_COUNT).launch(
-                share=False, favicon_path="./assets/favicon.ico", inbrowser=True
-            )  # 改为 share=True 可以创建公开分享链接
-        # demo.queue(concurrency_count=CONCURRENT_COUNT).launch(server_name="0.0.0.0", server_port=7860, share=False) # 可自定义端口
-        # demo.queue(concurrency_count=CONCURRENT_COUNT).launch(server_name="0.0.0.0", server_port=7860,auth=("在这里填写用户名", "在这里填写密码")) # 可设置用户名与密码
-        # demo.queue(concurrency_count=CONCURRENT_COUNT).launch(auth=("在这里填写用户名", "在这里填写密码")) # 适合Nginx反向代理

 from modules.utils import *
 from modules.presets import *
 from modules.overwrites import *
+from modules.models import get_model
+gr.Chatbot._postprocess_chat_messages = postprocess_chat_messages
 gr.Chatbot.postprocess = postprocess
 PromptHelper.compact_text_chunks = compact_text_chunks
 with open("assets/custom.css", "r", encoding="utf-8") as f:
     customCSS = f.read()
+def create_new_model():
+    return get_model(model_name = MODELS[DEFAULT_MODEL], access_key = my_api_key)[0]
 with gr.Blocks(css=customCSS, theme=small_and_beautiful_theme) as demo:
     user_name = gr.State("")
     promptTemplates = gr.State(load_template(get_template_names(plain=True)[0], mode=2))
     user_question = gr.State("")
+    user_api_key = gr.State(my_api_key)
+    current_model = gr.State(create_new_model)
     topic = gr.State("未命名对话历史记录")
     with gr.Row():
+        gr.HTML(CHUANHU_TITLE, elem_id="app_title")
         status_display = gr.Markdown(get_geoip(), elem_id="status_display")
+    with gr.Row(elem_id="float_display"):
+        user_info = gr.Markdown(value="getting user info...", elem_id="user_info")
         # https://github.com/gradio-app/gradio/pull/3296
         def create_greeting(request: gr.Request):
             with gr.Row():
                 chatbot = gr.Chatbot(elem_id="chuanhu_chatbot").style(height="100%")
             with gr.Row():
+                with gr.Column(min_width=225, scale=12):
                     user_input = gr.Textbox(
                         elem_id="user_input_tb",
                         show_label=False, placeholder="在这里输入"
                     ).style(container=False)
+                with gr.Column(min_width=42, scale=1):
+                    submitBtn = gr.Button(value="", variant="primary", elem_id="submit_btn")
+                    cancelBtn = gr.Button(value="", variant="secondary", visible=False, elem_id="cancel_btn")
             with gr.Row():
                 emptyBtn = gr.Button(
                     "🧹 新的对话",
                 retryBtn = gr.Button("🔄 重新生成")
                 delFirstBtn = gr.Button("🗑️ 删除最旧对话")
                 delLastBtn = gr.Button("🗑️ 删除最新对话")
         with gr.Column():
             with gr.Column(min_width=50, scale=1):
+                with gr.Tab(label="模型"):
                     keyTxt = gr.Textbox(
                         show_label=True,
                         placeholder=f"OpenAI API-key...",
+                        value=hide_middle_chars(user_api_key.value),
                         type="password",
                         visible=not HIDE_MY_KEY,
                         label="API-Key",
                     )
                     if multi_api_key:
+                        usageTxt = gr.Markdown("多账号模式已开启，无需输入key，可直接开始对话", elem_id="usage_display", elem_classes="insert_block")
                     else:
+                        usageTxt = gr.Markdown("**发送消息** 或 **提交key** 以显示额度", elem_id="usage_display", elem_classes="insert_block")
                     model_select_dropdown = gr.Dropdown(
+                        label="选择模型", choices=MODELS, multiselect=False, value=MODELS[DEFAULT_MODEL], interactive=True
                     )
+                    lora_select_dropdown = gr.Dropdown(
+                        label="选择LoRA模型", choices=[], multiselect=False, interactive=True, visible=False
                     )
+                    with gr.Row():
+                        use_streaming_checkbox = gr.Checkbox(
+                            label="实时传输回答", value=True, visible=ENABLE_STREAMING_OPTION
+                        )
+                        single_turn_checkbox = gr.Checkbox(label="单轮对话", value=False)
+                        use_websearch_checkbox = gr.Checkbox(label="使用在线搜索", value=False)
                     language_select_dropdown = gr.Dropdown(
                         label="选择回复语言（针对搜索&索引功能）",
                         choices=REPLY_LANGUAGES,
                         multiselect=False,
                         value=REPLY_LANGUAGES[0],
                     )
+                    index_files = gr.Files(label="上传索引文件", type="file")
                     two_column = gr.Checkbox(label="双栏pdf", value=advance_docs["pdf"].get("two_column", False))
                     # TODO: 公式ocr
                     # formula_ocr = gr.Checkbox(label="识别公式", value=advance_docs["pdf"].get("formula_ocr", False))
                         show_label=True,
                         placeholder=f"在这里输入System Prompt...",
                         label="System prompt",
+                        value=INITIAL_SYSTEM_PROMPT,
                         lines=10,
                     ).style(container=False)
                     with gr.Accordion(label="加载Prompt模板", open=True):
                 with gr.Tab(label="高级"):
                     gr.Markdown("# ⚠️ 务必谨慎更改 ⚠️\n\n如果无法使用请恢复默认设置")
+                    gr.HTML(APPEARANCE_SWITCHER, elem_classes="insert_block")
                     with gr.Accordion("参数", open=False):
+                        temperature_slider = gr.Slider(
+                            minimum=-0,
+                            maximum=2.0,
+                            value=1.0,
+                            step=0.1,
+                            interactive=True,
+                            label="temperature",
+                        )
+                        top_p_slider = gr.Slider(
                             minimum=-0,
                             maximum=1.0,
                             value=1.0,
                             step=0.05,
                             interactive=True,
+                            label="top-p",
                         )
+                        n_choices_slider = gr.Slider(
+                            minimum=1,
+                            maximum=10,
+                            value=1,
+                            step=1,
+                            interactive=True,
+                            label="n choices",
+                        )
+                        stop_sequence_txt = gr.Textbox(
+                            show_label=True,
+                            placeholder=f"在这里输入停止符，用英文逗号隔开...",
+                            label="stop",
+                            value="",
+                            lines=1,
+                        )
+                        max_context_length_slider = gr.Slider(
+                            minimum=1,
+                            maximum=32768,
+                            value=2000,
+                            step=1,
+                            interactive=True,
+                            label="max context",
+                        )
+                        max_generation_slider = gr.Slider(
+                            minimum=1,
+                            maximum=32768,
+                            value=1000,
+                            step=1,
+                            interactive=True,
+                            label="max generations",
+                        )
+                        presence_penalty_slider = gr.Slider(
+                            minimum=-2.0,
                             maximum=2.0,
+                            value=0.0,
+                            step=0.01,
                             interactive=True,
+                            label="presence penalty",
+                        )
+                        frequency_penalty_slider = gr.Slider(
+                            minimum=-2.0,
+                            maximum=2.0,
+                            value=0.0,
+                            step=0.01,
+                            interactive=True,
+                            label="frequency penalty",
+                        )
+                        logit_bias_txt = gr.Textbox(
+                            show_label=True,
+                            placeholder=f"word:likelihood",
+                            label="logit bias",
+                            value="",
+                            lines=1,
+                        )
+                        user_identifier_txt = gr.Textbox(
+                            show_label=True,
+                            placeholder=f"用于定位滥用行为",
+                            label="用户名",
+                            value=user_name.value,
+                            lines=1,
                         )
+                    with gr.Accordion("网络设置", open=False):
                         # 优先展示自定义的api_host
                         apihostTxt = gr.Textbox(
                             show_label=True,
                             lines=2,
                         )
                         changeProxyBtn = gr.Button("🔄 设置代理地址")
+                        default_btn = gr.Button("🔙 恢复默认设置")
+    gr.Markdown(CHUANHU_DESCRIPTION)
+    gr.HTML(FOOTER.format(versions=versions_html()), elem_id="footer")
     chatgpt_predict_args = dict(
         fn=predict,
         inputs=[
+            current_model,
             user_question,
             chatbot,
             use_streaming_checkbox,
             use_websearch_checkbox,
             index_files,
             language_select_dropdown,
         ],
+        outputs=[chatbot, status_display],
         show_progress=True,
     )
     )
     get_usage_args = dict(
+        fn=billing_info, inputs=[current_model], outputs=[usageTxt], show_progress=False
+    )
+    load_history_from_file_args = dict(
+        fn=load_chat_history,
+        inputs=[current_model, historyFileSelectDropdown, chatbot, user_name],
+        outputs=[saveFileName, systemPromptTxt, chatbot]
     )
     # Chatbot
+    cancelBtn.click(interrupt, [current_model], [])
     user_input.submit(**transfer_input_args).then(**chatgpt_predict_args).then(**end_outputing_args)
     user_input.submit(**get_usage_args)
     submitBtn.click(**transfer_input_args).then(**chatgpt_predict_args).then(**end_outputing_args)
     submitBtn.click(**get_usage_args)
+    index_files.change(handle_file_upload, [current_model, index_files, chatbot], [index_files, chatbot, status_display])
     emptyBtn.click(
+        reset,
+        inputs=[current_model],
+        outputs=[chatbot, status_display],
         show_progress=True,
     )
     emptyBtn.click(**reset_textbox_args)
     retryBtn.click(**start_outputing_args).then(
         retry,
         [
+            current_model,
             chatbot,
             use_streaming_checkbox,
+            use_websearch_checkbox,
+            index_files,
             language_select_dropdown,
         ],
+        [chatbot, status_display],
         show_progress=True,
     ).then(**end_outputing_args)
     retryBtn.click(**get_usage_args)
     delFirstBtn.click(
         delete_first_conversation,
+        [current_model],
+        [status_display],
     )
     delLastBtn.click(
         delete_last_conversation,
+        [current_model, chatbot],
+        [chatbot, status_display],
+        show_progress=False
     )
     two_column.change(update_doc_config, [two_column], None)
+    # LLM Models
+    keyTxt.change(set_key, [current_model, keyTxt], [user_api_key, status_display]).then(**get_usage_args)
     keyTxt.submit(**get_usage_args)
+    single_turn_checkbox.change(set_single_turn, [current_model, single_turn_checkbox], None)
+    model_select_dropdown.change(get_model, [model_select_dropdown, lora_select_dropdown, user_api_key, temperature_slider, top_p_slider, systemPromptTxt], [current_model, status_display, lora_select_dropdown], show_progress=True)
+    lora_select_dropdown.change(get_model, [model_select_dropdown, lora_select_dropdown, user_api_key, temperature_slider, top_p_slider, systemPromptTxt], [current_model, status_display], show_progress=True)
     # Template
+    systemPromptTxt.change(set_system_prompt, [current_model, systemPromptTxt], None)
     templateRefreshBtn.click(get_template_names, None, [templateFileSelectDropdown])
     templateFileSelectDropdown.change(
         load_template,
     # S&L
     saveHistoryBtn.click(
         save_chat_history,
+        [current_model, saveFileName, chatbot, user_name],
         downloadFile,
         show_progress=True,
     )
     saveHistoryBtn.click(get_history_names, [gr.State(False), user_name], [historyFileSelectDropdown])
     exportMarkdownBtn.click(
         export_markdown,
+        [current_model, saveFileName, chatbot, user_name],
         downloadFile,
         show_progress=True,
     )
     historyRefreshBtn.click(get_history_names, [gr.State(False), user_name], [historyFileSelectDropdown])
+    historyFileSelectDropdown.change(**load_history_from_file_args)
+    downloadFile.change(**load_history_from_file_args)
     # Advanced
+    max_context_length_slider.change(set_token_upper_limit, [current_model, max_context_length_slider], None)
+    temperature_slider.change(set_temperature, [current_model, temperature_slider], None)
+    top_p_slider.change(set_top_p, [current_model, top_p_slider], None)
+    n_choices_slider.change(set_n_choices, [current_model, n_choices_slider], None)
+    stop_sequence_txt.change(set_stop_sequence, [current_model, stop_sequence_txt], None)
+    max_generation_slider.change(set_max_tokens, [current_model, max_generation_slider], None)
+    presence_penalty_slider.change(set_presence_penalty, [current_model, presence_penalty_slider], None)
+    frequency_penalty_slider.change(set_frequency_penalty, [current_model, frequency_penalty_slider], None)
+    logit_bias_txt.change(set_logit_bias, [current_model, logit_bias_txt], None)
+    user_identifier_txt.change(set_user_identifier, [current_model, user_identifier_txt], None)
     default_btn.click(
         reset_default, [], [apihostTxt, proxyTxt, status_display], show_progress=True
     )
 if __name__ == "__main__":
     reload_javascript()
+    demo.queue(concurrency_count=CONCURRENT_COUNT).launch(
+        server_name=server_name,
+        server_port=server_port,
+        share=share,
+        auth=auth_list if authflag else None,
+        favicon_path="./assets/favicon.ico",
+        inbrowser=not dockerflag, # 禁止在docker下开启inbrowser
+    )
+    # demo.queue(concurrency_count=CONCURRENT_COUNT).launch(server_name="0.0.0.0", server_port=7860, share=False) # 可自定义端口
+    # demo.queue(concurrency_count=CONCURRENT_COUNT).launch(server_name="0.0.0.0", server_port=7860,auth=("在这里填写用户名", "在这里填写密码")) # 可设置用户名与密码
+    # demo.queue(concurrency_count=CONCURRENT_COUNT).launch(auth=("在这里填写用户名", "在这里填写密码")) # 适合Nginx反向代理

Dockerfile CHANGED Viewed

@@ -1,7 +1,9 @@
 FROM python:3.9 as builder
 RUN apt-get update && apt-get install -y build-essential
 COPY requirements.txt .
 RUN pip install --user -r requirements.txt
 FROM python:3.9
 MAINTAINER iskoldt
@@ -9,6 +11,5 @@ COPY --from=builder /root/.local /root/.local
 ENV PATH=/root/.local/bin:$PATH
 COPY . /app
 WORKDIR /app
-ENV my_api_key empty
 ENV dockerrun yes
 CMD ["python3", "-u", "ChuanhuChatbot.py", "2>&1", "|", "tee", "/var/log/application.log"]

 FROM python:3.9 as builder
 RUN apt-get update && apt-get install -y build-essential
 COPY requirements.txt .
+COPY requirements_advanced.txt .
 RUN pip install --user -r requirements.txt
+# RUN pip install --user -r requirements_advanced.txt
 FROM python:3.9
 MAINTAINER iskoldt
 ENV PATH=/root/.local/bin:$PATH
 COPY . /app
 WORKDIR /app
 ENV dockerrun yes
 CMD ["python3", "-u", "ChuanhuChatbot.py", "2>&1", "|", "tee", "/var/log/application.log"]

README.md CHANGED Viewed

@@ -1,13 +1,105 @@
----
-title: ChuanhuChatGPT
-emoji: 🐯
-colorFrom: green
-colorTo: red
-sdk: gradio
-sdk_version: 3.24.1
-app_file: ChuanhuChatbot.py
-pinned: false
-license: gpl-3.0
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+<h1 align="center">川虎 Chat 🐯 Chuanhu Chat</h1>
+<div align="center">
+  <a href="https://github.com/GaiZhenBiao/ChuanhuChatGPT">
+    <img src="https://user-images.githubusercontent.com/70903329/227087087-93b37d64-7dc3-4738-a518-c1cf05591c8a.png" alt="Logo" height="156">
+  </a>
+  <p align="center">
+    <h3>为ChatGPT/ChatGLM/LLaMA等多种LLM提供了一个轻快好用的Web图形界面</h3>
+    <p align="center">
+      <a href="https://github.com/GaiZhenbiao/ChuanhuChatGPT/blob/main/LICENSE">
+        <img alt="Tests Passing" src="https://img.shields.io/github/license/GaiZhenbiao/ChuanhuChatGPT" />
+      </a>
+      <a href="https://gradio.app/">
+        <img alt="GitHub Contributors" src="https://img.shields.io/badge/Base-Gradio-fb7d1a?style=flat" />
+      </a>
+      <a href="https://t.me/tkdifferent">
+        <img alt="GitHub pull requests" src="https://img.shields.io/badge/Telegram-Group-blue.svg?logo=telegram" />
+      </a>
+      <p>
+        实时回复 / 无限对话 / 保存对话 / 预设Prompt集 / 联网搜索 / 根据文件回答 <br />
+        渲染LaTeX / 渲染表格 / 代码高亮 / 自动亮暗色切换 / 自适应界面 / “小而美”的体验 <br />
+        自定义api-Host / 多参数可调 / 多API Key均衡负载 / 多用户显示 / 适配GPT-4 / 支持本地部署LLM
+      </p>
+      <a href="https://www.bilibili.com/video/BV1mo4y1r7eE"><strong>视频教程</strong></a>
+        ·
+      <a href="https://www.bilibili.com/video/BV1184y1w7aP"><strong>2.0介绍视频</strong></a>
+	||
+      <a href="https://huggingface.co/spaces/JohnSmith9982/ChuanhuChatGPT"><strong>在线体验</strong></a>
+      	·
+      <a href="https://huggingface.co/login?next=%2Fspaces%2FJohnSmith9982%2FChuanhuChatGPT%3Fduplicate%3Dtrue"><strong>一键部署</strong></a>
+    </p>
+    <p align="center">
+      <img alt="Animation Demo" src="https://user-images.githubusercontent.com/51039745/226255695-6b17ff1f-ea8d-464f-b69b-a7b6b68fffe8.gif" />
+    </p>
+  </p>
+</div>
+## 目录
+|[使用技巧](#使用技巧)|[安装方式](https://github.com/GaiZhenbiao/ChuanhuChatGPT/wiki/使用教程)|[常见问题](https://github.com/GaiZhenbiao/ChuanhuChatGPT/wiki/常见问题)| [给作者买可乐🥤](#捐款) |
+|  ----  | ----  | ----  | --- |
+## 使用技巧
+- 使用System Prompt可以很有效地设定前提条件。
+- 使用Prompt模板功能时，选择Prompt模板集合文件，然后从下拉菜单中选择想要的prompt。
+- 如果回答不满意，可以使用`重新生成`按钮再试一次
+- 对于长对话，可以使用`优化Tokens`按钮减少Tokens占用。
+- 输入框支持换行，按`shift enter`即可。
+- 可以在输入框按上下箭头在输入历史之间切换
+- 部署到服务器：将程序最后一句改成`demo.launch(server_name="0.0.0.0", server_port=<你的端口号>)`。
+- 获取公共链接：将程序最后一句改成`demo.launch(share=True)`。注意程序必须在运行，才能通过公共链接访问。
+- 在Hugging Face上使用：建议在右上角 **复制Space** 再使用，这样App反应可能会快一点。
+## 安装方式、使用方式
+请查看[本项目的wiki页面](https://github.com/GaiZhenbiao/ChuanhuChatGPT/wiki/使用教程)。
+## 疑难杂症解决
+在遇到各种问题查阅相关信息前，您可以先尝试手动拉取本项目的最新更改并更新 gradio，然后重试。步骤为：
+1. 点击网页上的 `Download ZIP` 下载最新代码，或
+   ```shell
+   git pull https://github.com/GaiZhenbiao/ChuanhuChatGPT.git main -f
+   ```
+2. 尝试再次安装依赖（可能本项目引入了新的依赖）
+   ```
+   pip install -r requirements.txt
+   ```
+3. 更新gradio
+   ```
+   pip install gradio --upgrade --force-reinstall
+   ```
+很多时候，这样就可以解决问题。
+如果问题仍然存在，请查阅该页面：[常见问题](https://github.com/GaiZhenbiao/ChuanhuChatGPT/wiki/常见问题)
+该页面列出了**几乎所有**您可能遇到的各种问题，包括如何配置代理，以及遇到问题后您该采取的措施，**请务必认真阅读**。
+## 了解更多
+若需了解更多信息，请查看我们的 [wiki](https://github.com/GaiZhenbiao/ChuanhuChatGPT/wiki)：
+- [想要做出贡献？](https://github.com/GaiZhenbiao/ChuanhuChatGPT/wiki/贡献指南)
+- [项目更新情况？](https://github.com/GaiZhenbiao/ChuanhuChatGPT/wiki/更新日志)
+- [二次开发许可？](https://github.com/GaiZhenbiao/ChuanhuChatGPT/wiki/使用许可)
+- [如何引用项目？](https://github.com/GaiZhenbiao/ChuanhuChatGPT/wiki/使用许可#如何引用该项目)
+## Starchart
+[![Star History Chart](https://api.star-history.com/svg?repos=GaiZhenbiao/ChuanhuChatGPT&type=Date)](https://star-history.com/#GaiZhenbiao/ChuanhuChatGPT&Date)
+## Contributors
+<a href="https://github.com/GaiZhenbiao/ChuanhuChatGPT/graphs/contributors">
+  <img src="https://contrib.rocks/image?repo=GaiZhenbiao/ChuanhuChatGPT" />
+</a>
+## 捐款
+🐯如果觉得这个软件对你有所帮助，欢迎请作者喝可乐、喝咖啡～
+<img width="250" alt="image" src="https://user-images.githubusercontent.com/51039745/226920291-e8ec0b0a-400f-4c20-ac13-dafac0c3aeeb.JPG">

assets/custom.css CHANGED Viewed

@@ -3,14 +3,18 @@
     --chatbot-color-dark: #121111;
 }
 /* 覆盖gradio的页脚信息QAQ */
 footer {
     display: none !important;
 }
-#footer{
     text-align: center;
 }
-#footer div{
     display: inline-block;
 }
 #footer .versions{
@@ -18,16 +22,34 @@ footer {
     opacity: 0.85;
 }
-/* user_info */
 #user_info {
     white-space: nowrap;
-    margin-top: -1.3em !important;
-    padding-left: 112px !important;
 }
 #user_info p {
-    font-size: .85em;
-    font-family: monospace;
-    color: var(--body-text-color-subdued);
 }
 /* status_display */
@@ -43,14 +65,18 @@ footer {
     color: var(--body-text-color-subdued);
 }
-#chuanhu_chatbot, #status_display {
     transition: all 0.6s;
 }
 /* usage_display */
-#usage_display {
     position: relative;
     margin: 0;
     box-shadow: var(--block-shadow);
     border-width: var(--block-border-width);
     border-color: var(--block-border-color);
@@ -62,7 +88,6 @@ footer {
 }
 #usage_display p, #usage_display span {
     margin: 0;
-    padding: .5em 1em;
     font-size: .85em;
     color: var(--body-text-color-subdued);
 }
@@ -74,7 +99,7 @@ footer {
     overflow: hidden;
 }
 .progress {
-    background-color: var(--block-title-background-fill);;
     height: 100%;
     border-radius: 10px;
     text-align: right;
@@ -88,38 +113,107 @@ footer {
     padding-right: 10px;
     line-height: 20px;
 }
 /* list */
 ol:not(.options), ul:not(.options) {
     padding-inline-start: 2em !important;
 }
-/* 亮色 */
-@media (prefers-color-scheme: light) {
     #chuanhu_chatbot {
-        background-color: var(--chatbot-color-light) !important;
-        color: #000000 !important;
     }
-    [data-testid = "bot"] {
-        background-color: #FFFFFF !important;
-    }
-    [data-testid = "user"] {
-        background-color: #95EC69 !important;
     }
 }
-/* 暗色 */
-@media (prefers-color-scheme: dark) {
     #chuanhu_chatbot {
-        background-color: var(--chatbot-color-dark) !important;
-        color: #FFFFFF !important;
     }
-    [data-testid = "bot"] {
-        background-color: #2C2C2C !important;
     }
-    [data-testid = "user"] {
-        background-color: #26B561 !important;
     }
-    body {
-        background-color: var(--neutral-950) !important;
     }
 }
 /* 对话气泡 */

     --chatbot-color-dark: #121111;
 }
+#app_title {
+    margin-top: 6px;
+    white-space: nowrap;
+}
 /* 覆盖gradio的页脚信息QAQ */
 footer {
     display: none !important;
 }
+#footer {
     text-align: center;
 }
+#footer div {
     display: inline-block;
 }
 #footer .versions{
     opacity: 0.85;
 }
+#float_display {
+    position: absolute;
+    max-height: 30px;
+}
+/* user_info */
 #user_info {
     white-space: nowrap;
+    position: absolute; left: 8em; top: .2em;
+    z-index: var(--layer-2);
+    box-shadow: var(--block-shadow);
+    border: none; border-radius: var(--block-label-radius);
+    background: var(--color-accent);
+    padding: var(--block-label-padding);
+    font-size: var(--block-label-text-size); line-height: var(--line-sm);
+    width: auto; min-height: 30px!important;
+    opacity: 1;
+    transition: opacity 0.3s ease-in-out;
+}
+#user_info .wrap {
+    opacity: 0;
 }
 #user_info p {
+    color: white;
+    font-weight: var(--block-label-text-weight);
+}
+#user_info.hideK {
+    opacity: 0;
+    transition: opacity 1s ease-in-out;
 }
 /* status_display */
     color: var(--body-text-color-subdued);
 }
+#status_display {
     transition: all 0.6s;
 }
+#chuanhu_chatbot {
+    transition: height 0.3s ease;
+}
 /* usage_display */
+.insert_block {
     position: relative;
     margin: 0;
+    padding: .5em 1em;
     box-shadow: var(--block-shadow);
     border-width: var(--block-border-width);
     border-color: var(--block-border-color);
 }
 #usage_display p, #usage_display span {
     margin: 0;
     font-size: .85em;
     color: var(--body-text-color-subdued);
 }
     overflow: hidden;
 }
 .progress {
+    background-color: var(--block-title-background-fill);
     height: 100%;
     border-radius: 10px;
     text-align: right;
     padding-right: 10px;
     line-height: 20px;
 }
+.apSwitch {
+    top: 2px;
+    display: inline-block;
+    height: 24px;
+    position: relative;
+    width: 48px;
+    border-radius: 12px;
+}
+.apSwitch input {
+    display: none !important;
+}
+.apSlider {
+    background-color: var(--block-label-background-fill);
+    bottom: 0;
+    cursor: pointer;
+    left: 0;
+    position: absolute;
+    right: 0;
+    top: 0;
+    transition: .4s;
+    font-size: 18px;
+    border-radius: 12px;
+}
+.apSlider::before {
+    bottom: -1.5px;
+    left: 1px;
+    position: absolute;
+    transition: .4s;
+    content: "🌞";
+}
+input:checked + .apSlider {
+    background-color: var(--block-label-background-fill);
+}
+input:checked + .apSlider::before {
+    transform: translateX(23px);
+    content:"🌚";
+}
+#submit_btn, #cancel_btn {
+    height: 42px !important;
+}
+#submit_btn::before {
+    content: url("data:image/svg+xml, %3Csvg width='21px' height='20px' viewBox='0 0 21 20' version='1.1' xmlns='http://www.w3.org/2000/svg' xmlns:xlink='http://www.w3.org/1999/xlink'%3E %3Cg id='page' stroke='none' stroke-width='1' fill='none' fill-rule='evenodd'%3E %3Cg id='send' transform='translate(0.435849, 0.088463)' fill='%23FFFFFF' fill-rule='nonzero'%3E %3Cpath d='M0.579148261,0.0428666046 C0.301105539,-0.0961547561 -0.036517765,0.122307382 0.0032026237,0.420210298 L1.4927172,18.1553639 C1.5125774,18.4334066 1.79062012,18.5922882 2.04880264,18.4929872 L8.24518329,15.8913017 L11.6412765,19.7441794 C11.8597387,19.9825018 12.2370824,19.8832008 12.3165231,19.5852979 L13.9450591,13.4882182 L19.7839562,11.0255541 C20.0619989,10.8865327 20.0818591,10.4694687 19.7839562,10.3105871 L0.579148261,0.0428666046 Z M11.6138902,17.0883151 L9.85385903,14.7195502 L0.718169621,0.618812241 L12.69945,12.9346347 L11.6138902,17.0883151 Z' id='shape'%3E%3C/path%3E %3C/g%3E %3C/g%3E %3C/svg%3E");
+    height: 21px;
+}
+#cancel_btn::before {
+    content: url("data:image/svg+xml,%3Csvg width='21px' height='21px' viewBox='0 0 21 21' version='1.1' xmlns='http://www.w3.org/2000/svg' xmlns:xlink='http://www.w3.org/1999/xlink'%3E %3Cg id='pg' stroke='none' stroke-width='1' fill='none' fill-rule='evenodd'%3E %3Cpath d='M10.2072007,20.088463 C11.5727865,20.088463 12.8594566,19.8259823 14.067211,19.3010209 C15.2749653,18.7760595 16.3386126,18.0538087 17.2581528,17.1342685 C18.177693,16.2147282 18.8982283,15.1527965 19.4197586,13.9484733 C19.9412889,12.7441501 20.202054,11.4557644 20.202054,10.0833163 C20.202054,8.71773046 19.9395733,7.43106036 19.4146119,6.22330603 C18.8896505,5.01555169 18.1673997,3.95018885 17.2478595,3.0272175 C16.3283192,2.10424615 15.2646719,1.3837109 14.0569176,0.865611739 C12.8491633,0.34751258 11.5624932,0.088463 10.1969073,0.088463 C8.83132146,0.088463 7.54636692,0.34751258 6.34204371,0.865611739 C5.1377205,1.3837109 4.07407321,2.10424615 3.15110186,3.0272175 C2.22813051,3.95018885 1.5058797,5.01555169 0.984349419,6.22330603 C0.46281914,7.43106036 0.202054,8.71773046 0.202054,10.0833163 C0.202054,11.4557644 0.4645347,12.7441501 0.9894961,13.9484733 C1.5144575,15.1527965 2.23670831,16.2147282 3.15624854,17.1342685 C4.07578877,18.0538087 5.1377205,18.7760595 6.34204371,19.3010209 C7.54636692,19.8259823 8.83475258,20.088463 10.2072007,20.088463 Z M10.2072007,18.2562448 C9.07493099,18.2562448 8.01471483,18.0452309 7.0265522,17.6232031 C6.03838956,17.2011753 5.17031614,16.6161693 4.42233192,15.8681851 C3.6743477,15.1202009 3.09105726,14.2521274 2.67246059,13.2639648 C2.25386392,12.2758022 2.04456558,11.215586 2.04456558,10.0833163 C2.04456558,8.95104663 2.25386392,7.89083047 2.67246059,6.90266784 C3.09105726,5.9145052 3.6743477,5.04643178 4.42233192,4.29844756 C5.17031614,3.55046334 6.036674,2.9671729 7.02140552,2.54857623 C8.00613703,2.12997956 9.06463763,1.92068122 10.1969073,1.92068122 C11.329177,1.92068122 12.3911087,2.12997956 13.3827025,2.54857623 C14.3742962,2.9671729 15.2440852,3.55046334 15.9920694,4.29844756 C16.7400537,5.04643178 17.3233441,5.9145052 17.7419408,6.90266784 C18.1605374,7.89083047 18.3698358,8.95104663 18.3698358,10.0833163 C18.3698358,11.215586 18.1605374,12.2758022 17.7419408,13.2639648 C17.3233441,14.2521274 16.7400537,15.1202009 15.9920694,15.8681851 C15.2440852,16.6161693 14.3760118,17.2011753 13.3878492,17.6232031 C12.3996865,18.0452309 11.3394704,18.2562448 10.2072007,18.2562448 Z M7.65444721,13.6242324 L12.7496608,13.6242324 C13.0584616,13.6242324 13.3003556,13.5384544 13.4753427,13.3668984 C13.6503299,13.1953424 13.7378234,12.9585951 13.7378234,12.6566565 L13.7378234,7.49968276 C13.7378234,7.19774418 13.6503299,6.96099688 13.4753427,6.78944087 C13.3003556,6.61788486 13.0584616,6.53210685 12.7496608,6.53210685 L7.65444721,6.53210685 C7.33878414,6.53210685 7.09345904,6.61788486 6.91847191,6.78944087 C6.74348478,6.96099688 6.65599121,7.19774418 6.65599121,7.49968276 L6.65599121,12.6566565 C6.65599121,12.9585951 6.74348478,13.1953424 6.91847191,13.3668984 C7.09345904,13.5384544 7.33878414,13.6242324 7.65444721,13.6242324 Z' id='shape' fill='%23FF3B30' fill-rule='nonzero'%3E%3C/path%3E %3C/g%3E %3C/svg%3E");
+    height: 21px;
+}
 /* list */
 ol:not(.options), ul:not(.options) {
     padding-inline-start: 2em !important;
 }
+/* 亮色（默认） */
+#chuanhu_chatbot {
+    background-color: var(--chatbot-color-light) !important;
+    color: #000000 !important;
+}
+[data-testid = "bot"] {
+    background-color: #FFFFFF !important;
+}
+[data-testid = "user"] {
+    background-color: #95EC69 !important;
+}
+/* 暗色 */
+.dark #chuanhu_chatbot {
+    background-color: var(--chatbot-color-dark) !important;
+    color: #FFFFFF !important;
+}
+.dark [data-testid = "bot"] {
+    background-color: #2C2C2C !important;
+}
+.dark [data-testid = "user"] {
+    background-color: #26B561 !important;
+}
+/* 屏幕宽度大于等于500px的设备 */
+/* update on 2023.4.8: 高度的细致调整已写入JavaScript */
+@media screen and (min-width: 500px) {
     #chuanhu_chatbot {
+        height: calc(100vh - 200px);
     }
+    #chuanhu_chatbot .wrap {
+        max-height: calc(100vh - 200px - var(--line-sm)*1rem - 2*var(--block-label-margin) );
     }
 }
+/* 屏幕宽度小于500px的设备 */
+@media screen and (max-width: 499px) {
     #chuanhu_chatbot {
+        height: calc(100vh - 140px);
     }
+    #chuanhu_chatbot .wrap {
+        max-height: calc(100vh - 140px - var(--line-sm)*1rem - 2*var(--block-label-margin) );
     }
+    [data-testid = "bot"] {
+        max-width: 98% !important;
     }
+    #app_title h1{
+        letter-spacing: -1px; font-size: 22px;
     }
 }
 /* 对话气泡 */

assets/custom.js CHANGED Viewed

@@ -1,70 +1,224 @@
 // custom javascript here
 const MAX_HISTORY_LENGTH = 32;
 var key_down_history = [];
 var currentIndex = -1;
 var user_input_ta;
 var ga = document.getElementsByTagName("gradio-app");
 var targetNode = ga[0];
-var observer = new MutationObserver(function(mutations) {
     for (var i = 0; i < mutations.length; i++) {
-        if (mutations[i].addedNodes.length) {
-          var user_input_tb = document.getElementById('user_input_tb');
-          if (user_input_tb) {
-            // 监听到user_input_tb被添加到DOM树中
-            // 这里可以编写元素加载完成后需要执行的代码
-            user_input_ta = user_input_tb.querySelector("textarea");
-            if (user_input_ta){
-                observer.disconnect(); // 停止监听
-                // 在 textarea 上监听 keydown 事件
-                user_input_ta.addEventListener("keydown", function (event) {
-                    var value = user_input_ta.value.trim();
-                    // 判断按下的是否为方向键
-                    if (event.code === 'ArrowUp' || event.code === 'ArrowDown') {
-                        // 如果按下的是方向键，且输入框中有内容，且历史记录中没有该内容，则不执行操作
-                        if(value && key_down_history.indexOf(value) === -1)
-                            return;
-                        // 对于需要响应的动作，阻止默认行为。
-                        event.preventDefault();
-                        var length = key_down_history.length;
-                        if(length === 0) {
-                            currentIndex = -1; // 如果历史记录为空，直接将当前选中的记录重置
-                            return;
-                        }
-                        if (currentIndex === -1) {
-                            currentIndex = length;
-                        }
-                        if (event.code === 'ArrowUp' && currentIndex > 0) {
-                            currentIndex--;
-                            user_input_ta.value = key_down_history[currentIndex];
-                        } else if (event.code === 'ArrowDown' && currentIndex < length - 1) {
-                            currentIndex++;
-                            user_input_ta.value = key_down_history[currentIndex];
-                        }
-                        user_input_ta.selectionStart = user_input_ta.value.length;
-                        user_input_ta.selectionEnd = user_input_ta.value.length;
-                        const input_event = new InputEvent("input", {bubbles: true, cancelable: true});
-                        user_input_ta.dispatchEvent(input_event);
-                    }else if(event.code === "Enter") {
-                        if (value) {
-                            currentIndex = -1;
-                            if(key_down_history.indexOf(value) === -1){
-                                key_down_history.push(value);
-                                if (key_down_history.length > MAX_HISTORY_LENGTH) {
-                                    key_down_history.shift();
-                                }
-                            }
                         }
                     }
-                });
-                break;
             }
-          }
         }
-      }
-});
-// 监听目标节点的子节点列表是否发生变化
-observer.observe(targetNode, { childList: true ,  subtree: true });

 // custom javascript here
 const MAX_HISTORY_LENGTH = 32;
 var key_down_history = [];
 var currentIndex = -1;
 var user_input_ta;
+var gradioContainer = null;
+var user_input_ta = null;
+var user_input_tb = null;
+var userInfoDiv = null;
+var appTitleDiv = null;
+var chatbot = null;
+var apSwitch = null;
 var ga = document.getElementsByTagName("gradio-app");
 var targetNode = ga[0];
+var isInIframe = (window.self !== window.top);
+// gradio 页面加载好了么??? 我能动你的元素了么??
+function gradioLoaded(mutations) {
     for (var i = 0; i < mutations.length; i++) {
+        if (mutations[i].addedNodes.length) {
+            gradioContainer = document.querySelector(".gradio-container");
+            user_input_tb = document.getElementById('user_input_tb');
+            userInfoDiv = document.getElementById("user_info");
+            appTitleDiv = document.getElementById("app_title");
+            chatbot = document.querySelector('#chuanhu_chatbot');
+            apSwitch = document.querySelector('.apSwitch input[type="checkbox"]');
+            if (gradioContainer && apSwitch) {  // gradioCainter 加载出来了没?
+                adjustDarkMode();
+            }
+            if (user_input_tb) {  // user_input_tb 加载出来了没?
+                selectHistory();
+            }
+            if (userInfoDiv && appTitleDiv) {  // userInfoDiv 和 appTitleDiv 加载出来了没?
+                setTimeout(showOrHideUserInfo(), 2000);
+            }
+            if (chatbot) {  // chatbot 加载出来了没?
+                setChatbotHeight()
+            }
+        }
+    }
+}
+function selectHistory() {
+    user_input_ta = user_input_tb.querySelector("textarea");
+    if (user_input_ta) {
+        observer.disconnect(); // 停止监听
+        // 在 textarea 上监听 keydown 事件
+        user_input_ta.addEventListener("keydown", function (event) {
+            var value = user_input_ta.value.trim();
+            // 判断按下的是否为方向键
+            if (event.code === 'ArrowUp' || event.code === 'ArrowDown') {
+                // ���果按下的是方向键，且输入框中有内容，且历史记录中没有该内容，则不执行操作
+                if (value && key_down_history.indexOf(value) === -1)
+                    return;
+                // 对于需要响应的动作，阻止默认行为。
+                event.preventDefault();
+                var length = key_down_history.length;
+                if (length === 0) {
+                    currentIndex = -1; // 如果历史记录为空，直接将当前选中的记录重置
+                    return;
+                }
+                if (currentIndex === -1) {
+                    currentIndex = length;
+                }
+                if (event.code === 'ArrowUp' && currentIndex > 0) {
+                    currentIndex--;
+                    user_input_ta.value = key_down_history[currentIndex];
+                } else if (event.code === 'ArrowDown' && currentIndex < length - 1) {
+                    currentIndex++;
+                    user_input_ta.value = key_down_history[currentIndex];
+                }
+                user_input_ta.selectionStart = user_input_ta.value.length;
+                user_input_ta.selectionEnd = user_input_ta.value.length;
+                const input_event = new InputEvent("input", { bubbles: true, cancelable: true });
+                user_input_ta.dispatchEvent(input_event);
+            } else if (event.code === "Enter") {
+                if (value) {
+                    currentIndex = -1;
+                    if (key_down_history.indexOf(value) === -1) {
+                        key_down_history.push(value);
+                        if (key_down_history.length > MAX_HISTORY_LENGTH) {
+                            key_down_history.shift();
                         }
                     }
+                }
             }
+        });
+    }
+}
+function toggleUserInfoVisibility(shouldHide) {
+    if (userInfoDiv) {
+        if (shouldHide) {
+            userInfoDiv.classList.add("hideK");
+        } else {
+            userInfoDiv.classList.remove("hideK");
         }
+    }
+}
+function showOrHideUserInfo() {
+    var sendBtn = document.getElementById("submit_btn");
+    // Bind mouse/touch events to show/hide user info
+    appTitleDiv.addEventListener("mouseenter", function () {
+        toggleUserInfoVisibility(false);
+    });
+    userInfoDiv.addEventListener("mouseenter", function () {
+        toggleUserInfoVisibility(false);
+    });
+    sendBtn.addEventListener("mouseenter", function () {
+        toggleUserInfoVisibility(false);
+    });
+    appTitleDiv.addEventListener("mouseleave", function () {
+        toggleUserInfoVisibility(true);
+    });
+    userInfoDiv.addEventListener("mouseleave", function () {
+        toggleUserInfoVisibility(true);
+    });
+    sendBtn.addEventListener("mouseleave", function () {
+        toggleUserInfoVisibility(true);
+    });
+    appTitleDiv.ontouchstart = function () {
+        toggleUserInfoVisibility(false);
+    };
+    userInfoDiv.ontouchstart = function () {
+        toggleUserInfoVisibility(false);
+    };
+    sendBtn.ontouchstart = function () {
+        toggleUserInfoVisibility(false);
+    };
+    appTitleDiv.ontouchend = function () {
+        setTimeout(function () {
+            toggleUserInfoVisibility(true);
+        }, 3000);
+    };
+    userInfoDiv.ontouchend = function () {
+        setTimeout(function () {
+            toggleUserInfoVisibility(true);
+        }, 3000);
+    };
+    sendBtn.ontouchend = function () {
+        setTimeout(function () {
+            toggleUserInfoVisibility(true);
+        }, 3000); // Delay 1 second to hide user info
+    };
+    // Hide user info after 2 second
+    setTimeout(function () {
+        toggleUserInfoVisibility(true);
+    }, 2000);
+}
+function toggleDarkMode(isEnabled) {
+    if (isEnabled) {
+        gradioContainer.classList.add("dark");
+        document.body.style.setProperty("background-color", "var(--neutral-950)", "important");
+    } else {
+        gradioContainer.classList.remove("dark");
+        document.body.style.backgroundColor = "";
+    }
+}
+function adjustDarkMode() {
+    const darkModeQuery = window.matchMedia("(prefers-color-scheme: dark)");
+    // 根据当前颜色模式设置初始状态
+    apSwitch.checked = darkModeQuery.matches;
+    toggleDarkMode(darkModeQuery.matches);
+    // 监听颜色模式变化
+    darkModeQuery.addEventListener("change", (e) => {
+        apSwitch.checked = e.matches;
+        toggleDarkMode(e.matches);
+    });
+    // apSwitch = document.querySelector('.apSwitch input[type="checkbox"]');
+    apSwitch.addEventListener("change", (e) => {
+        toggleDarkMode(e.target.checked);
+    });
+}
+function setChatbotHeight() {
+    const screenWidth = window.innerWidth;
+    const statusDisplay = document.querySelector('#status_display');
+    const statusDisplayHeight = statusDisplay ? statusDisplay.offsetHeight : 0;
+    const wrap = chatbot.querySelector('.wrap');
+    const vh = window.innerHeight * 0.01;
+    document.documentElement.style.setProperty('--vh', `${vh}px`);
+    if (isInIframe) {
+        chatbot.style.height = `700px`;
+        wrap.style.maxHeight = `calc(700px - var(--line-sm) * 1rem - 2 * var(--block-label-margin))`
+    } else {
+        if (screenWidth <= 320) {
+            chatbot.style.height = `calc(var(--vh, 1vh) * 100 - ${statusDisplayHeight + 150}px)`;
+            wrap.style.maxHeight = `calc(var(--vh, 1vh) * 100 - ${statusDisplayHeight + 150}px - var(--line-sm) * 1rem - 2 * var(--block-label-margin))`;
+        } else if (screenWidth <= 499) {
+            chatbot.style.height = `calc(var(--vh, 1vh) * 100 - ${statusDisplayHeight + 100}px)`;
+            wrap.style.maxHeight = `calc(var(--vh, 1vh) * 100 - ${statusDisplayHeight + 100}px - var(--line-sm) * 1rem - 2 * var(--block-label-margin))`;
+        } else {
+            chatbot.style.height = `calc(var(--vh, 1vh) * 100 - ${statusDisplayHeight + 160}px)`;
+            wrap.style.maxHeight = `calc(var(--vh, 1vh) * 100 - ${statusDisplayHeight + 160}px - var(--line-sm) * 1rem - 2 * var(--block-label-margin))`;
+        }
+    }
+}
+// 监视页面内部 DOM 变动
+var observer = new MutationObserver(function (mutations) {
+    gradioLoaded(mutations);
+});
+observer.observe(targetNode, { childList: true, subtree: true });
+// 监视页面变化
+window.addEventListener("DOMContentLoaded", function () {
+    isInIframe = (window.self !== window.top);
+});
+window.addEventListener('resize', setChatbotHeight);
+window.addEventListener('scroll', setChatbotHeight);
+window.matchMedia("(prefers-color-scheme: dark)").addEventListener("change", adjustDarkMode);

config_example.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+    // 你的OpenAI API Key，一般必填，
+    // 若缺省填为 "openai_api_key": "" 则必须再在图形界面中填入API Key
+    "openai_api_key": "",
+    // 如果使用代理，请取消注释下面的两行，并替换代理URL
+    // "https_proxy": "http://127.0.0.1:1079",
+    // "http_proxy": "http://127.0.0.1:1079",
+    "users": [], // 用户列表，[[用户名1, 密码1], [用户名2, 密码2], ...]
+    "local_embedding": false, //是否在本地编制索引
+    "default_model": "gpt-3.5-turbo", // 默认模型
+    "advance_docs": {
+        "pdf": {
+            // 是否认为PDF是双栏的
+            "two_column": false,
+            // 是否使用OCR识别PDF中的公式
+            "formula_ocr": true
+        }
+    },
+    // 是否多个API Key轮换使用
+    "multi_api_key": false,
+    "api_key_list": [
+        "sk-xxxxxxxxxxxxxxxxxxxxxxxx1",
+        "sk-xxxxxxxxxxxxxxxxxxxxxxxx2",
+        "sk-xxxxxxxxxxxxxxxxxxxxxxxx3"
+    ],
+    // 如果使用自定义端口、自定义ip，请取消注释并替换对应内容
+    // "server_name": "0.0.0.0",
+    // "server_port": 7860,
+    // 如果要share到gradio，设置为true
+    // "share": false,
+}

configs/ds_config_chatbot.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+    "fp16": {
+        "enabled": false
+    },
+    "bf16": {
+        "enabled": true
+    },
+    "comms_logger": {
+        "enabled": false,
+        "verbose": false,
+        "prof_all": false,
+        "debug": false
+    },
+    "steps_per_print": 20000000000000000,
+    "train_micro_batch_size_per_gpu": 1,
+    "wall_clock_breakdown": false
+}

modules/__init__.py ADDED Viewed

File without changes

modules/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (172 Bytes). View file

modules/__pycache__/__init__.cpython-39.pyc ADDED Viewed

Binary file (154 Bytes). View file

modules/__pycache__/base_model.cpython-311.pyc ADDED Viewed

Binary file (26.7 kB). View file

modules/__pycache__/base_model.cpython-39.pyc ADDED Viewed

Binary file (15.8 kB). View file

modules/__pycache__/config.cpython-311.pyc ADDED Viewed

Binary file (7.87 kB). View file

modules/__pycache__/config.cpython-39.pyc CHANGED Viewed

Binary files a/modules/__pycache__/config.cpython-39.pyc and b/modules/__pycache__/config.cpython-39.pyc differ

modules/__pycache__/llama_func.cpython-311.pyc ADDED Viewed

Binary file (9.28 kB). View file

modules/__pycache__/models.cpython-311.pyc ADDED Viewed

Binary file (30.6 kB). View file

modules/base_model.py ADDED Viewed

	@@ -0,0 +1,547 @@

+from __future__ import annotations
+from typing import TYPE_CHECKING, List
+import logging
+import json
+import commentjson as cjson
+import os
+import sys
+import requests
+import urllib3
+import traceback
+from tqdm import tqdm
+import colorama
+from duckduckgo_search import ddg
+import asyncio
+import aiohttp
+from enum import Enum
+from .presets import *
+from .llama_func import *
+from .utils import *
+from . import shared
+from .config import retrieve_proxy
+class ModelType(Enum):
+    Unknown = -1
+    OpenAI = 0
+    ChatGLM = 1
+    LLaMA = 2
+    XMBot = 3
+    @classmethod
+    def get_type(cls, model_name: str):
+        model_type = None
+        model_name_lower = model_name.lower()
+        if "gpt" in model_name_lower:
+            model_type = ModelType.OpenAI
+        elif "chatglm" in model_name_lower:
+            model_type = ModelType.ChatGLM
+        elif "llama" in model_name_lower or "alpaca" in model_name_lower:
+            model_type = ModelType.LLaMA
+        elif "xmbot" in model_name_lower:
+            model_type = ModelType.XMBot
+        else:
+            model_type = ModelType.Unknown
+        return model_type
+class BaseLLMModel:
+    def __init__(
+        self,
+        model_name,
+        system_prompt="",
+        temperature=1.0,
+        top_p=1.0,
+        n_choices=1,
+        stop=None,
+        max_generation_token=None,
+        presence_penalty=0,
+        frequency_penalty=0,
+        logit_bias=None,
+        user="",
+    ) -> None:
+        self.history = []
+        self.all_token_counts = []
+        self.model_name = model_name
+        self.model_type = ModelType.get_type(model_name)
+        try:
+            self.token_upper_limit = MODEL_TOKEN_LIMIT[model_name]
+        except KeyError:
+            self.token_upper_limit = DEFAULT_TOKEN_LIMIT
+        self.interrupted = False
+        self.system_prompt = system_prompt
+        self.api_key = None
+        self.need_api_key = False
+        self.single_turn = False
+        self.temperature = temperature
+        self.top_p = top_p
+        self.n_choices = n_choices
+        self.stop_sequence = stop
+        self.max_generation_token = None
+        self.presence_penalty = presence_penalty
+        self.frequency_penalty = frequency_penalty
+        self.logit_bias = logit_bias
+        self.user_identifier = user
+    def get_answer_stream_iter(self):
+        """stream predict, need to be implemented
+        conversations are stored in self.history, with the most recent question, in OpenAI format
+        should return a generator, each time give the next word (str) in the answer
+        """
+        logging.warning("stream predict not implemented, using at once predict instead")
+        response, _ = self.get_answer_at_once()
+        yield response
+    def get_answer_at_once(self):
+        """predict at once, need to be implemented
+        conversations are stored in self.history, with the most recent question, in OpenAI format
+        Should return:
+        the answer (str)
+        total token count (int)
+        """
+        logging.warning("at once predict not implemented, using stream predict instead")
+        response_iter = self.get_answer_stream_iter()
+        count = 0
+        for response in response_iter:
+            count += 1
+        return response, sum(self.all_token_counts) + count
+    def billing_info(self):
+        """get billing infomation, inplement if needed"""
+        logging.warning("billing info not implemented, using default")
+        return BILLING_NOT_APPLICABLE_MSG
+    def count_token(self, user_input):
+        """get token count from input, implement if needed"""
+        logging.warning("token count not implemented, using default")
+        return len(user_input)
+    def stream_next_chatbot(self, inputs, chatbot, fake_input=None, display_append=""):
+        def get_return_value():
+            return chatbot, status_text
+        status_text = "开始实时传输回答……"
+        if fake_input:
+            chatbot.append((fake_input, ""))
+        else:
+            chatbot.append((inputs, ""))
+        user_token_count = self.count_token(inputs)
+        self.all_token_counts.append(user_token_count)
+        logging.debug(f"输入token计数: {user_token_count}")
+        stream_iter = self.get_answer_stream_iter()
+        for partial_text in stream_iter:
+            chatbot[-1] = (chatbot[-1][0], partial_text + display_append)
+            self.all_token_counts[-1] += 1
+            status_text = self.token_message()
+            yield get_return_value()
+            if self.interrupted:
+                self.recover()
+                break
+        self.history.append(construct_assistant(partial_text))
+    def next_chatbot_at_once(self, inputs, chatbot, fake_input=None, display_append=""):
+        if fake_input:
+            chatbot.append((fake_input, ""))
+        else:
+            chatbot.append((inputs, ""))
+        if fake_input is not None:
+            user_token_count = self.count_token(fake_input)
+        else:
+            user_token_count = self.count_token(inputs)
+        self.all_token_counts.append(user_token_count)
+        ai_reply, total_token_count = self.get_answer_at_once()
+        self.history.append(construct_assistant(ai_reply))
+        if fake_input is not None:
+            self.history[-2] = construct_user(fake_input)
+        chatbot[-1] = (chatbot[-1][0], ai_reply + display_append)
+        if fake_input is not None:
+            self.all_token_counts[-1] += count_token(construct_assistant(ai_reply))
+        else:
+            self.all_token_counts[-1] = total_token_count - sum(self.all_token_counts)
+        status_text = self.token_message()
+        return chatbot, status_text
+    def handle_file_upload(self, files, chatbot):
+        """if the model accepts multi modal input, implement this function"""
+        status = gr.Markdown.update()
+        if files:
+            construct_index(self.api_key, file_src=files)
+            status = "索引构建完成"
+        return gr.Files.update(), chatbot, status
+    def prepare_inputs(self, real_inputs, use_websearch, files, reply_language, chatbot):
+        fake_inputs = None
+        display_append = []
+        limited_context = False
+        fake_inputs = real_inputs
+        if files:
+            from llama_index.indices.vector_store.base_query import GPTVectorStoreIndexQuery
+            from llama_index.indices.query.schema import QueryBundle
+            from langchain.embeddings.huggingface import HuggingFaceEmbeddings
+            from langchain.chat_models import ChatOpenAI
+            from llama_index import (
+                GPTSimpleVectorIndex,
+                ServiceContext,
+                LangchainEmbedding,
+                OpenAIEmbedding,
+            )
+            limited_context = True
+            msg = "加载索引中……"
+            logging.info(msg)
+            # yield chatbot + [(inputs, "")], msg
+            index = construct_index(self.api_key, file_src=files)
+            assert index is not None, "获取索引失败"
+            msg = "索引获取成功，生成回答中……"
+            logging.info(msg)
+            if local_embedding or self.model_type != ModelType.OpenAI:
+                embed_model = LangchainEmbedding(HuggingFaceEmbeddings())
+            else:
+                embed_model = OpenAIEmbedding()
+            # yield chatbot + [(inputs, "")], msg
+            with retrieve_proxy():
+                prompt_helper = PromptHelper(
+                    max_input_size=4096,
+                    num_output=5,
+                    max_chunk_overlap=20,
+                    chunk_size_limit=600,
+                )
+                from llama_index import ServiceContext
+                service_context = ServiceContext.from_defaults(
+                    prompt_helper=prompt_helper, embed_model=embed_model
+                )
+                query_object = GPTVectorStoreIndexQuery(
+                    index.index_struct,
+                    service_context=service_context,
+                    similarity_top_k=5,
+                    vector_store=index._vector_store,
+                    docstore=index._docstore,
+                )
+                query_bundle = QueryBundle(real_inputs)
+                nodes = query_object.retrieve(query_bundle)
+            reference_results = [n.node.text for n in nodes]
+            reference_results = add_source_numbers(reference_results, use_source=False)
+            display_append = add_details(reference_results)
+            display_append = "\n\n" + "".join(display_append)
+            real_inputs = (
+                replace_today(PROMPT_TEMPLATE)
+                .replace("{query_str}", real_inputs)
+                .replace("{context_str}", "\n\n".join(reference_results))
+                .replace("{reply_language}", reply_language)
+            )
+        elif use_websearch:
+            limited_context = True
+            search_results = ddg(real_inputs, max_results=5)
+            reference_results = []
+            for idx, result in enumerate(search_results):
+                logging.debug(f"搜索结果{idx + 1}：{result}")
+                domain_name = urllib3.util.parse_url(result["href"]).host
+                reference_results.append([result["body"], result["href"]])
+                display_append.append(
+                    f"{idx+1}. [{domain_name}]({result['href']})\n"
+                )
+            reference_results = add_source_numbers(reference_results)
+            display_append = "\n\n" + "".join(display_append)
+            real_inputs = (
+                replace_today(WEBSEARCH_PTOMPT_TEMPLATE)
+                .replace("{query}", real_inputs)
+                .replace("{web_results}", "\n\n".join(reference_results))
+                .replace("{reply_language}", reply_language)
+            )
+        else:
+            display_append = ""
+        return limited_context, fake_inputs, display_append, real_inputs, chatbot
+    def predict(
+        self,
+        inputs,
+        chatbot,
+        stream=False,
+        use_websearch=False,
+        files=None,
+        reply_language="中文",
+        should_check_token_count=True,
+    ):  # repetition_penalty, top_k
+        status_text = "开始生成回答……"
+        logging.info(
+            "输入为：" + colorama.Fore.BLUE + f"{inputs}" + colorama.Style.RESET_ALL
+        )
+        if should_check_token_count:
+            yield chatbot + [(inputs, "")], status_text
+        if reply_language == "跟随问题语言（不稳定）":
+            reply_language = "the same language as the question, such as English, 中文, 日本語, Español, Français, or Deutsch."
+        limited_context, fake_inputs, display_append, inputs, chatbot = self.prepare_inputs(real_inputs=inputs, use_websearch=use_websearch, files=files, reply_language=reply_language, chatbot=chatbot)
+        yield chatbot + [(fake_inputs, "")], status_text
+        if (
+            self.need_api_key and
+            self.api_key is None
+            and not shared.state.multi_api_key
+        ):
+            status_text = STANDARD_ERROR_MSG + NO_APIKEY_MSG
+            logging.info(status_text)
+            chatbot.append((inputs, ""))
+            if len(self.history) == 0:
+                self.history.append(construct_user(inputs))
+                self.history.append("")
+                self.all_token_counts.append(0)
+            else:
+                self.history[-2] = construct_user(inputs)
+            yield chatbot + [(inputs, "")], status_text
+            return
+        elif len(inputs.strip()) == 0:
+            status_text = STANDARD_ERROR_MSG + NO_INPUT_MSG
+            logging.info(status_text)
+            yield chatbot + [(inputs, "")], status_text
+            return
+        if self.single_turn:
+            self.history = []
+            self.all_token_counts = []
+        self.history.append(construct_user(inputs))
+        try:
+            if stream:
+                logging.debug("使用流式传输")
+                iter = self.stream_next_chatbot(
+                    inputs,
+                    chatbot,
+                    fake_input=fake_inputs,
+                    display_append=display_append,
+                )
+                for chatbot, status_text in iter:
+                    yield chatbot, status_text
+            else:
+                logging.debug("不使用流式传输")
+                chatbot, status_text = self.next_chatbot_at_once(
+                    inputs,
+                    chatbot,
+                    fake_input=fake_inputs,
+                    display_append=display_append,
+                )
+                yield chatbot, status_text
+        except Exception as e:
+            traceback.print_exc()
+            status_text = STANDARD_ERROR_MSG + str(e)
+            yield chatbot, status_text
+        if len(self.history) > 1 and self.history[-1]["content"] != inputs:
+            logging.info(
+                "回答为："
+                + colorama.Fore.BLUE
+                + f"{self.history[-1]['content']}"
+                + colorama.Style.RESET_ALL
+            )
+        if limited_context:
+            # self.history = self.history[-4:]
+            # self.all_token_counts = self.all_token_counts[-2:]
+            self.history = []
+            self.all_token_counts = []
+        max_token = self.token_upper_limit - TOKEN_OFFSET
+        if sum(self.all_token_counts) > max_token and should_check_token_count:
+            count = 0
+            while (
+                sum(self.all_token_counts)
+                > self.token_upper_limit * REDUCE_TOKEN_FACTOR
+                and sum(self.all_token_counts) > 0
+            ):
+                count += 1
+                del self.all_token_counts[0]
+                del self.history[:2]
+            logging.info(status_text)
+            status_text = f"为了防止token超限，模型忘记了早期的 {count} 轮对话"
+            yield chatbot, status_text
+    def retry(
+        self,
+        chatbot,
+        stream=False,
+        use_websearch=False,
+        files=None,
+        reply_language="中文",
+    ):
+        logging.debug("重试中……")
+        if len(self.history) == 0:
+            yield chatbot, f"{STANDARD_ERROR_MSG}上下文是空的"
+            return
+        inputs = self.history[-2]["content"]
+        del self.history[-2:]
+        self.all_token_counts.pop()
+        iter = self.predict(
+            inputs,
+            chatbot,
+            stream=stream,
+            use_websearch=use_websearch,
+            files=files,
+            reply_language=reply_language,
+        )
+        for x in iter:
+            yield x
+        logging.debug("重试完毕")
+    # def reduce_token_size(self, chatbot):
+    #     logging.info("开始减少token数量……")
+    #     chatbot, status_text = self.next_chatbot_at_once(
+    #         summarize_prompt,
+    #         chatbot
+    #     )
+    #     max_token_count = self.token_upper_limit * REDUCE_TOKEN_FACTOR
+    #     num_chat = find_n(self.all_token_counts, max_token_count)
+    #     logging.info(f"previous_token_count: {self.all_token_counts}, keeping {num_chat} chats")
+    #     chatbot = chatbot[:-1]
+    #     self.history = self.history[-2*num_chat:] if num_chat > 0 else []
+    #     self.all_token_counts = self.all_token_counts[-num_chat:] if num_chat > 0 else []
+    #     msg = f"保留了最近{num_chat}轮对话"
+    #     logging.info(msg)
+    #     logging.info("减少token数量完毕")
+    #     return chatbot, msg + "，" + self.token_message(self.all_token_counts if len(self.all_token_counts) > 0 else [0])
+    def interrupt(self):
+        self.interrupted = True
+    def recover(self):
+        self.interrupted = False
+    def set_token_upper_limit(self, new_upper_limit):
+        self.token_upper_limit = new_upper_limit
+        print(f"token上限设置为{new_upper_limit}")
+    def set_temperature(self, new_temperature):
+        self.temperature = new_temperature
+    def set_top_p(self, new_top_p):
+        self.top_p = new_top_p
+    def set_n_choices(self, new_n_choices):
+        self.n_choices = new_n_choices
+    def set_stop_sequence(self, new_stop_sequence: str):
+        new_stop_sequence = new_stop_sequence.split(",")
+        self.stop_sequence = new_stop_sequence
+    def set_max_tokens(self, new_max_tokens):
+        self.max_generation_token = new_max_tokens
+    def set_presence_penalty(self, new_presence_penalty):
+        self.presence_penalty = new_presence_penalty
+    def set_frequency_penalty(self, new_frequency_penalty):
+        self.frequency_penalty = new_frequency_penalty
+    def set_logit_bias(self, logit_bias):
+        logit_bias = logit_bias.split()
+        bias_map = {}
+        encoding = tiktoken.get_encoding("cl100k_base")
+        for line in logit_bias:
+            word, bias_amount = line.split(":")
+            if word:
+                for token in encoding.encode(word):
+                    bias_map[token] = float(bias_amount)
+        self.logit_bias = bias_map
+    def set_user_identifier(self, new_user_identifier):
+        self.user_identifier = new_user_identifier
+    def set_system_prompt(self, new_system_prompt):
+        self.system_prompt = new_system_prompt
+    def set_key(self, new_access_key):
+        self.api_key = new_access_key.strip()
+        msg = f"API密钥更改为了{hide_middle_chars(self.api_key)}"
+        logging.info(msg)
+        return new_access_key, msg
+    def set_single_turn(self, new_single_turn):
+        self.single_turn = new_single_turn
+    def reset(self):
+        self.history = []
+        self.all_token_counts = []
+        self.interrupted = False
+        return [], self.token_message([0])
+    def delete_first_conversation(self):
+        if self.history:
+            del self.history[:2]
+            del self.all_token_counts[0]
+        return self.token_message()
+    def delete_last_conversation(self, chatbot):
+        if len(chatbot) > 0 and STANDARD_ERROR_MSG in chatbot[-1][1]:
+            msg = "由于包含报错信息，只删除chatbot记录"
+            chatbot.pop()
+            return chatbot, self.history
+        if len(self.history) > 0:
+            self.history.pop()
+            self.history.pop()
+        if len(chatbot) > 0:
+            msg = "删除了一组chatbot对话"
+            chatbot.pop()
+        if len(self.all_token_counts) > 0:
+            msg = "删除了一组对话的token计数记录"
+            self.all_token_counts.pop()
+        msg = "删除了一组对话"
+        return chatbot, msg
+    def token_message(self, token_lst=None):
+        if token_lst is None:
+            token_lst = self.all_token_counts
+        token_sum = 0
+        for i in range(len(token_lst)):
+            token_sum += sum(token_lst[: i + 1])
+        return f"Token 计数: {sum(token_lst)}，本次对话累计消耗了 {token_sum} tokens"
+    def save_chat_history(self, filename, chatbot, user_name):
+        if filename == "":
+            return
+        if not filename.endswith(".json"):
+            filename += ".json"
+        return save_file(filename, self.system_prompt, self.history, chatbot, user_name)
+    def export_markdown(self, filename, chatbot, user_name):
+        if filename == "":
+            return
+        if not filename.endswith(".md"):
+            filename += ".md"
+        return save_file(filename, self.system_prompt, self.history, chatbot, user_name)
+    def load_chat_history(self, filename, chatbot, user_name):
+        logging.debug(f"{user_name} 加载对话历史中……")
+        if type(filename) != str:
+            filename = filename.name
+        try:
+            with open(os.path.join(HISTORY_DIR, user_name, filename), "r") as f:
+                json_s = json.load(f)
+            try:
+                if type(json_s["history"][0]) == str:
+                    logging.info("历史记录格式为旧版，正在转换……")
+                    new_history = []
+                    for index, item in enumerate(json_s["history"]):
+                        if index % 2 == 0:
+                            new_history.append(construct_user(item))
+                        else:
+                            new_history.append(construct_assistant(item))
+                    json_s["history"] = new_history
+                    logging.info(new_history)
+            except:
+                # 没有对话历史
+                pass
+            logging.debug(f"{user_name} 加载对话历史完毕")
+            self.history = json_s["history"]
+            return filename, json_s["system"], json_s["chatbot"]
+        except FileNotFoundError:
+            logging.warning(f"{user_name} 没有找到对话历史文件，不执行任何操作")
+            return filename, self.system_prompt, chatbot

modules/config.py CHANGED Viewed

@@ -3,9 +3,10 @@ from contextlib import contextmanager
 import os
 import logging
 import sys
-import json
 from . import shared
 __all__ = [
@@ -18,6 +19,9 @@ __all__ = [
     "advance_docs",
     "update_doc_config",
     "multi_api_key",
 ]
 # 添加一个统一的config文件，避免文件过多造成的疑惑（优先级最低）
@@ -28,6 +32,30 @@ if os.path.exists("config.json"):
 else:
     config = {}
 ## 处理docker if we are running in Docker
 dockerflag = config.get("dockerflag", False)
 if os.environ.get("dockerrun") == "yes":
@@ -54,35 +82,6 @@ api_host = os.environ.get("api_host", config.get("api_host", ""))
 if api_host:
     shared.state.set_api_host(api_host)
-if dockerflag:
-    if my_api_key == "empty":
-        logging.error("Please give a api key!")
-        sys.exit(1)
-    # auth
-    username = os.environ.get("USERNAME")
-    password = os.environ.get("PASSWORD")
-    if not (isinstance(username, type(None)) or isinstance(password, type(None))):
-        auth_list.append((os.environ.get("USERNAME"), os.environ.get("PASSWORD")))
-        authflag = True
-else:
-    if (
-        not my_api_key
-        and os.path.exists("api_key.txt")
-        and os.path.getsize("api_key.txt")
-    ):
-        with open("api_key.txt", "r") as f:
-            my_api_key = f.read().strip()
-    if os.path.exists("auth.json"):
-        authflag = True
-        with open("auth.json", "r", encoding='utf-8') as f:
-            auth = json.load(f)
-            for _ in auth:
-                if auth[_]["username"] and auth[_]["password"]:
-                    auth_list.append((auth[_]["username"], auth[_]["password"]))
-                else:
-                    logging.error("请检查auth.json文件中的用户名和密码！")
-                    sys.exit(1)
 @contextmanager
 def retrieve_openai_api(api_key = None):
     old_api_key = os.environ.get("OPENAI_API_KEY", "")
@@ -111,6 +110,8 @@ https_proxy = os.environ.get("HTTPS_PROXY", https_proxy)
 os.environ["HTTP_PROXY"] = ""
 os.environ["HTTPS_PROXY"] = ""
 @contextmanager
 def retrieve_proxy(proxy=None):
     """
@@ -137,9 +138,29 @@ advance_docs = defaultdict(lambda: defaultdict(dict))
 advance_docs.update(config.get("advance_docs", {}))
 def update_doc_config(two_column_pdf):
     global advance_docs
-    if two_column_pdf:
-        advance_docs["pdf"]["two_column"] = True
     else:
-        advance_docs["pdf"]["two_column"] = False
-    logging.info(f"更新后的文件参数为：{advance_docs}")

 import os
 import logging
 import sys
+import commentjson as json
 from . import shared
+from . import presets
 __all__ = [
     "advance_docs",
     "update_doc_config",
     "multi_api_key",
+    "server_name",
+    "server_port",
+    "share",
 ]
 # 添加一个统一的config文件，避免文件过多造成的疑惑（优先级最低）
 else:
     config = {}
+if os.path.exists("api_key.txt"):
+    logging.info("检测到api_key.txt文件，正在进行迁移...")
+    with open("api_key.txt", "r") as f:
+        config["openai_api_key"] = f.read().strip()
+    os.rename("api_key.txt", "api_key(deprecated).txt")
+    with open("config.json", "w", encoding='utf-8') as f:
+        json.dump(config, f, indent=4)
+if os.path.exists("auth.json"):
+    logging.info("检测到auth.json文件，正在进行迁移...")
+    auth_list = []
+    with open("auth.json", "r", encoding='utf-8') as f:
+            auth = json.load(f)
+            for _ in auth:
+                if auth[_]["username"] and auth[_]["password"]:
+                    auth_list.append((auth[_]["username"], auth[_]["password"]))
+                else:
+                    logging.error("请检查auth.json文件中的用户名和密码！")
+                    sys.exit(1)
+    config["users"] = auth_list
+    os.rename("auth.json", "auth(deprecated).json")
+    with open("config.json", "w", encoding='utf-8') as f:
+        json.dump(config, f, indent=4)
 ## 处理docker if we are running in Docker
 dockerflag = config.get("dockerflag", False)
 if os.environ.get("dockerrun") == "yes":
 if api_host:
     shared.state.set_api_host(api_host)
 @contextmanager
 def retrieve_openai_api(api_key = None):
     old_api_key = os.environ.get("OPENAI_API_KEY", "")
 os.environ["HTTP_PROXY"] = ""
 os.environ["HTTPS_PROXY"] = ""
+local_embedding = config.get("local_embedding", False) # 是否使用本地embedding
 @contextmanager
 def retrieve_proxy(proxy=None):
     """
 advance_docs.update(config.get("advance_docs", {}))
 def update_doc_config(two_column_pdf):
     global advance_docs
+    advance_docs["pdf"]["two_column"] = two_column_pdf
+    logging.info(f"更新后的文件参数为：{advance_docs}")
+## 处理gradio.launch参数
+server_name = config.get("server_name", None)
+server_port = config.get("server_port", None)
+if server_name is None:
+    if dockerflag:
+        server_name = "0.0.0.0"
     else:
+        server_name = "127.0.0.1"
+if server_port is None:
+    if dockerflag:
+        server_port = 7860
+assert server_port is None or type(server_port) == int, "要求port设置为int类型"
+# 设置默认model
+default_model = config.get("default_model", "")
+try:
+    presets.DEFAULT_MODEL = presets.MODELS.index(default_model)
+except ValueError:
+    pass
+share = config.get("share", False)

modules/llama_func.py CHANGED Viewed

@@ -15,6 +15,8 @@ from tqdm import tqdm
 from modules.presets import *
 from modules.utils import *
 def get_index_name(file_src):
     file_paths = [x.name for x in file_src]
@@ -28,6 +30,7 @@ def get_index_name(file_src):
     return md5_hash.hexdigest()
 def block_split(text):
     blocks = []
     while len(text) > 0:
@@ -35,6 +38,7 @@ def block_split(text):
         text = text[1000:]
     return blocks
 def get_documents(file_src):
     documents = []
     logging.debug("Loading documents...")
@@ -44,37 +48,45 @@ def get_documents(file_src):
         filename = os.path.basename(filepath)
         file_type = os.path.splitext(filepath)[1]
         logging.info(f"loading file: {filename}")
-        if file_type == ".pdf":
-            logging.debug("Loading PDF...")
-            try:
-                from modules.pdf_func import parse_pdf
-                from modules.config import advance_docs
-                two_column = advance_docs["pdf"].get("two_column", False)
-                pdftext = parse_pdf(filepath, two_column).text
-            except:
-                pdftext = ""
-                with open(filepath, 'rb') as pdfFileObj:
-                    pdfReader = PyPDF2.PdfReader(pdfFileObj)
-                    for page in tqdm(pdfReader.pages):
-                        pdftext += page.extract_text()
-            text_raw = pdftext
-        elif file_type == ".docx":
-            logging.debug("Loading Word...")
-            DocxReader = download_loader("DocxReader")
-            loader = DocxReader()
-            text_raw = loader.load_data(file=filepath)[0].text
-        elif file_type == ".epub":
-            logging.debug("Loading EPUB...")
-            EpubReader = download_loader("EpubReader")
-            loader = EpubReader()
-            text_raw = loader.load_data(file=filepath)[0].text
-        elif file_type == ".xlsx":
-            logging.debug("Loading Excel...")
-            text_raw = excel_to_string(filepath)
-        else:
-            logging.debug("Loading text file...")
-            with open(filepath, "r", encoding="utf-8") as f:
-                text_raw = f.read()
         text = add_space(text_raw)
         # text = block_split(text)
         # documents += text
@@ -84,27 +96,36 @@ def get_documents(file_src):
 def construct_index(
-        api_key,
-        file_src,
-        max_input_size=4096,
-        num_outputs=5,
-        max_chunk_overlap=20,
-        chunk_size_limit=600,
-        embedding_limit=None,
-        separator=" "
 ):
     from langchain.chat_models import ChatOpenAI
-    from llama_index import GPTSimpleVectorIndex, ServiceContext
-    os.environ["OPENAI_API_KEY"] = api_key
     chunk_size_limit = None if chunk_size_limit == 0 else chunk_size_limit
     embedding_limit = None if embedding_limit == 0 else embedding_limit
     separator = " " if separator == "" else separator
-    llm_predictor = LLMPredictor(
-        llm=ChatOpenAI(model_name="gpt-3.5-turbo-0301", openai_api_key=api_key)
     )
-    prompt_helper = PromptHelper(max_input_size = max_input_size, num_output = num_outputs, max_chunk_overlap = max_chunk_overlap, embedding_limit=embedding_limit, chunk_size_limit=600, separator=separator)
     index_name = get_index_name(file_src)
     if os.path.exists(f"./index/{index_name}.json"):
         logging.info("找到了缓存的索引文件，加载中……")
@@ -112,11 +133,19 @@ def construct_index(
     else:
         try:
             documents = get_documents(file_src)
             logging.info("构建索引中……")
             with retrieve_proxy():
-                service_context = ServiceContext.from_defaults(llm_predictor=llm_predictor, prompt_helper=prompt_helper, chunk_size_limit=chunk_size_limit)
                 index = GPTSimpleVectorIndex.from_documents(
-                    documents,  service_context=service_context
                 )
             logging.debug("索引构建完成！")
             os.makedirs("./index", exist_ok=True)

 from modules.presets import *
 from modules.utils import *
+from modules.config import local_embedding
 def get_index_name(file_src):
     file_paths = [x.name for x in file_src]
     return md5_hash.hexdigest()
 def block_split(text):
     blocks = []
     while len(text) > 0:
         text = text[1000:]
     return blocks
 def get_documents(file_src):
     documents = []
     logging.debug("Loading documents...")
         filename = os.path.basename(filepath)
         file_type = os.path.splitext(filepath)[1]
         logging.info(f"loading file: {filename}")
+        try:
+            if file_type == ".pdf":
+                logging.debug("Loading PDF...")
+                try:
+                    from modules.pdf_func import parse_pdf
+                    from modules.config import advance_docs
+                    two_column = advance_docs["pdf"].get("two_column", False)
+                    pdftext = parse_pdf(filepath, two_column).text
+                except:
+                    pdftext = ""
+                    with open(filepath, "rb") as pdfFileObj:
+                        pdfReader = PyPDF2.PdfReader(pdfFileObj)
+                        for page in tqdm(pdfReader.pages):
+                            pdftext += page.extract_text()
+                text_raw = pdftext
+            elif file_type == ".docx":
+                logging.debug("Loading Word...")
+                DocxReader = download_loader("DocxReader")
+                loader = DocxReader()
+                text_raw = loader.load_data(file=filepath)[0].text
+            elif file_type == ".epub":
+                logging.debug("Loading EPUB...")
+                EpubReader = download_loader("EpubReader")
+                loader = EpubReader()
+                text_raw = loader.load_data(file=filepath)[0].text
+            elif file_type == ".xlsx":
+                logging.debug("Loading Excel...")
+                text_list = excel_to_string(filepath)
+                for elem in text_list:
+                    documents.append(Document(elem))
+                continue
+            else:
+                logging.debug("Loading text file...")
+                with open(filepath, "r", encoding="utf-8") as f:
+                    text_raw = f.read()
+        except Exception as e:
+            logging.error(f"Error loading file: {filename}")
+            pass
         text = add_space(text_raw)
         # text = block_split(text)
         # documents += text
 def construct_index(
+    api_key,
+    file_src,
+    max_input_size=4096,
+    num_outputs=5,
+    max_chunk_overlap=20,
+    chunk_size_limit=600,
+    embedding_limit=None,
+    separator=" ",
 ):
     from langchain.chat_models import ChatOpenAI
+    from langchain.embeddings.huggingface import HuggingFaceEmbeddings
+    from llama_index import GPTSimpleVectorIndex, ServiceContext, LangchainEmbedding, OpenAIEmbedding
+    if api_key:
+        os.environ["OPENAI_API_KEY"] = api_key
+    else:
+        # 由于一个依赖的愚蠢的设计，这里必须要有一个API KEY
+        os.environ["OPENAI_API_KEY"] = "sk-xxxxxxx"
     chunk_size_limit = None if chunk_size_limit == 0 else chunk_size_limit
     embedding_limit = None if embedding_limit == 0 else embedding_limit
     separator = " " if separator == "" else separator
+    prompt_helper = PromptHelper(
+        max_input_size=max_input_size,
+        num_output=num_outputs,
+        max_chunk_overlap=max_chunk_overlap,
+        embedding_limit=embedding_limit,
+        chunk_size_limit=600,
+        separator=separator,
     )
     index_name = get_index_name(file_src)
     if os.path.exists(f"./index/{index_name}.json"):
         logging.info("找到了缓存的索引文件，加载中……")
     else:
         try:
             documents = get_documents(file_src)
+            if local_embedding:
+                embed_model = LangchainEmbedding(HuggingFaceEmbeddings())
+            else:
+                embed_model = OpenAIEmbedding()
             logging.info("构建索引中……")
             with retrieve_proxy():
+                service_context = ServiceContext.from_defaults(
+                    prompt_helper=prompt_helper,
+                    chunk_size_limit=chunk_size_limit,
+                    embed_model=embed_model,
+                )
                 index = GPTSimpleVectorIndex.from_documents(
+                    documents, service_context=service_context
                 )
             logging.debug("索引构建完成！")
             os.makedirs("./index", exist_ok=True)

modules/models.py ADDED Viewed

	@@ -0,0 +1,586 @@

+from __future__ import annotations
+from typing import TYPE_CHECKING, List
+import logging
+import json
+import commentjson as cjson
+import os
+import sys
+import requests
+import urllib3
+import platform
+from tqdm import tqdm
+import colorama
+from duckduckgo_search import ddg
+import asyncio
+import aiohttp
+from enum import Enum
+import uuid
+from .presets import *
+from .llama_func import *
+from .utils import *
+from . import shared
+from .config import retrieve_proxy
+from modules import config
+from .base_model import BaseLLMModel, ModelType
+class OpenAIClient(BaseLLMModel):
+    def __init__(
+        self,
+        model_name,
+        api_key,
+        system_prompt=INITIAL_SYSTEM_PROMPT,
+        temperature=1.0,
+        top_p=1.0,
+    ) -> None:
+        super().__init__(
+            model_name=model_name,
+            temperature=temperature,
+            top_p=top_p,
+            system_prompt=system_prompt,
+        )
+        self.api_key = api_key
+        self.need_api_key = True
+        self._refresh_header()
+    def get_answer_stream_iter(self):
+        response = self._get_response(stream=True)
+        if response is not None:
+            iter = self._decode_chat_response(response)
+            partial_text = ""
+            for i in iter:
+                partial_text += i
+                yield partial_text
+        else:
+            yield STANDARD_ERROR_MSG + GENERAL_ERROR_MSG
+    def get_answer_at_once(self):
+        response = self._get_response()
+        response = json.loads(response.text)
+        content = response["choices"][0]["message"]["content"]
+        total_token_count = response["usage"]["total_tokens"]
+        return content, total_token_count
+    def count_token(self, user_input):
+        input_token_count = count_token(construct_user(user_input))
+        if self.system_prompt is not None and len(self.all_token_counts) == 0:
+            system_prompt_token_count = count_token(
+                construct_system(self.system_prompt)
+            )
+            return input_token_count + system_prompt_token_count
+        return input_token_count
+    def billing_info(self):
+        try:
+            curr_time = datetime.datetime.now()
+            last_day_of_month = get_last_day_of_month(
+                curr_time).strftime("%Y-%m-%d")
+            first_day_of_month = curr_time.replace(day=1).strftime("%Y-%m-%d")
+            usage_url = f"{shared.state.usage_api_url}?start_date={first_day_of_month}&end_date={last_day_of_month}"
+            try:
+                usage_data = self._get_billing_data(usage_url)
+            except Exception as e:
+                logging.error(f"获取API使用情况失败:" + str(e))
+                return f"**获取API使用情况失败**"
+            rounded_usage = "{:.5f}".format(usage_data["total_usage"] / 100)
+            return f"**本月使用金额** \u3000 ${rounded_usage}"
+        except requests.exceptions.ConnectTimeout:
+            status_text = (
+                STANDARD_ERROR_MSG + CONNECTION_TIMEOUT_MSG + ERROR_RETRIEVE_MSG
+            )
+            return status_text
+        except requests.exceptions.ReadTimeout:
+            status_text = STANDARD_ERROR_MSG + READ_TIMEOUT_MSG + ERROR_RETRIEVE_MSG
+            return status_text
+        except Exception as e:
+            logging.error(f"获取API使用情况失败:" + str(e))
+            return STANDARD_ERROR_MSG + ERROR_RETRIEVE_MSG
+    def set_token_upper_limit(self, new_upper_limit):
+        pass
+    def set_key(self, new_access_key):
+        self.api_key = new_access_key.strip()
+        self._refresh_header()
+        msg = f"API密钥更改为了{hide_middle_chars(self.api_key)}"
+        logging.info(msg)
+        return msg
+    @shared.state.switching_api_key  # 在不开启多账号模式的时候，这个装饰器不会起作用
+    def _get_response(self, stream=False):
+        openai_api_key = self.api_key
+        system_prompt = self.system_prompt
+        history = self.history
+        logging.debug(colorama.Fore.YELLOW +
+                      f"{history}" + colorama.Fore.RESET)
+        headers = {
+            "Content-Type": "application/json",
+            "Authorization": f"Bearer {openai_api_key}",
+        }
+        if system_prompt is not None:
+            history = [construct_system(system_prompt), *history]
+        payload = {
+            "model": self.model_name,
+            "messages": history,
+            "temperature": self.temperature,
+            "top_p": self.top_p,
+            "n": self.n_choices,
+            "stream": stream,
+            "presence_penalty": self.presence_penalty,
+            "frequency_penalty": self.frequency_penalty,
+        }
+        if self.max_generation_token is not None:
+            payload["max_tokens"] = self.max_generation_token
+        if self.stop_sequence is not None:
+            payload["stop"] = self.stop_sequence
+        if self.logit_bias is not None:
+            payload["logit_bias"] = self.logit_bias
+        if self.user_identifier is not None:
+            payload["user"] = self.user_identifier
+        if stream:
+            timeout = TIMEOUT_STREAMING
+        else:
+            timeout = TIMEOUT_ALL
+        # 如果有自定义的api-host，使用自定义host发送请求，否则使用默认设置发送请求
+        if shared.state.completion_url != COMPLETION_URL:
+            logging.info(f"使用自定义API URL: {shared.state.completion_url}")
+        with retrieve_proxy():
+            try:
+                response = requests.post(
+                    shared.state.completion_url,
+                    headers=headers,
+                    json=payload,
+                    stream=stream,
+                    timeout=timeout,
+                )
+            except:
+                return None
+        return response
+    def _refresh_header(self):
+        self.headers = {
+            "Content-Type": "application/json",
+            "Authorization": f"Bearer {self.api_key}",
+        }
+    def _get_billing_data(self, billing_url):
+        with retrieve_proxy():
+            response = requests.get(
+                billing_url,
+                headers=self.headers,
+                timeout=TIMEOUT_ALL,
+            )
+        if response.status_code == 200:
+            data = response.json()
+            return data
+        else:
+            raise Exception(
+                f"API request failed with status code {response.status_code}: {response.text}"
+            )
+    def _decode_chat_response(self, response):
+        error_msg = ""
+        for chunk in response.iter_lines():
+            if chunk:
+                chunk = chunk.decode()
+                chunk_length = len(chunk)
+                try:
+                    chunk = json.loads(chunk[6:])
+                except json.JSONDecodeError:
+                    print(f"JSON解析错误,收到的内容: {chunk}")
+                    error_msg += chunk
+                    continue
+                if chunk_length > 6 and "delta" in chunk["choices"][0]:
+                    if chunk["choices"][0]["finish_reason"] == "stop":
+                        break
+                    try:
+                        yield chunk["choices"][0]["delta"]["content"]
+                    except Exception as e:
+                        # logging.error(f"Error: {e}")
+                        continue
+        if error_msg:
+            raise Exception(error_msg)
+class ChatGLM_Client(BaseLLMModel):
+    def __init__(self, model_name) -> None:
+        super().__init__(model_name=model_name)
+        from transformers import AutoTokenizer, AutoModel
+        import torch
+        global CHATGLM_TOKENIZER, CHATGLM_MODEL
+        if CHATGLM_TOKENIZER is None or CHATGLM_MODEL is None:
+            system_name = platform.system()
+            model_path = None
+            if os.path.exists("models"):
+                model_dirs = os.listdir("models")
+                if model_name in model_dirs:
+                    model_path = f"models/{model_name}"
+            if model_path is not None:
+                model_source = model_path
+            else:
+                model_source = f"THUDM/{model_name}"
+            CHATGLM_TOKENIZER = AutoTokenizer.from_pretrained(
+                model_source, trust_remote_code=True
+            )
+            quantified = False
+            if "int4" in model_name:
+                quantified = True
+            if quantified:
+                model = AutoModel.from_pretrained(
+                    model_source, trust_remote_code=True
+                ).half()
+            else:
+                model = AutoModel.from_pretrained(
+                    model_source, trust_remote_code=True
+                ).half()
+            if torch.cuda.is_available():
+                # run on CUDA
+                logging.info("CUDA is available, using CUDA")
+                model = model.cuda()
+            # mps加速还存在一些问题，暂时不使用
+            elif system_name == "Darwin" and model_path is not None and not quantified:
+                logging.info("Running on macOS, using MPS")
+                # running on macOS and model already downloaded
+                model = model.to("mps")
+            else:
+                logging.info("GPU is not available, using CPU")
+            model = model.eval()
+            CHATGLM_MODEL = model
+    def _get_glm_style_input(self):
+        history = [x["content"] for x in self.history]
+        query = history.pop()
+        logging.debug(colorama.Fore.YELLOW +
+                      f"{history}" + colorama.Fore.RESET)
+        assert (
+            len(history) % 2 == 0
+        ), f"History should be even length. current history is: {history}"
+        history = [[history[i], history[i + 1]]
+                   for i in range(0, len(history), 2)]
+        return history, query
+    def get_answer_at_once(self):
+        history, query = self._get_glm_style_input()
+        response, _ = CHATGLM_MODEL.chat(
+            CHATGLM_TOKENIZER, query, history=history)
+        return response, len(response)
+    def get_answer_stream_iter(self):
+        history, query = self._get_glm_style_input()
+        for response, history in CHATGLM_MODEL.stream_chat(
+            CHATGLM_TOKENIZER,
+            query,
+            history,
+            max_length=self.token_upper_limit,
+            top_p=self.top_p,
+            temperature=self.temperature,
+        ):
+            yield response
+class LLaMA_Client(BaseLLMModel):
+    def __init__(
+        self,
+        model_name,
+        lora_path=None,
+    ) -> None:
+        super().__init__(model_name=model_name)
+        from lmflow.datasets.dataset import Dataset
+        from lmflow.pipeline.auto_pipeline import AutoPipeline
+        from lmflow.models.auto_model import AutoModel
+        from lmflow.args import ModelArguments, DatasetArguments, InferencerArguments
+        self.max_generation_token = 1000
+        self.end_string = "\n\n"
+        # We don't need input data
+        data_args = DatasetArguments(dataset_path=None)
+        self.dataset = Dataset(data_args)
+        self.system_prompt = ""
+        global LLAMA_MODEL, LLAMA_INFERENCER
+        if LLAMA_MODEL is None or LLAMA_INFERENCER is None:
+            model_path = None
+            if os.path.exists("models"):
+                model_dirs = os.listdir("models")
+                if model_name in model_dirs:
+                    model_path = f"models/{model_name}"
+            if model_path is not None:
+                model_source = model_path
+            else:
+                model_source = f"decapoda-research/{model_name}"
+                # raise Exception(f"models目录下没有这个模型: {model_name}")
+            if lora_path is not None:
+                lora_path = f"lora/{lora_path}"
+            model_args = ModelArguments(model_name_or_path=model_source, lora_model_path=lora_path, model_type=None, config_overrides=None, config_name=None, tokenizer_name=None, cache_dir=None,
+                                        use_fast_tokenizer=True, model_revision='main', use_auth_token=False, torch_dtype=None, use_lora=False, lora_r=8, lora_alpha=32, lora_dropout=0.1, use_ram_optimized_load=True)
+            pipeline_args = InferencerArguments(
+                local_rank=0, random_seed=1, deepspeed='configs/ds_config_chatbot.json', mixed_precision='bf16')
+            with open(pipeline_args.deepspeed, "r") as f:
+                ds_config = json.load(f)
+            LLAMA_MODEL = AutoModel.get_model(
+                model_args,
+                tune_strategy="none",
+                ds_config=ds_config,
+            )
+            LLAMA_INFERENCER = AutoPipeline.get_pipeline(
+                pipeline_name="inferencer",
+                model_args=model_args,
+                data_args=data_args,
+                pipeline_args=pipeline_args,
+            )
+        # Chats
+        # model_name = model_args.model_name_or_path
+        # if model_args.lora_model_path is not None:
+        #     model_name += f" + {model_args.lora_model_path}"
+        # context = (
+        #     "You are a helpful assistant who follows the given instructions"
+        #     " unconditionally."
+        # )
+    def _get_llama_style_input(self):
+        history = []
+        instruction = ""
+        if self.system_prompt:
+            instruction = (f"Instruction: {self.system_prompt}\n")
+        for x in self.history:
+            if x["role"] == "user":
+                history.append(f"{instruction}Input: {x['content']}")
+            else:
+                history.append(f"Output: {x['content']}")
+        context = "\n\n".join(history)
+        context += "\n\nOutput: "
+        return context
+    def get_answer_at_once(self):
+        context = self._get_llama_style_input()
+        input_dataset = self.dataset.from_dict(
+            {"type": "text_only", "instances": [{"text": context}]}
+        )
+        output_dataset = LLAMA_INFERENCER.inference(
+            model=LLAMA_MODEL,
+            dataset=input_dataset,
+            max_new_tokens=self.max_generation_token,
+            temperature=self.temperature,
+        )
+        response = output_dataset.to_dict()["instances"][0]["text"]
+        return response, len(response)
+    def get_answer_stream_iter(self):
+        context = self._get_llama_style_input()
+        partial_text = ""
+        step = 1
+        for _ in range(0, self.max_generation_token, step):
+            input_dataset = self.dataset.from_dict(
+                {"type": "text_only", "instances": [
+                    {"text": context + partial_text}]}
+            )
+            output_dataset = LLAMA_INFERENCER.inference(
+                model=LLAMA_MODEL,
+                dataset=input_dataset,
+                max_new_tokens=step,
+                temperature=self.temperature,
+            )
+            response = output_dataset.to_dict()["instances"][0]["text"]
+            if response == "" or response == self.end_string:
+                break
+            partial_text += response
+            yield partial_text
+class XMBot_Client(BaseLLMModel):
+    def __init__(self, api_key):
+        super().__init__(model_name="xmbot")
+        self.api_key = api_key
+        self.session_id = None
+        self.reset()
+        self.image_bytes = None
+        self.image_path = None
+        self.xm_history = []
+        self.url = "https://xmbot.net/web"
+    def reset(self):
+        self.session_id = str(uuid.uuid4())
+        return [], "已重置"
+    def try_read_image(self, filepath):
+        import base64
+        def is_image_file(filepath):
+            # 判断文件是否为图片
+            valid_image_extensions = [".jpg", ".jpeg", ".png", ".bmp", ".gif", ".tiff"]
+            file_extension = os.path.splitext(filepath)[1].lower()
+            return file_extension in valid_image_extensions
+        def read_image_as_bytes(filepath):
+            # 读取图片文件并返回比特流
+            with open(filepath, "rb") as f:
+                image_bytes = f.read()
+            return image_bytes
+        if is_image_file(filepath):
+            logging.info(f"读取图片文件: {filepath}")
+            image_bytes = read_image_as_bytes(filepath)
+            base64_encoded_image = base64.b64encode(image_bytes).decode()
+            self.image_bytes = base64_encoded_image
+            self.image_path = filepath
+        else:
+            self.image_bytes = None
+            self.image_path = None
+    def prepare_inputs(self, real_inputs, use_websearch, files, reply_language, chatbot):
+        fake_inputs = real_inputs
+        display_append = ""
+        limited_context = False
+        return limited_context, fake_inputs, display_append, real_inputs, chatbot
+    def handle_file_upload(self, files, chatbot):
+        """if the model accepts multi modal input, implement this function"""
+        if files:
+            for file in files:
+                if file.name:
+                    logging.info(f"尝试读取图像: {file.name}")
+                    self.try_read_image(file.name)
+            if self.image_path is not None:
+                chatbot = chatbot + [((self.image_path,), None)]
+            if self.image_bytes is not None:
+                logging.info("使用图片作为输入")
+                conv_id = str(uuid.uuid4())
+                data = {
+                    "user_id": self.api_key,
+                    "session_id": self.session_id,
+                    "uuid": conv_id,
+                    "data_type": "imgbase64",
+                    "data": self.image_bytes
+                }
+                response = requests.post(self.url, json=data)
+                response = json.loads(response.text)
+                logging.info(f"图片回复: {response['data']}")
+        return None, chatbot, None
+    def get_answer_at_once(self):
+        question = self.history[-1]["content"]
+        conv_id = str(uuid.uuid4())
+        data = {
+            "user_id": self.api_key,
+            "session_id": self.session_id,
+            "uuid": conv_id,
+            "data_type": "text",
+            "data": question
+        }
+        response = requests.post(self.url, json=data)
+        response = json.loads(response.text)
+        return response["data"], len(response["data"])
+def get_model(
+    model_name,
+    lora_model_path=None,
+    access_key=None,
+    temperature=None,
+    top_p=None,
+    system_prompt=None,
+) -> BaseLLMModel:
+    msg = f"模型设置为了： {model_name}"
+    model_type = ModelType.get_type(model_name)
+    lora_selector_visibility = False
+    lora_choices = []
+    dont_change_lora_selector = False
+    if model_type != ModelType.OpenAI:
+        config.local_embedding = True
+    # del current_model.model
+    model = None
+    try:
+        if model_type == ModelType.OpenAI:
+            logging.info(f"正在加载OpenAI模型: {model_name}")
+            model = OpenAIClient(
+                model_name=model_name,
+                api_key=access_key,
+                system_prompt=system_prompt,
+                temperature=temperature,
+                top_p=top_p,
+            )
+        elif model_type == ModelType.ChatGLM:
+            logging.info(f"正在加载ChatGLM模型: {model_name}")
+            model = ChatGLM_Client(model_name)
+        elif model_type == ModelType.LLaMA and lora_model_path == "":
+            msg = f"现在请为 {model_name} 选择LoRA模型"
+            logging.info(msg)
+            lora_selector_visibility = True
+            if os.path.isdir("lora"):
+                lora_choices = get_file_names(
+                    "lora", plain=True, filetypes=[""])
+            lora_choices = ["No LoRA"] + lora_choices
+        elif model_type == ModelType.LLaMA and lora_model_path != "":
+            logging.info(f"正在加载LLaMA模型: {model_name} + {lora_model_path}")
+            dont_change_lora_selector = True
+            if lora_model_path == "No LoRA":
+                lora_model_path = None
+                msg += " + No LoRA"
+            else:
+                msg += f" + {lora_model_path}"
+            model = LLaMA_Client(model_name, lora_model_path)
+        elif model_type == ModelType.XMBot:
+            model = XMBot_Client(api_key=access_key)
+        elif model_type == ModelType.Unknown:
+            raise ValueError(f"未知模型: {model_name}")
+        logging.info(msg)
+    except Exception as e:
+        logging.error(e)
+        msg = f"{STANDARD_ERROR_MSG}: {e}"
+    if dont_change_lora_selector:
+        return model, msg
+    else:
+        return model, msg, gr.Dropdown.update(choices=lora_choices, visible=lora_selector_visibility)
+if __name__ == "__main__":
+    with open("config.json", "r") as f:
+        openai_api_key = cjson.load(f)["openai_api_key"]
+    # set logging level to debug
+    logging.basicConfig(level=logging.DEBUG)
+    # client = ModelManager(model_name="gpt-3.5-turbo", access_key=openai_api_key)
+    client = get_model(model_name="chatglm-6b-int4")
+    chatbot = []
+    stream = False
+    # 测试账单功能
+    logging.info(colorama.Back.GREEN + "测试账单功能" + colorama.Back.RESET)
+    logging.info(client.billing_info())
+    # 测试问答
+    logging.info(colorama.Back.GREEN + "测试问答" + colorama.Back.RESET)
+    question = "巴黎是中国的首都吗？"
+    for i in client.predict(inputs=question, chatbot=chatbot, stream=stream):
+        logging.info(i)
+    logging.info(f"测试问答后history : {client.history}")
+    # 测试记忆力
+    logging.info(colorama.Back.GREEN + "测试记忆力" + colorama.Back.RESET)
+    question = "我刚刚问了你什么问题？"
+    for i in client.predict(inputs=question, chatbot=chatbot, stream=stream):
+        logging.info(i)
+    logging.info(f"测试记忆力后history : {client.history}")
+    # 测试重试功能
+    logging.info(colorama.Back.GREEN + "测试重试功能" + colorama.Back.RESET)
+    for i in client.retry(chatbot=chatbot, stream=stream):
+        logging.info(i)
+    logging.info(f"重试后history : {client.history}")
+    # # 测试总结功能
+    # print(colorama.Back.GREEN + "测试总结功能" + colorama.Back.RESET)
+    # chatbot, msg = client.reduce_token_size(chatbot=chatbot)
+    # print(chatbot, msg)
+    # print(f"总结后history: {client.history}")

modules/overwrites.py CHANGED Viewed

@@ -4,6 +4,7 @@ import logging
 from llama_index import Prompt
 from typing import List, Tuple
 import mdtex2html
 from modules.presets import *
 from modules.llama_func import *
@@ -20,23 +21,60 @@ def compact_text_chunks(self, prompt: Prompt, text_chunks: List[str]) -> List[st
 def postprocess(
-    self, y: List[Tuple[str | None, str | None]]
-) -> List[Tuple[str | None, str | None]]:
-    """
-    Parameters:
-        y: List of tuples representing the message and response pairs. Each message and response should be a string, which may be in Markdown format.
-    Returns:
-        List of tuples representing the message and response. Each message and response will be a string of HTML.
-    """
-    if y is None or y == []:
-        return []
-    user, bot = y[-1]
-    if not detect_converted_mark(user):
-        user = convert_asis(user)
-    if not detect_converted_mark(bot):
-        bot = convert_mdtext(bot)
-    y[-1] = (user, bot)
-    return y
 with open("./assets/custom.js", "r", encoding="utf-8") as f, open("./assets/Kelpy-Codos.js", "r", encoding="utf-8") as f2:
     customJS = f.read()

 from llama_index import Prompt
 from typing import List, Tuple
 import mdtex2html
+from gradio_client import utils as client_utils
 from modules.presets import *
 from modules.llama_func import *
 def postprocess(
+        self,
+        y: List[List[str | Tuple[str] | Tuple[str, str] | None] | Tuple],
+    ) -> List[List[str | Dict | None]]:
+        """
+        Parameters:
+            y: List of lists representing the message and response pairs. Each message and response should be a string, which may be in Markdown format.  It can also be a tuple whose first element is a string filepath or URL to an image/video/audio, and second (optional) element is the alt text, in which case the media file is displayed. It can also be None, in which case that message is not displayed.
+        Returns:
+            List of lists representing the message and response. Each message and response will be a string of HTML, or a dictionary with media information. Or None if the message is not to be displayed.
+        """
+        if y is None:
+            return []
+        processed_messages = []
+        for message_pair in y:
+            assert isinstance(
+                message_pair, (tuple, list)
+            ), f"Expected a list of lists or list of tuples. Received: {message_pair}"
+            assert (
+                len(message_pair) == 2
+            ), f"Expected a list of lists of length 2 or list of tuples of length 2. Received: {message_pair}"
+            processed_messages.append(
+                [
+                    self._postprocess_chat_messages(message_pair[0], "user"),
+                    self._postprocess_chat_messages(message_pair[1], "bot"),
+                ]
+            )
+        return processed_messages
+def postprocess_chat_messages(
+        self, chat_message: str | Tuple | List | None, message_type: str
+    ) -> str | Dict | None:
+        if chat_message is None:
+            return None
+        elif isinstance(chat_message, (tuple, list)):
+            filepath = chat_message[0]
+            mime_type = client_utils.get_mimetype(filepath)
+            filepath = self.make_temp_copy_if_needed(filepath)
+            return {
+                "name": filepath,
+                "mime_type": mime_type,
+                "alt_text": chat_message[1] if len(chat_message) > 1 else None,
+                "data": None,  # These last two fields are filled in by the frontend
+                "is_file": True,
+            }
+        elif isinstance(chat_message, str):
+            if message_type == "bot":
+                if not detect_converted_mark(chat_message):
+                    chat_message = convert_mdtext(chat_message)
+            elif message_type == "user":
+                if not detect_converted_mark(chat_message):
+                    chat_message = convert_asis(chat_message)
+            return chat_message
+        else:
+            raise ValueError(f"Invalid message for Chatbot component: {chat_message}")
 with open("./assets/custom.js", "r", encoding="utf-8") as f, open("./assets/Kelpy-Codos.js", "r", encoding="utf-8") as f2:
     customJS = f.read()

modules/presets.py CHANGED Viewed

@@ -1,89 +1,122 @@
 # -*- coding:utf-8 -*-
-import gradio as gr
 from pathlib import Path
 # ChatGPT 设置
-initial_prompt = "You are a helpful assistant."
 API_HOST = "api.openai.com"
 COMPLETION_URL = "https://api.openai.com/v1/chat/completions"
 BALANCE_API_URL="https://api.openai.com/dashboard/billing/credit_grants"
 USAGE_API_URL="https://api.openai.com/dashboard/billing/usage"
 HISTORY_DIR = Path("history")
 TEMPLATES_DIR = "templates"
 # 错误信息
-standard_error_msg = "☹️发生了错误："  # 错误信息的标准前缀
-error_retrieve_prompt = "请检查网络连接，或者API-Key是否有效。"  # 获取对话时发生错误
-connection_timeout_prompt = "连接超时，无法获取对话。"  # 连接超时
-read_timeout_prompt = "读取超时，无法获取对话。"  # 读取超时
-proxy_error_prompt = "代理错误，无法获取对话。"  # 代理错误
-ssl_error_prompt = "SSL错误，无法获取对话。"  # SSL 错误
-no_apikey_msg = "API key长度不是51位，请检查是否输入正确。"  # API key 长度不足 51 位
-no_input_msg = "请输入对话内容。"  # 未输入对话内容
-timeout_streaming = 10  # 流式对话时的超时时间
-timeout_all = 200  # 非流式对话时的超时时间
-enable_streaming_option = True  # 是否启用选择选择是否实时显示回答的勾选框
 HIDE_MY_KEY = False  # 如果你想在UI中隐藏你的 API 密钥，将此值设置为 True
 CONCURRENT_COUNT = 100 # 允许同时使用的用户数量
 SIM_K = 5
 INDEX_QUERY_TEMPRATURE = 1.0
-title = """<h1 align="left" style="min-width:200px; margin-top:6px; white-space: nowrap;">川虎ChatGPT 🚀</h1>"""
-description = """\
 <div align="center" style="margin:16px 0">
 由Bilibili [土川虎虎虎](https://space.bilibili.com/29125536) 和 [明昭MZhao](https://space.bilibili.com/24807452)开发
-访问川虎ChatGPT的 [GitHub项目](https://github.com/GaiZhenbiao/ChuanhuChatGPT) 下载最新版脚本
-此App使用 `gpt-3.5-turbo` 大语言模型
 </div>
 """
-footer = """\
-<div class="versions">{versions}</div>
 """
-summarize_prompt = "你是谁？我们刚才聊了什么？"  # 总结对话时的 prompt
-MODELS = [
     "gpt-3.5-turbo",
     "gpt-3.5-turbo-0301",
     "gpt-4",
     "gpt-4-0314",
     "gpt-4-32k",
     "gpt-4-32k-0314",
-]  # 可选的模型
-MODEL_SOFT_TOKEN_LIMIT = {
-    "gpt-3.5-turbo": {
-        "streaming": 3500,
-        "all": 3500
-    },
-    "gpt-3.5-turbo-0301": {
-        "streaming": 3500,
-        "all": 3500
-    },
-    "gpt-4": {
-        "streaming": 7500,
-        "all": 7500
-    },
-    "gpt-4-0314": {
-        "streaming": 7500,
-        "all": 7500
-    },
-    "gpt-4-32k": {
-        "streaming": 31000,
-        "all": 31000
-    },
-    "gpt-4-32k-0314": {
-        "streaming": 31000,
-        "all": 31000
-    }
 }
 REPLY_LANGUAGES = [
     "简体中文",
     "繁體中文",

 # -*- coding:utf-8 -*-
+import os
 from pathlib import Path
+import gradio as gr
+CHATGLM_MODEL = None
+CHATGLM_TOKENIZER = None
+LLAMA_MODEL = None
+LLAMA_INFERENCER = None
 # ChatGPT 设置
+INITIAL_SYSTEM_PROMPT = "You are a helpful assistant."
 API_HOST = "api.openai.com"
 COMPLETION_URL = "https://api.openai.com/v1/chat/completions"
 BALANCE_API_URL="https://api.openai.com/dashboard/billing/credit_grants"
 USAGE_API_URL="https://api.openai.com/dashboard/billing/usage"
 HISTORY_DIR = Path("history")
+HISTORY_DIR = "history"
 TEMPLATES_DIR = "templates"
 # 错误信息
+STANDARD_ERROR_MSG = "☹️发生了错误："  # 错误信息的标准前缀
+GENERAL_ERROR_MSG = "获取对话时发生错误，请查看后台日志"
+ERROR_RETRIEVE_MSG = "请检查网络连接，或者API-Key是否有效。"
+CONNECTION_TIMEOUT_MSG = "连接超时，无法获取对话。"  # 连接超时
+READ_TIMEOUT_MSG = "读取超时，无法获取对话。"  # 读取超时
+PROXY_ERROR_MSG = "代理错误，无法获取对话。"  # 代理错误
+SSL_ERROR_PROMPT = "SSL错误，无法获取对话。"  # SSL 错误
+NO_APIKEY_MSG = "API key为空，请检查是否输入正确。"  # API key 长度不足 51 位
+NO_INPUT_MSG = "请输入对话内容。"  # 未输入对话内容
+BILLING_NOT_APPLICABLE_MSG = "账单信息不适用" # 本地运行的模型返回的账单信息
+TIMEOUT_STREAMING = 60  # 流式对话时的超时时间
+TIMEOUT_ALL = 200  # 非流式对话时的超时时间
+ENABLE_STREAMING_OPTION = True  # 是否启用选择选择是否实时显示回答的勾选框
 HIDE_MY_KEY = False  # 如果你想在UI中隐藏你的 API 密钥，将此值设置为 True
 CONCURRENT_COUNT = 100 # 允许同时使用的用户数量
 SIM_K = 5
 INDEX_QUERY_TEMPRATURE = 1.0
+CHUANHU_TITLE = """<h1 align="left">川虎Chat 🚀</h1>"""
+CHUANHU_DESCRIPTION = """\
 <div align="center" style="margin:16px 0">
 由Bilibili [土川虎虎虎](https://space.bilibili.com/29125536) 和 [明昭MZhao](https://space.bilibili.com/24807452)开发
+访问川虎Chat的 [GitHub项目](https://github.com/GaiZhenbiao/ChuanhuChatGPT) 下载最新版脚本
 </div>
 """
+FOOTER = """<div class="versions">{versions}</div>"""
+APPEARANCE_SWITCHER = """
+<div style="display: flex; justify-content: space-between;">
+<span style="margin-top: 4px !important;">切换亮暗色主题</span>
+<span><label class="apSwitch" for="checkbox">
+    <input type="checkbox" id="checkbox">
+    <div class="apSlider"></div>
+</label></span>
+</div>
 """
+SUMMARIZE_PROMPT = "你是谁？我们刚才聊了什么？"  # 总结对话时的 prompt
+ONLINE_MODELS = [
     "gpt-3.5-turbo",
     "gpt-3.5-turbo-0301",
     "gpt-4",
     "gpt-4-0314",
     "gpt-4-32k",
     "gpt-4-32k-0314",
+    "xmbot",
+]
+LOCAL_MODELS = [
+    "chatglm-6b",
+    "chatglm-6b-int4",
+    "chatglm-6b-int4-qe",
+    "llama-7b-hf",
+    "llama-7b-hf-int4",
+    "llama-7b-hf-int8",
+    "llama-13b-hf",
+    "llama-13b-hf-int4",
+    "llama-30b-hf",
+    "llama-30b-hf-int4",
+    "llama-65b-hf"
+]
+if os.environ.get('HIDE_LOCAL_MODELS', 'false') == 'true':
+    MODELS = ONLINE_MODELS
+else:
+    MODELS = ONLINE_MODELS + LOCAL_MODELS
+DEFAULT_MODEL = 0
+os.makedirs("models", exist_ok=True)
+os.makedirs("lora", exist_ok=True)
+os.makedirs("history", exist_ok=True)
+for dir_name in os.listdir("models"):
+    if os.path.isdir(os.path.join("models", dir_name)):
+        if dir_name not in MODELS:
+            MODELS.append(dir_name)
+MODEL_TOKEN_LIMIT = {
+    "gpt-3.5-turbo": 4096,
+    "gpt-3.5-turbo-0301": 4096,
+    "gpt-4": 8192,
+    "gpt-4-0314": 8192,
+    "gpt-4-32k": 32768,
+    "gpt-4-32k-0314": 32768
 }
+TOKEN_OFFSET = 1000 # 模型的token上限减去这个值，得到软上限。到达软上限之后，自动尝试减少token占用。
+DEFAULT_TOKEN_LIMIT = 3000 # 默认的token上限
+REDUCE_TOKEN_FACTOR = 0.5 # 与模型token上限想乘，得到目标token数。减少token占用时，将token占用减少到目标token数以下。
 REPLY_LANGUAGES = [
     "简体中文",
     "繁體中文",

modules/shared.py CHANGED Viewed

@@ -41,11 +41,11 @@ class State:
     def switching_api_key(self, func):
         if not hasattr(self, "api_key_queue"):
             return func
         def wrapped(*args, **kwargs):
             api_key = self.api_key_queue.get()
-            args = list(args)[1:]
-            ret = func(api_key, *args, **kwargs)
             self.api_key_queue.put(api_key)
             return ret

     def switching_api_key(self, func):
         if not hasattr(self, "api_key_queue"):
             return func
         def wrapped(*args, **kwargs):
             api_key = self.api_key_queue.get()
+            args[0].api_key = api_key
+            ret = func(*args, **kwargs)
             self.api_key_queue.put(api_key)
             return ret

modules/utils.py CHANGED Viewed

@@ -34,6 +34,85 @@ if TYPE_CHECKING:
         headers: List[str]
         data: List[List[str | int | bool]]
 def count_token(message):
     encoding = tiktoken.get_encoding("cl100k_base")
@@ -121,10 +200,13 @@ def convert_asis(userinput):
 def detect_converted_mark(userinput):
-    if userinput.endswith(ALREADY_CONVERTED_MARK):
         return True
-    else:
-        return False
 def detect_language(code):
@@ -153,107 +235,22 @@ def construct_assistant(text):
     return construct_text("assistant", text)
-def construct_token_message(tokens: List[int]):
-    token_sum = 0
-    for i in range(len(tokens)):
-        token_sum += sum(tokens[: i + 1])
-    return f"Token 计数: {sum(tokens)}，本次对话累计消耗了 {token_sum} tokens"
-def delete_first_conversation(history, previous_token_count):
-    if history:
-        del history[:2]
-        del previous_token_count[0]
-    return (
-        history,
-        previous_token_count,
-        construct_token_message(previous_token_count),
-    )
-def delete_last_conversation(chatbot, history, previous_token_count):
-    if len(chatbot) > 0 and standard_error_msg in chatbot[-1][1]:
-        logging.info("由于包含报错信息，只删除chatbot记录")
-        chatbot.pop()
-        return chatbot, history
-    if len(history) > 0:
-        logging.info("删除了一组对话历史")
-        history.pop()
-        history.pop()
-    if len(chatbot) > 0:
-        logging.info("删除了一组chatbot对话")
-        chatbot.pop()
-    if len(previous_token_count) > 0:
-        logging.info("删除了一组对话的token计数记录")
-        previous_token_count.pop()
-    return (
-        chatbot,
-        history,
-        previous_token_count,
-        construct_token_message(previous_token_count),
-    )
 def save_file(filename, system, history, chatbot, user_name):
-    logging.info(f"{user_name} 保存对话历史中……")
-    os.makedirs(HISTORY_DIR / user_name, exist_ok=True)
     if filename.endswith(".json"):
         json_s = {"system": system, "history": history, "chatbot": chatbot}
         print(json_s)
-        with open(os.path.join(HISTORY_DIR / user_name, filename), "w") as f:
             json.dump(json_s, f)
     elif filename.endswith(".md"):
         md_s = f"system: \n- {system} \n"
         for data in history:
             md_s += f"\n{data['role']}: \n- {data['content']} \n"
-        with open(os.path.join(HISTORY_DIR / user_name, filename), "w", encoding="utf8") as f:
             f.write(md_s)
-    logging.info(f"{user_name} 保存对话历史完毕")
-    return os.path.join(HISTORY_DIR / user_name, filename)
-def save_chat_history(filename, system, history, chatbot, user_name):
-    if filename == "":
-        return
-    if not filename.endswith(".json"):
-        filename += ".json"
-    return save_file(filename, system, history, chatbot, user_name)
-def export_markdown(filename, system, history, chatbot, user_name):
-    if filename == "":
-        return
-    if not filename.endswith(".md"):
-        filename += ".md"
-    return save_file(filename, system, history, chatbot, user_name)
-def load_chat_history(filename, system, history, chatbot, user_name):
-    logging.info(f"{user_name} 加载对话历史中……")
-    if type(filename) != str:
-        filename = filename.name
-    try:
-        with open(os.path.join(HISTORY_DIR / user_name, filename), "r") as f:
-            json_s = json.load(f)
-        try:
-            if type(json_s["history"][0]) == str:
-                logging.info("历史记录格式为旧版，正在转换……")
-                new_history = []
-                for index, item in enumerate(json_s["history"]):
-                    if index % 2 == 0:
-                        new_history.append(construct_user(item))
-                    else:
-                        new_history.append(construct_assistant(item))
-                json_s["history"] = new_history
-                logging.info(new_history)
-        except:
-            # 没有对话历史
-            pass
-        logging.info(f"{user_name} 加载对话历史完毕")
-        return filename, json_s["system"], json_s["history"], json_s["chatbot"]
-    except FileNotFoundError:
-        logging.info(f"{user_name} 没有找到对话历史文件，不执行任何操作")
-        return filename, system, history, chatbot
 def sorted_by_pinyin(list):
@@ -261,7 +258,7 @@ def sorted_by_pinyin(list):
 def get_file_names(dir, plain=False, filetypes=[".json"]):
-    logging.info(f"获取文件名列表，目录为{dir}，文件类型为{filetypes}，是否为纯文本列表{plain}")
     files = []
     try:
         for type in filetypes:
@@ -279,14 +276,13 @@ def get_file_names(dir, plain=False, filetypes=[".json"]):
 def get_history_names(plain=False, user_name=""):
-    logging.info(f"从用户 {user_name} 中获取历史记录文件名列表")
-    return get_file_names(HISTORY_DIR / user_name, plain)
 def load_template(filename, mode=0):
-    logging.info(f"加载模板文件{filename}，模式为{mode}（0为返回字典和下拉菜单，1为返回下拉菜单，2为返回字典）")
     lines = []
-    logging.info("Loading template...")
     if filename.endswith(".json"):
         with open(os.path.join(TEMPLATES_DIR, filename), "r", encoding="utf8") as f:
             lines = json.load(f)
@@ -310,23 +306,18 @@ def load_template(filename, mode=0):
 def get_template_names(plain=False):
-    logging.info("获取模板文件名列表")
     return get_file_names(TEMPLATES_DIR, plain, filetypes=[".csv", "json"])
 def get_template_content(templates, selection, original_system_prompt):
-    logging.info(f"应用模板中，选择为{selection}，原始系统提示为{original_system_prompt}")
     try:
         return templates[selection]
     except:
         return original_system_prompt
-def reset_state():
-    logging.info("重置状态")
-    return [], [], [], construct_token_message([0])
 def reset_textbox():
     logging.debug("重置文本框")
     return gr.update(value="")
@@ -388,7 +379,7 @@ def get_geoip():
         logging.warning(f"无法获取IP地址信息。\n{data}")
         if data["reason"] == "RateLimited":
             return (
-                f"获取IP地理位置失败，因为达到了检测IP的速率限制。聊天功能可能仍然可用。"
             )
         else:
             return f"获取IP地理位置失败。原因：{data['reason']}。你仍然可以使用聊天功能。"
@@ -418,7 +409,7 @@ def find_n(lst, max_num):
 def start_outputing():
     logging.debug("显示取消按钮，隐藏发送按钮")
-    return gr.Button.update(visible=True), gr.Button.update(visible=False)
 def end_outputing():
@@ -440,8 +431,8 @@ def transfer_input(inputs):
     return (
         inputs,
         gr.update(value=""),
-        gr.Button.update(visible=True),
         gr.Button.update(visible=False),
     )
@@ -504,15 +495,15 @@ def add_details(lst):
     return nodes
-def sheet_to_string(sheet):
-    result = ""
     for index, row in sheet.iterrows():
         row_string = ""
         for column in sheet.columns:
             row_string += f"{column}: {row[column]}, "
         row_string = row_string.rstrip(", ")
         row_string += "."
-        result += row_string + "\n"
     return result
 def excel_to_string(file_path):
@@ -520,17 +511,23 @@ def excel_to_string(file_path):
     excel_file = pd.read_excel(file_path, engine='openpyxl', sheet_name=None)
     # 初始化结果字符串
-    result = ""
     # 遍历每一个工作表
     for sheet_name, sheet_data in excel_file.items():
-        # 将工作表名称添加到结果字符串
-        result += f"Sheet: {sheet_name}\n"
         # 处理当前工作表并添加到结果字符串
-        result += sheet_to_string(sheet_data)
-        # 在不同工作表之间添加分隔符
-        result += "\n" + ("-" * 20) + "\n\n"
     return result

         headers: List[str]
         data: List[List[str | int | bool]]
+def predict(current_model, *args):
+    iter = current_model.predict(*args)
+    for i in iter:
+        yield i
+def billing_info(current_model):
+    return current_model.billing_info()
+def set_key(current_model, *args):
+    return current_model.set_key(*args)
+def load_chat_history(current_model, *args):
+    return current_model.load_chat_history(*args)
+def interrupt(current_model, *args):
+    return current_model.interrupt(*args)
+def reset(current_model, *args):
+    return current_model.reset(*args)
+def retry(current_model, *args):
+    iter = current_model.retry(*args)
+    for i in iter:
+        yield i
+def delete_first_conversation(current_model, *args):
+    return current_model.delete_first_conversation(*args)
+def delete_last_conversation(current_model, *args):
+    return current_model.delete_last_conversation(*args)
+def set_system_prompt(current_model, *args):
+    return current_model.set_system_prompt(*args)
+def save_chat_history(current_model, *args):
+    return current_model.save_chat_history(*args)
+def export_markdown(current_model, *args):
+    return current_model.export_markdown(*args)
+def load_chat_history(current_model, *args):
+    return current_model.load_chat_history(*args)
+def set_token_upper_limit(current_model, *args):
+    return current_model.set_token_upper_limit(*args)
+def set_temperature(current_model, *args):
+    current_model.set_temperature(*args)
+def set_top_p(current_model, *args):
+    current_model.set_top_p(*args)
+def set_n_choices(current_model, *args):
+    current_model.set_n_choices(*args)
+def set_stop_sequence(current_model, *args):
+    current_model.set_stop_sequence(*args)
+def set_max_tokens(current_model, *args):
+    current_model.set_max_tokens(*args)
+def set_presence_penalty(current_model, *args):
+    current_model.set_presence_penalty(*args)
+def set_frequency_penalty(current_model, *args):
+    current_model.set_frequency_penalty(*args)
+def set_logit_bias(current_model, *args):
+    current_model.set_logit_bias(*args)
+def set_user_identifier(current_model, *args):
+    current_model.set_user_identifier(*args)
+def set_single_turn(current_model, *args):
+    current_model.set_single_turn(*args)
+def handle_file_upload(current_model, *args):
+    return current_model.handle_file_upload(*args)
 def count_token(message):
     encoding = tiktoken.get_encoding("cl100k_base")
 def detect_converted_mark(userinput):
+    try:
+        if userinput.endswith(ALREADY_CONVERTED_MARK):
+            return True
+        else:
+            return False
+    except:
         return True
 def detect_language(code):
     return construct_text("assistant", text)
 def save_file(filename, system, history, chatbot, user_name):
+    logging.debug(f"{user_name} 保存对话历史中……")
+    os.makedirs(os.path.join(HISTORY_DIR, user_name), exist_ok=True)
     if filename.endswith(".json"):
         json_s = {"system": system, "history": history, "chatbot": chatbot}
         print(json_s)
+        with open(os.path.join(HISTORY_DIR, user_name, filename), "w") as f:
             json.dump(json_s, f)
     elif filename.endswith(".md"):
         md_s = f"system: \n- {system} \n"
         for data in history:
             md_s += f"\n{data['role']}: \n- {data['content']} \n"
+        with open(os.path.join(HISTORY_DIR, user_name, filename), "w", encoding="utf8") as f:
             f.write(md_s)
+    logging.debug(f"{user_name} 保存对话历史完毕")
+    return os.path.join(HISTORY_DIR, user_name, filename)
 def sorted_by_pinyin(list):
 def get_file_names(dir, plain=False, filetypes=[".json"]):
+    logging.debug(f"获取文件名列表，目录为{dir}，文件类型为{filetypes}，是否为纯文本列表{plain}")
     files = []
     try:
         for type in filetypes:
 def get_history_names(plain=False, user_name=""):
+    logging.debug(f"从用户 {user_name} 中获取历史记录文件名列表")
+    return get_file_names(os.path.join(HISTORY_DIR, user_name), plain)
 def load_template(filename, mode=0):
+    logging.debug(f"加载模板文件{filename}，模式为{mode}（0为返回字典和下拉菜单，1为返回下拉菜单，2为返回字典）")
     lines = []
     if filename.endswith(".json"):
         with open(os.path.join(TEMPLATES_DIR, filename), "r", encoding="utf8") as f:
             lines = json.load(f)
 def get_template_names(plain=False):
+    logging.debug("获取模板文件名列表")
     return get_file_names(TEMPLATES_DIR, plain, filetypes=[".csv", "json"])
 def get_template_content(templates, selection, original_system_prompt):
+    logging.debug(f"应用模板中，选择为{selection}，原始系统提示为{original_system_prompt}")
     try:
         return templates[selection]
     except:
         return original_system_prompt
 def reset_textbox():
     logging.debug("重置文本框")
     return gr.update(value="")
         logging.warning(f"无法获取IP地址信息。\n{data}")
         if data["reason"] == "RateLimited":
             return (
+                f"您的IP区域：未知。"
             )
         else:
             return f"获取IP地理位置失败。原因：{data['reason']}。你仍然可以使用聊天功能。"
 def start_outputing():
     logging.debug("显示取消按钮，隐藏发送按钮")
+    return gr.Button.update(visible=False), gr.Button.update(visible=True)
 def end_outputing():
     return (
         inputs,
         gr.update(value=""),
         gr.Button.update(visible=False),
+        gr.Button.update(visible=True),
     )
     return nodes
+def sheet_to_string(sheet, sheet_name = None):
+    result = []
     for index, row in sheet.iterrows():
         row_string = ""
         for column in sheet.columns:
             row_string += f"{column}: {row[column]}, "
         row_string = row_string.rstrip(", ")
         row_string += "."
+        result.append(row_string)
     return result
 def excel_to_string(file_path):
     excel_file = pd.read_excel(file_path, engine='openpyxl', sheet_name=None)
     # 初始化结果字符串
+    result = []
     # 遍历每一个工作表
     for sheet_name, sheet_data in excel_file.items():
         # 处理当前工作表并添加到结果字符串
+        result += sheet_to_string(sheet_data, sheet_name=sheet_name)
     return result
+def get_last_day_of_month(any_day):
+    # The day 28 exists in every month. 4 days later, it's always next month
+    next_month = any_day.replace(day=28) + datetime.timedelta(days=4)
+    # subtracting the number of the current day brings us back one month
+    return next_month - datetime.timedelta(days=next_month.day)
+def get_model_source(model_name, alternative_source):
+    if model_name == "gpt2-medium":
+        return "https://huggingface.co/gpt2-medium"

requirements.txt CHANGED Viewed

@@ -13,3 +13,4 @@ markdown
 PyPDF2
 pdfplumber
 pandas

 PyPDF2
 pdfplumber
 pandas
+commentjson

requirements_advanced.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+transformers
+torch
+icetk
+protobuf==3.19.0
+git+https://github.com/OptimalScale/LMFlow.git
+cpm-kernels
+sentence_transformers

run_Linux.sh CHANGED Viewed

@@ -1,10 +1,10 @@
 #!/bin/bash
 # 获取脚本所在目录
-script_dir=$(dirname "$0")
 # 将工作目录更改为脚本所在目录
-cd "$script_dir"
 # 检查Git仓库是否有更新
 git remote update
@@ -23,3 +23,9 @@ if ! git status -uno | grep 'up to date' > /dev/null; then
 	# 重新启动服务器
 	nohup python3 ChuanhuChatbot.py &
 fi

 #!/bin/bash
 # 获取脚本所在目录
+script_dir=$(dirname "$(readlink -f "$0")")
 # 将工作目录更改为脚本所在目录
+cd "$script_dir" || exit
 # 检查Git仓库是否有更新
 git remote update
 	# 重新启动服务器
 	nohup python3 ChuanhuChatbot.py &
 fi
+# 检查ChuanhuChatbot.py是否在运行
+if ! pgrep -f ChuanhuChatbot.py > /dev/null; then
+	# 如果没有运行，启动服务器
+	nohup python3 ChuanhuChatbot.py &
+fi

run_macOS.command CHANGED Viewed

@@ -1,10 +1,10 @@
 #!/bin/bash
 # 获取脚本所在目录
-script_dir=$(dirname "$0")
 # 将工作目录更改为脚本所在目录
-cd "$script_dir"
 # 检查Git仓库是否有更新
 git remote update
@@ -23,3 +23,9 @@ if ! git status -uno | grep 'up to date' > /dev/null; then
 	# 重新启动服务器
 	nohup python3 ChuanhuChatbot.py &
 fi

 #!/bin/bash
 # 获取脚本所在目录
+script_dir=$(dirname "$(readlink -f "$0")")
 # 将工作目录更改为脚本所在目录
+cd "$script_dir" || exit
 # 检查Git仓库是否有更新
 git remote update
 	# 重新启动服务器
 	nohup python3 ChuanhuChatbot.py &
 fi
+# 检查ChuanhuChatbot.py是否在运行
+if ! pgrep -f ChuanhuChatbot.py > /dev/null; then
+	# 如果没有运行，启动服务器
+	nohup python3 ChuanhuChatbot.py &
+fi