Konect-U-GPT

Runtime error

App Files Files Community

Sean-Case commited on Oct 20, 2023

Commit

c2ff47a

•

1 Parent(s): 7339026

Put sources behind accordion, minor change to model params. Gitignore update

Browse files

Files changed (3) hide show

.gitignore +3 -1
app.py +5 -3
chatfuncs/chatfuncs.py +2 -3

.gitignore CHANGED Viewed

@@ -3,6 +3,8 @@
 *.pdf
 *.spec
 *.toc
 bootstrapper.py
 build/*
-dist/*

 *.pdf
 *.spec
 *.toc
+*.csv
 bootstrapper.py
 build/*
+dist/*
+Q tests/*

app.py CHANGED Viewed

@@ -95,11 +95,13 @@ def load_model(model_type, gpu_layers, gpu_config=None, cpu_config=None, torch_d
             #model = AutoModelForCausalLM.from_pretrained('Aryanne/Orca-Mini-3B-gguf', model_type='llama', model_file='q5_0-orca-mini-3b.gguf', **vars(gpu_config)) # **asdict(CtransRunConfig_cpu())
             #model = AutoModelForCausalLM.from_pretrained('Aryanne/Wizard-Orca-3B-gguf', model_type='llama', model_file='q4_1-wizard-orca-3b.gguf', **vars(gpu_config)) # **asdict(CtransRunConfig_cpu())
             model = AutoModelForCausalLM.from_pretrained('TheBloke/Mistral-7B-OpenOrca-GGUF', model_type='mistral', model_file='mistral-7b-openorca.Q4_K_M.gguf', **vars(gpu_config)) # **asdict(CtransRunConfig_cpu())
         except:
             #model = AutoModelForCausalLM.from_pretrained('Aryanne/Orca-Mini-3B-gguf', model_type='llama', model_file='q5_0-orca-mini-3b.gguf', **vars(cpu_config)) #**asdict(CtransRunConfig_gpu())
             #model = AutoModelForCausalLM.from_pretrained('Aryanne/Wizard-Orca-3B-gguf', model_type='llama', model_file='q4_1-wizard-orca-3b.gguf', **vars(cpu_config)) # **asdict(CtransRunConfig_cpu())
             model = AutoModelForCausalLM.from_pretrained('TheBloke/Mistral-7B-OpenOrca-GGUF', model_type='mistral', model_file='mistral-7b-openorca.Q4_K_M.gguf', **vars(cpu_config)) # **asdict(CtransRunConfig_cpu())
         tokenizer = []
@@ -192,12 +194,12 @@ with block:
         with gr.Row():
             chat_height = 500
             chatbot = gr.Chatbot(height=chat_height, avatar_images=('user.jfif', 'bot.jpg'),bubble_full_width = False, scale = 1)
-            #sources = gr.HTML(value = "Source paragraphs with the most relevant text will appear here", height=chat_height, scale = 2)
-            sources = gr.Markdown(value = "Source paragraphs with the most relevant text will appear here", height=chat_height, scale = 2)
         with gr.Row():
             message = gr.Textbox(
-                label="Enter your question here.",
                 lines=1,
             )
         with gr.Row():

             #model = AutoModelForCausalLM.from_pretrained('Aryanne/Orca-Mini-3B-gguf', model_type='llama', model_file='q5_0-orca-mini-3b.gguf', **vars(gpu_config)) # **asdict(CtransRunConfig_cpu())
             #model = AutoModelForCausalLM.from_pretrained('Aryanne/Wizard-Orca-3B-gguf', model_type='llama', model_file='q4_1-wizard-orca-3b.gguf', **vars(gpu_config)) # **asdict(CtransRunConfig_cpu())
             model = AutoModelForCausalLM.from_pretrained('TheBloke/Mistral-7B-OpenOrca-GGUF', model_type='mistral', model_file='mistral-7b-openorca.Q4_K_M.gguf', **vars(gpu_config)) # **asdict(CtransRunConfig_cpu())
+            #model = AutoModelForCausalLM.from_pretrained('TheBloke/MistralLite-7B-GGUF', model_type='mistral', model_file='mistrallite.Q4_K_M.gguf', **vars(gpu_config)) # **asdict(CtransRunConfig_cpu())
         except:
             #model = AutoModelForCausalLM.from_pretrained('Aryanne/Orca-Mini-3B-gguf', model_type='llama', model_file='q5_0-orca-mini-3b.gguf', **vars(cpu_config)) #**asdict(CtransRunConfig_gpu())
             #model = AutoModelForCausalLM.from_pretrained('Aryanne/Wizard-Orca-3B-gguf', model_type='llama', model_file='q4_1-wizard-orca-3b.gguf', **vars(cpu_config)) # **asdict(CtransRunConfig_cpu())
             model = AutoModelForCausalLM.from_pretrained('TheBloke/Mistral-7B-OpenOrca-GGUF', model_type='mistral', model_file='mistral-7b-openorca.Q4_K_M.gguf', **vars(cpu_config)) # **asdict(CtransRunConfig_cpu())
+            #model = AutoModelForCausalLM.from_pretrained('TheBloke/MistralLite-7B-GGUF', model_type='mistral', model_file='mistrallite.Q4_K_M.gguf', **vars(cpu_config)) # **asdict(CtransRunConfig_cpu())
         tokenizer = []
         with gr.Row():
             chat_height = 500
             chatbot = gr.Chatbot(height=chat_height, avatar_images=('user.jfif', 'bot.jpg'),bubble_full_width = False, scale = 1)
+            with gr.Accordion("Open this tab to see the source paragraphs used to generate the answer", open = False):
+                sources = gr.HTML(value = "Source paragraphs with the most relevant text will appear here", height=chat_height, scale = 2)
         with gr.Row():
             message = gr.Textbox(
+                label="Enter your question here",
                 lines=1,
             )
         with gr.Row():

chatfuncs/chatfuncs.py CHANGED Viewed

@@ -84,15 +84,14 @@ top_k: int = 3
 top_p: float = 1
 repetition_penalty: float = 1.3
 flan_alpaca_repetition_penalty: float = 1.3
-tinyllama_repetition_penalty: float = 1.5
 last_n_tokens: int = 64
-max_new_tokens: int = 512
 seed: int = 42
 reset: bool = False
 stream: bool = True
 threads: int = threads
 batch_size:int = 256
-context_length:int = 4096
 sample = True

 top_p: float = 1
 repetition_penalty: float = 1.3
 flan_alpaca_repetition_penalty: float = 1.3
 last_n_tokens: int = 64
+max_new_tokens: int = 256
 seed: int = 42
 reset: bool = False
 stream: bool = True
 threads: int = threads
 batch_size:int = 256
+context_length:int = 2048
 sample = True