From 59375244b68051d82989667c167417138a899e14 Mon Sep 17 00:00:00 2001 From: imClumsyPanda Date: Sat, 15 Apr 2023 20:01:36 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BF=AE=E5=A4=8D=20webui.py=20=E4=B8=AD=20llm?= =?UTF-8?q?=5Fhistory=5Flen=20=E5=92=8C=20vector=5Fsearch=5Ftop=5Fk=20?= =?UTF-8?q?=E6=98=BE=E7=A4=BA=E5=80=BC=E4=B8=8E=E5=90=AF=E5=8A=A8=E8=AE=BE?= =?UTF-8?q?=E7=BD=AE=E9=BB=98=E8=AE=A4=E5=80=BC=E4=B8=8D=E4=B8=80=E8=87=B4?= =?UTF-8?q?=E7=9A=84=E9=97=AE=E9=A2=98?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- chains/local_doc_qa.py | 5 +---- webui.py | 17 +++++++++++++---- 2 files changed, 14 insertions(+), 8 deletions(-) diff --git a/chains/local_doc_qa.py b/chains/local_doc_qa.py index 12489426..8b9cff99 100644 --- a/chains/local_doc_qa.py +++ b/chains/local_doc_qa.py @@ -11,14 +11,11 @@ import datetime from typing import List # return top-k text chunk from vector store -VECTOR_SEARCH_TOP_K = 10 +VECTOR_SEARCH_TOP_K = 6 # LLM input history length LLM_HISTORY_LEN = 3 -# Show reply with source text from input document -REPLY_WITH_SOURCE = True - class LocalDocQA: llm: object = None diff --git a/webui.py b/webui.py index b2ed760f..65c21d8e 100644 --- a/webui.py +++ b/webui.py @@ -4,6 +4,11 @@ import shutil from chains.local_doc_qa import LocalDocQA from configs.model_config import * +# return top-k text chunk from vector store +VECTOR_SEARCH_TOP_K = 6 + +# LLM input history length +LLM_HISTORY_LEN = 3 def get_file_list(): if not os.path.exists("content"): @@ -124,7 +129,7 @@ with gr.Blocks(css=block_css) as demo: interactive=True) llm_history_len = gr.Slider(0, 10, - value=3, + value=LLM_HISTORY_LEN, step=1, label="LLM history len", interactive=True) @@ -137,7 +142,7 @@ with gr.Blocks(css=block_css) as demo: interactive=True) top_k = gr.Slider(1, 20, - value=6, + value=VECTOR_SEARCH_TOP_K, step=1, label="向量匹配 top k", interactive=True) @@ -173,5 +178,9 @@ with gr.Blocks(css=block_css) as demo: [chatbot, query], ) -demo.queue(concurrency_count=3).launch( - server_name='0.0.0.0', share=False, inbrowser=False) +demo.queue(concurrency_count=3 + ).launch(server_name='0.0.0.0', + server_port=7860, + show_api=False, + share=False, + inbrowser=False)