File size: 2,699 Bytes
815128e
 
 
 
 
 
 
 
 
 
7f9d16c
99d65c0
 
815128e
 
 
 
 
 
 
 
ab49330
815128e
c815d49
99d65c0
a08dbb5
a766494
815128e
 
 
 
 
 
99d65c0
 
815128e
 
 
 
 
 
 
 
 
 
99d65c0
 
 
 
815128e
 
 
99d65c0
815128e
 
 
c2cb992
7f9d16c
815128e
c2cb992
815128e
 
c2cb992
7f9d16c
815128e
59fc6ec
25ef847
 
815128e
 
 
 
 
 
 
99d65c0
815128e
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
# LLM_MODEL_TYPE=openai
# LLM_MODEL_TYPE=gpt4all-j
# LLM_MODEL_TYPE=gpt4all
# LLM_MODEL_TYPE=llamacpp
LLM_MODEL_TYPE=huggingface
# LLM_MODEL_TYPE=mosaicml
# LLM_MODEL_TYPE=stablelm

OPENAI_API_KEY=

# if unset, default to "gpt-3.5-turbo"
OPENAI_MODEL_NAME=

# cpu, mps or cuda:0 - if unset, use whatever detected
HF_EMBEDDINGS_DEVICE_TYPE=
HF_PIPELINE_DEVICE_TYPE=

# uncomment one of the below to load corresponding quantized model
# LOAD_QUANTIZED_MODEL=4bit
# LOAD_QUANTIZED_MODEL=8bit

DISABLE_MODEL_PRELOADING=true
CHAT_HISTORY_ENABLED=true
SHOW_PARAM_SETTINGS=false
SHARE_GRADIO_APP=false
PDF_FILE_BASE_URL=https://ai-engd.netlify.app/pdfs/books/

# if unset, default to "hkunlp/instructor-xl"
HF_EMBEDDINGS_MODEL_NAME="hkunlp/instructor-large"

# number of cpu cores - used to set n_threads for GPT4ALL & LlamaCpp models
NUMBER_OF_CPU_CORES=

HUGGINGFACE_AUTH_TOKEN=

USING_TORCH_BFLOAT16=true
# HUGGINGFACE_MODEL_NAME_OR_PATH="databricks/dolly-v2-3b"
# HUGGINGFACE_MODEL_NAME_OR_PATH="databricks/dolly-v2-7b"
# HUGGINGFACE_MODEL_NAME_OR_PATH="databricks/dolly-v2-12b"

# LLM_MODEL_TYPE must be set to huggingface
# HUGGINGFACE_MODEL_NAME_OR_PATH="TheBloke/wizardLM-7B-HF"
# HUGGINGFACE_MODEL_NAME_OR_PATH="TheBloke/vicuna-7B-1.1-HF"
# HUGGINGFACE_MODEL_NAME_OR_PATH="nomic-ai/gpt4all-j"
# HUGGINGFACE_MODEL_NAME_OR_PATH="nomic-ai/gpt4all-falcon"
# HUGGINGFACE_MODEL_NAME_OR_PATH="lmsys/fastchat-t5-3b-v1.0"
HUGGINGFACE_MODEL_NAME_OR_PATH="meta-llama/Llama-2-7b-chat-hf"
# HUGGINGFACE_MODEL_NAME_OR_PATH="meta-llama/Llama-2-13b-chat-hf"
# HUGGINGFACE_MODEL_NAME_OR_PATH="meta-llama/Llama-2-70b-chat-hf"

STABLELM_MODEL_NAME_OR_PATH="OpenAssistant/stablelm-7b-sft-v7-epoch-3"

MOSAICML_MODEL_NAME_OR_PATH="mosaicml/mpt-7b-instruct"

FALCON_MODEL_NAME_OR_PATH="tiiuae/falcon-7b-instruct"

GPT4ALL_J_MODEL_PATH="../models/llama-2-7b-chat.ggmlv3.q4_K_M.bin"
GPT4ALL_J_DOWNLOAD_LINK=https://huggingface.co/TheBloke/Llama-2-7B-Chat-GGML/resolve/main/llama-2-7b-chat.ggmlv3.q4_0.bin

GPT4ALL_MODEL_PATH="../models/ggml-nous-gpt4-vicuna-13b.bin"
GPT4ALL_DOWNLOAD_LINK=https://gpt4all.io/models/ggml-nous-gpt4-vicuna-13b.bin

LLAMACPP_MODEL_PATH="../models/llama-2-7b-chat.ggmlv3.q4_K_M.bin"
LLAMACPP_DOWNLOAD_LINK=https://huggingface.co/TheBloke/Llama-2-7B-Chat-GGML/resolve/main/llama-2-7b-chat.ggmlv3.q4_K_M.bin

# Index for AI Books PDF files - chunk_size=1024 chunk_overlap=512
# CHROMADB_INDEX_PATH="./data/chromadb_1024_512/"
FAISS_INDEX_PATH="./data/faiss_1024_512/"

QUESTIONS_FILE_PATH="./data/questions.txt"

TOKENIZERS_PARALLELISM=true

# env variables for ingesting source PDF files
SOURCE_PDFS_PATH="./data/pdfs/"
SOURCE_URLS="./data/pci_dss_urls.txt"
CHUNCK_SIZE=1024
CHUNK_OVERLAP=512