-
Notifications
You must be signed in to change notification settings - Fork 1
/
config.ini
68 lines (59 loc) · 1.6 KB
/
config.ini
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
[llm]
model_name : Llama-2-13b-chat
# meta-llama/Llama-2-70b-chat-hf Mixtral-8x7B-Instruct-v0.1
quantization : Q5_K_M
pipeline : llama_cpp
device_map : auto
task : text-generation
max_new_tokens : 1024
temperature : 0.1
n_batch : 1024
n_ctx : 6000
n_gpu_layers : -1
# The number of layers to put on the GPU. Mixtral-18, gemma-20
std_out : True
;base_dir : ${root:root_path}/models
[chroma_client]
host : localhost
port : 8000
collection_name : arxiv
# embedding_type : sentence-transformers
# embedding_model : "all-mpnet-base-v2"
embedding_type : instructor-embedding
embedding_model : hkunlp/instructor-xl
;store_path : ${data:data_path}/vectordb
;allow_reset : True
[deeplake_client]
collection_name : arxiv
# embedding_type : sentence-transformers
# embedding_model : "all-mpnet-base-v2"
embedding_type : instructor-embedding
embedding_model : hkunlp/instructor-xl
store_path : ${data:data_path}/vectordb
[text_splitter]
chunk_size : 5000
chunk_overlap : 400
[multivec_retriever]
# store_path: data/docs
store_path : ${data:data_path}/doc_store
# namespace: UUID(8c9040b0-b5cd-4d7c-bc2e-737da1b24ebf)
namespace : 8c9040b0b5cd4d7cbc2e737da1b24ebf
id_key : doc_id
top_k : 3
[parse_pdf]
single_text_out : True
strategy : hi_res
infer_table_structure : True
extract_images : True
image_output_dir : None
add_captions_to_text : True
add_captions_to_blocks : True
table_as_html : True
[data]
data_path : ${root:root_path}/data
[env]
env_path : ${root:root_path}/.env
[root]
root_path : /home/ubuntu/volume_2k/Capstone_5
;[quantize]
;llama_cpp_path : ${root:root_path}