-
Notifications
You must be signed in to change notification settings - Fork 83
/
Copy pathconfig.yaml
63 lines (50 loc) · 1.4 KB
/
config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
# config.yaml
project:
name: "Simba"
version: "1.0.0"
api_version: "/api/v1"
paths:
base_dir: null # Will be set programmatically
faiss_index_dir: "vector_stores/faiss_index"
vector_store_dir: "vector_stores"
llm:
provider: "openai"
model_name: "gpt-4o-mini"
temperature: 0.0
max_tokens: null
streaming: true
additional_params: {}
embedding:
provider: "huggingface"
model_name: "BAAI/bge-base-en-v1.5"
#model_name: "openai/clip-vit-base-patch32"
device: "mps" # Changed from mps to cpu for container compatibility
additional_params: {}
vector_store:
provider: "faiss"
collection_name: "simba_collection"
additional_params: {}
chunking:
chunk_size: 512
chunk_overlap: 200
retrieval:
method: "hybrid" # Options: default, semantic, keyword, hybrid, ensemble, reranked
k: 5
# Method-specific parameters
params:
# Semantic retrieval parameters
score_threshold: 0.5
# Hybrid retrieval parameters
prioritize_semantic: true
# Ensemble retrieval parameters
weights: [0.7, 0.3] # Weights for semantic and keyword retrievers
# Reranking parameters
reranker_model: colbert
reranker_threshold: 0.7
# Database configuration
database:
provider: litedb # Options: litedb, sqlite
additional_params: {}
celery:
broker_url: ${CELERY_BROKER_URL:-redis://redis:6379/0}
result_backend: ${CELERY_RESULT_BACKEND:-redis://redis:6379/1}