File size: 819 Bytes
2754790
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3379e0a
 
 
 
a092eef
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
# TheDataGuy Chat Configuration
# Copy this file to .env and fill in your values

# OpenAI API Key - Required for LLM and embeddings
OPENAI_API_KEY=your_openai_api_key_here

# Vector Store Configuration
VECTOR_STORAGE_PATH=./db/vector_store_tdg
QDRANT_COLLECTION=thedataguy_documents

# Model Configuration
EMBEDDING_MODEL=Snowflake/snowflake-arctic-embed-l
LLM_MODEL=gpt-4o-mini
LLM_TEMPERATURE=0

# For evaluation and synthetic data generation (optional)
SDG_LLM_MODEL=gpt-4.1
EVAL_LLM_MODEL=gpt-4.1

# Blog Configuration
DATA_DIR=data/
BLOG_BASE_URL=https://thedataguy.pro/blog/

# Search Configuration
MAX_SEARCH_RESULTS=5

# Document Chunking Configuration
CHUNK_SIZE=1000
CHUNK_OVERLAP=200

# Vector Database Creation Configuration
FORCE_RECREATE=False
OUTPUT_DIR=./stats
USE_CHUNKING=True
SHOULD_SAVE_STATS=True