# TheDataGuy Chat Configuration # Copy this file to .env and fill in your values # OpenAI API Key - Required for LLM and embeddings OPENAI_API_KEY=your_openai_api_key_here # Vector Store Configuration VECTOR_STORAGE_PATH=./db/vector_store_tdg QDRANT_COLLECTION=thedataguy_documents # Model Configuration EMBEDDING_MODEL=Snowflake/snowflake-arctic-embed-l LLM_MODEL=gpt-4o-mini LLM_TEMPERATURE=0 # For evaluation and synthetic data generation (optional) SDG_LLM_MODEL=gpt-4.1 EVAL_LLM_MODEL=gpt-4.1 # Blog Configuration DATA_DIR=data/ BLOG_BASE_URL=https://thedataguy.pro/blog/ # Search Configuration MAX_SEARCH_RESULTS=5 # Document Chunking Configuration CHUNK_SIZE=1000 CHUNK_OVERLAP=200 # Vector Database Creation Configuration FORCE_RECREATE=False OUTPUT_DIR=./stats USE_CHUNKING=True SHOULD_SAVE_STATS=True