enhanced-rag-demo / config /default.yaml
Arthur Passuello
initial commit
5e1a30c
# Epic 2 Configuration with Graph Enhancement - Calibration Ready
# This config enables graph enhancement with all parameters registered for calibration
# Document processor for handling input files
document_processor:
type: "hybrid_pdf"
config:
chunk_size: 1024
chunk_overlap: 128
# High-performance embedder for Epic 2
embedder:
type: "modular"
config:
model:
type: "sentence_transformer"
config:
model_name: "sentence-transformers/multi-qa-MiniLM-L6-cos-v1"
device: "mps"
normalize_embeddings: true
batch_processor:
type: "dynamic"
config:
initial_batch_size: 64
max_batch_size: 256
optimize_for_memory: false
cache:
type: "memory"
config:
max_entries: 100000
max_memory_mb: 1024
# Epic 2 with Graph Enhancement - All Parameters Calibration-Ready
retriever:
type: "modular_unified"
config:
min_semantic_alignment: 0.2
vector_index:
type: "faiss"
config:
index_type: "IndexFlatIP"
normalize_embeddings: true
metric: "cosine"
sparse:
type: "bm25"
config:
k1: 1.2 # Calibration parameter
b: 0.75 # Calibration parameter (original "problematic" value)
lowercase: true
filter_stop_words: true
stop_word_sets: ["english_common"]
preserve_technical_terms: true
# Basic RRF Fusion (default configuration)
fusion:
type: "rrf"
config:
k: 60 # RRF discriminative power
weights:
dense: 0.7 # Dense weight
sparse: 0.3 # Sparse weight
# Basic Identity Reranker (no reranking)
reranker:
type: "identity"
config:
enabled: false
# Mock answer generation for testing
answer_generator:
type: "adaptive_modular"
config:
llm_client:
type: "mock"
config:
model_name: "mock-llm-for-testing"
response_pattern: "technical"
include_citations: true
temperature: 0.3
max_tokens: 1024
confidence_threshold: 0.85 # Calibration parameter
prompt_builder:
type: "simple"
config:
max_context_length: 12000
include_instructions: true
citation_style: "inline"
response_parser:
type: "markdown"
config:
preserve_formatting: true
extract_citations: true
confidence_scorer:
type: "semantic"
config:
relevance_weight: 0.4
grounding_weight: 0.4
quality_weight: 0.2
# Global settings
global_settings:
log_level: "INFO"
cache_enabled: true
performance_monitoring: true
max_concurrent_requests: 8