Spaces:
Running
Running
# Epic 2 Configuration with Graph Enhancement - Calibration Ready | |
# This config enables graph enhancement with all parameters registered for calibration | |
# Document processor for handling input files | |
document_processor: | |
type: "hybrid_pdf" | |
config: | |
chunk_size: 1024 | |
chunk_overlap: 128 | |
# High-performance embedder for Epic 2 | |
embedder: | |
type: "modular" | |
config: | |
model: | |
type: "sentence_transformer" | |
config: | |
model_name: "sentence-transformers/multi-qa-MiniLM-L6-cos-v1" | |
device: "mps" | |
normalize_embeddings: true | |
batch_processor: | |
type: "dynamic" | |
config: | |
initial_batch_size: 64 | |
max_batch_size: 256 | |
optimize_for_memory: false | |
cache: | |
type: "memory" | |
config: | |
max_entries: 100000 | |
max_memory_mb: 1024 | |
# Epic 2 with Graph Enhancement - All Parameters Calibration-Ready | |
retriever: | |
type: "modular_unified" | |
config: | |
min_semantic_alignment: 0.2 | |
vector_index: | |
type: "faiss" | |
config: | |
index_type: "IndexFlatIP" | |
normalize_embeddings: true | |
metric: "cosine" | |
sparse: | |
type: "bm25" | |
config: | |
k1: 1.2 # Calibration parameter | |
b: 0.75 # Calibration parameter (original "problematic" value) | |
lowercase: true | |
filter_stop_words: true | |
stop_word_sets: ["english_common"] | |
preserve_technical_terms: true | |
# Basic RRF Fusion (default configuration) | |
fusion: | |
type: "rrf" | |
config: | |
k: 60 # RRF discriminative power | |
weights: | |
dense: 0.7 # Dense weight | |
sparse: 0.3 # Sparse weight | |
# Basic Identity Reranker (no reranking) | |
reranker: | |
type: "identity" | |
config: | |
enabled: false | |
# Mock answer generation for testing | |
answer_generator: | |
type: "adaptive_modular" | |
config: | |
llm_client: | |
type: "mock" | |
config: | |
model_name: "mock-llm-for-testing" | |
response_pattern: "technical" | |
include_citations: true | |
temperature: 0.3 | |
max_tokens: 1024 | |
confidence_threshold: 0.85 # Calibration parameter | |
prompt_builder: | |
type: "simple" | |
config: | |
max_context_length: 12000 | |
include_instructions: true | |
citation_style: "inline" | |
response_parser: | |
type: "markdown" | |
config: | |
preserve_formatting: true | |
extract_citations: true | |
confidence_scorer: | |
type: "semantic" | |
config: | |
relevance_weight: 0.4 | |
grounding_weight: 0.4 | |
quality_weight: 0.2 | |
# Global settings | |
global_settings: | |
log_level: "INFO" | |
cache_enabled: true | |
performance_monitoring: true | |
max_concurrent_requests: 8 |