Spaces:
Running
Running
# AI Knowledge Distillation Platform Configuration | |
# تكوين منصة تقطير المعرفة للذكاء الاصطناعي | |
# System Configuration | |
system: | |
# Memory management settings | |
memory: | |
max_memory_gb: 14.0 # Maximum memory usage (leave 2GB for system) | |
chunk_size_mb: 500.0 # Chunk size for large model loading | |
cleanup_threshold: 0.85 # Memory usage threshold for cleanup | |
emergency_threshold: 0.95 # Emergency cleanup threshold | |
# CPU optimization settings | |
cpu: | |
max_threads: 8 # Maximum number of threads | |
use_intel_extension: true # Use Intel Extension for PyTorch if available | |
enable_mkl: true # Enable Intel MKL | |
enable_openmp: true # Enable OpenMP | |
# Storage settings | |
storage: | |
cache_dir: "./cache" | |
models_dir: "./models" | |
database_dir: "./database" | |
logs_dir: "./logs" | |
temp_dir: "./temp" | |
max_cache_size_gb: 20.0 # Maximum cache size | |
# Model Loading Configuration | |
models: | |
# Default settings for model loading | |
default_settings: | |
torch_dtype: "float32" # Use float32 for CPU | |
low_cpu_mem_usage: true | |
device_map: "cpu" | |
trust_remote_code: false | |
# Chunk loading settings | |
chunk_loading: | |
enabled: true | |
max_chunk_size_mb: 500.0 | |
max_cached_chunks: 3 | |
auto_cleanup: true | |
# Supported model types | |
supported_formats: | |
- ".pt" | |
- ".pth" | |
- ".bin" | |
- ".safetensors" | |
# Model size limits | |
size_limits: | |
small_model_mb: 1000 # Models under 1GB load normally | |
large_model_mb: 2000 # Models over 2GB use chunking | |
# Training Configuration | |
training: | |
# Default training parameters | |
default_params: | |
learning_rate: 0.0001 | |
batch_size: 4 # Small batch size for memory efficiency | |
max_steps: 1000 | |
temperature: 3.0 | |
alpha: 0.7 | |
save_steps: 100 | |
eval_steps: 50 | |
# Memory optimization during training | |
memory_optimization: | |
gradient_accumulation_steps: 4 | |
gradient_checkpointing: true | |
mixed_precision: false # Disable for CPU | |
dataloader_num_workers: 2 | |
# Medical Datasets Configuration | |
medical: | |
# Supported medical datasets | |
datasets: | |
roco_v2: | |
repo_id: "eltorio/ROCOv2-radiology" | |
streaming_supported: true | |
estimated_size_gb: 8.5 | |
ct_rate: | |
repo_id: "ibrahimhamamci/CT-RATE" | |
streaming_supported: true | |
estimated_size_gb: 12.3 | |
umie_datasets: | |
repo_id: "lion-ai/umie_datasets" | |
streaming_supported: true | |
estimated_size_gb: 15.7 | |
# DICOM processing settings | |
dicom: | |
memory_limit_mb: 1000.0 | |
default_window_center: 40 | |
default_window_width: 400 | |
default_output_size: [512, 512] | |
# Medical preprocessing settings | |
preprocessing: | |
target_size: [512, 512] | |
normalize_images: true | |
enhance_contrast: true | |
# Token Management Configuration | |
tokens: | |
# Encryption settings | |
encryption: | |
key_file: ".token_key" | |
algorithm: "Fernet" | |
# Token types and their properties | |
types: | |
read: | |
security_level: "medium" | |
recommended_for: "development" | |
write: | |
security_level: "high" | |
recommended_for: "production" | |
fine_grained: | |
security_level: "very_high" | |
recommended_for: "enterprise" | |
# Database Configuration | |
database: | |
# SQLite settings | |
sqlite: | |
database_dir: "./database" | |
backup_interval_hours: 24 | |
cleanup_days: 30 | |
# Connection settings | |
connection: | |
timeout: 30 | |
check_same_thread: false | |
# Web Server Configuration | |
server: | |
# FastAPI settings | |
host: "0.0.0.0" | |
port: 8000 | |
workers: 1 # Single worker for memory efficiency | |
reload: false | |
# CORS settings | |
cors: | |
allow_origins: ["*"] | |
allow_methods: ["GET", "POST", "PUT", "DELETE"] | |
allow_headers: ["*"] | |
# Upload settings | |
uploads: | |
max_file_size_mb: 5000 # 5GB max file size | |
allowed_extensions: [".pt", ".pth", ".bin", ".safetensors"] | |
temp_dir: "./temp" | |
# Logging Configuration | |
logging: | |
# Log levels | |
level: "INFO" | |
format: "%(asctime)s - %(name)s - %(levelname)s - %(message)s" | |
# File logging | |
file: | |
enabled: true | |
filename: "logs/app.log" | |
max_size_mb: 100 | |
backup_count: 5 | |
# Console logging | |
console: | |
enabled: true | |
level: "INFO" | |
# Specific logger levels | |
loggers: | |
uvicorn: "INFO" | |
transformers: "WARNING" | |
datasets: "WARNING" | |
torch: "WARNING" | |
# Performance Monitoring | |
monitoring: | |
# System metrics collection | |
system_metrics: | |
enabled: true | |
interval_seconds: 30 | |
store_in_database: true | |
# Memory monitoring | |
memory_monitoring: | |
enabled: true | |
alert_threshold: 0.85 | |
emergency_threshold: 0.95 | |
# Performance recommendations | |
recommendations: | |
enabled: true | |
check_interval_minutes: 5 | |
# Security Configuration | |
security: | |
# Token validation | |
token_validation: | |
enabled: true | |
cache_results: true | |
cache_duration_minutes: 60 | |
# File upload security | |
file_uploads: | |
scan_uploads: true | |
max_file_size_mb: 5000 | |
allowed_mime_types: | |
- "application/octet-stream" | |
- "application/x-pytorch" | |
# Feature Flags | |
features: | |
# Advanced features | |
memory_management: true | |
chunk_loading: true | |
cpu_optimization: true | |
medical_datasets: true | |
token_management: true | |
# Experimental features | |
experimental: | |
auto_model_optimization: true | |
progressive_loading: true | |
smart_caching: true | |
# Environment-specific overrides | |
environments: | |
development: | |
logging: | |
level: "DEBUG" | |
server: | |
reload: true | |
production: | |
logging: | |
level: "INFO" | |
server: | |
reload: false | |
security: | |
token_validation: | |
enabled: true | |