File size: 1,594 Bytes
454e47c ea0b2a0 454e47c ea0b2a0 454e47c ea0b2a0 454e47c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 |
"""
Distiller package for code-specialized embedding model distillation and evaluation.
This package provides a complete pipeline for:
1. Distilling code-specialized embedding models using Model2Vec
2. Comprehensive evaluation including CodeSearchNet and performance benchmarks
3. Analysis and reporting of model performance
Main modules:
- distill: Model2Vec distillation with optional advanced training
- evaluate: Comprehensive evaluation (CodeSearchNet + performance benchmarks)
- analyze: Analysis and reporting tools
- config: Centralized configuration management
- beam_utils: Beam cloud utilities for distributed processing
Usage:
from distiller import distill, evaluate, analyze
"""
from . import analyze, config, distill, evaluate
from .analyze import CodeSearchNetAnalyzer
from .config import (
BEAM_ENV_SETTINGS,
DEFAULT_EVALUATION_MODELS,
IMAGE,
codesearchnet_config,
directories,
distillation_config,
get_volume_config,
languages_config,
)
from .distill import (
run_beam_distillation,
run_local_distillation,
)
from .evaluate import (
CodeSearchNetEvaluator,
ComprehensiveModelEvaluator,
run_evaluation,
)
__all__ = [
# Configuration
"BEAM_ENV_SETTINGS",
"DEFAULT_EVALUATION_MODELS",
"IMAGE",
# Main classes
"CodeSearchNetAnalyzer",
"CodeSearchNetEvaluator",
"ComprehensiveModelEvaluator",
# Modules
"analyze",
"codesearchnet_config",
"config",
"directories",
"distill",
"distillation_config",
"evaluate",
"get_volume_config",
"languages_config",
# Main functions
"run_beam_distillation",
"run_evaluation",
"run_local_distillation",
]
|