|
{ |
|
"config": { |
|
"batch_size": 16, |
|
"cost_coefficients": {}, |
|
"cost_function_type": "separable", |
|
"device_map": "auto", |
|
"early_stopping_patience": 3, |
|
"enable_strategic_mode": false, |
|
"epochs": 10, |
|
"ewc_lambda": 100.0, |
|
"gradient_checkpointing": false, |
|
"learning_rate": 2e-05, |
|
"max_examples_per_class": 150, |
|
"max_length": 512, |
|
"min_confidence": 0.1, |
|
"min_examples_per_class": 3, |
|
"neural_weight": 0.4, |
|
"num_representative_examples": 5, |
|
"prototype_update_frequency": 10, |
|
"prototype_weight": 0.6, |
|
"quantization": null, |
|
"similarity_threshold": 0.7, |
|
"strategic_blend_regular_weight": 0.6, |
|
"strategic_blend_strategic_weight": 0.4, |
|
"strategic_lambda": 0.1, |
|
"strategic_prediction_head_weight": 0.5, |
|
"strategic_prediction_proto_weight": 0.5, |
|
"strategic_robust_head_weight": 0.2, |
|
"strategic_robust_proto_weight": 0.8, |
|
"strategic_training_frequency": 10, |
|
"warmup_steps": 0 |
|
}, |
|
"embedding_dim": 768, |
|
"id_to_label": { |
|
"0": "poor_quality", |
|
"1": "high_quality" |
|
}, |
|
"label_to_id": { |
|
"high_quality": 1, |
|
"poor_quality": 0 |
|
}, |
|
"model_name": "answerdotai/ModernBERT-base", |
|
"train_steps": 6 |
|
} |