File size: 1,249 Bytes
48b24d3 789527d 48b24d3 789527d 48b24d3 789527d 48b24d3 81cc47c 789527d 48b24d3 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 |
{
"config": {
"batch_size": 16,
"cost_coefficients": {},
"cost_function_type": "separable",
"device_map": "auto",
"early_stopping_patience": 3,
"enable_strategic_mode": false,
"epochs": 10,
"ewc_lambda": 100.0,
"gradient_checkpointing": false,
"learning_rate": 0.0005,
"max_examples_per_class": 500,
"max_length": 512,
"min_confidence": 0.1,
"min_examples_per_class": 3,
"neural_weight": 0.2,
"num_representative_examples": 5,
"prototype_update_frequency": 50,
"prototype_weight": 0.8,
"quantization": null,
"similarity_threshold": 0.7,
"strategic_blend_regular_weight": 0.6,
"strategic_blend_strategic_weight": 0.4,
"strategic_lambda": 0.1,
"strategic_prediction_head_weight": 0.5,
"strategic_prediction_proto_weight": 0.5,
"strategic_robust_head_weight": 0.2,
"strategic_robust_proto_weight": 0.8,
"strategic_training_frequency": 10,
"warmup_steps": 0
},
"embedding_dim": 768,
"id_to_label": {
"0": "HIGH",
"1": "LOW"
},
"label_to_id": {
"HIGH": 0,
"LOW": 1
},
"model_name": "distilbert/distilbert-base-cased",
"train_steps": 3688,
"training_history": {
"HIGH": 29504,
"LOW": 29504
}
} |