dialogsum-ru-intent-rubert / multitask_config.json
ozonize's picture
Update artifacts from notebook 11: multitask_config.json
60f2d48 verified
{
"model_name": "DeepPavlov/rubert-base-cased-conversational",
"max_len": 128,
"batch_size": 16,
"epochs": 10,
"lr": 2e-05,
"weight_decay": 0.01,
"use_uncertainty_weighting": false,
"use_coarse_topic_head": true,
"lambda_intent": 1.0,
"lambda_topic": 0.1,
"lambda_coarse_topic": 0.1,
"class_weight_mode": "sqrt",
"class_weight_power": 0.5,
"detach_topic_grad": true,
"detach_coarse_topic_grad": false,
"top_n_clusters": 10,
"min_intent_count": 20,
"max_samples": null,
"freeze_encoder": false,
"use_class_weights": true,
"patience": 2,
"run_ablation": false,
"ablation_lambdas": [
0.1,
1.0
],
"active_learning_candidate_pool": 500,
"active_learning_top_n": 100,
"active_learning_max_per_pred_intent": 15,
"active_learning_max_per_cluster": 15,
"random_state": 42,
"num_intents": 14,
"num_topics": 10,
"num_coarse_topics": 5,
"intent_classes": [
"arrangement",
"complaint",
"confirmation",
"farewell",
"greeting",
"informational_request",
"opinion_or_preference",
"other",
"problem_report",
"purchase_or_booking_request",
"rejection",
"service_request",
"suggestion_or_recommendation",
"thanks"
],
"topic_classes": [
28,
77,
114,
145,
169,
186,
187,
202,
204,
206
],
"coarse_topic_classes": [
"дом_сервис",
"жалобы_проблемы",
"культура_досуг",
"путешествия_сервис",
"работа_образование"
],
"used_fallback_weak_labels": false,
"device": "cuda",
"train_size": 3007,
"val_size": 645,
"test_size": 645
}