veryfansome commited on
Commit
5e7aec5
·
1 Parent(s): 84c7b94

Added training command

Browse files
models/ud_ewt_gum_pud_20250610/README.md CHANGED
@@ -326,6 +326,7 @@ weighted avg 1.00 0.99 1.00 54358
326
 
327
  ## Training logs
328
  ```
 
329
  {'loss': 167.3008, 'grad_norm': 78.67291259765625, 'learning_rate': 1.3605442176870749e-05, 'epoch': 0.68}
330
  {'eval_loss': 6.9092020988464355, 'eval_f1_macro': 0.3894647498221998, 'eval_xpos_accuracy': 0.4056051740067755, 'eval_xpos_precision_macro': 0.07715923171265232, 'eval_xpos_recall_macro': 0.09578323169321702, 'eval_xpos_f1_macro': 0.06760571983122861, 'eval_xpos_precision_micro': 0.4056051740067755, 'eval_xpos_recall_micro': 0.4056051740067755, 'eval_xpos_f1_micro': 0.4056051740067755, 'eval_deprel_accuracy': 0.39214659685863873, 'eval_deprel_precision_macro': 0.06449934886885347, 'eval_deprel_recall_macro': 0.10861127424632379, 'eval_deprel_f1_macro': 0.07442277240270408, 'eval_deprel_precision_micro': 0.39214659685863873, 'eval_deprel_recall_micro': 0.39214659685863873, 'eval_deprel_f1_micro': 0.39214659685863873, 'eval_pos_accuracy': 0.6299045272559286, 'eval_pos_precision_macro': 0.3789462822637483, 'eval_pos_recall_macro': 0.3314686217408947, 'eval_pos_f1_macro': 0.2862715500361932, 'eval_pos_precision_micro': 0.6299045272559286, 'eval_pos_recall_micro': 0.6299045272559286, 'eval_pos_f1_micro': 0.6299045272559286, 'eval_Abbr_accuracy': 0.9993840468124423, 'eval_Abbr_precision_macro': 0.49969202340622115, 'eval_Abbr_recall_macro': 0.5, 'eval_Abbr_f1_macro': 0.4998459642637092, 'eval_Abbr_precision_micro': 0.9993840468124423, 'eval_Abbr_recall_micro': 0.9993840468124423, 'eval_Abbr_f1_micro': 0.9993840468124423, 'eval_Case_accuracy': 0.9816445950107792, 'eval_Case_precision_macro': 0.6237830971493706, 'eval_Case_recall_macro': 0.5995542599176837, 'eval_Case_f1_macro': 0.6108994481245369, 'eval_Case_precision_micro': 0.9816445950107792, 'eval_Case_recall_micro': 0.9816445950107792, 'eval_Case_f1_micro': 0.9816445950107792, 'eval_Definite_accuracy': 0.9671388974437942, 'eval_Definite_precision_macro': 0.570645217925757, 'eval_Definite_recall_macro': 0.5851893604042604, 'eval_Definite_f1_macro': 0.5778223477074399, 'eval_Definite_precision_micro': 0.9671388974437942, 'eval_Definite_recall_micro': 0.9671388974437942, 'eval_Definite_f1_micro': 0.9671388974437942, 'eval_Degree_accuracy': 0.9235294117647059, 'eval_Degree_precision_macro': 0.48088176414426065, 'eval_Degree_recall_macro': 0.25010931351114996, 'eval_Degree_f1_macro': 0.24027937527607288, 'eval_Degree_precision_micro': 0.9235294117647059, 'eval_Degree_recall_micro': 0.9235294117647059, 'eval_Degree_f1_micro': 0.9235294117647059, 'eval_Foreign_accuracy': 0.9999384046812442, 'eval_Foreign_precision_macro': 0.4999692023406221, 'eval_Foreign_recall_macro': 0.5, 'eval_Foreign_f1_macro': 0.49998460069604855, 'eval_Foreign_precision_micro': 0.9999384046812442, 'eval_Foreign_recall_micro': 0.9999384046812442, 'eval_Foreign_f1_micro': 0.9999384046812442, 'eval_Gender_accuracy': 0.9816137973514013, 'eval_Gender_precision_macro': 0.24545636570865292, 'eval_Gender_recall_macro': 0.24994510664993727, 'eval_Gender_f1_macro': 0.2476804003543509, 'eval_Gender_precision_micro': 0.9816137973514013, 'eval_Gender_recall_micro': 0.9816137973514013, 'eval_Gender_f1_micro': 0.9816137973514013, 'eval_Mood_accuracy': 0.9319063751154912, 'eval_Mood_precision_macro': 0.6387004043049438, 'eval_Mood_recall_macro': 0.3883744843777621, 'eval_Mood_f1_macro': 0.41581031611224173, 'eval_Mood_precision_micro': 0.9319063751154912, 'eval_Mood_recall_micro': 0.9319063751154912, 'eval_Mood_f1_micro': 0.9319063751154912, 'eval_NumType_accuracy': 0.9828765013858947, 'eval_NumType_precision_macro': 0.24571912534647367, 'eval_NumType_recall_macro': 0.25, 'eval_NumType_f1_macro': 0.24784107852882703, 'eval_NumType_precision_micro': 0.9828765013858947, 'eval_NumType_recall_micro': 0.9828765013858947, 'eval_NumType_f1_micro': 0.9828765013858947, 'eval_Number_accuracy': 0.8546966430551278, 'eval_Number_precision_macro': 0.8775308105441524, 'eval_Number_recall_macro': 0.5982683704051597, 'eval_Number_f1_macro': 0.5746129222413208, 'eval_Number_precision_micro': 0.8546966430551278, 'eval_Number_recall_micro': 0.8546966430551278, 'eval_Number_f1_micro': 0.8546966430551278, 'eval_Person_accuracy': 0.9288882044964583, 'eval_Person_precision_macro': 0.60663366254716, 'eval_Person_recall_macro': 0.34372242024231814, 'eval_Person_f1_macro': 0.35067286612707, 'eval_Person_precision_micro': 0.9288882044964583, 'eval_Person_recall_micro': 0.9288882044964583, 'eval_Person_f1_micro': 0.9288882044964583, 'eval_Polarity_accuracy': 0.9957191253464737, 'eval_Polarity_precision_macro': 0.49785956267323683, 'eval_Polarity_recall_macro': 0.5, 'eval_Polarity_f1_macro': 0.4989274856869493, 'eval_Polarity_precision_micro': 0.9957191253464737, 'eval_Polarity_recall_micro': 0.9957191253464737, 'eval_Polarity_f1_micro': 0.9957191253464737, 'eval_PronType_accuracy': 0.9723129042192793, 'eval_PronType_precision_macro': 0.4836619126413276, 'eval_PronType_recall_macro': 0.49156583018410926, 'eval_PronType_f1_macro': 0.4875445572326604, 'eval_PronType_precision_micro': 0.9723129042192793, 'eval_PronType_recall_micro': 0.9723129042192793, 'eval_PronType_f1_micro': 0.9723129042192793, 'eval_Poss_accuracy': 0.9857098860486603, 'eval_Poss_precision_macro': 0.49285494302433014, 'eval_Poss_recall_macro': 0.5, 'eval_Poss_f1_macro': 0.49640176189589924, 'eval_Poss_precision_micro': 0.9857098860486603, 'eval_Poss_recall_micro': 0.9857098860486603, 'eval_Poss_f1_micro': 0.9857098860486603, 'eval_Reflex_accuracy': 0.9991376655374191, 'eval_Reflex_precision_macro': 0.49956883276870956, 'eval_Reflex_recall_macro': 0.5, 'eval_Reflex_f1_macro': 0.49978432339166873, 'eval_Reflex_precision_micro': 0.9991376655374191, 'eval_Reflex_recall_micro': 0.9991376655374191, 'eval_Reflex_f1_micro': 0.9991376655374191, 'eval_Tense_accuracy': 0.9044040652910379, 'eval_Tense_precision_macro': 0.3014680217636793, 'eval_Tense_recall_macro': 0.3333333333333333, 'eval_Tense_f1_macro': 0.31660090130883844, 'eval_Tense_precision_micro': 0.9044040652910379, 'eval_Tense_recall_micro': 0.9044040652910379, 'eval_Tense_f1_micro': 0.9044040652910379, 'eval_VerbForm_accuracy': 0.8764705882352941, 'eval_VerbForm_precision_macro': 0.34036124720280947, 'eval_VerbForm_recall_macro': 0.2824085711629648, 'eval_VerbForm_f1_macro': 0.29697279356566025, 'eval_VerbForm_precision_micro': 0.8764705882352941, 'eval_VerbForm_recall_micro': 0.8764705882352941, 'eval_VerbForm_f1_micro': 0.8764705882352941, 'eval_Voice_accuracy': 0.9972590083153681, 'eval_Voice_precision_macro': 0.49862950415768403, 'eval_Voice_recall_macro': 0.5, 'eval_Voice_f1_macro': 0.49931381166057576, 'eval_Voice_precision_micro': 0.9972590083153681, 'eval_Voice_recall_micro': 0.9972590083153681, 'eval_Voice_f1_micro': 0.9972590083153681, 'eval_runtime': 260.5761, 'eval_samples_per_second': 9.183, 'eval_steps_per_second': 4.594, 'epoch': 0.68}
331
  {'loss': 40.7431, 'grad_norm': 33.708248138427734, 'learning_rate': 1.919879062736206e-05, 'epoch': 1.35}
 
326
 
327
  ## Training logs
328
  ```
329
+ $ python -m multi_head_trainer --data-path dataset/ud_ewt_gum_pud_20250610 --save-path models/ud_ewt_gum_pud_20250610 --from-base microsoft/deberta-v3-base --train
330
  {'loss': 167.3008, 'grad_norm': 78.67291259765625, 'learning_rate': 1.3605442176870749e-05, 'epoch': 0.68}
331
  {'eval_loss': 6.9092020988464355, 'eval_f1_macro': 0.3894647498221998, 'eval_xpos_accuracy': 0.4056051740067755, 'eval_xpos_precision_macro': 0.07715923171265232, 'eval_xpos_recall_macro': 0.09578323169321702, 'eval_xpos_f1_macro': 0.06760571983122861, 'eval_xpos_precision_micro': 0.4056051740067755, 'eval_xpos_recall_micro': 0.4056051740067755, 'eval_xpos_f1_micro': 0.4056051740067755, 'eval_deprel_accuracy': 0.39214659685863873, 'eval_deprel_precision_macro': 0.06449934886885347, 'eval_deprel_recall_macro': 0.10861127424632379, 'eval_deprel_f1_macro': 0.07442277240270408, 'eval_deprel_precision_micro': 0.39214659685863873, 'eval_deprel_recall_micro': 0.39214659685863873, 'eval_deprel_f1_micro': 0.39214659685863873, 'eval_pos_accuracy': 0.6299045272559286, 'eval_pos_precision_macro': 0.3789462822637483, 'eval_pos_recall_macro': 0.3314686217408947, 'eval_pos_f1_macro': 0.2862715500361932, 'eval_pos_precision_micro': 0.6299045272559286, 'eval_pos_recall_micro': 0.6299045272559286, 'eval_pos_f1_micro': 0.6299045272559286, 'eval_Abbr_accuracy': 0.9993840468124423, 'eval_Abbr_precision_macro': 0.49969202340622115, 'eval_Abbr_recall_macro': 0.5, 'eval_Abbr_f1_macro': 0.4998459642637092, 'eval_Abbr_precision_micro': 0.9993840468124423, 'eval_Abbr_recall_micro': 0.9993840468124423, 'eval_Abbr_f1_micro': 0.9993840468124423, 'eval_Case_accuracy': 0.9816445950107792, 'eval_Case_precision_macro': 0.6237830971493706, 'eval_Case_recall_macro': 0.5995542599176837, 'eval_Case_f1_macro': 0.6108994481245369, 'eval_Case_precision_micro': 0.9816445950107792, 'eval_Case_recall_micro': 0.9816445950107792, 'eval_Case_f1_micro': 0.9816445950107792, 'eval_Definite_accuracy': 0.9671388974437942, 'eval_Definite_precision_macro': 0.570645217925757, 'eval_Definite_recall_macro': 0.5851893604042604, 'eval_Definite_f1_macro': 0.5778223477074399, 'eval_Definite_precision_micro': 0.9671388974437942, 'eval_Definite_recall_micro': 0.9671388974437942, 'eval_Definite_f1_micro': 0.9671388974437942, 'eval_Degree_accuracy': 0.9235294117647059, 'eval_Degree_precision_macro': 0.48088176414426065, 'eval_Degree_recall_macro': 0.25010931351114996, 'eval_Degree_f1_macro': 0.24027937527607288, 'eval_Degree_precision_micro': 0.9235294117647059, 'eval_Degree_recall_micro': 0.9235294117647059, 'eval_Degree_f1_micro': 0.9235294117647059, 'eval_Foreign_accuracy': 0.9999384046812442, 'eval_Foreign_precision_macro': 0.4999692023406221, 'eval_Foreign_recall_macro': 0.5, 'eval_Foreign_f1_macro': 0.49998460069604855, 'eval_Foreign_precision_micro': 0.9999384046812442, 'eval_Foreign_recall_micro': 0.9999384046812442, 'eval_Foreign_f1_micro': 0.9999384046812442, 'eval_Gender_accuracy': 0.9816137973514013, 'eval_Gender_precision_macro': 0.24545636570865292, 'eval_Gender_recall_macro': 0.24994510664993727, 'eval_Gender_f1_macro': 0.2476804003543509, 'eval_Gender_precision_micro': 0.9816137973514013, 'eval_Gender_recall_micro': 0.9816137973514013, 'eval_Gender_f1_micro': 0.9816137973514013, 'eval_Mood_accuracy': 0.9319063751154912, 'eval_Mood_precision_macro': 0.6387004043049438, 'eval_Mood_recall_macro': 0.3883744843777621, 'eval_Mood_f1_macro': 0.41581031611224173, 'eval_Mood_precision_micro': 0.9319063751154912, 'eval_Mood_recall_micro': 0.9319063751154912, 'eval_Mood_f1_micro': 0.9319063751154912, 'eval_NumType_accuracy': 0.9828765013858947, 'eval_NumType_precision_macro': 0.24571912534647367, 'eval_NumType_recall_macro': 0.25, 'eval_NumType_f1_macro': 0.24784107852882703, 'eval_NumType_precision_micro': 0.9828765013858947, 'eval_NumType_recall_micro': 0.9828765013858947, 'eval_NumType_f1_micro': 0.9828765013858947, 'eval_Number_accuracy': 0.8546966430551278, 'eval_Number_precision_macro': 0.8775308105441524, 'eval_Number_recall_macro': 0.5982683704051597, 'eval_Number_f1_macro': 0.5746129222413208, 'eval_Number_precision_micro': 0.8546966430551278, 'eval_Number_recall_micro': 0.8546966430551278, 'eval_Number_f1_micro': 0.8546966430551278, 'eval_Person_accuracy': 0.9288882044964583, 'eval_Person_precision_macro': 0.60663366254716, 'eval_Person_recall_macro': 0.34372242024231814, 'eval_Person_f1_macro': 0.35067286612707, 'eval_Person_precision_micro': 0.9288882044964583, 'eval_Person_recall_micro': 0.9288882044964583, 'eval_Person_f1_micro': 0.9288882044964583, 'eval_Polarity_accuracy': 0.9957191253464737, 'eval_Polarity_precision_macro': 0.49785956267323683, 'eval_Polarity_recall_macro': 0.5, 'eval_Polarity_f1_macro': 0.4989274856869493, 'eval_Polarity_precision_micro': 0.9957191253464737, 'eval_Polarity_recall_micro': 0.9957191253464737, 'eval_Polarity_f1_micro': 0.9957191253464737, 'eval_PronType_accuracy': 0.9723129042192793, 'eval_PronType_precision_macro': 0.4836619126413276, 'eval_PronType_recall_macro': 0.49156583018410926, 'eval_PronType_f1_macro': 0.4875445572326604, 'eval_PronType_precision_micro': 0.9723129042192793, 'eval_PronType_recall_micro': 0.9723129042192793, 'eval_PronType_f1_micro': 0.9723129042192793, 'eval_Poss_accuracy': 0.9857098860486603, 'eval_Poss_precision_macro': 0.49285494302433014, 'eval_Poss_recall_macro': 0.5, 'eval_Poss_f1_macro': 0.49640176189589924, 'eval_Poss_precision_micro': 0.9857098860486603, 'eval_Poss_recall_micro': 0.9857098860486603, 'eval_Poss_f1_micro': 0.9857098860486603, 'eval_Reflex_accuracy': 0.9991376655374191, 'eval_Reflex_precision_macro': 0.49956883276870956, 'eval_Reflex_recall_macro': 0.5, 'eval_Reflex_f1_macro': 0.49978432339166873, 'eval_Reflex_precision_micro': 0.9991376655374191, 'eval_Reflex_recall_micro': 0.9991376655374191, 'eval_Reflex_f1_micro': 0.9991376655374191, 'eval_Tense_accuracy': 0.9044040652910379, 'eval_Tense_precision_macro': 0.3014680217636793, 'eval_Tense_recall_macro': 0.3333333333333333, 'eval_Tense_f1_macro': 0.31660090130883844, 'eval_Tense_precision_micro': 0.9044040652910379, 'eval_Tense_recall_micro': 0.9044040652910379, 'eval_Tense_f1_micro': 0.9044040652910379, 'eval_VerbForm_accuracy': 0.8764705882352941, 'eval_VerbForm_precision_macro': 0.34036124720280947, 'eval_VerbForm_recall_macro': 0.2824085711629648, 'eval_VerbForm_f1_macro': 0.29697279356566025, 'eval_VerbForm_precision_micro': 0.8764705882352941, 'eval_VerbForm_recall_micro': 0.8764705882352941, 'eval_VerbForm_f1_micro': 0.8764705882352941, 'eval_Voice_accuracy': 0.9972590083153681, 'eval_Voice_precision_macro': 0.49862950415768403, 'eval_Voice_recall_macro': 0.5, 'eval_Voice_f1_macro': 0.49931381166057576, 'eval_Voice_precision_micro': 0.9972590083153681, 'eval_Voice_recall_micro': 0.9972590083153681, 'eval_Voice_f1_micro': 0.9972590083153681, 'eval_runtime': 260.5761, 'eval_samples_per_second': 9.183, 'eval_steps_per_second': 4.594, 'epoch': 0.68}
332
  {'loss': 40.7431, 'grad_norm': 33.708248138427734, 'learning_rate': 1.919879062736206e-05, 'epoch': 1.35}