| |
|
| | --- |
| | language: |
| | - pt |
| | - en |
| | tags: |
| | - aes |
| | datasets: |
| | - kamel-usp/aes_enem_dataset |
| | base_model: microsoft/Phi-3.5-mini-instruct |
| | metrics: |
| | - accuracy |
| | - qwk |
| | library_name: peft |
| | model-index: |
| | - name: phi35-balanced-C2 |
| | results: |
| | - task: |
| | type: text-classification |
| | name: Automated Essay Score |
| | dataset: |
| | name: Automated Essay Score ENEM Dataset |
| | type: kamel-usp/aes_enem_dataset |
| | config: JBCS2025 |
| | split: test |
| | metrics: |
| | - name: Macro F1 |
| | type: f1 |
| | value: 0.27702836615880094 |
| | - name: QWK |
| | type: qwk |
| | value: 0.34891857506361335 |
| | - name: Weighted Macro F1 |
| | type: f1 |
| | value: 0.34879657904232575 |
| | --- |
| | # Model ID: phi35-balanced-C2 |
| | ## Results |
| | | | test_data | |
| | |:-----------------|------------:| |
| | | eval_accuracy | 0.384058 | |
| | | eval_RMSE | 64.2459 | |
| | | eval_QWK | 0.348919 | |
| | | eval_Macro_F1 | 0.277028 | |
| | | eval_Weighted_F1 | 0.348797 | |
| | | eval_Micro_F1 | 0.384058 | |
| | | eval_HDIV | 0.0724638 | |
| | |