|
|
|
|
|
--- |
|
|
language: |
|
|
- pt |
|
|
- en |
|
|
tags: |
|
|
- aes |
|
|
datasets: |
|
|
- kamel-usp/aes_enem_dataset |
|
|
base_model: microsoft/phi-4 |
|
|
metrics: |
|
|
- accuracy |
|
|
- qwk |
|
|
library_name: peft |
|
|
model-index: |
|
|
- name: phi4-balanced-C5 |
|
|
results: |
|
|
- task: |
|
|
type: text-classification |
|
|
name: Automated Essay Score |
|
|
dataset: |
|
|
name: Automated Essay Score ENEM Dataset |
|
|
type: kamel-usp/aes_enem_dataset |
|
|
config: JBCS2025 |
|
|
split: test |
|
|
metrics: |
|
|
- name: Macro F1 |
|
|
type: f1 |
|
|
value: 0.18887726030583174 |
|
|
- name: QWK |
|
|
type: qwk |
|
|
value: 0.4510713065547368 |
|
|
- name: Weighted Macro F1 |
|
|
type: f1 |
|
|
value: 0.24284273352596336 |
|
|
--- |
|
|
# Model ID: phi4-balanced-C5 |
|
|
## Results |
|
|
| | test_data | |
|
|
|:-----------------|------------:| |
|
|
| eval_accuracy | 0.311594 | |
|
|
| eval_RMSE | 61.4793 | |
|
|
| eval_QWK | 0.451071 | |
|
|
| eval_Macro_F1 | 0.188877 | |
|
|
| eval_Weighted_F1 | 0.242843 | |
|
|
| eval_Micro_F1 | 0.311594 | |
|
|
| eval_HDIV | 0.137681 | |
|
|
|