language: | |
- pt | |
- en | |
tags: | |
- aes | |
datasets: | |
- kamel-usp/aes_enem_dataset | |
base_model: microsoft/phi-4 | |
metrics: | |
- accuracy | |
- qwk | |
library_name: peft | |
model-index: | |
- name: phi-4-phi4_classification_lora-C3-full_context-r8 | |
results: | |
- task: | |
type: text-classification | |
name: Automated Essay Score | |
dataset: | |
name: Automated Essay Score ENEM Dataset | |
type: kamel-usp/aes_enem_dataset | |
config: JBCS2025 | |
split: test | |
metrics: | |
- name: Macro F1 | |
type: f1 | |
value: 0.3422333666920509 | |
- name: QWK | |
type: qwk | |
value: 0.582344914453658 | |
- name: Weighted Macro F1 | |
type: f1 | |
value: 0.3729164740568574 | |
# Model ID: phi-4-phi4_classification_lora-C3-full_context-r8 | |
## Results | |
| | test_data | | |
|:-----------------|------------:| | |
| eval_accuracy | 0.413043 | | |
| eval_RMSE | 44.7861 | | |
| eval_QWK | 0.582345 | | |
| eval_Macro_F1 | 0.342233 | | |
| eval_Weighted_F1 | 0.372916 | | |
| eval_Micro_F1 | 0.413043 | | |
| eval_HDIV | 0.0289855 | | |