lgsilvaesilva commited on Jun 10

Commit

e6caab3

verified ·

1 Parent(s): 4c67f07

Upload folder using huggingface_hub

Browse files

Files changed (50) hide show

.gitattributes +1 -0
README.md +65 -65
REPORT.md +65 -65
baselines/embedding-lightgbm/embedding-lightgbm.joblib +2 -2
baselines/embedding-lightgbm/test_predictions.csv +0 -0
baselines/embedding-lightgbm/validation_predictions.csv +0 -0
baselines/embedding-logistic/embedding-logistic.joblib +2 -2
baselines/embedding-logistic/test_predictions.csv +0 -0
baselines/embedding-logistic/validation_predictions.csv +0 -0
baselines/embedding-svm/embedding-svm.joblib +1 -1
baselines/embedding-svm/test_predictions.csv +0 -0
baselines/embedding-svm/validation_predictions.csv +0 -0
baselines/logistic/logistic_tfidf.joblib +2 -2
baselines/logistic/test_predictions.csv +0 -0
baselines/logistic/validation_predictions.csv +0 -0
baselines/xgboost/test_predictions.csv +0 -0
baselines/xgboost/validation_predictions.csv +0 -0
baselines/xgboost/xgboost_tfidf.joblib +2 -2
report.json +701 -701
transformer/checkpoint-1220/config.json +1 -1
transformer/checkpoint-1220/model.safetensors +1 -1
transformer/checkpoint-1220/optimizer.pt +1 -1
transformer/checkpoint-1220/rng_state.pth +1 -1
transformer/checkpoint-1220/scaler.pt +1 -1
transformer/checkpoint-1220/scheduler.pt +1 -1
transformer/checkpoint-1220/trainer_state.json +218 -244
transformer/checkpoint-1220/training_args.bin +2 -2
transformer/checkpoint-1830/config.json +39 -0
transformer/checkpoint-1830/model.safetensors +3 -0
transformer/checkpoint-1830/optimizer.pt +3 -0
transformer/checkpoint-1830/rng_state.pth +3 -0
transformer/checkpoint-1830/scaler.pt +3 -0
transformer/checkpoint-1830/scheduler.pt +3 -0
transformer/checkpoint-1830/tokenizer.json +3 -0
transformer/checkpoint-1830/tokenizer_config.json +15 -0
transformer/checkpoint-1830/trainer_state.json +593 -0
transformer/checkpoint-1830/training_args.bin +3 -0
transformer/checkpoint-610/config.json +1 -1
transformer/checkpoint-610/model.safetensors +1 -1
transformer/checkpoint-610/optimizer.pt +1 -1
transformer/checkpoint-610/rng_state.pth +1 -1
transformer/checkpoint-610/scaler.pt +1 -1
transformer/checkpoint-610/scheduler.pt +1 -1
transformer/checkpoint-610/trainer_state.json +113 -126
transformer/checkpoint-610/training_args.bin +2 -2
transformer/config.json +6 -6
transformer/model.safetensors +1 -1
transformer/test_predictions.csv +0 -0
transformer/training_args.bin +2 -2
transformer/validation_predictions.csv +0 -0

.gitattributes CHANGED Viewed

@@ -39,3 +39,4 @@ transformer/checkpoint-305/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 transformer/checkpoint-610/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 transformer/checkpoint-915/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 transformer/tokenizer.json filter=lfs diff=lfs merge=lfs -text

 transformer/checkpoint-610/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 transformer/checkpoint-915/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 transformer/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+transformer/checkpoint-1830/tokenizer.json filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -17,19 +17,19 @@ It includes the Transformer model, any configured TF-IDF or sentence-embedding b
 - Dataset: `faodl/amis-agri-utilization`
 - Dataset subset: ``
-- Dataset revision: `ada4a04088a98f8f64bc7485c57d4c7f422c2151`
 - Text column: `chunk_text`
 - Label column: `label`
 - Transformer: `FacebookAI/xlm-roberta-base`
-- Generated at: `2026-05-27T10:50:45.867038+00:00`
 ## Dataset Summary
 | Split | Rows | Label 0 | Label 1 | Unique groups | Mean text length |
 | --- | ---: | ---: | ---: | ---: | ---: |
-| train | 4877 | 4347 | 530 | 2513 | 696.6 |
-| validation | 978 | 899 | 79 | 538 | 690.6 |
-| test | 1016 | 904 | 112 | 539 | 690.7 |
 ## Threshold Comparison on Validation Split
@@ -37,35 +37,35 @@ Validation metrics document threshold selection and tuning behavior; test metric
 | Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
 | --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
-| logistic_tfidf | 0.500 | 0.912 | 0.465 | 0.582 | 0.517 | 0.872 | 0.594 |
-| logistic_tfidf | 0.608 | 0.942 | 0.696 | 0.494 | 0.578 | 0.872 | 0.594 |
-| xgboost_tfidf | 0.500 | 0.945 | 0.931 | 0.342 | 0.500 | 0.823 | 0.588 |
-| xgboost_tfidf | 0.177 | 0.934 | 0.592 | 0.570 | 0.581 | 0.823 | 0.588 |
-| embedding-logistic_sentence_embeddings | 0.500 | 0.912 | 0.476 | 0.861 | 0.613 | 0.953 | 0.762 |
-| embedding-logistic_sentence_embeddings | 0.722 | 0.957 | 0.703 | 0.810 | 0.753 | 0.953 | 0.762 |
-| embedding-svm_sentence_embeddings | 0.500 | 0.955 | 0.807 | 0.582 | 0.676 | 0.952 | 0.754 |
-| embedding-svm_sentence_embeddings | 0.310 | 0.957 | 0.713 | 0.785 | 0.747 | 0.952 | 0.754 |
-| embedding-lightgbm_sentence_embeddings | 0.500 | 0.954 | 0.750 | 0.646 | 0.694 | 0.948 | 0.782 |
-| embedding-lightgbm_sentence_embeddings | 0.042 | 0.952 | 0.670 | 0.797 | 0.728 | 0.948 | 0.782 |
-| transformer | 0.500 | 0.970 | 0.798 | 0.848 | 0.822 | 0.966 | 0.854 |
-| transformer | 0.471 | 0.971 | 0.800 | 0.861 | 0.829 | 0.966 | 0.854 |
 ## Threshold Comparison on Test Split
 | Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
 | --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
-| logistic_tfidf | 0.500 | 0.926 | 0.691 | 0.598 | 0.641 | 0.899 | 0.726 |
-| logistic_tfidf | 0.608 | 0.930 | 0.902 | 0.411 | 0.564 | 0.899 | 0.726 |
-| xgboost_tfidf | 0.500 | 0.924 | 1.000 | 0.312 | 0.476 | 0.892 | 0.692 |
-| xgboost_tfidf | 0.177 | 0.918 | 0.663 | 0.527 | 0.587 | 0.892 | 0.692 |
-| embedding-logistic_sentence_embeddings | 0.500 | 0.891 | 0.503 | 0.884 | 0.641 | 0.955 | 0.710 |
-| embedding-logistic_sentence_embeddings | 0.722 | 0.935 | 0.689 | 0.750 | 0.718 | 0.955 | 0.710 |
-| embedding-svm_sentence_embeddings | 0.500 | 0.930 | 0.741 | 0.562 | 0.640 | 0.956 | 0.704 |
-| embedding-svm_sentence_embeddings | 0.310 | 0.934 | 0.686 | 0.741 | 0.712 | 0.956 | 0.704 |
-| embedding-lightgbm_sentence_embeddings | 0.500 | 0.937 | 0.740 | 0.661 | 0.698 | 0.960 | 0.791 |
-| embedding-lightgbm_sentence_embeddings | 0.042 | 0.929 | 0.639 | 0.821 | 0.719 | 0.960 | 0.791 |
-| transformer | 0.500 | 0.951 | 0.777 | 0.777 | 0.777 | 0.968 | 0.817 |
-| transformer | 0.471 | 0.950 | 0.770 | 0.777 | 0.773 | 0.968 | 0.817 |
 ## Confusion Matrices on Test Split
@@ -75,95 +75,95 @@ Rows are true labels and columns are predicted labels.
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 874 | 30 |
-| RELEVANT | 45 | 67 |
-### logistic_tfidf at threshold 0.608
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 899 | 5 |
-| RELEVANT | 66 | 46 |
 ### xgboost_tfidf at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 904 | 0 |
-| RELEVANT | 77 | 35 |
-### xgboost_tfidf at threshold 0.177
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 874 | 30 |
-| RELEVANT | 53 | 59 |
 ### embedding-logistic_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 806 | 98 |
-| RELEVANT | 13 | 99 |
-### embedding-logistic_sentence_embeddings at threshold 0.722
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 866 | 38 |
-| RELEVANT | 28 | 84 |
 ### embedding-svm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 882 | 22 |
-| RELEVANT | 49 | 63 |
-### embedding-svm_sentence_embeddings at threshold 0.310
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 866 | 38 |
-| RELEVANT | 29 | 83 |
 ### embedding-lightgbm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 878 | 26 |
-| RELEVANT | 38 | 74 |
-### embedding-lightgbm_sentence_embeddings at threshold 0.042
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 852 | 52 |
-| RELEVANT | 20 | 92 |
 ### transformer at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 879 | 25 |
-| RELEVANT | 25 | 87 |
-### transformer at threshold 0.471
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 878 | 26 |
-| RELEVANT | 25 | 87 |
 ## Validation-Tuned Thresholds
-- `logistic_tfidf`: threshold `0.608` (validation F1 `0.578`); test F1 change vs 0.5: `-0.077`.
-- `xgboost_tfidf`: threshold `0.177` (validation F1 `0.581`); test F1 change vs 0.5: `+0.111`.
-- `embedding-logistic_sentence_embeddings`: threshold `0.722` (validation F1 `0.753`); test F1 change vs 0.5: `+0.077`.
-- `embedding-svm_sentence_embeddings`: threshold `0.310` (validation F1 `0.747`); test F1 change vs 0.5: `+0.073`.
-- `embedding-lightgbm_sentence_embeddings`: threshold `0.042` (validation F1 `0.728`); test F1 change vs 0.5: `+0.021`.
-- `transformer`: threshold `0.471` (validation F1 `0.829`); test F1 change vs 0.5: `-0.003`.
 ## Artifacts

 - Dataset: `faodl/amis-agri-utilization`
 - Dataset subset: ``
+- Dataset revision: `main`
 - Text column: `chunk_text`
 - Label column: `label`
 - Transformer: `FacebookAI/xlm-roberta-base`
+- Generated at: `2026-06-09T23:58:45.600559+00:00`
 ## Dataset Summary
 | Split | Rows | Label 0 | Label 1 | Unique groups | Mean text length |
 | --- | ---: | ---: | ---: | ---: | ---: |
+| train | 9753 | 8950 | 803 | 4987 | 696.4 |
+| validation | 2084 | 1885 | 199 | 1069 | 700.8 |
+| test | 2086 | 1957 | 129 | 1069 | 701.6 |
 ## Threshold Comparison on Validation Split
 | Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
 | --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
+| logistic_tfidf | 0.500 | 0.901 | 0.482 | 0.462 | 0.472 | 0.867 | 0.496 |
+| logistic_tfidf | 0.360 | 0.863 | 0.380 | 0.688 | 0.489 | 0.867 | 0.496 |
+| xgboost_tfidf | 0.500 | 0.919 | 0.721 | 0.246 | 0.367 | 0.834 | 0.493 |
+| xgboost_tfidf | 0.104 | 0.903 | 0.492 | 0.588 | 0.535 | 0.834 | 0.493 |
+| embedding-logistic_sentence_embeddings | 0.500 | 0.895 | 0.474 | 0.869 | 0.613 | 0.952 | 0.652 |
+| embedding-logistic_sentence_embeddings | 0.726 | 0.930 | 0.602 | 0.804 | 0.688 | 0.952 | 0.652 |
+| embedding-svm_sentence_embeddings | 0.500 | 0.931 | 0.712 | 0.472 | 0.568 | 0.954 | 0.670 |
+| embedding-svm_sentence_embeddings | 0.245 | 0.938 | 0.647 | 0.764 | 0.700 | 0.954 | 0.670 |
+| embedding-lightgbm_sentence_embeddings | 0.500 | 0.937 | 0.681 | 0.633 | 0.656 | 0.954 | 0.669 |
+| embedding-lightgbm_sentence_embeddings | 0.089 | 0.933 | 0.610 | 0.824 | 0.701 | 0.954 | 0.669 |
+| transformer | 0.500 | 0.938 | 0.653 | 0.739 | 0.693 | 0.954 | 0.726 |
+| transformer | 0.544 | 0.939 | 0.662 | 0.739 | 0.698 | 0.954 | 0.726 |
 ## Threshold Comparison on Test Split
 | Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
 | --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
+| logistic_tfidf | 0.500 | 0.918 | 0.358 | 0.419 | 0.386 | 0.856 | 0.398 |
+| logistic_tfidf | 0.360 | 0.869 | 0.267 | 0.643 | 0.377 | 0.856 | 0.398 |
+| xgboost_tfidf | 0.500 | 0.950 | 0.766 | 0.279 | 0.409 | 0.821 | 0.471 |
+| xgboost_tfidf | 0.104 | 0.907 | 0.343 | 0.558 | 0.425 | 0.821 | 0.471 |
+| embedding-logistic_sentence_embeddings | 0.500 | 0.891 | 0.350 | 0.884 | 0.501 | 0.951 | 0.543 |
+| embedding-logistic_sentence_embeddings | 0.726 | 0.929 | 0.449 | 0.690 | 0.544 | 0.951 | 0.543 |
+| embedding-svm_sentence_embeddings | 0.500 | 0.948 | 0.606 | 0.465 | 0.526 | 0.955 | 0.566 |
+| embedding-svm_sentence_embeddings | 0.245 | 0.937 | 0.494 | 0.674 | 0.570 | 0.955 | 0.566 |
+| embedding-lightgbm_sentence_embeddings | 0.500 | 0.948 | 0.579 | 0.597 | 0.588 | 0.948 | 0.585 |
+| embedding-lightgbm_sentence_embeddings | 0.089 | 0.932 | 0.472 | 0.775 | 0.587 | 0.948 | 0.585 |
+| transformer | 0.500 | 0.943 | 0.532 | 0.643 | 0.582 | 0.931 | 0.500 |
+| transformer | 0.544 | 0.942 | 0.529 | 0.636 | 0.577 | 0.931 | 0.500 |
 ## Confusion Matrices on Test Split
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1860 | 97 |
+| RELEVANT | 75 | 54 |
+### logistic_tfidf at threshold 0.360
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1729 | 228 |
+| RELEVANT | 46 | 83 |
 ### xgboost_tfidf at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1946 | 11 |
+| RELEVANT | 93 | 36 |
+### xgboost_tfidf at threshold 0.104
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1819 | 138 |
+| RELEVANT | 57 | 72 |
 ### embedding-logistic_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1745 | 212 |
+| RELEVANT | 15 | 114 |
+### embedding-logistic_sentence_embeddings at threshold 0.726
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1848 | 109 |
+| RELEVANT | 40 | 89 |
 ### embedding-svm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1918 | 39 |
+| RELEVANT | 69 | 60 |
+### embedding-svm_sentence_embeddings at threshold 0.245
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1868 | 89 |
+| RELEVANT | 42 | 87 |
 ### embedding-lightgbm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1901 | 56 |
+| RELEVANT | 52 | 77 |
+### embedding-lightgbm_sentence_embeddings at threshold 0.089
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1845 | 112 |
+| RELEVANT | 29 | 100 |
 ### transformer at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1884 | 73 |
+| RELEVANT | 46 | 83 |
+### transformer at threshold 0.544
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1884 | 73 |
+| RELEVANT | 47 | 82 |
 ## Validation-Tuned Thresholds
+- `logistic_tfidf`: threshold `0.360` (validation F1 `0.489`); test F1 change vs 0.5: `-0.008`.
+- `xgboost_tfidf`: threshold `0.104` (validation F1 `0.535`); test F1 change vs 0.5: `+0.016`.
+- `embedding-logistic_sentence_embeddings`: threshold `0.726` (validation F1 `0.688`); test F1 change vs 0.5: `+0.043`.
+- `embedding-svm_sentence_embeddings`: threshold `0.245` (validation F1 `0.700`); test F1 change vs 0.5: `+0.044`.
+- `embedding-lightgbm_sentence_embeddings`: threshold `0.089` (validation F1 `0.701`); test F1 change vs 0.5: `-0.001`.
+- `transformer`: threshold `0.544` (validation F1 `0.698`); test F1 change vs 0.5: `-0.005`.
 ## Artifacts

REPORT.md CHANGED Viewed

@@ -2,19 +2,19 @@
 - Dataset: `faodl/amis-agri-utilization`
 - Dataset subset: ``
-- Dataset revision: `ada4a04088a98f8f64bc7485c57d4c7f422c2151`
 - Text column: `chunk_text`
 - Label column: `label`
 - Transformer: `FacebookAI/xlm-roberta-base`
-- Generated at: `2026-05-27T10:50:45.867038+00:00`
 ## Dataset Summary
 | Split | Rows | Label 0 | Label 1 | Unique groups | Mean text length |
 | --- | ---: | ---: | ---: | ---: | ---: |
-| train | 4877 | 4347 | 530 | 2513 | 696.6 |
-| validation | 978 | 899 | 79 | 538 | 690.6 |
-| test | 1016 | 904 | 112 | 539 | 690.7 |
 ## Threshold Comparison on Validation Split
@@ -22,35 +22,35 @@ Validation metrics document threshold selection and tuning behavior; test metric
 | Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
 | --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
-| logistic_tfidf | 0.500 | 0.912 | 0.465 | 0.582 | 0.517 | 0.872 | 0.594 |
-| logistic_tfidf | 0.608 | 0.942 | 0.696 | 0.494 | 0.578 | 0.872 | 0.594 |
-| xgboost_tfidf | 0.500 | 0.945 | 0.931 | 0.342 | 0.500 | 0.823 | 0.588 |
-| xgboost_tfidf | 0.177 | 0.934 | 0.592 | 0.570 | 0.581 | 0.823 | 0.588 |
-| embedding-logistic_sentence_embeddings | 0.500 | 0.912 | 0.476 | 0.861 | 0.613 | 0.953 | 0.762 |
-| embedding-logistic_sentence_embeddings | 0.722 | 0.957 | 0.703 | 0.810 | 0.753 | 0.953 | 0.762 |
-| embedding-svm_sentence_embeddings | 0.500 | 0.955 | 0.807 | 0.582 | 0.676 | 0.952 | 0.754 |
-| embedding-svm_sentence_embeddings | 0.310 | 0.957 | 0.713 | 0.785 | 0.747 | 0.952 | 0.754 |
-| embedding-lightgbm_sentence_embeddings | 0.500 | 0.954 | 0.750 | 0.646 | 0.694 | 0.948 | 0.782 |
-| embedding-lightgbm_sentence_embeddings | 0.042 | 0.952 | 0.670 | 0.797 | 0.728 | 0.948 | 0.782 |
-| transformer | 0.500 | 0.970 | 0.798 | 0.848 | 0.822 | 0.966 | 0.854 |
-| transformer | 0.471 | 0.971 | 0.800 | 0.861 | 0.829 | 0.966 | 0.854 |
 ## Threshold Comparison on Test Split
 | Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
 | --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
-| logistic_tfidf | 0.500 | 0.926 | 0.691 | 0.598 | 0.641 | 0.899 | 0.726 |
-| logistic_tfidf | 0.608 | 0.930 | 0.902 | 0.411 | 0.564 | 0.899 | 0.726 |
-| xgboost_tfidf | 0.500 | 0.924 | 1.000 | 0.312 | 0.476 | 0.892 | 0.692 |
-| xgboost_tfidf | 0.177 | 0.918 | 0.663 | 0.527 | 0.587 | 0.892 | 0.692 |
-| embedding-logistic_sentence_embeddings | 0.500 | 0.891 | 0.503 | 0.884 | 0.641 | 0.955 | 0.710 |
-| embedding-logistic_sentence_embeddings | 0.722 | 0.935 | 0.689 | 0.750 | 0.718 | 0.955 | 0.710 |
-| embedding-svm_sentence_embeddings | 0.500 | 0.930 | 0.741 | 0.562 | 0.640 | 0.956 | 0.704 |
-| embedding-svm_sentence_embeddings | 0.310 | 0.934 | 0.686 | 0.741 | 0.712 | 0.956 | 0.704 |
-| embedding-lightgbm_sentence_embeddings | 0.500 | 0.937 | 0.740 | 0.661 | 0.698 | 0.960 | 0.791 |
-| embedding-lightgbm_sentence_embeddings | 0.042 | 0.929 | 0.639 | 0.821 | 0.719 | 0.960 | 0.791 |
-| transformer | 0.500 | 0.951 | 0.777 | 0.777 | 0.777 | 0.968 | 0.817 |
-| transformer | 0.471 | 0.950 | 0.770 | 0.777 | 0.773 | 0.968 | 0.817 |
 ## Confusion Matrices on Test Split
@@ -60,95 +60,95 @@ Rows are true labels and columns are predicted labels.
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 874 | 30 |
-| RELEVANT | 45 | 67 |
-### logistic_tfidf at threshold 0.608
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 899 | 5 |
-| RELEVANT | 66 | 46 |
 ### xgboost_tfidf at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 904 | 0 |
-| RELEVANT | 77 | 35 |
-### xgboost_tfidf at threshold 0.177
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 874 | 30 |
-| RELEVANT | 53 | 59 |
 ### embedding-logistic_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 806 | 98 |
-| RELEVANT | 13 | 99 |
-### embedding-logistic_sentence_embeddings at threshold 0.722
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 866 | 38 |
-| RELEVANT | 28 | 84 |
 ### embedding-svm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 882 | 22 |
-| RELEVANT | 49 | 63 |
-### embedding-svm_sentence_embeddings at threshold 0.310
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 866 | 38 |
-| RELEVANT | 29 | 83 |
 ### embedding-lightgbm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 878 | 26 |
-| RELEVANT | 38 | 74 |
-### embedding-lightgbm_sentence_embeddings at threshold 0.042
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 852 | 52 |
-| RELEVANT | 20 | 92 |
 ### transformer at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 879 | 25 |
-| RELEVANT | 25 | 87 |
-### transformer at threshold 0.471
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 878 | 26 |
-| RELEVANT | 25 | 87 |
 ## Validation-Tuned Thresholds
-- `logistic_tfidf`: threshold `0.608` (validation F1 `0.578`); test F1 change vs 0.5: `-0.077`.
-- `xgboost_tfidf`: threshold `0.177` (validation F1 `0.581`); test F1 change vs 0.5: `+0.111`.
-- `embedding-logistic_sentence_embeddings`: threshold `0.722` (validation F1 `0.753`); test F1 change vs 0.5: `+0.077`.
-- `embedding-svm_sentence_embeddings`: threshold `0.310` (validation F1 `0.747`); test F1 change vs 0.5: `+0.073`.
-- `embedding-lightgbm_sentence_embeddings`: threshold `0.042` (validation F1 `0.728`); test F1 change vs 0.5: `+0.021`.
-- `transformer`: threshold `0.471` (validation F1 `0.829`); test F1 change vs 0.5: `-0.003`.
 ## Artifacts

 - Dataset: `faodl/amis-agri-utilization`
 - Dataset subset: ``
+- Dataset revision: `main`
 - Text column: `chunk_text`
 - Label column: `label`
 - Transformer: `FacebookAI/xlm-roberta-base`
+- Generated at: `2026-06-09T23:58:45.600559+00:00`
 ## Dataset Summary
 | Split | Rows | Label 0 | Label 1 | Unique groups | Mean text length |
 | --- | ---: | ---: | ---: | ---: | ---: |
+| train | 9753 | 8950 | 803 | 4987 | 696.4 |
+| validation | 2084 | 1885 | 199 | 1069 | 700.8 |
+| test | 2086 | 1957 | 129 | 1069 | 701.6 |
 ## Threshold Comparison on Validation Split
 | Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
 | --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
+| logistic_tfidf | 0.500 | 0.901 | 0.482 | 0.462 | 0.472 | 0.867 | 0.496 |
+| logistic_tfidf | 0.360 | 0.863 | 0.380 | 0.688 | 0.489 | 0.867 | 0.496 |
+| xgboost_tfidf | 0.500 | 0.919 | 0.721 | 0.246 | 0.367 | 0.834 | 0.493 |
+| xgboost_tfidf | 0.104 | 0.903 | 0.492 | 0.588 | 0.535 | 0.834 | 0.493 |
+| embedding-logistic_sentence_embeddings | 0.500 | 0.895 | 0.474 | 0.869 | 0.613 | 0.952 | 0.652 |
+| embedding-logistic_sentence_embeddings | 0.726 | 0.930 | 0.602 | 0.804 | 0.688 | 0.952 | 0.652 |
+| embedding-svm_sentence_embeddings | 0.500 | 0.931 | 0.712 | 0.472 | 0.568 | 0.954 | 0.670 |
+| embedding-svm_sentence_embeddings | 0.245 | 0.938 | 0.647 | 0.764 | 0.700 | 0.954 | 0.670 |
+| embedding-lightgbm_sentence_embeddings | 0.500 | 0.937 | 0.681 | 0.633 | 0.656 | 0.954 | 0.669 |
+| embedding-lightgbm_sentence_embeddings | 0.089 | 0.933 | 0.610 | 0.824 | 0.701 | 0.954 | 0.669 |
+| transformer | 0.500 | 0.938 | 0.653 | 0.739 | 0.693 | 0.954 | 0.726 |
+| transformer | 0.544 | 0.939 | 0.662 | 0.739 | 0.698 | 0.954 | 0.726 |
 ## Threshold Comparison on Test Split
 | Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
 | --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
+| logistic_tfidf | 0.500 | 0.918 | 0.358 | 0.419 | 0.386 | 0.856 | 0.398 |
+| logistic_tfidf | 0.360 | 0.869 | 0.267 | 0.643 | 0.377 | 0.856 | 0.398 |
+| xgboost_tfidf | 0.500 | 0.950 | 0.766 | 0.279 | 0.409 | 0.821 | 0.471 |
+| xgboost_tfidf | 0.104 | 0.907 | 0.343 | 0.558 | 0.425 | 0.821 | 0.471 |
+| embedding-logistic_sentence_embeddings | 0.500 | 0.891 | 0.350 | 0.884 | 0.501 | 0.951 | 0.543 |
+| embedding-logistic_sentence_embeddings | 0.726 | 0.929 | 0.449 | 0.690 | 0.544 | 0.951 | 0.543 |
+| embedding-svm_sentence_embeddings | 0.500 | 0.948 | 0.606 | 0.465 | 0.526 | 0.955 | 0.566 |
+| embedding-svm_sentence_embeddings | 0.245 | 0.937 | 0.494 | 0.674 | 0.570 | 0.955 | 0.566 |
+| embedding-lightgbm_sentence_embeddings | 0.500 | 0.948 | 0.579 | 0.597 | 0.588 | 0.948 | 0.585 |
+| embedding-lightgbm_sentence_embeddings | 0.089 | 0.932 | 0.472 | 0.775 | 0.587 | 0.948 | 0.585 |
+| transformer | 0.500 | 0.943 | 0.532 | 0.643 | 0.582 | 0.931 | 0.500 |
+| transformer | 0.544 | 0.942 | 0.529 | 0.636 | 0.577 | 0.931 | 0.500 |
 ## Confusion Matrices on Test Split
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1860 | 97 |
+| RELEVANT | 75 | 54 |
+### logistic_tfidf at threshold 0.360
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1729 | 228 |
+| RELEVANT | 46 | 83 |
 ### xgboost_tfidf at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1946 | 11 |
+| RELEVANT | 93 | 36 |
+### xgboost_tfidf at threshold 0.104
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1819 | 138 |
+| RELEVANT | 57 | 72 |
 ### embedding-logistic_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1745 | 212 |
+| RELEVANT | 15 | 114 |
+### embedding-logistic_sentence_embeddings at threshold 0.726
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1848 | 109 |
+| RELEVANT | 40 | 89 |
 ### embedding-svm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1918 | 39 |
+| RELEVANT | 69 | 60 |
+### embedding-svm_sentence_embeddings at threshold 0.245
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1868 | 89 |
+| RELEVANT | 42 | 87 |
 ### embedding-lightgbm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1901 | 56 |
+| RELEVANT | 52 | 77 |
+### embedding-lightgbm_sentence_embeddings at threshold 0.089
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1845 | 112 |
+| RELEVANT | 29 | 100 |
 ### transformer at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1884 | 73 |
+| RELEVANT | 46 | 83 |
+### transformer at threshold 0.544
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 1884 | 73 |
+| RELEVANT | 47 | 82 |
 ## Validation-Tuned Thresholds
+- `logistic_tfidf`: threshold `0.360` (validation F1 `0.489`); test F1 change vs 0.5: `-0.008`.
+- `xgboost_tfidf`: threshold `0.104` (validation F1 `0.535`); test F1 change vs 0.5: `+0.016`.
+- `embedding-logistic_sentence_embeddings`: threshold `0.726` (validation F1 `0.688`); test F1 change vs 0.5: `+0.043`.
+- `embedding-svm_sentence_embeddings`: threshold `0.245` (validation F1 `0.700`); test F1 change vs 0.5: `+0.044`.
+- `embedding-lightgbm_sentence_embeddings`: threshold `0.089` (validation F1 `0.701`); test F1 change vs 0.5: `-0.001`.
+- `transformer`: threshold `0.544` (validation F1 `0.698`); test F1 change vs 0.5: `-0.005`.
 ## Artifacts

baselines/embedding-lightgbm/embedding-lightgbm.joblib CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:02039c6ee8487042ae61343afc227ab7375bbfdb042e073232a995d2e4d57dd6
-size 1467646

 version https://git-lfs.github.com/spec/v1
+oid sha256:ef46feb03d6d86629446a2b84e3976aad0bbf58a95a4a53a9fd370bd0fd97a5b
+size 1454606

baselines/embedding-lightgbm/test_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/embedding-lightgbm/validation_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/embedding-logistic/embedding-logistic.joblib CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:433846875da231d3a97fc0f6bfa5adc3a1c4edb548d9655dc98a07523b436207
-size 4361

 version https://git-lfs.github.com/spec/v1
+oid sha256:2368ac2c3c1cc353bb281993f87b11f6ea0b4a86abd8d935a9506f607933b1ae
+size 2821

baselines/embedding-logistic/test_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/embedding-logistic/validation_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/embedding-svm/embedding-svm.joblib CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:df3e6eaec015a205089efe2457d89d2ecacdf1661b8607ad60905ef318adc5f4
 size 11770

 version https://git-lfs.github.com/spec/v1
+oid sha256:6d0d609b2c746c6481cb61c52f997a53e8962c60aceda441970bbaeffd07223e
 size 11770

baselines/embedding-svm/test_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/embedding-svm/validation_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/logistic/logistic_tfidf.joblib CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:988b232ccc0c55fa1116c0885058e6200246e9dbe050debf6f5edfa81e0438e7
-size 2452308

 version https://git-lfs.github.com/spec/v1
+oid sha256:0ff51ca92cbba2cd25b3bd551d90fa24bbe8217cf6d701c493727b09df330af7
+size 2430788

baselines/logistic/test_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/logistic/validation_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/xgboost/test_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/xgboost/validation_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/xgboost/xgboost_tfidf.joblib CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:75dae90ae561b6e87b2fd736393208127db3493eb3df7a2232490a3a60238d1b
-size 2494551

 version https://git-lfs.github.com/spec/v1
+oid sha256:a4b2edd904d295c0f6e835bcff08adff1506e9ce985ac708d392ce1c8dd97b2a
+size 2483313

report.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
-  "created_at": "2026-05-27T10:50:45.867038+00:00",
   "config": {
     "hf_dataset": "faodl/amis-agri-utilization",
     "hf_subset": null,
-    "hf_revision": "ada4a04088a98f8f64bc7485c57d4c7f422c2151",
     "train_split": "train",
     "validation_split": "validation",
     "test_split": "test",
@@ -44,33 +44,33 @@
   },
   "dataset_summary": {
     "train": {
-      "rows": 4877,
       "labels": {
-        "0": 4347,
-        "1": 530
       },
-      "unique_groups": 2513,
-      "text_length_mean": 696.6221037523068,
       "text_length_median": 794.0
     },
     "validation": {
-      "rows": 978,
       "labels": {
-        "0": 899,
-        "1": 79
       },
-      "unique_groups": 538,
-      "text_length_mean": 690.6196319018405,
       "text_length_median": 794.0
     },
     "test": {
-      "rows": 1016,
       "labels": {
-        "0": 904,
-        "1": 112
       },
-      "unique_groups": 539,
-      "text_length_mean": 690.6929133858267,
       "text_length_median": 794.0
     }
   },
@@ -81,194 +81,194 @@
       "artifact_dir": "/content/agri-utilization-classifier/baselines/logistic",
       "artifact_file": "/content/agri-utilization-classifier/baselines/logistic/logistic_tfidf.joblib",
       "validation_best_threshold": {
-        "threshold": 0.6076606929552563,
-        "f1": 0.5777777777777778,
-        "precision": 0.6964285714285714,
-        "recall": 0.4936708860759494
       },
       "validation_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.9120654396728016,
-        "precision": 0.46464646464646464,
-        "recall": 0.5822784810126582,
-        "f1": 0.5168539325842697,
         "confusion_matrix": [
           [
-            846,
-            53
           ],
           [
-            33,
-            46
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.962457337883959,
-            "recall": 0.9410456062291435,
-            "f1-score": 0.9516310461192351,
-            "support": 899.0
           },
           "RELEVANT": {
-            "precision": 0.46464646464646464,
-            "recall": 0.5822784810126582,
-            "f1-score": 0.5168539325842697,
-            "support": 79.0
           },
-          "accuracy": 0.9120654396728016,
           "macro avg": {
-            "precision": 0.7135519012652118,
-            "recall": 0.7616620436209008,
-            "f1-score": 0.7342424893517524,
-            "support": 978.0
           },
           "weighted avg": {
-            "precision": 0.9222456211296011,
-            "recall": 0.9120654396728016,
-            "f1-score": 0.9165110134308279,
-            "support": 978.0
           }
         },
-        "roc_auc": 0.871530955632841,
-        "average_precision": 0.5935308473185881
       },
       "validation_optimal_threshold": {
-        "threshold": 0.6076606929552563,
-        "accuracy": 0.941717791411043,
-        "precision": 0.6964285714285714,
-        "recall": 0.4936708860759494,
-        "f1": 0.5777777777777777,
         "confusion_matrix": [
           [
-            882,
-            17
           ],
           [
-            40,
-            39
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9566160520607375,
-            "recall": 0.9810901001112347,
-            "f1-score": 0.9686985172981878,
-            "support": 899.0
           },
           "RELEVANT": {
-            "precision": 0.6964285714285714,
-            "recall": 0.4936708860759494,
-            "f1-score": 0.5777777777777777,
-            "support": 79.0
           },
-          "accuracy": 0.941717791411043,
           "macro avg": {
-            "precision": 0.8265223117446545,
-            "recall": 0.737380493093592,
-            "f1-score": 0.7732381475379828,
-            "support": 978.0
           },
           "weighted avg": {
-            "precision": 0.9355988629299183,
-            "recall": 0.941717791411043,
-            "f1-score": 0.9371210751487886,
-            "support": 978.0
           }
         },
-        "roc_auc": 0.871530955632841,
-        "average_precision": 0.5935308473185881
       },
       "test_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.9261811023622047,
-        "precision": 0.6907216494845361,
-        "recall": 0.5982142857142857,
-        "f1": 0.6411483253588517,
         "confusion_matrix": [
           [
-            874,
-            30
           ],
           [
-            45,
-            67
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9510337323177367,
-            "recall": 0.9668141592920354,
-            "f1-score": 0.9588590235874932,
-            "support": 904.0
           },
           "RELEVANT": {
-            "precision": 0.6907216494845361,
-            "recall": 0.5982142857142857,
-            "f1-score": 0.6411483253588517,
-            "support": 112.0
           },
-          "accuracy": 0.9261811023622047,
           "macro avg": {
-            "precision": 0.8208776909011364,
-            "recall": 0.7825142225031605,
-            "f1-score": 0.8000036744731724,
-            "support": 1016.0
           },
           "weighted avg": {
-            "precision": 0.9223379121628957,
-            "recall": 0.9261811023622047,
-            "f1-score": 0.9238357970111075,
-            "support": 1016.0
           }
         },
-        "roc_auc": 0.8990004740834386,
-        "average_precision": 0.7262348311700503
       },
       "test_optimal_threshold": {
-        "threshold": 0.6076606929552563,
-        "accuracy": 0.9301181102362205,
-        "precision": 0.9019607843137255,
-        "recall": 0.4107142857142857,
-        "f1": 0.5644171779141104,
         "confusion_matrix": [
           [
-            899,
-            5
           ],
           [
-            66,
-            46
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9316062176165804,
-            "recall": 0.9944690265486725,
-            "f1-score": 0.962011771000535,
-            "support": 904.0
           },
           "RELEVANT": {
-            "precision": 0.9019607843137255,
-            "recall": 0.4107142857142857,
-            "f1-score": 0.5644171779141104,
-            "support": 112.0
           },
-          "accuracy": 0.9301181102362205,
           "macro avg": {
-            "precision": 0.9167835009651529,
-            "recall": 0.7025916561314791,
-            "f1-score": 0.7632144744573227,
-            "support": 1016.0
           },
           "weighted avg": {
-            "precision": 0.9283382170950057,
-            "recall": 0.9301181102362205,
-            "f1-score": 0.9181824457784095,
-            "support": 1016.0
           }
         },
-        "roc_auc": 0.8990004740834386,
-        "average_precision": 0.7262348311700503
       }
     },
     {
@@ -277,194 +277,194 @@
       "artifact_dir": "/content/agri-utilization-classifier/baselines/xgboost",
       "artifact_file": "/content/agri-utilization-classifier/baselines/xgboost/xgboost_tfidf.joblib",
       "validation_best_threshold": {
-        "threshold": 0.17728303372859955,
-        "f1": 0.5806451612903226,
-        "precision": 0.5921052631578947,
-        "recall": 0.569620253164557
       },
       "validation_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.9447852760736196,
-        "precision": 0.9310344827586207,
-        "recall": 0.34177215189873417,
-        "f1": 0.5,
         "confusion_matrix": [
           [
-            897,
-            2
           ],
           [
-            52,
-            27
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9452054794520548,
-            "recall": 0.9977753058954394,
-            "f1-score": 0.9707792207792207,
-            "support": 899.0
           },
           "RELEVANT": {
-            "precision": 0.9310344827586207,
-            "recall": 0.34177215189873417,
-            "f1-score": 0.5,
-            "support": 79.0
           },
-          "accuracy": 0.9447852760736196,
           "macro avg": {
-            "precision": 0.9381199811053378,
-            "recall": 0.6697737288970868,
-            "f1-score": 0.7353896103896104,
-            "support": 978.0
           },
           "weighted avg": {
-            "precision": 0.9440607874901108,
-            "recall": 0.9447852760736196,
-            "f1-score": 0.9327510424136191,
-            "support": 978.0
           }
         },
-        "roc_auc": 0.822629926359809,
-        "average_precision": 0.5882293042162409
       },
       "validation_optimal_threshold": {
-        "threshold": 0.17728303372859955,
-        "accuracy": 0.9335378323108384,
-        "precision": 0.5921052631578947,
-        "recall": 0.569620253164557,
-        "f1": 0.5806451612903226,
         "confusion_matrix": [
           [
-            868,
-            31
           ],
           [
-            34,
-            45
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9623059866962306,
-            "recall": 0.9655172413793104,
-            "f1-score": 0.9639089394780678,
-            "support": 899.0
           },
           "RELEVANT": {
-            "precision": 0.5921052631578947,
-            "recall": 0.569620253164557,
-            "f1-score": 0.5806451612903226,
-            "support": 79.0
           },
-          "accuracy": 0.9335378323108384,
           "macro avg": {
-            "precision": 0.7772056249270627,
-            "recall": 0.7675687472719337,
-            "f1-score": 0.7722770503841951,
-            "support": 978.0
           },
           "weighted avg": {
-            "precision": 0.9324022472693098,
-            "recall": 0.9335378323108384,
-            "f1-score": 0.9329500044301825,
-            "support": 978.0
           }
         },
-        "roc_auc": 0.822629926359809,
-        "average_precision": 0.5882293042162409
       },
       "test_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.9242125984251969,
-        "precision": 1.0,
-        "recall": 0.3125,
-        "f1": 0.47619047619047616,
         "confusion_matrix": [
           [
-            904,
-            0
           ],
           [
-            77,
-            35
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9215086646279307,
-            "recall": 1.0,
-            "f1-score": 0.9591511936339523,
-            "support": 904.0
           },
           "RELEVANT": {
-            "precision": 1.0,
-            "recall": 0.3125,
-            "f1-score": 0.47619047619047616,
-            "support": 112.0
           },
-          "accuracy": 0.9242125984251969,
           "macro avg": {
-            "precision": 0.9607543323139653,
-            "recall": 0.65625,
-            "f1-score": 0.7176708349122143,
-            "support": 1016.0
           },
           "weighted avg": {
-            "precision": 0.9301612527791825,
-            "recall": 0.9242125984251969,
-            "f1-score": 0.905911429506325,
-            "support": 1016.0
           }
         },
-        "roc_auc": 0.8921114491150443,
-        "average_precision": 0.6916666494483661
       },
       "test_optimal_threshold": {
-        "threshold": 0.17728303372859955,
-        "accuracy": 0.9183070866141733,
-        "precision": 0.6629213483146067,
-        "recall": 0.5267857142857143,
-        "f1": 0.5870646766169154,
         "confusion_matrix": [
           [
-            874,
-            30
           ],
           [
-            53,
-            59
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9428263214670982,
-            "recall": 0.9668141592920354,
-            "f1-score": 0.9546695794647734,
-            "support": 904.0
           },
           "RELEVANT": {
-            "precision": 0.6629213483146067,
-            "recall": 0.5267857142857143,
-            "f1-score": 0.5870646766169154,
-            "support": 112.0
           },
-          "accuracy": 0.9183070866141733,
           "macro avg": {
-            "precision": 0.8028738348908524,
-            "recall": 0.7467999367888749,
-            "f1-score": 0.7708671280408443,
-            "support": 1016.0
           },
           "weighted avg": {
-            "precision": 0.9119706551353274,
-            "recall": 0.9183070866141733,
-            "f1-score": 0.9141462043476867,
-            "support": 1016.0
           }
         },
-        "roc_auc": 0.8921114491150443,
-        "average_precision": 0.6916666494483661
       }
     },
     {
@@ -474,194 +474,194 @@
       "artifact_dir": "/content/agri-utilization-classifier/baselines/embedding-logistic",
       "artifact_file": "/content/agri-utilization-classifier/baselines/embedding-logistic/embedding-logistic.joblib",
       "validation_best_threshold": {
-        "threshold": 0.7220406191151401,
-        "f1": 0.7529411764705883,
-        "precision": 0.7032967032967034,
-        "recall": 0.810126582278481
       },
       "validation_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.9120654396728016,
-        "precision": 0.4755244755244755,
-        "recall": 0.8607594936708861,
-        "f1": 0.6126126126126126,
         "confusion_matrix": [
           [
-            824,
-            75
           ],
           [
-            11,
-            68
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9868263473053892,
-            "recall": 0.9165739710789766,
-            "f1-score": 0.9504036908881199,
-            "support": 899.0
           },
           "RELEVANT": {
-            "precision": 0.4755244755244755,
-            "recall": 0.8607594936708861,
-            "f1-score": 0.6126126126126126,
-            "support": 79.0
           },
-          "accuracy": 0.9120654396728016,
           "macro avg": {
-            "precision": 0.7311754114149324,
-            "recall": 0.8886667323749313,
-            "f1-score": 0.7815081517503663,
-            "support": 978.0
           },
           "weighted avg": {
-            "precision": 0.9455248668650087,
-            "recall": 0.9120654396728016,
-            "f1-score": 0.9231179084916321,
-            "support": 978.0
           }
         },
-        "roc_auc": 0.9525633263400967,
-        "average_precision": 0.7622834015915168
       },
       "validation_optimal_threshold": {
-        "threshold": 0.7220406191151401,
-        "accuracy": 0.9570552147239264,
-        "precision": 0.7032967032967034,
-        "recall": 0.810126582278481,
-        "f1": 0.7529411764705882,
         "confusion_matrix": [
           [
-            872,
-            27
           ],
           [
-            15,
-            64
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9830890642615558,
-            "recall": 0.9699666295884316,
-            "f1-score": 0.9764837625979843,
-            "support": 899.0
           },
           "RELEVANT": {
-            "precision": 0.7032967032967034,
-            "recall": 0.810126582278481,
-            "f1-score": 0.7529411764705882,
-            "support": 79.0
           },
-          "accuracy": 0.9570552147239264,
           "macro avg": {
-            "precision": 0.8431928837791296,
-            "recall": 0.8900466059334563,
-            "f1-score": 0.8647124695342863,
-            "support": 978.0
           },
           "weighted avg": {
-            "precision": 0.9604882498277897,
-            "recall": 0.9570552147239264,
-            "f1-score": 0.9584266416326834,
-            "support": 978.0
           }
         },
-        "roc_auc": 0.9525633263400967,
-        "average_precision": 0.7622834015915168
       },
       "test_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.890748031496063,
-        "precision": 0.5025380710659898,
-        "recall": 0.8839285714285714,
-        "f1": 0.6407766990291263,
         "confusion_matrix": [
           [
-            806,
-            98
           ],
           [
-            13,
-            99
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9841269841269841,
-            "recall": 0.8915929203539823,
-            "f1-score": 0.9355774811375508,
-            "support": 904.0
           },
           "RELEVANT": {
-            "precision": 0.5025380710659898,
-            "recall": 0.8839285714285714,
-            "f1-score": 0.6407766990291263,
-            "support": 112.0
           },
-          "accuracy": 0.890748031496063,
           "macro avg": {
-            "precision": 0.7433325275964869,
-            "recall": 0.8877607458912768,
-            "f1-score": 0.7881770900833385,
-            "support": 1016.0
           },
           "weighted avg": {
-            "precision": 0.9310384425297091,
-            "recall": 0.890748031496063,
-            "f1-score": 0.9030797571255984,
-            "support": 1016.0
           }
         },
-        "roc_auc": 0.955317635903919,
-        "average_precision": 0.7096184898069098
       },
       "test_optimal_threshold": {
-        "threshold": 0.7220406191151401,
-        "accuracy": 0.9350393700787402,
-        "precision": 0.6885245901639344,
-        "recall": 0.75,
-        "f1": 0.717948717948718,
         "confusion_matrix": [
           [
-            866,
-            38
           ],
           [
-            28,
-            84
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9686800894854586,
-            "recall": 0.9579646017699115,
-            "f1-score": 0.9632925472747497,
-            "support": 904.0
           },
           "RELEVANT": {
-            "precision": 0.6885245901639344,
-            "recall": 0.75,
-            "f1-score": 0.717948717948718,
-            "support": 112.0
           },
-          "accuracy": 0.9350393700787402,
           "macro avg": {
-            "precision": 0.8286023398246964,
-            "recall": 0.8539823008849557,
-            "f1-score": 0.8406206326117338,
-            "support": 1016.0
           },
           "weighted avg": {
-            "precision": 0.9377968060956843,
-            "recall": 0.9350393700787402,
-            "f1-score": 0.9362467708136123,
-            "support": 1016.0
           }
         },
-        "roc_auc": 0.955317635903919,
-        "average_precision": 0.7096184898069098
       }
     },
     {
@@ -671,194 +671,194 @@
       "artifact_dir": "/content/agri-utilization-classifier/baselines/embedding-svm",
       "artifact_file": "/content/agri-utilization-classifier/baselines/embedding-svm/embedding-svm.joblib",
       "validation_best_threshold": {
-        "threshold": 0.30975184413575924,
-        "f1": 0.746987951807229,
-        "precision": 0.7126436781609196,
-        "recall": 0.7848101265822784
       },
       "validation_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.9550102249488752,
-        "precision": 0.8070175438596491,
-        "recall": 0.5822784810126582,
-        "f1": 0.6764705882352942,
         "confusion_matrix": [
           [
-            888,
-            11
           ],
           [
-            33,
-            46
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9641693811074918,
-            "recall": 0.9877641824249166,
-            "f1-score": 0.9758241758241758,
-            "support": 899.0
           },
           "RELEVANT": {
-            "precision": 0.8070175438596491,
-            "recall": 0.5822784810126582,
-            "f1-score": 0.6764705882352942,
-            "support": 79.0
           },
-          "accuracy": 0.9550102249488752,
           "macro avg": {
-            "precision": 0.8855934624835704,
-            "recall": 0.7850213317187874,
-            "f1-score": 0.8261473820297349,
-            "support": 978.0
           },
           "weighted avg": {
-            "precision": 0.9514751120455496,
-            "recall": 0.9550102249488752,
-            "f1-score": 0.9516432623072826,
-            "support": 978.0
           }
         },
-        "roc_auc": 0.9524506836006251,
-        "average_precision": 0.7542419360138435
       },
       "validation_optimal_threshold": {
-        "threshold": 0.30975184413575924,
-        "accuracy": 0.9570552147239264,
-        "precision": 0.7126436781609196,
-        "recall": 0.7848101265822784,
-        "f1": 0.7469879518072289,
         "confusion_matrix": [
           [
-            874,
-            25
           ],
           [
-            17,
-            62
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9809203142536476,
-            "recall": 0.9721913236929922,
-            "f1-score": 0.976536312849162,
-            "support": 899.0
           },
           "RELEVANT": {
-            "precision": 0.7126436781609196,
-            "recall": 0.7848101265822784,
-            "f1-score": 0.7469879518072289,
-            "support": 79.0
           },
-          "accuracy": 0.9570552147239264,
           "macro avg": {
-            "precision": 0.8467819962072836,
-            "recall": 0.8785007251376353,
-            "f1-score": 0.8617621323281954,
-            "support": 978.0
           },
           "weighted avg": {
-            "precision": 0.9592497066347054,
-            "recall": 0.9570552147239264,
-            "f1-score": 0.9579940628263474,
-            "support": 978.0
           }
         },
-        "roc_auc": 0.9524506836006251,
-        "average_precision": 0.7542419360138435
       },
       "test_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.9301181102362205,
-        "precision": 0.7411764705882353,
-        "recall": 0.5625,
-        "f1": 0.6395939086294417,
         "confusion_matrix": [
           [
-            882,
-            22
           ],
           [
-            49,
-            63
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9473684210526315,
-            "recall": 0.9756637168141593,
-            "f1-score": 0.9613079019073569,
-            "support": 904.0
           },
           "RELEVANT": {
-            "precision": 0.7411764705882353,
-            "recall": 0.5625,
-            "f1-score": 0.6395939086294417,
-            "support": 112.0
           },
-          "accuracy": 0.9301181102362205,
           "macro avg": {
-            "precision": 0.8442724458204334,
-            "recall": 0.7690818584070797,
-            "f1-score": 0.8004509052683992,
-            "support": 1016.0
           },
           "weighted avg": {
-            "precision": 0.9246385997415957,
-            "recall": 0.9301181102362205,
-            "f1-score": 0.9258433672153032,
-            "support": 1016.0
           }
         },
-        "roc_auc": 0.9563744469026548,
-        "average_precision": 0.7035914186137721
       },
       "test_optimal_threshold": {
-        "threshold": 0.30975184413575924,
-        "accuracy": 0.9340551181102362,
-        "precision": 0.6859504132231405,
-        "recall": 0.7410714285714286,
-        "f1": 0.7124463519313304,
         "confusion_matrix": [
           [
-            866,
-            38
           ],
           [
-            29,
-            83
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9675977653631285,
-            "recall": 0.9579646017699115,
-            "f1-score": 0.962757087270706,
-            "support": 904.0
           },
           "RELEVANT": {
-            "precision": 0.6859504132231405,
-            "recall": 0.7410714285714286,
-            "f1-score": 0.7124463519313304,
-            "support": 112.0
           },
-          "accuracy": 0.9340551181102362,
           "macro avg": {
-            "precision": 0.8267740892931346,
-            "recall": 0.84951801517067,
-            "f1-score": 0.8376017196010181,
-            "support": 1016.0
           },
           "weighted avg": {
-            "precision": 0.9365500257571455,
-            "recall": 0.9340551181102362,
-            "f1-score": 0.9351637778632157,
-            "support": 1016.0
           }
         },
-        "roc_auc": 0.9563744469026548,
-        "average_precision": 0.7035914186137721
       }
     },
     {
@@ -868,194 +868,194 @@
       "artifact_dir": "/content/agri-utilization-classifier/baselines/embedding-lightgbm",
       "artifact_file": "/content/agri-utilization-classifier/baselines/embedding-lightgbm/embedding-lightgbm.joblib",
       "validation_best_threshold": {
-        "threshold": 0.042041465431985434,
-        "f1": 0.7283236994219654,
-        "precision": 0.6702127659574468,
-        "recall": 0.7974683544303798
       },
       "validation_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.9539877300613497,
-        "precision": 0.75,
-        "recall": 0.6455696202531646,
-        "f1": 0.6938775510204082,
         "confusion_matrix": [
           [
-            882,
-            17
           ],
           [
-            28,
-            51
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9692307692307692,
-            "recall": 0.9810901001112347,
-            "f1-score": 0.9751243781094527,
-            "support": 899.0
           },
           "RELEVANT": {
-            "precision": 0.75,
-            "recall": 0.6455696202531646,
-            "f1-score": 0.6938775510204082,
-            "support": 79.0
           },
-          "accuracy": 0.9539877300613497,
           "macro avg": {
-            "precision": 0.8596153846153847,
-            "recall": 0.8133298601821997,
-            "f1-score": 0.8345009645649304,
-            "support": 978.0
           },
           "weighted avg": {
-            "precision": 0.9515219443133554,
-            "recall": 0.9539877300613497,
-            "f1-score": 0.9524060761257774,
-            "support": 978.0
           }
         },
-        "roc_auc": 0.9480716971036736,
-        "average_precision": 0.7818499996214695
       },
       "validation_optimal_threshold": {
-        "threshold": 0.042041465431985434,
-        "accuracy": 0.9519427402862985,
-        "precision": 0.6702127659574468,
-        "recall": 0.7974683544303798,
-        "f1": 0.7283236994219653,
         "confusion_matrix": [
           [
-            868,
-            31
           ],
           [
-            16,
-            63
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9819004524886877,
-            "recall": 0.9655172413793104,
-            "f1-score": 0.9736399326977005,
-            "support": 899.0
           },
           "RELEVANT": {
-            "precision": 0.6702127659574468,
-            "recall": 0.7974683544303798,
-            "f1-score": 0.7283236994219653,
-            "support": 79.0
           },
-          "accuracy": 0.9519427402862985,
           "macro avg": {
-            "precision": 0.8260566092230672,
-            "recall": 0.881492797904845,
-            "f1-score": 0.8509818160598329,
-            "support": 978.0
           },
           "weighted avg": {
-            "precision": 0.9567232262760416,
-            "recall": 0.9519427402862985,
-            "f1-score": 0.9538239997439346,
-            "support": 978.0
           }
         },
-        "roc_auc": 0.9480716971036736,
-        "average_precision": 0.7818499996214695
       },
       "test_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.937007874015748,
-        "precision": 0.74,
-        "recall": 0.6607142857142857,
-        "f1": 0.6981132075471698,
         "confusion_matrix": [
           [
-            878,
-            26
           ],
           [
-            38,
-            74
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9585152838427947,
-            "recall": 0.9712389380530974,
-            "f1-score": 0.9648351648351648,
-            "support": 904.0
           },
           "RELEVANT": {
-            "precision": 0.74,
-            "recall": 0.6607142857142857,
-            "f1-score": 0.6981132075471698,
-            "support": 112.0
           },
-          "accuracy": 0.937007874015748,
           "macro avg": {
-            "precision": 0.8492576419213973,
-            "recall": 0.8159766118836915,
-            "f1-score": 0.8314741861911673,
-            "support": 1016.0
           },
           "weighted avg": {
-            "precision": 0.9344269848365024,
-            "recall": 0.937007874015748,
-            "f1-score": 0.9354327443467244,
-            "support": 1016.0
           }
         },
-        "roc_auc": 0.9597819216182049,
-        "average_precision": 0.7911233572387708
       },
       "test_optimal_threshold": {
-        "threshold": 0.042041465431985434,
-        "accuracy": 0.9291338582677166,
-        "precision": 0.6388888888888888,
-        "recall": 0.8214285714285714,
-        "f1": 0.71875,
         "confusion_matrix": [
           [
-            852,
-            52
           ],
           [
-            20,
-            92
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9770642201834863,
-            "recall": 0.9424778761061947,
-            "f1-score": 0.9594594594594594,
-            "support": 904.0
           },
           "RELEVANT": {
-            "precision": 0.6388888888888888,
-            "recall": 0.8214285714285714,
-            "f1-score": 0.71875,
-            "support": 112.0
           },
-          "accuracy": 0.9291338582677166,
           "macro avg": {
-            "precision": 0.8079765545361876,
-            "recall": 0.881953223767383,
-            "f1-score": 0.8391047297297297,
-            "support": 1016.0
           },
           "weighted avg": {
-            "precision": 0.9397850498045542,
-            "recall": 0.9291338582677166,
-            "f1-score": 0.9329245584166844,
-            "support": 1016.0
           }
         },
-        "roc_auc": 0.9597819216182049,
-        "average_precision": 0.7911233572387708
       }
     },
     {
@@ -1063,194 +1063,194 @@
       "model_name": "FacebookAI/xlm-roberta-base",
       "artifact_dir": "/content/agri-utilization-classifier/transformer",
       "validation_best_threshold": {
-        "threshold": 0.4710787534713745,
-        "f1": 0.829268292682927,
-        "precision": 0.8,
-        "recall": 0.8607594936708861
       },
       "validation_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.9703476482617587,
-        "precision": 0.7976190476190477,
-        "recall": 0.8481012658227848,
-        "f1": 0.8220858895705522,
         "confusion_matrix": [
           [
-            882,
-            17
           ],
           [
-            12,
-            67
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9865771812080537,
-            "recall": 0.9810901001112347,
-            "f1-score": 0.9838259899609593,
-            "support": 899.0
           },
           "RELEVANT": {
-            "precision": 0.7976190476190477,
-            "recall": 0.8481012658227848,
-            "f1-score": 0.8220858895705522,
-            "support": 79.0
           },
-          "accuracy": 0.9703476482617587,
           "macro avg": {
-            "precision": 0.8920981144135507,
-            "recall": 0.9145956829670097,
-            "f1-score": 0.9029559397657557,
-            "support": 978.0
           },
           "weighted avg": {
-            "precision": 0.9713136918895144,
-            "recall": 0.9703476482617587,
-            "f1-score": 0.9707610943261513,
-            "support": 978.0
           }
         },
-        "roc_auc": 0.9661086157615353,
-        "average_precision": 0.8539255147550682
       },
       "validation_optimal_threshold": {
-        "threshold": 0.4710787534713745,
-        "accuracy": 0.9713701431492843,
-        "precision": 0.8,
-        "recall": 0.8607594936708861,
-        "f1": 0.8292682926829268,
         "confusion_matrix": [
           [
-            882,
-            17
           ],
           [
-            11,
-            68
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9876819708846585,
-            "recall": 0.9810901001112347,
-            "f1-score": 0.984375,
-            "support": 899.0
           },
           "RELEVANT": {
-            "precision": 0.8,
-            "recall": 0.8607594936708861,
-            "f1-score": 0.8292682926829268,
-            "support": 79.0
           },
-          "accuracy": 0.9713701431492843,
           "macro avg": {
-            "precision": 0.8938409854423293,
-            "recall": 0.9209247968910603,
-            "f1-score": 0.9068216463414633,
-            "support": 978.0
           },
           "weighted avg": {
-            "precision": 0.972521566283546,
-            "recall": 0.9713701431492843,
-            "f1-score": 0.9718459305950421,
-            "support": 978.0
           }
         },
-        "roc_auc": 0.9661086157615353,
-        "average_precision": 0.8539255147550682
       },
       "test_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.9507874015748031,
-        "precision": 0.7767857142857143,
-        "recall": 0.7767857142857143,
-        "f1": 0.7767857142857143,
         "confusion_matrix": [
           [
-            879,
-            25
           ],
           [
-            25,
-            87
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9723451327433629,
-            "recall": 0.9723451327433629,
-            "f1-score": 0.9723451327433629,
-            "support": 904.0
           },
           "RELEVANT": {
-            "precision": 0.7767857142857143,
-            "recall": 0.7767857142857143,
-            "f1-score": 0.7767857142857143,
-            "support": 112.0
           },
-          "accuracy": 0.9507874015748031,
           "macro avg": {
-            "precision": 0.8745654235145386,
-            "recall": 0.8745654235145386,
-            "f1-score": 0.8745654235145386,
-            "support": 1016.0
           },
           "weighted avg": {
-            "precision": 0.9507874015748031,
-            "recall": 0.9507874015748031,
-            "f1-score": 0.9507874015748031,
-            "support": 1016.0
           }
         },
-        "roc_auc": 0.9682512247155499,
-        "average_precision": 0.8171206633671375
       },
       "test_optimal_threshold": {
-        "threshold": 0.4710787534713745,
-        "accuracy": 0.9498031496062992,
-        "precision": 0.7699115044247787,
-        "recall": 0.7767857142857143,
-        "f1": 0.7733333333333333,
         "confusion_matrix": [
           [
-            878,
-            26
           ],
           [
-            25,
-            87
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9723145071982281,
-            "recall": 0.9712389380530974,
-            "f1-score": 0.9717764250138351,
-            "support": 904.0
           },
           "RELEVANT": {
-            "precision": 0.7699115044247787,
-            "recall": 0.7767857142857143,
-            "f1-score": 0.7733333333333333,
-            "support": 112.0
           },
-          "accuracy": 0.9498031496062992,
           "macro avg": {
-            "precision": 0.8711130058115034,
-            "recall": 0.8740123261694058,
-            "f1-score": 0.8725548791735842,
-            "support": 1016.0
           },
           "weighted avg": {
-            "precision": 0.9500023651602102,
-            "recall": 0.9498031496062992,
-            "f1-score": 0.9499008086081104,
-            "support": 1016.0
           }
         },
-        "roc_auc": 0.9682512247155499,
-        "average_precision": 0.8171206633671375
       }
     }
   ]

 {
+  "created_at": "2026-06-09T23:58:45.600559+00:00",
   "config": {
     "hf_dataset": "faodl/amis-agri-utilization",
     "hf_subset": null,
+    "hf_revision": "main",
     "train_split": "train",
     "validation_split": "validation",
     "test_split": "test",
   },
   "dataset_summary": {
     "train": {
+      "rows": 9753,
       "labels": {
+        "0": 8950,
+        "1": 803
       },
+      "unique_groups": 4987,
+      "text_length_mean": 696.3964933866503,
       "text_length_median": 794.0
     },
     "validation": {
+      "rows": 2084,
       "labels": {
+        "0": 1885,
+        "1": 199
       },
+      "unique_groups": 1069,
+      "text_length_mean": 700.8267754318618,
       "text_length_median": 794.0
     },
     "test": {
+      "rows": 2086,
       "labels": {
+        "0": 1957,
+        "1": 129
       },
+      "unique_groups": 1069,
+      "text_length_mean": 701.6332694151486,
       "text_length_median": 794.0
     }
   },
       "artifact_dir": "/content/agri-utilization-classifier/baselines/logistic",
       "artifact_file": "/content/agri-utilization-classifier/baselines/logistic/logistic_tfidf.joblib",
       "validation_best_threshold": {
+        "threshold": 0.36023362771573536,
+        "f1": 0.48928571428571427,
+        "precision": 0.37950138504155123,
+        "recall": 0.6884422110552764
       },
       "validation_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.9011516314779271,
+        "precision": 0.4816753926701571,
+        "recall": 0.4623115577889447,
+        "f1": 0.4717948717948718,
         "confusion_matrix": [
           [
+            1786,
+            99
           ],
           [
+            107,
+            92
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9434759640781828,
+            "recall": 0.9474801061007958,
+            "f1-score": 0.9454737956590789,
+            "support": 1885.0
           },
           "RELEVANT": {
+            "precision": 0.4816753926701571,
+            "recall": 0.4623115577889447,
+            "f1-score": 0.4717948717948718,
+            "support": 199.0
           },
+          "accuracy": 0.9011516314779271,
           "macro avg": {
+            "precision": 0.7125756783741699,
+            "recall": 0.7048958319448703,
+            "f1-score": 0.7086343337269754,
+            "support": 2084.0
           },
           "weighted avg": {
+            "precision": 0.8993788845627332,
+            "recall": 0.9011516314779271,
+            "f1-score": 0.9002424588793393,
+            "support": 2084.0
           }
         },
+        "roc_auc": 0.8674606454020767,
+        "average_precision": 0.4960554729220717
       },
       "validation_optimal_threshold": {
+        "threshold": 0.36023362771573536,
+        "accuracy": 0.8627639155470249,
+        "precision": 0.37950138504155123,
+        "recall": 0.6884422110552764,
+        "f1": 0.48928571428571427,
         "confusion_matrix": [
           [
+            1661,
+            224
           ],
           [
+            62,
+            137
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9640162507254788,
+            "recall": 0.8811671087533156,
+            "f1-score": 0.9207317073170732,
+            "support": 1885.0
           },
           "RELEVANT": {
+            "precision": 0.37950138504155123,
+            "recall": 0.6884422110552764,
+            "f1-score": 0.48928571428571427,
+            "support": 199.0
           },
+          "accuracy": 0.8627639155470249,
           "macro avg": {
+            "precision": 0.671758817883515,
+            "recall": 0.7848046599042959,
+            "f1-score": 0.7050087108013937,
+            "support": 2084.0
           },
           "weighted avg": {
+            "precision": 0.9082012515550846,
+            "recall": 0.8627639155470249,
+            "f1-score": 0.879533169594789,
+            "support": 2084.0
           }
         },
+        "roc_auc": 0.8674606454020767,
+        "average_precision": 0.4960554729220717
       },
       "test_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.9175455417066155,
+        "precision": 0.3576158940397351,
+        "recall": 0.4186046511627907,
+        "f1": 0.38571428571428573,
         "confusion_matrix": [
           [
+            1860,
+            97
           ],
           [
+            75,
+            54
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9612403100775194,
+            "recall": 0.9504343382728666,
+            "f1-score": 0.9558067831449126,
+            "support": 1957.0
           },
           "RELEVANT": {
+            "precision": 0.3576158940397351,
+            "recall": 0.4186046511627907,
+            "f1-score": 0.38571428571428573,
+            "support": 129.0
           },
+          "accuracy": 0.9175455417066155,
           "macro avg": {
+            "precision": 0.6594281020586272,
+            "recall": 0.6845194947178287,
+            "f1-score": 0.6707605344295992,
+            "support": 2086.0
           },
           "weighted avg": {
+            "precision": 0.9239116668997274,
+            "recall": 0.9175455417066155,
+            "f1-score": 0.9205517821053388,
+            "support": 2086.0
           }
         },
+        "roc_auc": 0.8562663149180244,
+        "average_precision": 0.3981049318082447
       },
       "test_optimal_threshold": {
+        "threshold": 0.36023362771573536,
+        "accuracy": 0.8686481303930969,
+        "precision": 0.26688102893890675,
+        "recall": 0.6434108527131783,
+        "f1": 0.37727272727272726,
         "confusion_matrix": [
           [
+            1729,
+            228
           ],
           [
+            46,
+            83
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9740845070422535,
+            "recall": 0.883495145631068,
+            "f1-score": 0.9265809217577706,
+            "support": 1957.0
           },
           "RELEVANT": {
+            "precision": 0.26688102893890675,
+            "recall": 0.6434108527131783,
+            "f1-score": 0.37727272727272726,
+            "support": 129.0
           },
+          "accuracy": 0.8686481303930969,
           "macro avg": {
+            "precision": 0.6204827679905801,
+            "recall": 0.7634529991721232,
+            "f1-score": 0.651926824515249,
+            "support": 2086.0
           },
           "weighted avg": {
+            "precision": 0.9303504472745969,
+            "recall": 0.8686481303930969,
+            "f1-score": 0.8926112395484846,
+            "support": 2086.0
           }
         },
+        "roc_auc": 0.8562663149180244,
+        "average_precision": 0.3981049318082447
       }
     },
     {
       "artifact_dir": "/content/agri-utilization-classifier/baselines/xgboost",
       "artifact_file": "/content/agri-utilization-classifier/baselines/xgboost/xgboost_tfidf.joblib",
       "validation_best_threshold": {
+        "threshold": 0.10415865480899811,
+        "f1": 0.5354691075514874,
+        "precision": 0.49159663865546216,
+        "recall": 0.5879396984924623
       },
       "validation_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.9189059500959693,
+        "precision": 0.7205882352941176,
+        "recall": 0.24623115577889448,
+        "f1": 0.36704119850187267,
         "confusion_matrix": [
           [
+            1866,
+            19
           ],
           [
+            150,
+            49
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9255952380952381,
+            "recall": 0.9899204244031831,
+            "f1-score": 0.9566777749295052,
+            "support": 1885.0
           },
           "RELEVANT": {
+            "precision": 0.7205882352941176,
+            "recall": 0.24623115577889448,
+            "f1-score": 0.36704119850187267,
+            "support": 199.0
           },
+          "accuracy": 0.9189059500959693,
           "macro avg": {
+            "precision": 0.823091736694678,
+            "recall": 0.6180757900910387,
+            "f1-score": 0.661859486715689,
+            "support": 2084.0
           },
           "weighted avg": {
+            "precision": 0.9060192335091427,
+            "recall": 0.9189059500959693,
+            "f1-score": 0.9003737064510509,
+            "support": 2084.0
           }
         },
+        "roc_auc": 0.8338682803940125,
+        "average_precision": 0.49303491730954946
       },
       "validation_optimal_threshold": {
+        "threshold": 0.10415865480899811,
+        "accuracy": 0.9025911708253359,
+        "precision": 0.49159663865546216,
+        "recall": 0.5879396984924623,
+        "f1": 0.5354691075514875,
         "confusion_matrix": [
           [
+            1764,
+            121
           ],
           [
+            82,
+            117
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9555796316359697,
+            "recall": 0.9358090185676392,
+            "f1-score": 0.9455909943714822,
+            "support": 1885.0
           },
           "RELEVANT": {
+            "precision": 0.49159663865546216,
+            "recall": 0.5879396984924623,
+            "f1-score": 0.5354691075514875,
+            "support": 199.0
           },
+          "accuracy": 0.9025911708253359,
           "macro avg": {
+            "precision": 0.723588135145716,
+            "recall": 0.7618743585300507,
+            "f1-score": 0.7405300509614848,
+            "support": 2084.0
           },
           "weighted avg": {
+            "precision": 0.9112741538993474,
+            "recall": 0.9025911708253359,
+            "f1-score": 0.906428683681857,
+            "support": 2084.0
           }
         },
+        "roc_auc": 0.8338682803940125,
+        "average_precision": 0.49303491730954946
       },
       "test_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.950143815915628,
+        "precision": 0.7659574468085106,
+        "recall": 0.27906976744186046,
+        "f1": 0.4090909090909091,
         "confusion_matrix": [
           [
+            1946,
+            11
           ],
           [
+            93,
+            36
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9543894065718489,
+            "recall": 0.9943791517629024,
+            "f1-score": 0.973973973973974,
+            "support": 1957.0
           },
           "RELEVANT": {
+            "precision": 0.7659574468085106,
+            "recall": 0.27906976744186046,
+            "f1-score": 0.4090909090909091,
+            "support": 129.0
           },
+          "accuracy": 0.950143815915628,
           "macro avg": {
+            "precision": 0.8601734266901797,
+            "recall": 0.6367244596023814,
+            "f1-score": 0.6915324415324415,
+            "support": 2086.0
           },
           "weighted avg": {
+            "precision": 0.9427366151962637,
+            "recall": 0.950143815915628,
+            "f1-score": 0.9390411286384441,
+            "support": 2086.0
           }
         },
+        "roc_auc": 0.8210657033190336,
+        "average_precision": 0.47107353711983707
       },
       "test_optimal_threshold": {
+        "threshold": 0.10415865480899811,
+        "accuracy": 0.9065196548418025,
+        "precision": 0.34285714285714286,
+        "recall": 0.5581395348837209,
+        "f1": 0.4247787610619469,
         "confusion_matrix": [
           [
+            1819,
+            138
           ],
           [
+            57,
+            72
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9696162046908315,
+            "recall": 0.9294839039345938,
+            "f1-score": 0.9491260109574745,
+            "support": 1957.0
           },
           "RELEVANT": {
+            "precision": 0.34285714285714286,
+            "recall": 0.5581395348837209,
+            "f1-score": 0.4247787610619469,
+            "support": 129.0
           },
+          "accuracy": 0.9065196548418025,
           "macro avg": {
+            "precision": 0.6562366737739872,
+            "recall": 0.7438117194091574,
+            "f1-score": 0.6869523860097106,
+            "support": 2086.0
           },
           "weighted avg": {
+            "precision": 0.9308568954978566,
+            "recall": 0.9065196548418025,
+            "f1-score": 0.9166999346216532,
+            "support": 2086.0
           }
         },
+        "roc_auc": 0.8210657033190336,
+        "average_precision": 0.47107353711983707
       }
     },
     {
       "artifact_dir": "/content/agri-utilization-classifier/baselines/embedding-logistic",
       "artifact_file": "/content/agri-utilization-classifier/baselines/embedding-logistic/embedding-logistic.joblib",
       "validation_best_threshold": {
+        "threshold": 0.7262281775474548,
+        "f1": 0.6881720430107527,
+        "precision": 0.6015037593984962,
+        "recall": 0.8040201005025126
       },
       "validation_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.8953934740882917,
+        "precision": 0.473972602739726,
+        "recall": 0.8693467336683417,
+        "f1": 0.6134751773049646,
         "confusion_matrix": [
           [
+            1693,
+            192
           ],
           [
+            26,
+            173
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9848749272833043,
+            "recall": 0.8981432360742706,
+            "f1-score": 0.939511653718091,
+            "support": 1885.0
           },
           "RELEVANT": {
+            "precision": 0.473972602739726,
+            "recall": 0.8693467336683417,
+            "f1-score": 0.6134751773049646,
+            "support": 199.0
           },
+          "accuracy": 0.8953934740882917,
           "macro avg": {
+            "precision": 0.7294237650115152,
+            "recall": 0.8837449848713061,
+            "f1-score": 0.7764934155115277,
+            "support": 2084.0
           },
           "weighted avg": {
+            "precision": 0.9360891486920508,
+            "recall": 0.8953934740882917,
+            "f1-score": 0.9083786120644383,
+            "support": 2084.0
           }
         },
+        "roc_auc": 0.951833437745758,
+        "average_precision": 0.6518934466014814
       },
       "validation_optimal_threshold": {
+        "threshold": 0.7262281775474548,
+        "accuracy": 0.9304222648752399,
+        "precision": 0.6015037593984962,
+        "recall": 0.8040201005025126,
+        "f1": 0.6881720430107527,
         "confusion_matrix": [
           [
+            1779,
+            106
           ],
           [
+            39,
+            160
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9785478547854786,
+            "recall": 0.9437665782493369,
+            "f1-score": 0.9608425600864164,
+            "support": 1885.0
           },
           "RELEVANT": {
+            "precision": 0.6015037593984962,
+            "recall": 0.8040201005025126,
+            "f1-score": 0.6881720430107527,
+            "support": 199.0
           },
+          "accuracy": 0.9304222648752399,
           "macro avg": {
+            "precision": 0.7900258070919874,
+            "recall": 0.8738933393759247,
+            "f1-score": 0.8245073015485846,
+            "support": 2084.0
           },
           "weighted avg": {
+            "precision": 0.9425441239879693,
+            "recall": 0.9304222648752399,
+            "f1-score": 0.9348054041852374,
+            "support": 2084.0
           }
         },
+        "roc_auc": 0.951833437745758,
+        "average_precision": 0.6518934466014814
       },
       "test_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.8911792905081496,
+        "precision": 0.3496932515337423,
+        "recall": 0.8837209302325582,
+        "f1": 0.5010989010989011,
         "confusion_matrix": [
           [
+            1745,
+            212
           ],
           [
+            15,
+            114
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9914772727272727,
+            "recall": 0.8916709248850281,
+            "f1-score": 0.9389292440139898,
+            "support": 1957.0
           },
           "RELEVANT": {
+            "precision": 0.3496932515337423,
+            "recall": 0.8837209302325582,
+            "f1-score": 0.5010989010989011,
+            "support": 129.0
           },
+          "accuracy": 0.8911792905081496,
           "macro avg": {
+            "precision": 0.6705852621305075,
+            "recall": 0.8876959275587931,
+            "f1-score": 0.7200140725564455,
+            "support": 2086.0
           },
           "weighted avg": {
+            "precision": 0.9517888073706259,
+            "recall": 0.8911792905081496,
+            "f1-score": 0.911853446201887,
+            "support": 2086.0
           }
         },
+        "roc_auc": 0.9507987625419385,
+        "average_precision": 0.5430515103343022
       },
       "test_optimal_threshold": {
+        "threshold": 0.7262281775474548,
+        "accuracy": 0.9285714285714286,
+        "precision": 0.4494949494949495,
+        "recall": 0.689922480620155,
+        "f1": 0.5443425076452599,
         "confusion_matrix": [
           [
+            1848,
+            109
           ],
           [
+            40,
+            89
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9788135593220338,
+            "recall": 0.9443025038323966,
+            "f1-score": 0.9612483745123537,
+            "support": 1957.0
           },
           "RELEVANT": {
+            "precision": 0.4494949494949495,
+            "recall": 0.689922480620155,
+            "f1-score": 0.5443425076452599,
+            "support": 129.0
           },
+          "accuracy": 0.9285714285714286,
           "macro avg": {
+            "precision": 0.7141542544084917,
+            "recall": 0.8171124922262758,
+            "f1-score": 0.7527954410788068,
+            "support": 2086.0
           },
           "weighted avg": {
+            "precision": 0.9460800498936092,
+            "recall": 0.9285714285714286,
+            "f1-score": 0.9354665639534586,
+            "support": 2086.0
           }
         },
+        "roc_auc": 0.9507987625419385,
+        "average_precision": 0.5430515103343022
       }
     },
     {
       "artifact_dir": "/content/agri-utilization-classifier/baselines/embedding-svm",
       "artifact_file": "/content/agri-utilization-classifier/baselines/embedding-svm/embedding-svm.joblib",
       "validation_best_threshold": {
+        "threshold": 0.24490298824052611,
+        "f1": 0.7004608294930875,
+        "precision": 0.6468085106382979,
+        "recall": 0.7638190954773869
       },
       "validation_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.9313819577735125,
+        "precision": 0.7121212121212122,
+        "recall": 0.4723618090452261,
+        "f1": 0.56797583081571,
         "confusion_matrix": [
           [
+            1847,
+            38
           ],
           [
+            105,
+            94
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9462090163934426,
+            "recall": 0.979840848806366,
+            "f1-score": 0.9627313004951785,
+            "support": 1885.0
           },
           "RELEVANT": {
+            "precision": 0.7121212121212122,
+            "recall": 0.4723618090452261,
+            "f1-score": 0.56797583081571,
+            "support": 199.0
           },
+          "accuracy": 0.9313819577735125,
           "macro avg": {
+            "precision": 0.8291651142573273,
+            "recall": 0.726101328925796,
+            "f1-score": 0.7653535656554442,
+            "support": 2084.0
           },
           "weighted avg": {
+            "precision": 0.9238561022618813,
+            "recall": 0.9313819577735125,
+            "f1-score": 0.9250363204250182,
+            "support": 2084.0
           }
         },
+        "roc_auc": 0.9535662396864961,
+        "average_precision": 0.6698106173212027
       },
       "validation_optimal_threshold": {
+        "threshold": 0.24490298824052611,
+        "accuracy": 0.9376199616122841,
+        "precision": 0.6468085106382979,
+        "recall": 0.7638190954773869,
+        "f1": 0.7004608294930875,
         "confusion_matrix": [
           [
+            1802,
+            83
           ],
           [
+            47,
+            152
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9745808545159546,
+            "recall": 0.9559681697612732,
+            "f1-score": 0.9651847884306374,
+            "support": 1885.0
           },
           "RELEVANT": {
+            "precision": 0.6468085106382979,
+            "recall": 0.7638190954773869,
+            "f1-score": 0.7004608294930875,
+            "support": 199.0
           },
+          "accuracy": 0.9376199616122841,
           "macro avg": {
+            "precision": 0.8106946825771262,
+            "recall": 0.85989363261933,
+            "f1-score": 0.8328228089618624,
+            "support": 2084.0
           },
           "weighted avg": {
+            "precision": 0.9432820558443357,
+            "recall": 0.9376199616122841,
+            "f1-score": 0.9399064449428386,
+            "support": 2084.0
           }
         },
+        "roc_auc": 0.9535662396864961,
+        "average_precision": 0.6698106173212027
       },
       "test_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.9482262703739214,
+        "precision": 0.6060606060606061,
+        "recall": 0.46511627906976744,
+        "f1": 0.5263157894736842,
         "confusion_matrix": [
           [
+            1918,
+            39
           ],
           [
+            69,
+            60
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.96527428283845,
+            "recall": 0.9800715380684721,
+            "f1-score": 0.9726166328600405,
+            "support": 1957.0
           },
           "RELEVANT": {
+            "precision": 0.6060606060606061,
+            "recall": 0.46511627906976744,
+            "f1-score": 0.5263157894736842,
+            "support": 129.0
           },
+          "accuracy": 0.9482262703739214,
           "macro avg": {
+            "precision": 0.785667444449528,
+            "recall": 0.7225939085691198,
+            "f1-score": 0.7494662111668624,
+            "support": 2086.0
           },
           "weighted avg": {
+            "precision": 0.9430602059907309,
+            "recall": 0.9482262703739214,
+            "f1-score": 0.9450170121520635,
+            "support": 2086.0
           }
         },
+        "roc_auc": 0.9554768610394807,
+        "average_precision": 0.5656727259491919
       },
       "test_optimal_threshold": {
+        "threshold": 0.24490298824052611,
+        "accuracy": 0.9372003835091084,
+        "precision": 0.4943181818181818,
+        "recall": 0.6744186046511628,
+        "f1": 0.5704918032786885,
         "confusion_matrix": [
           [
+            1868,
+            89
           ],
           [
+            42,
+            87
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9780104712041885,
+            "recall": 0.9545222278998468,
+            "f1-score": 0.9661236100336178,
+            "support": 1957.0
           },
           "RELEVANT": {
+            "precision": 0.4943181818181818,
+            "recall": 0.6744186046511628,
+            "f1-score": 0.5704918032786885,
+            "support": 129.0
           },
+          "accuracy": 0.9372003835091084,
           "macro avg": {
+            "precision": 0.7361643265111851,
+            "recall": 0.8144704162755048,
+            "f1-score": 0.7683077066561532,
+            "support": 2086.0
           },
           "weighted avg": {
+            "precision": 0.9480985319276809,
+            "recall": 0.9372003835091084,
+            "f1-score": 0.9416574053014098,
+            "support": 2086.0
           }
         },
+        "roc_auc": 0.9554768610394807,
+        "average_precision": 0.5656727259491919
       }
     },
     {
       "artifact_dir": "/content/agri-utilization-classifier/baselines/embedding-lightgbm",
       "artifact_file": "/content/agri-utilization-classifier/baselines/embedding-lightgbm/embedding-lightgbm.joblib",
       "validation_best_threshold": {
+        "threshold": 0.08937255699326424,
+        "f1": 0.7008547008547008,
+        "precision": 0.6096654275092936,
+        "recall": 0.8241206030150754
       },
       "validation_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.9366602687140115,
+        "precision": 0.6810810810810811,
+        "recall": 0.6331658291457286,
+        "f1": 0.65625,
         "confusion_matrix": [
           [
+            1826,
+            59
           ],
           [
+            73,
+            126
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9615587151132174,
+            "recall": 0.9687002652519894,
+            "f1-score": 0.9651162790697675,
+            "support": 1885.0
           },
           "RELEVANT": {
+            "precision": 0.6810810810810811,
+            "recall": 0.6331658291457286,
+            "f1-score": 0.65625,
+            "support": 199.0
           },
+          "accuracy": 0.9366602687140115,
           "macro avg": {
+            "precision": 0.8213198980971492,
+            "recall": 0.8009330471988589,
+            "f1-score": 0.8106831395348837,
+            "support": 2084.0
           },
           "weighted avg": {
+            "precision": 0.9347760619594769,
+            "recall": 0.9366602687140115,
+            "f1-score": 0.9356228100031246,
+            "support": 2084.0
           }
         },
+        "roc_auc": 0.9537208589365928,
+        "average_precision": 0.6689450933330522
       },
       "validation_optimal_threshold": {
+        "threshold": 0.08937255699326424,
+        "accuracy": 0.9328214971209213,
+        "precision": 0.6096654275092936,
+        "recall": 0.8241206030150754,
+        "f1": 0.7008547008547008,
         "confusion_matrix": [
           [
+            1780,
+            105
           ],
           [
+            35,
+            164
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9807162534435262,
+            "recall": 0.9442970822281167,
+            "f1-score": 0.9621621621621622,
+            "support": 1885.0
           },
           "RELEVANT": {
+            "precision": 0.6096654275092936,
+            "recall": 0.8241206030150754,
+            "f1-score": 0.7008547008547008,
+            "support": 199.0
           },
+          "accuracy": 0.9328214971209213,
           "macro avg": {
+            "precision": 0.7951908404764099,
+            "recall": 0.884208842621596,
+            "f1-score": 0.8315084315084316,
+            "support": 2084.0
           },
           "weighted avg": {
+            "precision": 0.945284816610075,
+            "recall": 0.9328214971209213,
+            "f1-score": 0.9372100581313634,
+            "support": 2084.0
           }
         },
+        "roc_auc": 0.9537208589365928,
+        "average_precision": 0.6689450933330522
       },
       "test_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.9482262703739214,
+        "precision": 0.5789473684210527,
+        "recall": 0.5968992248062015,
+        "f1": 0.5877862595419847,
         "confusion_matrix": [
           [
+            1901,
+            56
           ],
           [
+            52,
+            77
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9733742959549411,
+            "recall": 0.9713847726111395,
+            "f1-score": 0.972378516624041,
+            "support": 1957.0
           },
           "RELEVANT": {
+            "precision": 0.5789473684210527,
+            "recall": 0.5968992248062015,
+            "f1-score": 0.5877862595419847,
+            "support": 129.0
           },
+          "accuracy": 0.9482262703739214,
           "macro avg": {
+            "precision": 0.7761608321879969,
+            "recall": 0.7841419987086705,
+            "f1-score": 0.7800823880830128,
+            "support": 2086.0
           },
           "weighted avg": {
+            "precision": 0.948982601970343,
+            "recall": 0.9482262703739214,
+            "f1-score": 0.9485950069578927,
+            "support": 2086.0
           }
         },
+        "roc_auc": 0.9484498104597687,
+        "average_precision": 0.5852438412769653
       },
       "test_optimal_threshold": {
+        "threshold": 0.08937255699326424,
+        "accuracy": 0.9324065196548418,
+        "precision": 0.4716981132075472,
+        "recall": 0.7751937984496124,
+        "f1": 0.5865102639296188,
         "confusion_matrix": [
           [
+            1845,
+            112
           ],
           [
+            29,
+            100
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9845250800426895,
+            "recall": 0.942769545222279,
+            "f1-score": 0.9631949882537196,
+            "support": 1957.0
           },
           "RELEVANT": {
+            "precision": 0.4716981132075472,
+            "recall": 0.7751937984496124,
+            "f1-score": 0.5865102639296188,
+            "support": 129.0
           },
+          "accuracy": 0.9324065196548418,
           "macro avg": {
+            "precision": 0.7281115966251184,
+            "recall": 0.8589816718359458,
+            "f1-score": 0.7748526260916693,
+            "support": 2086.0
           },
           "weighted avg": {
+            "precision": 0.9528114277312162,
+            "recall": 0.9324065196548418,
+            "f1-score": 0.9399004870850672,
+            "support": 2086.0
           }
         },
+        "roc_auc": 0.9484498104597687,
+        "average_precision": 0.5852438412769653
       }
     },
     {
       "model_name": "FacebookAI/xlm-roberta-base",
       "artifact_dir": "/content/agri-utilization-classifier/transformer",
       "validation_best_threshold": {
+        "threshold": 0.5436205267906189,
+        "f1": 0.6983372921615203,
+        "precision": 0.6621621621621622,
+        "recall": 0.7386934673366834
       },
       "validation_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.9376199616122841,
+        "precision": 0.6533333333333333,
+        "recall": 0.7386934673366834,
+        "f1": 0.6933962264150944,
         "confusion_matrix": [
           [
+            1807,
+            78
           ],
           [
+            52,
+            147
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.972027972027972,
+            "recall": 0.9586206896551724,
+            "f1-score": 0.9652777777777778,
+            "support": 1885.0
           },
           "RELEVANT": {
+            "precision": 0.6533333333333333,
+            "recall": 0.7386934673366834,
+            "f1-score": 0.6933962264150944,
+            "support": 199.0
           },
+          "accuracy": 0.9376199616122841,
           "macro avg": {
+            "precision": 0.8126806526806527,
+            "recall": 0.848657078495928,
+            "f1-score": 0.8293370020964361,
+            "support": 2084.0
           },
           "weighted avg": {
+            "precision": 0.9415959983714303,
+            "recall": 0.9376199616122841,
+            "f1-score": 0.9393159597733756,
+            "support": 2084.0
           }
         },
+        "roc_auc": 0.9544433040534235,
+        "average_precision": 0.7261778718910262
       },
       "validation_optimal_threshold": {
+        "threshold": 0.5436205267906189,
+        "accuracy": 0.9390595009596929,
+        "precision": 0.6621621621621622,
+        "recall": 0.7386934673366834,
+        "f1": 0.6983372921615202,
         "confusion_matrix": [
           [
+            1810,
+            75
           ],
           [
+            52,
+            147
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9720730397422127,
+            "recall": 0.9602122015915119,
+            "f1-score": 0.9661062183079797,
+            "support": 1885.0
           },
           "RELEVANT": {
+            "precision": 0.6621621621621622,
+            "recall": 0.7386934673366834,
+            "f1-score": 0.6983372921615202,
+            "support": 199.0
           },
+          "accuracy": 0.9390595009596929,
           "macro avg": {
+            "precision": 0.8171176009521874,
+            "recall": 0.8494528344640977,
+            "f1-score": 0.83222175523475,
+            "support": 2084.0
           },
           "weighted avg": {
+            "precision": 0.9424798225452693,
+            "recall": 0.9390595009596929,
+            "f1-score": 0.9405371125962977,
+            "support": 2084.0
           }
         },
+        "roc_auc": 0.9544433040534235,
+        "average_precision": 0.7261778718910262
       },
       "test_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.9429530201342282,
+        "precision": 0.532051282051282,
+        "recall": 0.6434108527131783,
+        "f1": 0.5824561403508772,
         "confusion_matrix": [
           [
+            1884,
+            73
           ],
           [
+            46,
+            83
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9761658031088083,
+            "recall": 0.9626980071538068,
+            "f1-score": 0.969385129920247,
+            "support": 1957.0
           },
           "RELEVANT": {
+            "precision": 0.532051282051282,
+            "recall": 0.6434108527131783,
+            "f1-score": 0.5824561403508772,
+            "support": 129.0
           },
+          "accuracy": 0.9429530201342282,
           "macro avg": {
+            "precision": 0.7541085425800451,
+            "recall": 0.8030544299334925,
+            "f1-score": 0.7759206351355621,
+            "support": 2086.0
           },
           "weighted avg": {
+            "precision": 0.9487013864182902,
+            "recall": 0.9429530201342282,
+            "f1-score": 0.9454571147455353,
+            "support": 2086.0
           }
         },
+        "roc_auc": 0.9314030730472604,
+        "average_precision": 0.4996827419378796
       },
       "test_optimal_threshold": {
+        "threshold": 0.5436205267906189,
+        "accuracy": 0.9424736337488016,
+        "precision": 0.5290322580645161,
+        "recall": 0.6356589147286822,
+        "f1": 0.5774647887323944,
         "confusion_matrix": [
           [
+            1884,
+            73
           ],
           [
+            47,
+            82
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9756602796478508,
+            "recall": 0.9626980071538068,
+            "f1-score": 0.9691358024691358,
+            "support": 1957.0
           },
           "RELEVANT": {
+            "precision": 0.5290322580645161,
+            "recall": 0.6356589147286822,
+            "f1-score": 0.5774647887323944,
+            "support": 129.0
           },
+          "accuracy": 0.9424736337488016,
           "macro avg": {
+            "precision": 0.7523462688561835,
+            "recall": 0.7991784609412445,
+            "f1-score": 0.7733002956007651,
+            "support": 2086.0
           },
           "weighted avg": {
+            "precision": 0.948040425964126,
+            "recall": 0.9424736337488016,
+            "f1-score": 0.944914536518973,
+            "support": 2086.0
           }
         },
+        "roc_auc": 0.9314030730472604,
+        "average_precision": 0.4996827419378796
       }
     }
   ]

transformer/checkpoint-1220/config.json CHANGED Viewed

@@ -32,7 +32,7 @@
   "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "tie_word_embeddings": true,
-  "transformers_version": "5.9.0",
   "type_vocab_size": 1,
   "use_cache": false,
   "vocab_size": 250002

   "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "tie_word_embeddings": true,
+  "transformers_version": "5.10.2",
   "type_vocab_size": 1,
   "use_cache": false,
   "vocab_size": 250002

transformer/checkpoint-1220/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b248f60ff3e153b28949243967a2debde809912442c1ef5fe19d89dad891f1f9
 size 1112205008

 version https://git-lfs.github.com/spec/v1
+oid sha256:68cfdbf41602bef3dad433cc9d7341026e15b6212a2de26b87cb1b08c92fe53a
 size 1112205008

transformer/checkpoint-1220/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f731780f8bff3652e23ff4cf1692c96c1068919f515c85113ffd987765be34ce
 size 2224532875

 version https://git-lfs.github.com/spec/v1
+oid sha256:b157f469e91a6d944690dc04579dbfd1df4cb7df1828e6737dc78b7100c6c9bd
 size 2224532875

transformer/checkpoint-1220/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e47023fdf7fee85f2c66207ee2960719b8bf1b11c2d946d75e0d2fe33113c7ce
 size 14645

 version https://git-lfs.github.com/spec/v1
+oid sha256:d539b8d76c8001da486adb60fe77a06b1ad89abe54968b00e74e6fe0a65f76a4
 size 14645

transformer/checkpoint-1220/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f2e11cad5f2deee13f6148971cf1c6ded27d5cbdc725a37902243981a6125a17
 size 1383

 version https://git-lfs.github.com/spec/v1
+oid sha256:f0d6ec924d72ca240bed6d2851cb98eda1484e26fe7cbfd21e9c5ca01087e280
 size 1383

transformer/checkpoint-1220/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f6adfd2a8e363fb5adf050a01658d698ef3da72d5e9b197063c5e3b6a0fe9333
 size 1465

 version https://git-lfs.github.com/spec/v1
+oid sha256:a9b7df4afd103514fe9d65c0bed1c50f1ab1e4c492ac4aaea616afc5f70bab7e
 size 1465

transformer/checkpoint-1220/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-  "best_global_step": 915,
-  "best_metric": 0.8220858895705522,
-  "best_model_checkpoint": "/content/agri-utilization-classifier/transformer/checkpoint-915",
-  "epoch": 4.0,
   "eval_steps": 500,
   "global_step": 1220,
   "is_hyper_param_search": false,
@@ -10,396 +10,370 @@
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.08196721311475409,
-      "grad_norm": 6.055062770843506,
-      "learning_rate": 3.157894736842105e-06,
-      "loss": 0.62972900390625,
       "step": 25
     },
     {
-      "epoch": 0.16393442622950818,
-      "grad_norm": 10.6914701461792,
-      "learning_rate": 6.447368421052632e-06,
-      "loss": 0.44850738525390627,
       "step": 50
     },
     {
-      "epoch": 0.2459016393442623,
-      "grad_norm": 6.670228481292725,
-      "learning_rate": 9.736842105263159e-06,
-      "loss": 0.3566379165649414,
       "step": 75
     },
     {
-      "epoch": 0.32786885245901637,
-      "grad_norm": 2.589911937713623,
-      "learning_rate": 1.3026315789473684e-05,
-      "loss": 0.2718839645385742,
       "step": 100
     },
     {
-      "epoch": 0.4098360655737705,
-      "grad_norm": 22.02676773071289,
-      "learning_rate": 1.6315789473684213e-05,
-      "loss": 0.1922766876220703,
       "step": 125
     },
     {
-      "epoch": 0.4918032786885246,
-      "grad_norm": 2.6362855434417725,
-      "learning_rate": 1.960526315789474e-05,
-      "loss": 0.1837622833251953,
       "step": 150
     },
     {
-      "epoch": 0.5737704918032787,
-      "grad_norm": 3.478484630584717,
-      "learning_rate": 1.9679533867443555e-05,
-      "loss": 0.18766048431396484,
       "step": 175
     },
     {
-      "epoch": 0.6557377049180327,
-      "grad_norm": 8.077605247497559,
-      "learning_rate": 1.9315367807720323e-05,
-      "loss": 0.23830581665039063,
       "step": 200
     },
     {
-      "epoch": 0.7377049180327869,
-      "grad_norm": 0.7427046298980713,
-      "learning_rate": 1.8951201747997088e-05,
-      "loss": 0.30742517471313474,
       "step": 225
     },
     {
-      "epoch": 0.819672131147541,
-      "grad_norm": 36.34975051879883,
-      "learning_rate": 1.8587035688273852e-05,
-      "loss": 0.22336017608642578,
       "step": 250
     },
     {
-      "epoch": 0.9016393442622951,
-      "grad_norm": 5.215510845184326,
-      "learning_rate": 1.822286962855062e-05,
-      "loss": 0.13779294967651368,
       "step": 275
     },
     {
-      "epoch": 0.9836065573770492,
-      "grad_norm": 3.551121950149536,
-      "learning_rate": 1.7858703568827385e-05,
-      "loss": 0.19200111389160157,
       "step": 300
     },
     {
-      "epoch": 1.0,
-      "eval_accuracy": 0.9631901840490797,
-      "eval_f1": 0.7721518987341772,
-      "eval_loss": 0.1292734444141388,
-      "eval_precision": 0.7721518987341772,
-      "eval_recall": 0.7721518987341772,
-      "eval_roc_auc": 0.9563720589684741,
-      "eval_runtime": 3.3396,
-      "eval_samples_per_second": 292.853,
-      "eval_steps_per_second": 9.283,
-      "step": 305
-    },
-    {
-      "epoch": 1.0655737704918034,
-      "grad_norm": 0.5402449369430542,
-      "learning_rate": 1.7494537509104153e-05,
-      "loss": 0.1241053295135498,
       "step": 325
     },
     {
-      "epoch": 1.1475409836065573,
-      "grad_norm": 4.476892948150635,
-      "learning_rate": 1.7130371449380918e-05,
-      "loss": 0.20724605560302733,
       "step": 350
     },
     {
-      "epoch": 1.2295081967213115,
-      "grad_norm": 0.46729782223701477,
-      "learning_rate": 1.6766205389657686e-05,
-      "loss": 0.13567353248596192,
       "step": 375
     },
     {
-      "epoch": 1.3114754098360657,
-      "grad_norm": 0.1852118819952011,
-      "learning_rate": 1.640203932993445e-05,
-      "loss": 0.13295170783996582,
       "step": 400
     },
     {
-      "epoch": 1.3934426229508197,
-      "grad_norm": 1.2681413888931274,
-      "learning_rate": 1.603787327021122e-05,
-      "loss": 0.2027936363220215,
       "step": 425
     },
     {
-      "epoch": 1.4754098360655736,
-      "grad_norm": 7.484091281890869,
-      "learning_rate": 1.5673707210487983e-05,
-      "loss": 0.12364128112792969,
       "step": 450
     },
     {
-      "epoch": 1.5573770491803278,
-      "grad_norm": 0.46489500999450684,
-      "learning_rate": 1.530954115076475e-05,
-      "loss": 0.14407362937927246,
       "step": 475
     },
     {
-      "epoch": 1.639344262295082,
-      "grad_norm": 0.20967872440814972,
-      "learning_rate": 1.4945375091041516e-05,
-      "loss": 0.12458925247192383,
       "step": 500
     },
     {
-      "epoch": 1.721311475409836,
-      "grad_norm": 0.1643747240304947,
-      "learning_rate": 1.4581209031318282e-05,
-      "loss": 0.21631996154785157,
       "step": 525
     },
     {
-      "epoch": 1.8032786885245902,
-      "grad_norm": 7.073329448699951,
-      "learning_rate": 1.4217042971595047e-05,
-      "loss": 0.16043865203857421,
       "step": 550
     },
     {
-      "epoch": 1.8852459016393444,
-      "grad_norm": 1.744958758354187,
-      "learning_rate": 1.3852876911871815e-05,
-      "loss": 0.0966644287109375,
       "step": 575
     },
     {
-      "epoch": 1.9672131147540983,
-      "grad_norm": 12.79035472869873,
-      "learning_rate": 1.3488710852148582e-05,
-      "loss": 0.15884541511535644,
       "step": 600
     },
     {
-      "epoch": 2.0,
-      "eval_accuracy": 0.9611451942740287,
-      "eval_f1": 0.7432432432432432,
-      "eval_loss": 0.13287827372550964,
-      "eval_precision": 0.7971014492753623,
-      "eval_recall": 0.6962025316455697,
-      "eval_roc_auc": 0.9594697343039381,
-      "eval_runtime": 3.2739,
-      "eval_samples_per_second": 298.727,
-      "eval_steps_per_second": 9.469,
       "step": 610
     },
     {
-      "epoch": 2.0491803278688523,
-      "grad_norm": 17.520444869995117,
-      "learning_rate": 1.3124544792425346e-05,
-      "loss": 0.08896012306213379,
       "step": 625
     },
     {
-      "epoch": 2.1311475409836067,
-      "grad_norm": 0.16623224318027496,
-      "learning_rate": 1.2760378732702113e-05,
-      "loss": 0.11752216339111328,
       "step": 650
     },
     {
-      "epoch": 2.2131147540983607,
-      "grad_norm": 0.20762814581394196,
-      "learning_rate": 1.239621267297888e-05,
-      "loss": 0.1193038272857666,
       "step": 675
     },
     {
-      "epoch": 2.2950819672131146,
-      "grad_norm": 0.1500111073255539,
-      "learning_rate": 1.2032046613255645e-05,
-      "loss": 0.0630855655670166,
       "step": 700
     },
     {
-      "epoch": 2.3770491803278686,
-      "grad_norm": 0.17727839946746826,
-      "learning_rate": 1.1667880553532412e-05,
-      "loss": 0.08730959892272949,
       "step": 725
     },
     {
-      "epoch": 2.459016393442623,
-      "grad_norm": 4.3997321128845215,
-      "learning_rate": 1.1303714493809176e-05,
-      "loss": 0.12114215850830078,
       "step": 750
     },
     {
-      "epoch": 2.540983606557377,
-      "grad_norm": 34.47224044799805,
-      "learning_rate": 1.0939548434085944e-05,
-      "loss": 0.11070786476135254,
       "step": 775
     },
     {
-      "epoch": 2.6229508196721314,
-      "grad_norm": 25.977081298828125,
-      "learning_rate": 1.057538237436271e-05,
-      "loss": 0.10845686912536621,
       "step": 800
     },
     {
-      "epoch": 2.7049180327868854,
-      "grad_norm": 0.1657736450433731,
-      "learning_rate": 1.0211216314639475e-05,
-      "loss": 0.1025285530090332,
       "step": 825
     },
     {
-      "epoch": 2.7868852459016393,
-      "grad_norm": 34.05498504638672,
-      "learning_rate": 9.847050254916243e-06,
-      "loss": 0.07825160026550293,
       "step": 850
     },
     {
-      "epoch": 2.8688524590163933,
-      "grad_norm": 0.2868161201477051,
-      "learning_rate": 9.482884195193008e-06,
-      "loss": 0.12041816711425782,
       "step": 875
     },
     {
-      "epoch": 2.9508196721311473,
-      "grad_norm": 0.19192977249622345,
-      "learning_rate": 9.118718135469774e-06,
-      "loss": 0.08709416389465333,
       "step": 900
     },
     {
-      "epoch": 3.0,
-      "eval_accuracy": 0.9703476482617587,
-      "eval_f1": 0.8220858895705522,
-      "eval_loss": 0.11163181066513062,
-      "eval_precision": 0.7976190476190477,
-      "eval_recall": 0.8481012658227848,
-      "eval_roc_auc": 0.9661086157615353,
-      "eval_runtime": 3.1733,
-      "eval_samples_per_second": 308.193,
-      "eval_steps_per_second": 9.769,
-      "step": 915
-    },
-    {
-      "epoch": 3.0327868852459017,
-      "grad_norm": 1.0706992149353027,
-      "learning_rate": 8.754552075746541e-06,
-      "loss": 0.10751664161682128,
       "step": 925
     },
     {
-      "epoch": 3.1147540983606556,
-      "grad_norm": 0.12844231724739075,
-      "learning_rate": 8.390386016023307e-06,
-      "loss": 0.06818144798278808,
       "step": 950
     },
     {
-      "epoch": 3.19672131147541,
-      "grad_norm": 0.07692205160856247,
-      "learning_rate": 8.026219956300074e-06,
-      "loss": 0.12229555130004882,
       "step": 975
     },
     {
-      "epoch": 3.278688524590164,
-      "grad_norm": 1.773990511894226,
-      "learning_rate": 7.66205389657684e-06,
-      "loss": 0.06936595916748046,
       "step": 1000
     },
     {
-      "epoch": 3.360655737704918,
-      "grad_norm": 0.07844381034374237,
-      "learning_rate": 7.2978878368536055e-06,
-      "loss": 0.05219663143157959,
       "step": 1025
     },
     {
-      "epoch": 3.442622950819672,
-      "grad_norm": 12.502548217773438,
-      "learning_rate": 6.933721777130372e-06,
-      "loss": 0.06849228858947753,
       "step": 1050
     },
     {
-      "epoch": 3.5245901639344264,
-      "grad_norm": 1.6993861198425293,
-      "learning_rate": 6.569555717407138e-06,
-      "loss": 0.08783550262451172,
       "step": 1075
     },
     {
-      "epoch": 3.6065573770491803,
-      "grad_norm": 0.06551510095596313,
-      "learning_rate": 6.2053896576839045e-06,
-      "loss": 0.049420347213745115,
       "step": 1100
     },
     {
-      "epoch": 3.6885245901639343,
-      "grad_norm": 0.034276798367500305,
-      "learning_rate": 5.84122359796067e-06,
-      "loss": 0.05244039058685303,
       "step": 1125
     },
     {
-      "epoch": 3.7704918032786887,
-      "grad_norm": 10.901683807373047,
-      "learning_rate": 5.477057538237437e-06,
-      "loss": 0.06656317710876465,
       "step": 1150
     },
     {
-      "epoch": 3.8524590163934427,
-      "grad_norm": 2.3856894969940186,
-      "learning_rate": 5.112891478514203e-06,
-      "loss": 0.06277508735656738,
       "step": 1175
     },
     {
-      "epoch": 3.9344262295081966,
-      "grad_norm": 0.018699949607253075,
-      "learning_rate": 4.748725418790969e-06,
-      "loss": 0.046858911514282224,
       "step": 1200
     },
     {
-      "epoch": 4.0,
-      "eval_accuracy": 0.9662576687116564,
-      "eval_f1": 0.8047337278106509,
-      "eval_loss": 0.14547723531723022,
-      "eval_precision": 0.7555555555555555,
-      "eval_recall": 0.8607594936708861,
-      "eval_roc_auc": 0.9600822291998141,
-      "eval_runtime": 3.1883,
-      "eval_samples_per_second": 306.745,
-      "eval_steps_per_second": 9.723,
       "step": 1220
     }
   ],
   "logging_steps": 25,
-  "max_steps": 1525,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 5,
   "save_steps": 500,
@@ -424,7 +398,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 2566385233981440.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

 {
+  "best_global_step": 610,
+  "best_metric": 0.6933962264150944,
+  "best_model_checkpoint": "/content/agri-utilization-classifier/transformer/checkpoint-610",
+  "epoch": 2.0,
   "eval_steps": 500,
   "global_step": 1220,
   "is_hyper_param_search": false,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.040983606557377046,
+      "grad_norm": 3.1041932106018066,
+      "learning_rate": 1.573770491803279e-06,
+      "loss": 0.526744384765625,
       "step": 25
     },
     {
+      "epoch": 0.08196721311475409,
+      "grad_norm": 4.816498279571533,
+      "learning_rate": 3.213114754098361e-06,
+      "loss": 0.46380462646484377,
       "step": 50
     },
     {
+      "epoch": 0.12295081967213115,
+      "grad_norm": 5.105863571166992,
+      "learning_rate": 4.8524590163934435e-06,
+      "loss": 0.3628129577636719,
       "step": 75
     },
     {
+      "epoch": 0.16393442622950818,
+      "grad_norm": 3.479628324508667,
+      "learning_rate": 6.491803278688526e-06,
+      "loss": 0.3321057891845703,
       "step": 100
     },
     {
+      "epoch": 0.20491803278688525,
+      "grad_norm": 5.271286487579346,
+      "learning_rate": 8.131147540983607e-06,
+      "loss": 0.29200584411621094,
       "step": 125
     },
     {
+      "epoch": 0.2459016393442623,
+      "grad_norm": 2.9103591442108154,
+      "learning_rate": 9.770491803278689e-06,
+      "loss": 0.20765865325927735,
       "step": 150
     },
     {
+      "epoch": 0.28688524590163933,
+      "grad_norm": 5.441774845123291,
+      "learning_rate": 1.1409836065573771e-05,
+      "loss": 0.22107566833496095,
       "step": 175
     },
     {
+      "epoch": 0.32786885245901637,
+      "grad_norm": 17.181110382080078,
+      "learning_rate": 1.3049180327868853e-05,
+      "loss": 0.22224016189575196,
       "step": 200
     },
     {
+      "epoch": 0.36885245901639346,
+      "grad_norm": 5.543371677398682,
+      "learning_rate": 1.4688524590163935e-05,
+      "loss": 0.20201002120971678,
       "step": 225
     },
     {
+      "epoch": 0.4098360655737705,
+      "grad_norm": 5.812751770019531,
+      "learning_rate": 1.6327868852459016e-05,
+      "loss": 0.2299608612060547,
       "step": 250
     },
     {
+      "epoch": 0.45081967213114754,
+      "grad_norm": 2.845670461654663,
+      "learning_rate": 1.79672131147541e-05,
+      "loss": 0.21673511505126952,
       "step": 275
     },
     {
+      "epoch": 0.4918032786885246,
+      "grad_norm": 18.98938751220703,
+      "learning_rate": 1.9606557377049183e-05,
+      "loss": 0.21523273468017579,
       "step": 300
     },
     {
+      "epoch": 0.5327868852459017,
+      "grad_norm": 5.82402229309082,
+      "learning_rate": 1.9861566484517306e-05,
+      "loss": 0.15432929039001464,
       "step": 325
     },
     {
+      "epoch": 0.5737704918032787,
+      "grad_norm": 0.48278993368148804,
+      "learning_rate": 1.9679417122040073e-05,
+      "loss": 0.16572830200195313,
       "step": 350
     },
     {
+      "epoch": 0.6147540983606558,
+      "grad_norm": 5.946134567260742,
+      "learning_rate": 1.9497267759562843e-05,
+      "loss": 0.17543071746826172,
       "step": 375
     },
     {
+      "epoch": 0.6557377049180327,
+      "grad_norm": 13.494661331176758,
+      "learning_rate": 1.9315118397085614e-05,
+      "loss": 0.15327459335327148,
       "step": 400
     },
     {
+      "epoch": 0.6967213114754098,
+      "grad_norm": 9.058329582214355,
+      "learning_rate": 1.913296903460838e-05,
+      "loss": 0.19322505950927735,
       "step": 425
     },
     {
+      "epoch": 0.7377049180327869,
+      "grad_norm": 9.420262336730957,
+      "learning_rate": 1.895081967213115e-05,
+      "loss": 0.18702877044677735,
       "step": 450
     },
     {
+      "epoch": 0.7786885245901639,
+      "grad_norm": 0.29203546047210693,
+      "learning_rate": 1.8768670309653917e-05,
+      "loss": 0.13424430847167967,
       "step": 475
     },
     {
+      "epoch": 0.819672131147541,
+      "grad_norm": 5.464226245880127,
+      "learning_rate": 1.8586520947176687e-05,
+      "loss": 0.1403522300720215,
       "step": 500
     },
     {
+      "epoch": 0.860655737704918,
+      "grad_norm": 0.3305734395980835,
+      "learning_rate": 1.8404371584699454e-05,
+      "loss": 0.1768626403808594,
       "step": 525
     },
     {
+      "epoch": 0.9016393442622951,
+      "grad_norm": 6.791965007781982,
+      "learning_rate": 1.8222222222222224e-05,
+      "loss": 0.22005313873291016,
       "step": 550
     },
     {
+      "epoch": 0.9426229508196722,
+      "grad_norm": 3.971740484237671,
+      "learning_rate": 1.804007285974499e-05,
+      "loss": 0.17844413757324218,
       "step": 575
     },
     {
+      "epoch": 0.9836065573770492,
+      "grad_norm": 1.6787421703338623,
+      "learning_rate": 1.785792349726776e-05,
+      "loss": 0.16104537963867188,
       "step": 600
     },
     {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9376199616122841,
+      "eval_f1": 0.6933962264150944,
+      "eval_loss": 0.17767289280891418,
+      "eval_precision": 0.6533333333333333,
+      "eval_recall": 0.7386934673366834,
+      "eval_roc_auc": 0.9544433040534235,
+      "eval_runtime": 8.7237,
+      "eval_samples_per_second": 238.89,
+      "eval_steps_per_second": 7.566,
       "step": 610
     },
     {
+      "epoch": 1.0245901639344261,
+      "grad_norm": 5.573081016540527,
+      "learning_rate": 1.7675774134790528e-05,
+      "loss": 0.10441858291625977,
       "step": 625
     },
     {
+      "epoch": 1.0655737704918034,
+      "grad_norm": 0.11036327481269836,
+      "learning_rate": 1.7493624772313298e-05,
+      "loss": 0.16641632080078125,
       "step": 650
     },
     {
+      "epoch": 1.1065573770491803,
+      "grad_norm": 6.172032833099365,
+      "learning_rate": 1.731147540983607e-05,
+      "loss": 0.14472474098205568,
       "step": 675
     },
     {
+      "epoch": 1.1475409836065573,
+      "grad_norm": 5.863953113555908,
+      "learning_rate": 1.7129326047358835e-05,
+      "loss": 0.1113892936706543,
       "step": 700
     },
     {
+      "epoch": 1.1885245901639343,
+      "grad_norm": 0.25357893109321594,
+      "learning_rate": 1.6947176684881602e-05,
+      "loss": 0.12171897888183594,
       "step": 725
     },
     {
+      "epoch": 1.2295081967213115,
+      "grad_norm": 4.559972763061523,
+      "learning_rate": 1.6765027322404372e-05,
+      "loss": 0.08190732002258301,
       "step": 750
     },
     {
+      "epoch": 1.2704918032786885,
+      "grad_norm": 5.443191051483154,
+      "learning_rate": 1.6582877959927142e-05,
+      "loss": 0.06097976684570312,
       "step": 775
     },
     {
+      "epoch": 1.3114754098360657,
+      "grad_norm": 7.672996997833252,
+      "learning_rate": 1.6400728597449912e-05,
+      "loss": 0.09989359855651855,
       "step": 800
     },
     {
+      "epoch": 1.3524590163934427,
+      "grad_norm": 0.30564695596694946,
+      "learning_rate": 1.621857923497268e-05,
+      "loss": 0.08488804817199708,
       "step": 825
     },
     {
+      "epoch": 1.3934426229508197,
+      "grad_norm": 0.5056689977645874,
+      "learning_rate": 1.6036429872495446e-05,
+      "loss": 0.15551289558410644,
       "step": 850
     },
     {
+      "epoch": 1.4344262295081966,
+      "grad_norm": 0.06402106583118439,
+      "learning_rate": 1.5854280510018216e-05,
+      "loss": 0.1194021987915039,
       "step": 875
     },
     {
+      "epoch": 1.4754098360655736,
+      "grad_norm": 0.8240995407104492,
+      "learning_rate": 1.5672131147540986e-05,
+      "loss": 0.11723342895507813,
       "step": 900
     },
     {
+      "epoch": 1.5163934426229508,
+      "grad_norm": 0.07588805258274078,
+      "learning_rate": 1.5489981785063753e-05,
+      "loss": 0.12805092811584473,
       "step": 925
     },
     {
+      "epoch": 1.5573770491803278,
+      "grad_norm": 29.323896408081055,
+      "learning_rate": 1.5307832422586523e-05,
+      "loss": 0.15534672737121583,
       "step": 950
     },
     {
+      "epoch": 1.598360655737705,
+      "grad_norm": 11.02952766418457,
+      "learning_rate": 1.512568306010929e-05,
+      "loss": 0.1811429214477539,
       "step": 975
     },
     {
+      "epoch": 1.639344262295082,
+      "grad_norm": 0.9738644957542419,
+      "learning_rate": 1.494353369763206e-05,
+      "loss": 0.1270007610321045,
       "step": 1000
     },
     {
+      "epoch": 1.680327868852459,
+      "grad_norm": 2.311349630355835,
+      "learning_rate": 1.4761384335154829e-05,
+      "loss": 0.1843573570251465,
       "step": 1025
     },
     {
+      "epoch": 1.721311475409836,
+      "grad_norm": 7.105762004852295,
+      "learning_rate": 1.4579234972677595e-05,
+      "loss": 0.15470240592956544,
       "step": 1050
     },
     {
+      "epoch": 1.762295081967213,
+      "grad_norm": 9.120081901550293,
+      "learning_rate": 1.4397085610200366e-05,
+      "loss": 0.1170622444152832,
       "step": 1075
     },
     {
+      "epoch": 1.8032786885245902,
+      "grad_norm": 0.09794076532125473,
+      "learning_rate": 1.4214936247723134e-05,
+      "loss": 0.14307721138000487,
       "step": 1100
     },
     {
+      "epoch": 1.8442622950819674,
+      "grad_norm": 10.330300331115723,
+      "learning_rate": 1.4032786885245904e-05,
+      "loss": 0.15037315368652343,
       "step": 1125
     },
     {
+      "epoch": 1.8852459016393444,
+      "grad_norm": 0.7867186069488525,
+      "learning_rate": 1.3850637522768671e-05,
+      "loss": 0.10941274642944336,
       "step": 1150
     },
     {
+      "epoch": 1.9262295081967213,
+      "grad_norm": 7.952847003936768,
+      "learning_rate": 1.366848816029144e-05,
+      "loss": 0.1380799674987793,
       "step": 1175
     },
     {
+      "epoch": 1.9672131147540983,
+      "grad_norm": 11.602045059204102,
+      "learning_rate": 1.348633879781421e-05,
+      "loss": 0.07221244812011719,
       "step": 1200
     },
     {
+      "epoch": 2.0,
+      "eval_accuracy": 0.935700575815739,
+      "eval_f1": 0.6854460093896714,
+      "eval_loss": 0.24323046207427979,
+      "eval_precision": 0.6431718061674009,
+      "eval_recall": 0.7336683417085427,
+      "eval_roc_auc": 0.9480599282886581,
+      "eval_runtime": 8.6243,
+      "eval_samples_per_second": 241.642,
+      "eval_steps_per_second": 7.653,
       "step": 1220
     }
   ],
   "logging_steps": 25,
+  "max_steps": 3050,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 5,
   "save_steps": 500,
       "attributes": {}
     }
   },
+  "total_flos": 2566122122926080.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

transformer/checkpoint-1220/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3c60366894b25ead0379e8d97e61f1123e1ad4786f5e41a8bc70f2d7bc8901f5
-size 5329

 version https://git-lfs.github.com/spec/v1
+oid sha256:26170ff2d75562c83f88182ac9301ad3566752c384b38d15219d8c3352efbebb
+size 5201

transformer/checkpoint-1830/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "add_cross_attention": false,
+  "architectures": [
+    "XLMRobertaForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "dtype": "float32",
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "NOT_RELEVANT",
+    "1": "RELEVANT"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "is_decoder": false,
+  "label2id": {
+    "NOT_RELEVANT": 0,
+    "RELEVANT": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "xlm-roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "tie_word_embeddings": true,
+  "transformers_version": "5.10.2",
+  "type_vocab_size": 1,
+  "use_cache": false,
+  "vocab_size": 250002
+}

transformer/checkpoint-1830/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f2d36571bab40691e34928937e3b6273dc9f93cd7ff5063c0b0f56f6c81c617e
+size 1112205008

transformer/checkpoint-1830/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cd40f5b113902e4d4d3cafce7879adf4a0cd4adc135b994b1df34ea3f00be36d
+size 2224532875

transformer/checkpoint-1830/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:396753321c3a3c714b0c16546663b596b2b7dc320914daeff4f4502205877de5
+size 14645

transformer/checkpoint-1830/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e491b7c283e1accd9af8c8149230ddc3a5c9734dc7607b730682b67947f9d5a
+size 1383

transformer/checkpoint-1830/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:54b2dfae694f5d9051517fe489620541ef50f0d13ff4da58515c39d36e6dbf34
+size 1465

transformer/checkpoint-1830/tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc02d42fb2a10276563109e2287cc0dbe6b595d5b3b3401c7cfeffc0b7e20270
+size 17098351

transformer/checkpoint-1830/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "add_prefix_space": true,
+  "backend": "tokenizers",
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "is_local": false,
+  "local_files_only": false,
+  "mask_token": "<mask>",
+  "model_max_length": 512,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "tokenizer_class": "XLMRobertaTokenizer",
+  "unk_token": "<unk>"
+}

transformer/checkpoint-1830/trainer_state.json ADDED Viewed

	@@ -0,0 +1,593 @@

+{
+  "best_global_step": 610,
+  "best_metric": 0.6933962264150944,
+  "best_model_checkpoint": "/content/agri-utilization-classifier/transformer/checkpoint-610",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 1830,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.040983606557377046,
+      "grad_norm": 3.1041932106018066,
+      "learning_rate": 1.573770491803279e-06,
+      "loss": 0.526744384765625,
+      "step": 25
+    },
+    {
+      "epoch": 0.08196721311475409,
+      "grad_norm": 4.816498279571533,
+      "learning_rate": 3.213114754098361e-06,
+      "loss": 0.46380462646484377,
+      "step": 50
+    },
+    {
+      "epoch": 0.12295081967213115,
+      "grad_norm": 5.105863571166992,
+      "learning_rate": 4.8524590163934435e-06,
+      "loss": 0.3628129577636719,
+      "step": 75
+    },
+    {
+      "epoch": 0.16393442622950818,
+      "grad_norm": 3.479628324508667,
+      "learning_rate": 6.491803278688526e-06,
+      "loss": 0.3321057891845703,
+      "step": 100
+    },
+    {
+      "epoch": 0.20491803278688525,
+      "grad_norm": 5.271286487579346,
+      "learning_rate": 8.131147540983607e-06,
+      "loss": 0.29200584411621094,
+      "step": 125
+    },
+    {
+      "epoch": 0.2459016393442623,
+      "grad_norm": 2.9103591442108154,
+      "learning_rate": 9.770491803278689e-06,
+      "loss": 0.20765865325927735,
+      "step": 150
+    },
+    {
+      "epoch": 0.28688524590163933,
+      "grad_norm": 5.441774845123291,
+      "learning_rate": 1.1409836065573771e-05,
+      "loss": 0.22107566833496095,
+      "step": 175
+    },
+    {
+      "epoch": 0.32786885245901637,
+      "grad_norm": 17.181110382080078,
+      "learning_rate": 1.3049180327868853e-05,
+      "loss": 0.22224016189575196,
+      "step": 200
+    },
+    {
+      "epoch": 0.36885245901639346,
+      "grad_norm": 5.543371677398682,
+      "learning_rate": 1.4688524590163935e-05,
+      "loss": 0.20201002120971678,
+      "step": 225
+    },
+    {
+      "epoch": 0.4098360655737705,
+      "grad_norm": 5.812751770019531,
+      "learning_rate": 1.6327868852459016e-05,
+      "loss": 0.2299608612060547,
+      "step": 250
+    },
+    {
+      "epoch": 0.45081967213114754,
+      "grad_norm": 2.845670461654663,
+      "learning_rate": 1.79672131147541e-05,
+      "loss": 0.21673511505126952,
+      "step": 275
+    },
+    {
+      "epoch": 0.4918032786885246,
+      "grad_norm": 18.98938751220703,
+      "learning_rate": 1.9606557377049183e-05,
+      "loss": 0.21523273468017579,
+      "step": 300
+    },
+    {
+      "epoch": 0.5327868852459017,
+      "grad_norm": 5.82402229309082,
+      "learning_rate": 1.9861566484517306e-05,
+      "loss": 0.15432929039001464,
+      "step": 325
+    },
+    {
+      "epoch": 0.5737704918032787,
+      "grad_norm": 0.48278993368148804,
+      "learning_rate": 1.9679417122040073e-05,
+      "loss": 0.16572830200195313,
+      "step": 350
+    },
+    {
+      "epoch": 0.6147540983606558,
+      "grad_norm": 5.946134567260742,
+      "learning_rate": 1.9497267759562843e-05,
+      "loss": 0.17543071746826172,
+      "step": 375
+    },
+    {
+      "epoch": 0.6557377049180327,
+      "grad_norm": 13.494661331176758,
+      "learning_rate": 1.9315118397085614e-05,
+      "loss": 0.15327459335327148,
+      "step": 400
+    },
+    {
+      "epoch": 0.6967213114754098,
+      "grad_norm": 9.058329582214355,
+      "learning_rate": 1.913296903460838e-05,
+      "loss": 0.19322505950927735,
+      "step": 425
+    },
+    {
+      "epoch": 0.7377049180327869,
+      "grad_norm": 9.420262336730957,
+      "learning_rate": 1.895081967213115e-05,
+      "loss": 0.18702877044677735,
+      "step": 450
+    },
+    {
+      "epoch": 0.7786885245901639,
+      "grad_norm": 0.29203546047210693,
+      "learning_rate": 1.8768670309653917e-05,
+      "loss": 0.13424430847167967,
+      "step": 475
+    },
+    {
+      "epoch": 0.819672131147541,
+      "grad_norm": 5.464226245880127,
+      "learning_rate": 1.8586520947176687e-05,
+      "loss": 0.1403522300720215,
+      "step": 500
+    },
+    {
+      "epoch": 0.860655737704918,
+      "grad_norm": 0.3305734395980835,
+      "learning_rate": 1.8404371584699454e-05,
+      "loss": 0.1768626403808594,
+      "step": 525
+    },
+    {
+      "epoch": 0.9016393442622951,
+      "grad_norm": 6.791965007781982,
+      "learning_rate": 1.8222222222222224e-05,
+      "loss": 0.22005313873291016,
+      "step": 550
+    },
+    {
+      "epoch": 0.9426229508196722,
+      "grad_norm": 3.971740484237671,
+      "learning_rate": 1.804007285974499e-05,
+      "loss": 0.17844413757324218,
+      "step": 575
+    },
+    {
+      "epoch": 0.9836065573770492,
+      "grad_norm": 1.6787421703338623,
+      "learning_rate": 1.785792349726776e-05,
+      "loss": 0.16104537963867188,
+      "step": 600
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9376199616122841,
+      "eval_f1": 0.6933962264150944,
+      "eval_loss": 0.17767289280891418,
+      "eval_precision": 0.6533333333333333,
+      "eval_recall": 0.7386934673366834,
+      "eval_roc_auc": 0.9544433040534235,
+      "eval_runtime": 8.7237,
+      "eval_samples_per_second": 238.89,
+      "eval_steps_per_second": 7.566,
+      "step": 610
+    },
+    {
+      "epoch": 1.0245901639344261,
+      "grad_norm": 5.573081016540527,
+      "learning_rate": 1.7675774134790528e-05,
+      "loss": 0.10441858291625977,
+      "step": 625
+    },
+    {
+      "epoch": 1.0655737704918034,
+      "grad_norm": 0.11036327481269836,
+      "learning_rate": 1.7493624772313298e-05,
+      "loss": 0.16641632080078125,
+      "step": 650
+    },
+    {
+      "epoch": 1.1065573770491803,
+      "grad_norm": 6.172032833099365,
+      "learning_rate": 1.731147540983607e-05,
+      "loss": 0.14472474098205568,
+      "step": 675
+    },
+    {
+      "epoch": 1.1475409836065573,
+      "grad_norm": 5.863953113555908,
+      "learning_rate": 1.7129326047358835e-05,
+      "loss": 0.1113892936706543,
+      "step": 700
+    },
+    {
+      "epoch": 1.1885245901639343,
+      "grad_norm": 0.25357893109321594,
+      "learning_rate": 1.6947176684881602e-05,
+      "loss": 0.12171897888183594,
+      "step": 725
+    },
+    {
+      "epoch": 1.2295081967213115,
+      "grad_norm": 4.559972763061523,
+      "learning_rate": 1.6765027322404372e-05,
+      "loss": 0.08190732002258301,
+      "step": 750
+    },
+    {
+      "epoch": 1.2704918032786885,
+      "grad_norm": 5.443191051483154,
+      "learning_rate": 1.6582877959927142e-05,
+      "loss": 0.06097976684570312,
+      "step": 775
+    },
+    {
+      "epoch": 1.3114754098360657,
+      "grad_norm": 7.672996997833252,
+      "learning_rate": 1.6400728597449912e-05,
+      "loss": 0.09989359855651855,
+      "step": 800
+    },
+    {
+      "epoch": 1.3524590163934427,
+      "grad_norm": 0.30564695596694946,
+      "learning_rate": 1.621857923497268e-05,
+      "loss": 0.08488804817199708,
+      "step": 825
+    },
+    {
+      "epoch": 1.3934426229508197,
+      "grad_norm": 0.5056689977645874,
+      "learning_rate": 1.6036429872495446e-05,
+      "loss": 0.15551289558410644,
+      "step": 850
+    },
+    {
+      "epoch": 1.4344262295081966,
+      "grad_norm": 0.06402106583118439,
+      "learning_rate": 1.5854280510018216e-05,
+      "loss": 0.1194021987915039,
+      "step": 875
+    },
+    {
+      "epoch": 1.4754098360655736,
+      "grad_norm": 0.8240995407104492,
+      "learning_rate": 1.5672131147540986e-05,
+      "loss": 0.11723342895507813,
+      "step": 900
+    },
+    {
+      "epoch": 1.5163934426229508,
+      "grad_norm": 0.07588805258274078,
+      "learning_rate": 1.5489981785063753e-05,
+      "loss": 0.12805092811584473,
+      "step": 925
+    },
+    {
+      "epoch": 1.5573770491803278,
+      "grad_norm": 29.323896408081055,
+      "learning_rate": 1.5307832422586523e-05,
+      "loss": 0.15534672737121583,
+      "step": 950
+    },
+    {
+      "epoch": 1.598360655737705,
+      "grad_norm": 11.02952766418457,
+      "learning_rate": 1.512568306010929e-05,
+      "loss": 0.1811429214477539,
+      "step": 975
+    },
+    {
+      "epoch": 1.639344262295082,
+      "grad_norm": 0.9738644957542419,
+      "learning_rate": 1.494353369763206e-05,
+      "loss": 0.1270007610321045,
+      "step": 1000
+    },
+    {
+      "epoch": 1.680327868852459,
+      "grad_norm": 2.311349630355835,
+      "learning_rate": 1.4761384335154829e-05,
+      "loss": 0.1843573570251465,
+      "step": 1025
+    },
+    {
+      "epoch": 1.721311475409836,
+      "grad_norm": 7.105762004852295,
+      "learning_rate": 1.4579234972677595e-05,
+      "loss": 0.15470240592956544,
+      "step": 1050
+    },
+    {
+      "epoch": 1.762295081967213,
+      "grad_norm": 9.120081901550293,
+      "learning_rate": 1.4397085610200366e-05,
+      "loss": 0.1170622444152832,
+      "step": 1075
+    },
+    {
+      "epoch": 1.8032786885245902,
+      "grad_norm": 0.09794076532125473,
+      "learning_rate": 1.4214936247723134e-05,
+      "loss": 0.14307721138000487,
+      "step": 1100
+    },
+    {
+      "epoch": 1.8442622950819674,
+      "grad_norm": 10.330300331115723,
+      "learning_rate": 1.4032786885245904e-05,
+      "loss": 0.15037315368652343,
+      "step": 1125
+    },
+    {
+      "epoch": 1.8852459016393444,
+      "grad_norm": 0.7867186069488525,
+      "learning_rate": 1.3850637522768671e-05,
+      "loss": 0.10941274642944336,
+      "step": 1150
+    },
+    {
+      "epoch": 1.9262295081967213,
+      "grad_norm": 7.952847003936768,
+      "learning_rate": 1.366848816029144e-05,
+      "loss": 0.1380799674987793,
+      "step": 1175
+    },
+    {
+      "epoch": 1.9672131147540983,
+      "grad_norm": 11.602045059204102,
+      "learning_rate": 1.348633879781421e-05,
+      "loss": 0.07221244812011719,
+      "step": 1200
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.935700575815739,
+      "eval_f1": 0.6854460093896714,
+      "eval_loss": 0.24323046207427979,
+      "eval_precision": 0.6431718061674009,
+      "eval_recall": 0.7336683417085427,
+      "eval_roc_auc": 0.9480599282886581,
+      "eval_runtime": 8.6243,
+      "eval_samples_per_second": 241.642,
+      "eval_steps_per_second": 7.653,
+      "step": 1220
+    },
+    {
+      "epoch": 2.0081967213114753,
+      "grad_norm": 4.202751636505127,
+      "learning_rate": 1.3304189435336978e-05,
+      "loss": 0.16997112274169923,
+      "step": 1225
+    },
+    {
+      "epoch": 2.0491803278688523,
+      "grad_norm": 0.40695664286613464,
+      "learning_rate": 1.3122040072859745e-05,
+      "loss": 0.0950162410736084,
+      "step": 1250
+    },
+    {
+      "epoch": 2.0901639344262297,
+      "grad_norm": 2.8617703914642334,
+      "learning_rate": 1.2939890710382515e-05,
+      "loss": 0.10194917678833008,
+      "step": 1275
+    },
+    {
+      "epoch": 2.1311475409836067,
+      "grad_norm": 0.08977202326059341,
+      "learning_rate": 1.2757741347905283e-05,
+      "loss": 0.0662102746963501,
+      "step": 1300
+    },
+    {
+      "epoch": 2.1721311475409837,
+      "grad_norm": 0.10930905491113663,
+      "learning_rate": 1.2575591985428054e-05,
+      "loss": 0.07460547924041748,
+      "step": 1325
+    },
+    {
+      "epoch": 2.2131147540983607,
+      "grad_norm": 11.703680038452148,
+      "learning_rate": 1.239344262295082e-05,
+      "loss": 0.11810153961181641,
+      "step": 1350
+    },
+    {
+      "epoch": 2.2540983606557377,
+      "grad_norm": 3.0462427139282227,
+      "learning_rate": 1.2211293260473589e-05,
+      "loss": 0.11896968841552734,
+      "step": 1375
+    },
+    {
+      "epoch": 2.2950819672131146,
+      "grad_norm": 11.854302406311035,
+      "learning_rate": 1.2029143897996359e-05,
+      "loss": 0.10016871452331542,
+      "step": 1400
+    },
+    {
+      "epoch": 2.3360655737704916,
+      "grad_norm": 5.737449645996094,
+      "learning_rate": 1.1846994535519127e-05,
+      "loss": 0.12308047294616699,
+      "step": 1425
+    },
+    {
+      "epoch": 2.3770491803278686,
+      "grad_norm": 3.3703978061676025,
+      "learning_rate": 1.1664845173041894e-05,
+      "loss": 0.10508214950561523,
+      "step": 1450
+    },
+    {
+      "epoch": 2.418032786885246,
+      "grad_norm": 15.429414749145508,
+      "learning_rate": 1.1482695810564664e-05,
+      "loss": 0.05040365219116211,
+      "step": 1475
+    },
+    {
+      "epoch": 2.459016393442623,
+      "grad_norm": 14.725594520568848,
+      "learning_rate": 1.1300546448087433e-05,
+      "loss": 0.13564690589904785,
+      "step": 1500
+    },
+    {
+      "epoch": 2.5,
+      "grad_norm": 0.18430812656879425,
+      "learning_rate": 1.1118397085610201e-05,
+      "loss": 0.08556642532348632,
+      "step": 1525
+    },
+    {
+      "epoch": 2.540983606557377,
+      "grad_norm": 0.062474410980939865,
+      "learning_rate": 1.0936247723132968e-05,
+      "loss": 0.08463016510009766,
+      "step": 1550
+    },
+    {
+      "epoch": 2.581967213114754,
+      "grad_norm": 0.20876172184944153,
+      "learning_rate": 1.0754098360655738e-05,
+      "loss": 0.1799280548095703,
+      "step": 1575
+    },
+    {
+      "epoch": 2.6229508196721314,
+      "grad_norm": 6.137902736663818,
+      "learning_rate": 1.0571948998178507e-05,
+      "loss": 0.12623875617980956,
+      "step": 1600
+    },
+    {
+      "epoch": 2.663934426229508,
+      "grad_norm": 17.05773162841797,
+      "learning_rate": 1.0389799635701277e-05,
+      "loss": 0.09255536079406738,
+      "step": 1625
+    },
+    {
+      "epoch": 2.7049180327868854,
+      "grad_norm": 1.2578394412994385,
+      "learning_rate": 1.0207650273224044e-05,
+      "loss": 0.0888406753540039,
+      "step": 1650
+    },
+    {
+      "epoch": 2.7459016393442623,
+      "grad_norm": 15.845796585083008,
+      "learning_rate": 1.0025500910746812e-05,
+      "loss": 0.10764387130737305,
+      "step": 1675
+    },
+    {
+      "epoch": 2.7868852459016393,
+      "grad_norm": 12.588105201721191,
+      "learning_rate": 9.843351548269582e-06,
+      "loss": 0.12151247024536133,
+      "step": 1700
+    },
+    {
+      "epoch": 2.8278688524590163,
+      "grad_norm": 7.840113162994385,
+      "learning_rate": 9.66120218579235e-06,
+      "loss": 0.1787535858154297,
+      "step": 1725
+    },
+    {
+      "epoch": 2.8688524590163933,
+      "grad_norm": 5.082641124725342,
+      "learning_rate": 9.47905282331512e-06,
+      "loss": 0.07576138019561768,
+      "step": 1750
+    },
+    {
+      "epoch": 2.9098360655737707,
+      "grad_norm": 14.185094833374023,
+      "learning_rate": 9.296903460837888e-06,
+      "loss": 0.1186930274963379,
+      "step": 1775
+    },
+    {
+      "epoch": 2.9508196721311473,
+      "grad_norm": 31.60809898376465,
+      "learning_rate": 9.114754098360656e-06,
+      "loss": 0.10553586959838868,
+      "step": 1800
+    },
+    {
+      "epoch": 2.9918032786885247,
+      "grad_norm": 2.9622690677642822,
+      "learning_rate": 8.932604735883426e-06,
+      "loss": 0.054716997146606446,
+      "step": 1825
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.9414587332053743,
+      "eval_f1": 0.6903553299492385,
+      "eval_loss": 0.24261149764060974,
+      "eval_precision": 0.6974358974358974,
+      "eval_recall": 0.6834170854271356,
+      "eval_roc_auc": 0.9521560054916492,
+      "eval_runtime": 8.6527,
+      "eval_samples_per_second": 240.849,
+      "eval_steps_per_second": 7.628,
+      "step": 1830
+    }
+  ],
+  "logging_steps": 25,
+  "max_steps": 3050,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 2,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 2
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3849183184389120.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

transformer/checkpoint-1830/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:26170ff2d75562c83f88182ac9301ad3566752c384b38d15219d8c3352efbebb
+size 5201

transformer/checkpoint-610/config.json CHANGED Viewed

@@ -32,7 +32,7 @@
   "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "tie_word_embeddings": true,
-  "transformers_version": "5.9.0",
   "type_vocab_size": 1,
   "use_cache": false,
   "vocab_size": 250002

   "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "tie_word_embeddings": true,
+  "transformers_version": "5.10.2",
   "type_vocab_size": 1,
   "use_cache": false,
   "vocab_size": 250002

transformer/checkpoint-610/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8c2e8002a8b39d6b2b729d256b3d4cff3d522204ecb453b2bd5c433f9bd4944f
 size 1112205008

 version https://git-lfs.github.com/spec/v1
+oid sha256:150736722d2137e368c215a6ded5ca83348b547235eed16e8939af8b89077765
 size 1112205008

transformer/checkpoint-610/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:36fd23804b528193a6fc5999a821ef8809fb31a6efd5c61fe763007795ad7dff
 size 2224532875

 version https://git-lfs.github.com/spec/v1
+oid sha256:0e116ee1524d3a0af2639c7796fdc33da882323ef9133d8950b493efc3fdc234
 size 2224532875

transformer/checkpoint-610/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fafd9c24dc9711309db2e4113a63ff7120e22ca104346dfb40523f00ae210f76
 size 14645

 version https://git-lfs.github.com/spec/v1
+oid sha256:f79ebe41a952d58a414acbb1200490974edd9f70a35228ee802fd1f53139fa66
 size 14645

transformer/checkpoint-610/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:50d9d499a5525a1f496c3b9a272dbba833f43becb5d780497724ade85d68372c
 size 1383

 version https://git-lfs.github.com/spec/v1
+oid sha256:88e49d8c13a6eacfd8373ea54c57924180b7dfff65f37e60feb7ea51f503d158
 size 1383

transformer/checkpoint-610/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d364349216cf58d042027a258508346e7afb967d9966c7e61a3b5de011c04767
 size 1465

 version https://git-lfs.github.com/spec/v1
+oid sha256:3342a44ed126fda993f7f2d332ee7ff352916f58e467cf3c50397c3413bfcc8a
 size 1465

transformer/checkpoint-610/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-  "best_global_step": 305,
-  "best_metric": 0.7721518987341772,
-  "best_model_checkpoint": "/content/agri-utilization-classifier/transformer/checkpoint-305",
-  "epoch": 2.0,
   "eval_steps": 500,
   "global_step": 610,
   "is_hyper_param_search": false,
@@ -10,202 +10,189 @@
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.08196721311475409,
-      "grad_norm": 6.055062770843506,
-      "learning_rate": 3.157894736842105e-06,
-      "loss": 0.62972900390625,
       "step": 25
     },
     {
-      "epoch": 0.16393442622950818,
-      "grad_norm": 10.6914701461792,
-      "learning_rate": 6.447368421052632e-06,
-      "loss": 0.44850738525390627,
       "step": 50
     },
     {
-      "epoch": 0.2459016393442623,
-      "grad_norm": 6.670228481292725,
-      "learning_rate": 9.736842105263159e-06,
-      "loss": 0.3566379165649414,
       "step": 75
     },
     {
-      "epoch": 0.32786885245901637,
-      "grad_norm": 2.589911937713623,
-      "learning_rate": 1.3026315789473684e-05,
-      "loss": 0.2718839645385742,
       "step": 100
     },
     {
-      "epoch": 0.4098360655737705,
-      "grad_norm": 22.02676773071289,
-      "learning_rate": 1.6315789473684213e-05,
-      "loss": 0.1922766876220703,
       "step": 125
     },
     {
-      "epoch": 0.4918032786885246,
-      "grad_norm": 2.6362855434417725,
-      "learning_rate": 1.960526315789474e-05,
-      "loss": 0.1837622833251953,
       "step": 150
     },
     {
-      "epoch": 0.5737704918032787,
-      "grad_norm": 3.478484630584717,
-      "learning_rate": 1.9679533867443555e-05,
-      "loss": 0.18766048431396484,
       "step": 175
     },
     {
-      "epoch": 0.6557377049180327,
-      "grad_norm": 8.077605247497559,
-      "learning_rate": 1.9315367807720323e-05,
-      "loss": 0.23830581665039063,
       "step": 200
     },
     {
-      "epoch": 0.7377049180327869,
-      "grad_norm": 0.7427046298980713,
-      "learning_rate": 1.8951201747997088e-05,
-      "loss": 0.30742517471313474,
       "step": 225
     },
     {
-      "epoch": 0.819672131147541,
-      "grad_norm": 36.34975051879883,
-      "learning_rate": 1.8587035688273852e-05,
-      "loss": 0.22336017608642578,
       "step": 250
     },
     {
-      "epoch": 0.9016393442622951,
-      "grad_norm": 5.215510845184326,
-      "learning_rate": 1.822286962855062e-05,
-      "loss": 0.13779294967651368,
       "step": 275
     },
     {
-      "epoch": 0.9836065573770492,
-      "grad_norm": 3.551121950149536,
-      "learning_rate": 1.7858703568827385e-05,
-      "loss": 0.19200111389160157,
       "step": 300
     },
     {
-      "epoch": 1.0,
-      "eval_accuracy": 0.9631901840490797,
-      "eval_f1": 0.7721518987341772,
-      "eval_loss": 0.1292734444141388,
-      "eval_precision": 0.7721518987341772,
-      "eval_recall": 0.7721518987341772,
-      "eval_roc_auc": 0.9563720589684741,
-      "eval_runtime": 3.3396,
-      "eval_samples_per_second": 292.853,
-      "eval_steps_per_second": 9.283,
-      "step": 305
-    },
-    {
-      "epoch": 1.0655737704918034,
-      "grad_norm": 0.5402449369430542,
-      "learning_rate": 1.7494537509104153e-05,
-      "loss": 0.1241053295135498,
       "step": 325
     },
     {
-      "epoch": 1.1475409836065573,
-      "grad_norm": 4.476892948150635,
-      "learning_rate": 1.7130371449380918e-05,
-      "loss": 0.20724605560302733,
       "step": 350
     },
     {
-      "epoch": 1.2295081967213115,
-      "grad_norm": 0.46729782223701477,
-      "learning_rate": 1.6766205389657686e-05,
-      "loss": 0.13567353248596192,
       "step": 375
     },
     {
-      "epoch": 1.3114754098360657,
-      "grad_norm": 0.1852118819952011,
-      "learning_rate": 1.640203932993445e-05,
-      "loss": 0.13295170783996582,
       "step": 400
     },
     {
-      "epoch": 1.3934426229508197,
-      "grad_norm": 1.2681413888931274,
-      "learning_rate": 1.603787327021122e-05,
-      "loss": 0.2027936363220215,
       "step": 425
     },
     {
-      "epoch": 1.4754098360655736,
-      "grad_norm": 7.484091281890869,
-      "learning_rate": 1.5673707210487983e-05,
-      "loss": 0.12364128112792969,
       "step": 450
     },
     {
-      "epoch": 1.5573770491803278,
-      "grad_norm": 0.46489500999450684,
-      "learning_rate": 1.530954115076475e-05,
-      "loss": 0.14407362937927246,
       "step": 475
     },
     {
-      "epoch": 1.639344262295082,
-      "grad_norm": 0.20967872440814972,
-      "learning_rate": 1.4945375091041516e-05,
-      "loss": 0.12458925247192383,
       "step": 500
     },
     {
-      "epoch": 1.721311475409836,
-      "grad_norm": 0.1643747240304947,
-      "learning_rate": 1.4581209031318282e-05,
-      "loss": 0.21631996154785157,
       "step": 525
     },
     {
-      "epoch": 1.8032786885245902,
-      "grad_norm": 7.073329448699951,
-      "learning_rate": 1.4217042971595047e-05,
-      "loss": 0.16043865203857421,
       "step": 550
     },
     {
-      "epoch": 1.8852459016393444,
-      "grad_norm": 1.744958758354187,
-      "learning_rate": 1.3852876911871815e-05,
-      "loss": 0.0966644287109375,
       "step": 575
     },
     {
-      "epoch": 1.9672131147540983,
-      "grad_norm": 12.79035472869873,
-      "learning_rate": 1.3488710852148582e-05,
-      "loss": 0.15884541511535644,
       "step": 600
     },
     {
-      "epoch": 2.0,
-      "eval_accuracy": 0.9611451942740287,
-      "eval_f1": 0.7432432432432432,
-      "eval_loss": 0.13287827372550964,
-      "eval_precision": 0.7971014492753623,
-      "eval_recall": 0.6962025316455697,
-      "eval_roc_auc": 0.9594697343039381,
-      "eval_runtime": 3.2739,
-      "eval_samples_per_second": 298.727,
-      "eval_steps_per_second": 9.469,
       "step": 610
     }
   ],
   "logging_steps": 25,
-  "max_steps": 1525,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 5,
   "save_steps": 500,
@@ -216,7 +203,7 @@
         "early_stopping_threshold": 0.0
       },
       "attributes": {
-        "early_stopping_patience_counter": 1
       }
     },
     "TrainerControl": {
@@ -230,7 +217,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 1283192616990720.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

 {
+  "best_global_step": 610,
+  "best_metric": 0.6933962264150944,
+  "best_model_checkpoint": "/content/agri-utilization-classifier/transformer/checkpoint-610",
+  "epoch": 1.0,
   "eval_steps": 500,
   "global_step": 610,
   "is_hyper_param_search": false,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.040983606557377046,
+      "grad_norm": 3.1041932106018066,
+      "learning_rate": 1.573770491803279e-06,
+      "loss": 0.526744384765625,
       "step": 25
     },
     {
+      "epoch": 0.08196721311475409,
+      "grad_norm": 4.816498279571533,
+      "learning_rate": 3.213114754098361e-06,
+      "loss": 0.46380462646484377,
       "step": 50
     },
     {
+      "epoch": 0.12295081967213115,
+      "grad_norm": 5.105863571166992,
+      "learning_rate": 4.8524590163934435e-06,
+      "loss": 0.3628129577636719,
       "step": 75
     },
     {
+      "epoch": 0.16393442622950818,
+      "grad_norm": 3.479628324508667,
+      "learning_rate": 6.491803278688526e-06,
+      "loss": 0.3321057891845703,
       "step": 100
     },
     {
+      "epoch": 0.20491803278688525,
+      "grad_norm": 5.271286487579346,
+      "learning_rate": 8.131147540983607e-06,
+      "loss": 0.29200584411621094,
       "step": 125
     },
     {
+      "epoch": 0.2459016393442623,
+      "grad_norm": 2.9103591442108154,
+      "learning_rate": 9.770491803278689e-06,
+      "loss": 0.20765865325927735,
       "step": 150
     },
     {
+      "epoch": 0.28688524590163933,
+      "grad_norm": 5.441774845123291,
+      "learning_rate": 1.1409836065573771e-05,
+      "loss": 0.22107566833496095,
       "step": 175
     },
     {
+      "epoch": 0.32786885245901637,
+      "grad_norm": 17.181110382080078,
+      "learning_rate": 1.3049180327868853e-05,
+      "loss": 0.22224016189575196,
       "step": 200
     },
     {
+      "epoch": 0.36885245901639346,
+      "grad_norm": 5.543371677398682,
+      "learning_rate": 1.4688524590163935e-05,
+      "loss": 0.20201002120971678,
       "step": 225
     },
     {
+      "epoch": 0.4098360655737705,
+      "grad_norm": 5.812751770019531,
+      "learning_rate": 1.6327868852459016e-05,
+      "loss": 0.2299608612060547,
       "step": 250
     },
     {
+      "epoch": 0.45081967213114754,
+      "grad_norm": 2.845670461654663,
+      "learning_rate": 1.79672131147541e-05,
+      "loss": 0.21673511505126952,
       "step": 275
     },
     {
+      "epoch": 0.4918032786885246,
+      "grad_norm": 18.98938751220703,
+      "learning_rate": 1.9606557377049183e-05,
+      "loss": 0.21523273468017579,
       "step": 300
     },
     {
+      "epoch": 0.5327868852459017,
+      "grad_norm": 5.82402229309082,
+      "learning_rate": 1.9861566484517306e-05,
+      "loss": 0.15432929039001464,
       "step": 325
     },
     {
+      "epoch": 0.5737704918032787,
+      "grad_norm": 0.48278993368148804,
+      "learning_rate": 1.9679417122040073e-05,
+      "loss": 0.16572830200195313,
       "step": 350
     },
     {
+      "epoch": 0.6147540983606558,
+      "grad_norm": 5.946134567260742,
+      "learning_rate": 1.9497267759562843e-05,
+      "loss": 0.17543071746826172,
       "step": 375
     },
     {
+      "epoch": 0.6557377049180327,
+      "grad_norm": 13.494661331176758,
+      "learning_rate": 1.9315118397085614e-05,
+      "loss": 0.15327459335327148,
       "step": 400
     },
     {
+      "epoch": 0.6967213114754098,
+      "grad_norm": 9.058329582214355,
+      "learning_rate": 1.913296903460838e-05,
+      "loss": 0.19322505950927735,
       "step": 425
     },
     {
+      "epoch": 0.7377049180327869,
+      "grad_norm": 9.420262336730957,
+      "learning_rate": 1.895081967213115e-05,
+      "loss": 0.18702877044677735,
       "step": 450
     },
     {
+      "epoch": 0.7786885245901639,
+      "grad_norm": 0.29203546047210693,
+      "learning_rate": 1.8768670309653917e-05,
+      "loss": 0.13424430847167967,
       "step": 475
     },
     {
+      "epoch": 0.819672131147541,
+      "grad_norm": 5.464226245880127,
+      "learning_rate": 1.8586520947176687e-05,
+      "loss": 0.1403522300720215,
       "step": 500
     },
     {
+      "epoch": 0.860655737704918,
+      "grad_norm": 0.3305734395980835,
+      "learning_rate": 1.8404371584699454e-05,
+      "loss": 0.1768626403808594,
       "step": 525
     },
     {
+      "epoch": 0.9016393442622951,
+      "grad_norm": 6.791965007781982,
+      "learning_rate": 1.8222222222222224e-05,
+      "loss": 0.22005313873291016,
       "step": 550
     },
     {
+      "epoch": 0.9426229508196722,
+      "grad_norm": 3.971740484237671,
+      "learning_rate": 1.804007285974499e-05,
+      "loss": 0.17844413757324218,
       "step": 575
     },
     {
+      "epoch": 0.9836065573770492,
+      "grad_norm": 1.6787421703338623,
+      "learning_rate": 1.785792349726776e-05,
+      "loss": 0.16104537963867188,
       "step": 600
     },
     {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9376199616122841,
+      "eval_f1": 0.6933962264150944,
+      "eval_loss": 0.17767289280891418,
+      "eval_precision": 0.6533333333333333,
+      "eval_recall": 0.7386934673366834,
+      "eval_roc_auc": 0.9544433040534235,
+      "eval_runtime": 8.7237,
+      "eval_samples_per_second": 238.89,
+      "eval_steps_per_second": 7.566,
       "step": 610
     }
   ],
   "logging_steps": 25,
+  "max_steps": 3050,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 5,
   "save_steps": 500,
         "early_stopping_threshold": 0.0
       },
       "attributes": {
+        "early_stopping_patience_counter": 0
       }
     },
     "TrainerControl": {
       "attributes": {}
     }
   },
+  "total_flos": 1283061061463040.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

transformer/checkpoint-610/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3c60366894b25ead0379e8d97e61f1123e1ad4786f5e41a8bc70f2d7bc8901f5
-size 5329

 version https://git-lfs.github.com/spec/v1
+oid sha256:26170ff2d75562c83f88182ac9301ad3566752c384b38d15219d8c3352efbebb
+size 5201

transformer/config.json CHANGED Viewed

@@ -31,16 +31,16 @@
   "pad_token_id": 1,
   "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
-  "threshold": 0.4710787534713745,
   "tie_word_embeddings": true,
-  "transformers_version": "5.9.0",
   "type_vocab_size": 1,
   "use_cache": false,
   "validation_threshold_report": {
-    "f1": 0.829268292682927,
-    "precision": 0.8,
-    "recall": 0.8607594936708861,
-    "threshold": 0.4710787534713745
   },
   "vocab_size": 250002
 }

   "pad_token_id": 1,
   "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
+  "threshold": 0.5436205267906189,
   "tie_word_embeddings": true,
+  "transformers_version": "5.10.2",
   "type_vocab_size": 1,
   "use_cache": false,
   "validation_threshold_report": {
+    "f1": 0.6983372921615203,
+    "precision": 0.6621621621621622,
+    "recall": 0.7386934673366834,
+    "threshold": 0.5436205267906189
   },
   "vocab_size": 250002
 }

transformer/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:49a18c813f49f0f53eef5e1646a8e80f88eb366c956b09301312f1a23e9fe977
 size 1112205008

 version https://git-lfs.github.com/spec/v1
+oid sha256:150736722d2137e368c215a6ded5ca83348b547235eed16e8939af8b89077765
 size 1112205008

transformer/test_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

transformer/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3c60366894b25ead0379e8d97e61f1123e1ad4786f5e41a8bc70f2d7bc8901f5
-size 5329

 version https://git-lfs.github.com/spec/v1
+oid sha256:26170ff2d75562c83f88182ac9301ad3566752c384b38d15219d8c3352efbebb
+size 5201

transformer/validation_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff