lgsilvaesilva commited on May 29

Commit

57dcd10

verified ·

1 Parent(s): b813f7b

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +6 -0
README.md +86 -47
REPORT.md +54 -34
baselines/embedding-lightgbm/embedding-lightgbm.joblib +2 -2
baselines/embedding-lightgbm/test_predictions.csv +0 -0
baselines/embedding-lightgbm/validation_predictions.csv +0 -0
baselines/embedding-logistic/embedding-logistic.joblib +2 -2
baselines/embedding-logistic/test_predictions.csv +0 -0
baselines/embedding-logistic/validation_predictions.csv +0 -0
baselines/embedding-svm/embedding-svm.joblib +2 -2
baselines/embedding-svm/test_predictions.csv +0 -0
baselines/embedding-svm/validation_predictions.csv +0 -0
report.json +759 -206
transformer/checkpoint-1135/config.json +39 -0
transformer/checkpoint-1135/model.safetensors +3 -0
transformer/checkpoint-1135/optimizer.pt +3 -0
transformer/checkpoint-1135/rng_state.pth +3 -0
transformer/checkpoint-1135/scaler.pt +3 -0
transformer/checkpoint-1135/scheduler.pt +3 -0
transformer/checkpoint-1135/tokenizer.json +3 -0
transformer/checkpoint-1135/tokenizer_config.json +15 -0
transformer/checkpoint-1135/trainer_state.json +423 -0
transformer/checkpoint-1135/training_args.bin +3 -0
transformer/checkpoint-227/config.json +21 -19
transformer/checkpoint-227/model.safetensors +2 -2
transformer/checkpoint-227/optimizer.pt +2 -2
transformer/checkpoint-227/rng_state.pth +1 -1
transformer/checkpoint-227/scaler.pt +1 -1
transformer/checkpoint-227/tokenizer.json +0 -0
transformer/checkpoint-227/tokenizer_config.json +9 -9
transformer/checkpoint-227/trainer_state.json +29 -29
transformer/checkpoint-454/config.json +21 -19
transformer/checkpoint-454/model.safetensors +2 -2
transformer/checkpoint-454/optimizer.pt +2 -2
transformer/checkpoint-454/rng_state.pth +1 -1
transformer/checkpoint-454/scaler.pt +1 -1
transformer/checkpoint-454/tokenizer.json +0 -0
transformer/checkpoint-454/tokenizer_config.json +9 -9
transformer/checkpoint-454/trainer_state.json +56 -56
transformer/checkpoint-681/config.json +21 -19
transformer/checkpoint-681/model.safetensors +2 -2
transformer/checkpoint-681/optimizer.pt +2 -2
transformer/checkpoint-681/rng_state.pth +1 -1
transformer/checkpoint-681/scaler.pt +1 -1
transformer/checkpoint-681/tokenizer.json +0 -0
transformer/checkpoint-681/tokenizer_config.json +9 -9
transformer/checkpoint-681/trainer_state.json +86 -86
transformer/checkpoint-908/config.json +21 -19
transformer/checkpoint-908/model.safetensors +2 -2
transformer/checkpoint-908/optimizer.pt +2 -2

.gitattributes CHANGED Viewed

@@ -33,3 +33,9 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+transformer/checkpoint-1135/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+transformer/checkpoint-227/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+transformer/checkpoint-454/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+transformer/checkpoint-681/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+transformer/checkpoint-908/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+transformer/tokenizer.json filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 library_name: transformers
 pipeline_tag: text-classification
-base_model: distilbert/distilbert-base-multilingual-cased
 tags:
 - text-classification
 - binary-classification
@@ -17,10 +17,11 @@ It includes the Transformer model, any configured TF-IDF or sentence-embedding b
 - Dataset: `faodl/amis-agri-wheat`
 - Dataset subset: ``
 - Text column: `chunk_text`
 - Label column: `label`
-- Transformer: `distilbert/distilbert-base-multilingual-cased`
-- Generated at: `2026-05-19T20:24:29.088047+00:00`
 ## Dataset Summary
@@ -30,6 +31,25 @@ It includes the Transformer model, any configured TF-IDF or sentence-embedding b
 | validation | 759 | 486 | 273 | 396 | 636.7 |
 | test | 762 | 470 | 292 | 397 | 643.3 |
 ## Threshold Comparison on Test Split
 | Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
@@ -38,14 +58,14 @@ It includes the Transformer model, any configured TF-IDF or sentence-embedding b
 | logistic_tfidf | 0.470 | 0.797 | 0.688 | 0.860 | 0.764 | 0.888 | 0.827 |
 | xgboost_tfidf | 0.500 | 0.835 | 0.773 | 0.805 | 0.789 | 0.910 | 0.831 |
 | xgboost_tfidf | 0.520 | 0.835 | 0.777 | 0.798 | 0.787 | 0.910 | 0.831 |
-| embedding-logistic_sentence_embeddings | 0.500 | 0.795 | 0.711 | 0.784 | 0.746 | 0.880 | 0.825 |
-| embedding-logistic_sentence_embeddings | 0.564 | 0.799 | 0.746 | 0.723 | 0.734 | 0.880 | 0.825 |
-| embedding-svm_sentence_embeddings | 0.500 | 0.811 | 0.794 | 0.685 | 0.735 | 0.884 | 0.828 |
-| embedding-svm_sentence_embeddings | 0.406 | 0.801 | 0.716 | 0.795 | 0.753 | 0.884 | 0.828 |
-| embedding-lightgbm_sentence_embeddings | 0.500 | 0.807 | 0.756 | 0.733 | 0.744 | 0.888 | 0.823 |
-| embedding-lightgbm_sentence_embeddings | 0.540 | 0.806 | 0.761 | 0.719 | 0.739 | 0.888 | 0.823 |
-| transformer | 0.500 | 0.881 | 0.823 | 0.877 | 0.849 | 0.944 | 0.905 |
-| transformer | 0.581 | 0.881 | 0.830 | 0.866 | 0.848 | 0.944 | 0.905 |
 ## Confusion Matrices on Test Split
@@ -83,67 +103,67 @@ Rows are true labels and columns are predicted labels.
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 377 | 93 |
-| RELEVANT | 63 | 229 |
-### embedding-logistic_sentence_embeddings at threshold 0.564
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 398 | 72 |
-| RELEVANT | 81 | 211 |
 ### embedding-svm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 418 | 52 |
-| RELEVANT | 92 | 200 |
-### embedding-svm_sentence_embeddings at threshold 0.406
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 378 | 92 |
-| RELEVANT | 60 | 232 |
 ### embedding-lightgbm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 401 | 69 |
-| RELEVANT | 78 | 214 |
-### embedding-lightgbm_sentence_embeddings at threshold 0.540
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 404 | 66 |
-| RELEVANT | 82 | 210 |
 ### transformer at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 415 | 55 |
-| RELEVANT | 36 | 256 |
-### transformer at threshold 0.581
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 418 | 52 |
-| RELEVANT | 39 | 253 |
 ## Validation-Tuned Thresholds
 - `logistic_tfidf`: threshold `0.470` (validation F1 `0.779`); test F1 change vs 0.5: `+0.005`.
 - `xgboost_tfidf`: threshold `0.520` (validation F1 `0.822`); test F1 change vs 0.5: `-0.001`.
-- `embedding-logistic_sentence_embeddings`: threshold `0.564` (validation F1 `0.730`); test F1 change vs 0.5: `-0.012`.
-- `embedding-svm_sentence_embeddings`: threshold `0.406` (validation F1 `0.734`); test F1 change vs 0.5: `+0.018`.
-- `embedding-lightgbm_sentence_embeddings`: threshold `0.540` (validation F1 `0.748`); test F1 change vs 0.5: `-0.005`.
-- `transformer`: threshold `0.581` (validation F1 `0.878`); test F1 change vs 0.5: `-0.002`.
 ## Artifacts
@@ -159,7 +179,7 @@ Rows are true labels and columns are predicted labels.
 Install the runtime dependencies:
 ```bash
-pip install transformers torch huggingface_hub pandas joblib scikit-learn xgboost sentence-transformers lightgbm
 ```
 ### Transformer
@@ -168,7 +188,7 @@ pip install transformers torch huggingface_hub pandas joblib scikit-learn xgboos
 import torch
 from transformers import AutoModelForSequenceClassification, AutoTokenizer
-MODEL_ID = "faodl/agri-wheat-classifier"
 texts = [
     "Rice export prices increased after new procurement rules were announced.",
@@ -205,7 +225,7 @@ import json
 import joblib
 from huggingface_hub import hf_hub_download
-MODEL_ID = "faodl/agri-wheat-classifier"
 BASELINE = "logistic"
 texts = [
@@ -246,10 +266,11 @@ Available embedding baseline names in this run: "embedding-logistic", "embedding
 ```python
 import joblib
 from huggingface_hub import hf_hub_download
-from sentence_transformers import SentenceTransformer
-MODEL_ID = "faodl/agri-wheat-classifier"
 BASELINE = "embedding-logistic"
 texts = [
@@ -263,13 +284,31 @@ model_path = hf_hub_download(
     filename=f"baselines/{BASELINE}/{BASELINE}.joblib",
 )
 artifact = joblib.load(model_path)
-embedding_model = SentenceTransformer(artifact["embedding_model_name"])
-embeddings = embedding_model.encode(
-    texts,
-    batch_size=artifact.get("embedding_batch_size", 64),
-    convert_to_numpy=True,
-    normalize_embeddings=artifact.get("normalize_embeddings", True),
-)
 probabilities = artifact["classifier"].predict_proba(embeddings)[:, 1]
 threshold = artifact["validation_best_threshold"]["threshold"]

 ---
 library_name: transformers
 pipeline_tag: text-classification
+base_model: FacebookAI/xlm-roberta-base
 tags:
 - text-classification
 - binary-classification
 - Dataset: `faodl/amis-agri-wheat`
 - Dataset subset: ``
+- Dataset revision: `main`
 - Text column: `chunk_text`
 - Label column: `label`
+- Transformer: `FacebookAI/xlm-roberta-base`
+- Generated at: `2026-05-29T18:13:08.384805+00:00`
 ## Dataset Summary
 | validation | 759 | 486 | 273 | 396 | 636.7 |
 | test | 762 | 470 | 292 | 397 | 643.3 |
+## Threshold Comparison on Validation Split
+Validation metrics document threshold selection and tuning behavior; test metrics remain the primary estimate of out-of-sample performance.
+| Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
+| --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
+| logistic_tfidf | 0.500 | 0.818 | 0.718 | 0.813 | 0.763 | 0.907 | 0.867 |
+| logistic_tfidf | 0.470 | 0.823 | 0.709 | 0.864 | 0.779 | 0.907 | 0.867 |
+| xgboost_tfidf | 0.500 | 0.868 | 0.808 | 0.832 | 0.819 | 0.935 | 0.892 |
+| xgboost_tfidf | 0.520 | 0.871 | 0.816 | 0.828 | 0.822 | 0.935 | 0.892 |
+| embedding-logistic_sentence_embeddings | 0.500 | 0.783 | 0.658 | 0.824 | 0.732 | 0.862 | 0.780 |
+| embedding-logistic_sentence_embeddings | 0.521 | 0.791 | 0.673 | 0.813 | 0.736 | 0.862 | 0.780 |
+| embedding-svm_sentence_embeddings | 0.500 | 0.804 | 0.714 | 0.758 | 0.735 | 0.869 | 0.792 |
+| embedding-svm_sentence_embeddings | 0.473 | 0.805 | 0.704 | 0.791 | 0.745 | 0.869 | 0.792 |
+| embedding-lightgbm_sentence_embeddings | 0.500 | 0.791 | 0.694 | 0.747 | 0.720 | 0.868 | 0.786 |
+| embedding-lightgbm_sentence_embeddings | 0.433 | 0.800 | 0.693 | 0.795 | 0.741 | 0.868 | 0.786 |
+| transformer | 0.500 | 0.925 | 0.894 | 0.897 | 0.896 | 0.956 | 0.914 |
+| transformer | 0.203 | 0.926 | 0.883 | 0.916 | 0.899 | 0.956 | 0.914 |
 ## Threshold Comparison on Test Split
 | Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
 | logistic_tfidf | 0.470 | 0.797 | 0.688 | 0.860 | 0.764 | 0.888 | 0.827 |
 | xgboost_tfidf | 0.500 | 0.835 | 0.773 | 0.805 | 0.789 | 0.910 | 0.831 |
 | xgboost_tfidf | 0.520 | 0.835 | 0.777 | 0.798 | 0.787 | 0.910 | 0.831 |
+| embedding-logistic_sentence_embeddings | 0.500 | 0.782 | 0.699 | 0.757 | 0.727 | 0.877 | 0.821 |
+| embedding-logistic_sentence_embeddings | 0.521 | 0.789 | 0.713 | 0.750 | 0.731 | 0.877 | 0.821 |
+| embedding-svm_sentence_embeddings | 0.500 | 0.818 | 0.778 | 0.733 | 0.755 | 0.883 | 0.824 |
+| embedding-svm_sentence_embeddings | 0.473 | 0.812 | 0.758 | 0.750 | 0.754 | 0.883 | 0.824 |
+| embedding-lightgbm_sentence_embeddings | 0.500 | 0.798 | 0.740 | 0.729 | 0.734 | 0.892 | 0.847 |
+| embedding-lightgbm_sentence_embeddings | 0.433 | 0.806 | 0.735 | 0.771 | 0.753 | 0.892 | 0.847 |
+| transformer | 0.500 | 0.885 | 0.862 | 0.832 | 0.847 | 0.943 | 0.915 |
+| transformer | 0.203 | 0.890 | 0.854 | 0.860 | 0.857 | 0.943 | 0.915 |
 ## Confusion Matrices on Test Split
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 375 | 95 |
+| RELEVANT | 71 | 221 |
+### embedding-logistic_sentence_embeddings at threshold 0.521
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 382 | 88 |
+| RELEVANT | 73 | 219 |
 ### embedding-svm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 409 | 61 |
+| RELEVANT | 78 | 214 |
+### embedding-svm_sentence_embeddings at threshold 0.473
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 400 | 70 |
+| RELEVANT | 73 | 219 |
 ### embedding-lightgbm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 395 | 75 |
+| RELEVANT | 79 | 213 |
+### embedding-lightgbm_sentence_embeddings at threshold 0.433
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 389 | 81 |
+| RELEVANT | 67 | 225 |
 ### transformer at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 431 | 39 |
+| RELEVANT | 49 | 243 |
+### transformer at threshold 0.203
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 427 | 43 |
+| RELEVANT | 41 | 251 |
 ## Validation-Tuned Thresholds
 - `logistic_tfidf`: threshold `0.470` (validation F1 `0.779`); test F1 change vs 0.5: `+0.005`.
 - `xgboost_tfidf`: threshold `0.520` (validation F1 `0.822`); test F1 change vs 0.5: `-0.001`.
+- `embedding-logistic_sentence_embeddings`: threshold `0.521` (validation F1 `0.736`); test F1 change vs 0.5: `+0.004`.
+- `embedding-svm_sentence_embeddings`: threshold `0.473` (validation F1 `0.745`); test F1 change vs 0.5: `-0.001`.
+- `embedding-lightgbm_sentence_embeddings`: threshold `0.433` (validation F1 `0.741`); test F1 change vs 0.5: `+0.018`.
+- `transformer`: threshold `0.203` (validation F1 `0.899`); test F1 change vs 0.5: `+0.010`.
 ## Artifacts
 Install the runtime dependencies:
 ```bash
+pip install transformers torch huggingface_hub pandas joblib scikit-learn xgboost lightgbm
 ```
 ### Transformer
 import torch
 from transformers import AutoModelForSequenceClassification, AutoTokenizer
+MODEL_ID = "YOUR_USERNAME/YOUR_MODEL_REPO"
 texts = [
     "Rice export prices increased after new procurement rules were announced.",
 import joblib
 from huggingface_hub import hf_hub_download
+MODEL_ID = "YOUR_USERNAME/YOUR_MODEL_REPO"
 BASELINE = "logistic"
 texts = [
 ```python
 import joblib
+import torch
 from huggingface_hub import hf_hub_download
+from transformers import AutoModel, AutoTokenizer
+MODEL_ID = "YOUR_USERNAME/YOUR_MODEL_REPO"
 BASELINE = "embedding-logistic"
 texts = [
     filename=f"baselines/{BASELINE}/{BASELINE}.joblib",
 )
 artifact = joblib.load(model_path)
+tokenizer = AutoTokenizer.from_pretrained(artifact["embedding_model_name"])
+encoder = AutoModel.from_pretrained(artifact["embedding_model_name"])
+encoder.eval()
+encoded_batches = []
+batch_size = artifact.get("embedding_batch_size", 64)
+for start in range(0, len(texts), batch_size):
+    batch_texts = texts[start : start + batch_size]
+    inputs = tokenizer(
+        batch_texts,
+        padding=True,
+        truncation=True,
+        max_length=artifact.get("embedding_max_length", 256),
+        return_tensors="pt",
+    )
+    with torch.no_grad():
+        outputs = encoder(**inputs)
+    token_embeddings = outputs.last_hidden_state
+    attention_mask = inputs["attention_mask"].unsqueeze(-1).to(token_embeddings.dtype)
+    embeddings = (token_embeddings * attention_mask).sum(dim=1)
+    embeddings = embeddings / attention_mask.sum(dim=1).clamp(min=1e-9)
+    if artifact.get("normalize_embeddings", True):
+        embeddings = torch.nn.functional.normalize(embeddings, p=2, dim=1)
+    encoded_batches.append(embeddings)
+embeddings = torch.cat(encoded_batches).numpy()
 probabilities = artifact["classifier"].predict_proba(embeddings)[:, 1]
 threshold = artifact["validation_best_threshold"]["threshold"]

REPORT.md CHANGED Viewed

@@ -2,10 +2,11 @@
 - Dataset: `faodl/amis-agri-wheat`
 - Dataset subset: ``
 - Text column: `chunk_text`
 - Label column: `label`
-- Transformer: `distilbert/distilbert-base-multilingual-cased`
-- Generated at: `2026-05-19T20:24:29.088047+00:00`
 ## Dataset Summary
@@ -15,6 +16,25 @@
 | validation | 759 | 486 | 273 | 396 | 636.7 |
 | test | 762 | 470 | 292 | 397 | 643.3 |
 ## Threshold Comparison on Test Split
 | Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
@@ -23,14 +43,14 @@
 | logistic_tfidf | 0.470 | 0.797 | 0.688 | 0.860 | 0.764 | 0.888 | 0.827 |
 | xgboost_tfidf | 0.500 | 0.835 | 0.773 | 0.805 | 0.789 | 0.910 | 0.831 |
 | xgboost_tfidf | 0.520 | 0.835 | 0.777 | 0.798 | 0.787 | 0.910 | 0.831 |
-| embedding-logistic_sentence_embeddings | 0.500 | 0.795 | 0.711 | 0.784 | 0.746 | 0.880 | 0.825 |
-| embedding-logistic_sentence_embeddings | 0.564 | 0.799 | 0.746 | 0.723 | 0.734 | 0.880 | 0.825 |
-| embedding-svm_sentence_embeddings | 0.500 | 0.811 | 0.794 | 0.685 | 0.735 | 0.884 | 0.828 |
-| embedding-svm_sentence_embeddings | 0.406 | 0.801 | 0.716 | 0.795 | 0.753 | 0.884 | 0.828 |
-| embedding-lightgbm_sentence_embeddings | 0.500 | 0.807 | 0.756 | 0.733 | 0.744 | 0.888 | 0.823 |
-| embedding-lightgbm_sentence_embeddings | 0.540 | 0.806 | 0.761 | 0.719 | 0.739 | 0.888 | 0.823 |
-| transformer | 0.500 | 0.881 | 0.823 | 0.877 | 0.849 | 0.944 | 0.905 |
-| transformer | 0.581 | 0.881 | 0.830 | 0.866 | 0.848 | 0.944 | 0.905 |
 ## Confusion Matrices on Test Split
@@ -68,67 +88,67 @@ Rows are true labels and columns are predicted labels.
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 377 | 93 |
-| RELEVANT | 63 | 229 |
-### embedding-logistic_sentence_embeddings at threshold 0.564
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 398 | 72 |
-| RELEVANT | 81 | 211 |
 ### embedding-svm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 418 | 52 |
-| RELEVANT | 92 | 200 |
-### embedding-svm_sentence_embeddings at threshold 0.406
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 378 | 92 |
-| RELEVANT | 60 | 232 |
 ### embedding-lightgbm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 401 | 69 |
-| RELEVANT | 78 | 214 |
-### embedding-lightgbm_sentence_embeddings at threshold 0.540
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 404 | 66 |
-| RELEVANT | 82 | 210 |
 ### transformer at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 415 | 55 |
-| RELEVANT | 36 | 256 |
-### transformer at threshold 0.581
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
-| NOT_RELEVANT | 418 | 52 |
-| RELEVANT | 39 | 253 |
 ## Validation-Tuned Thresholds
 - `logistic_tfidf`: threshold `0.470` (validation F1 `0.779`); test F1 change vs 0.5: `+0.005`.
 - `xgboost_tfidf`: threshold `0.520` (validation F1 `0.822`); test F1 change vs 0.5: `-0.001`.
-- `embedding-logistic_sentence_embeddings`: threshold `0.564` (validation F1 `0.730`); test F1 change vs 0.5: `-0.012`.
-- `embedding-svm_sentence_embeddings`: threshold `0.406` (validation F1 `0.734`); test F1 change vs 0.5: `+0.018`.
-- `embedding-lightgbm_sentence_embeddings`: threshold `0.540` (validation F1 `0.748`); test F1 change vs 0.5: `-0.005`.
-- `transformer`: threshold `0.581` (validation F1 `0.878`); test F1 change vs 0.5: `-0.002`.
 ## Artifacts

 - Dataset: `faodl/amis-agri-wheat`
 - Dataset subset: ``
+- Dataset revision: `main`
 - Text column: `chunk_text`
 - Label column: `label`
+- Transformer: `FacebookAI/xlm-roberta-base`
+- Generated at: `2026-05-29T18:13:08.384805+00:00`
 ## Dataset Summary
 | validation | 759 | 486 | 273 | 396 | 636.7 |
 | test | 762 | 470 | 292 | 397 | 643.3 |
+## Threshold Comparison on Validation Split
+Validation metrics document threshold selection and tuning behavior; test metrics remain the primary estimate of out-of-sample performance.
+| Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
+| --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
+| logistic_tfidf | 0.500 | 0.818 | 0.718 | 0.813 | 0.763 | 0.907 | 0.867 |
+| logistic_tfidf | 0.470 | 0.823 | 0.709 | 0.864 | 0.779 | 0.907 | 0.867 |
+| xgboost_tfidf | 0.500 | 0.868 | 0.808 | 0.832 | 0.819 | 0.935 | 0.892 |
+| xgboost_tfidf | 0.520 | 0.871 | 0.816 | 0.828 | 0.822 | 0.935 | 0.892 |
+| embedding-logistic_sentence_embeddings | 0.500 | 0.783 | 0.658 | 0.824 | 0.732 | 0.862 | 0.780 |
+| embedding-logistic_sentence_embeddings | 0.521 | 0.791 | 0.673 | 0.813 | 0.736 | 0.862 | 0.780 |
+| embedding-svm_sentence_embeddings | 0.500 | 0.804 | 0.714 | 0.758 | 0.735 | 0.869 | 0.792 |
+| embedding-svm_sentence_embeddings | 0.473 | 0.805 | 0.704 | 0.791 | 0.745 | 0.869 | 0.792 |
+| embedding-lightgbm_sentence_embeddings | 0.500 | 0.791 | 0.694 | 0.747 | 0.720 | 0.868 | 0.786 |
+| embedding-lightgbm_sentence_embeddings | 0.433 | 0.800 | 0.693 | 0.795 | 0.741 | 0.868 | 0.786 |
+| transformer | 0.500 | 0.925 | 0.894 | 0.897 | 0.896 | 0.956 | 0.914 |
+| transformer | 0.203 | 0.926 | 0.883 | 0.916 | 0.899 | 0.956 | 0.914 |
 ## Threshold Comparison on Test Split
 | Model | Threshold | Accuracy | Precision | Recall | F1 | ROC AUC | Average precision |
 | logistic_tfidf | 0.470 | 0.797 | 0.688 | 0.860 | 0.764 | 0.888 | 0.827 |
 | xgboost_tfidf | 0.500 | 0.835 | 0.773 | 0.805 | 0.789 | 0.910 | 0.831 |
 | xgboost_tfidf | 0.520 | 0.835 | 0.777 | 0.798 | 0.787 | 0.910 | 0.831 |
+| embedding-logistic_sentence_embeddings | 0.500 | 0.782 | 0.699 | 0.757 | 0.727 | 0.877 | 0.821 |
+| embedding-logistic_sentence_embeddings | 0.521 | 0.789 | 0.713 | 0.750 | 0.731 | 0.877 | 0.821 |
+| embedding-svm_sentence_embeddings | 0.500 | 0.818 | 0.778 | 0.733 | 0.755 | 0.883 | 0.824 |
+| embedding-svm_sentence_embeddings | 0.473 | 0.812 | 0.758 | 0.750 | 0.754 | 0.883 | 0.824 |
+| embedding-lightgbm_sentence_embeddings | 0.500 | 0.798 | 0.740 | 0.729 | 0.734 | 0.892 | 0.847 |
+| embedding-lightgbm_sentence_embeddings | 0.433 | 0.806 | 0.735 | 0.771 | 0.753 | 0.892 | 0.847 |
+| transformer | 0.500 | 0.885 | 0.862 | 0.832 | 0.847 | 0.943 | 0.915 |
+| transformer | 0.203 | 0.890 | 0.854 | 0.860 | 0.857 | 0.943 | 0.915 |
 ## Confusion Matrices on Test Split
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 375 | 95 |
+| RELEVANT | 71 | 221 |
+### embedding-logistic_sentence_embeddings at threshold 0.521
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 382 | 88 |
+| RELEVANT | 73 | 219 |
 ### embedding-svm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 409 | 61 |
+| RELEVANT | 78 | 214 |
+### embedding-svm_sentence_embeddings at threshold 0.473
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 400 | 70 |
+| RELEVANT | 73 | 219 |
 ### embedding-lightgbm_sentence_embeddings at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 395 | 75 |
+| RELEVANT | 79 | 213 |
+### embedding-lightgbm_sentence_embeddings at threshold 0.433
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 389 | 81 |
+| RELEVANT | 67 | 225 |
 ### transformer at threshold 0.500
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 431 | 39 |
+| RELEVANT | 49 | 243 |
+### transformer at threshold 0.203
 | True / Predicted | NOT_RELEVANT | RELEVANT |
 | --- | ---: | ---: |
+| NOT_RELEVANT | 427 | 43 |
+| RELEVANT | 41 | 251 |
 ## Validation-Tuned Thresholds
 - `logistic_tfidf`: threshold `0.470` (validation F1 `0.779`); test F1 change vs 0.5: `+0.005`.
 - `xgboost_tfidf`: threshold `0.520` (validation F1 `0.822`); test F1 change vs 0.5: `-0.001`.
+- `embedding-logistic_sentence_embeddings`: threshold `0.521` (validation F1 `0.736`); test F1 change vs 0.5: `+0.004`.
+- `embedding-svm_sentence_embeddings`: threshold `0.473` (validation F1 `0.745`); test F1 change vs 0.5: `-0.001`.
+- `embedding-lightgbm_sentence_embeddings`: threshold `0.433` (validation F1 `0.741`); test F1 change vs 0.5: `+0.018`.
+- `transformer`: threshold `0.203` (validation F1 `0.899`); test F1 change vs 0.5: `+0.010`.
 ## Artifacts

baselines/embedding-lightgbm/embedding-lightgbm.joblib CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b3f56f59c1281405d56efca4d691933dd542cee67012f1c7345dd76701fba6d7
-size 1444644

 version https://git-lfs.github.com/spec/v1
+oid sha256:3463bed6fbc93713eabd1e10f2dbb63b05f5ce1533a4ea9aaab45a753bcb5c21
+size 1444574

baselines/embedding-lightgbm/test_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/embedding-lightgbm/validation_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/embedding-logistic/embedding-logistic.joblib CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8675c256f2bd7cc388d6bc6a3c61e5930f5c33b4275649c9d831f344e8412fa4
-size 4287

 version https://git-lfs.github.com/spec/v1
+oid sha256:645213b2f532b79aa9381ce2c83e1e1d47957dba20521077adcc302ac5c6a27b
+size 4361

baselines/embedding-logistic/test_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/embedding-logistic/validation_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/embedding-svm/embedding-svm.joblib CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:61cbe1c99c38b69262a096054e3563b97479585fffafff10400538e65b20fdcb
-size 11696

 version https://git-lfs.github.com/spec/v1
+oid sha256:c464a859cf16feb638dfa769b9156542b9e1a35d82c9ab9035abf8ec110c44d6
+size 11770

baselines/embedding-svm/test_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

baselines/embedding-svm/validation_predictions.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

report.json CHANGED Viewed

@@ -1,8 +1,9 @@
 {
-  "created_at": "2026-05-19T20:24:29.088047+00:00",
   "config": {
     "hf_dataset": "faodl/amis-agri-wheat",
     "hf_subset": null,
     "train_split": "train",
     "validation_split": "validation",
     "test_split": "test",
@@ -10,7 +11,7 @@
     "label_col": "label",
     "group_col": "id",
     "id_col": "chunk_id",
-    "model_name": "distilbert/distilbert-base-multilingual-cased",
     "output_dir": "/content/agri-wheat-classifier",
     "max_length": 256,
     "learning_rate": 2e-05,
@@ -37,8 +38,8 @@
     "embedding_batch_size": 64,
     "positive_label_name": "RELEVANT",
     "negative_label_name": "NOT_RELEVANT",
-    "push_to_hub": true,
-    "hub_model_id": "faodl/agri-wheat-classifier",
     "hub_private_repo": false
   },
   "dataset_summary": {
@@ -85,6 +86,98 @@
         "precision": 0.7087087087087087,
         "recall": 0.8644688644688645
       },
       "test_default_0_5": {
         "threshold": 0.5,
         "accuracy": 0.8031496062992126,
@@ -189,6 +282,98 @@
         "precision": 0.8158844765342961,
         "recall": 0.8278388278388278
       },
       "test_default_0_5": {
         "threshold": 0.5,
         "accuracy": 0.8346456692913385,
@@ -289,102 +474,194 @@
       "artifact_dir": "/content/agri-wheat-classifier/baselines/embedding-logistic",
       "artifact_file": "/content/agri-wheat-classifier/baselines/embedding-logistic/embedding-logistic.joblib",
       "validation_best_threshold": {
-        "threshold": 0.563937513505343,
-        "f1": 0.7301038062283736,
-        "precision": 0.6918032786885245,
-        "recall": 0.7728937728937729
       },
       "test_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.7952755905511811,
-        "precision": 0.7111801242236024,
-        "recall": 0.7842465753424658,
-        "f1": 0.745928338762215,
         "confusion_matrix": [
           [
-            377,
-            93
           ],
           [
-            63,
-            229
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.8568181818181818,
-            "recall": 0.8021276595744681,
-            "f1-score": 0.8285714285714286,
             "support": 470.0
           },
           "RELEVANT": {
-            "precision": 0.7111801242236024,
-            "recall": 0.7842465753424658,
-            "f1-score": 0.745928338762215,
             "support": 292.0
           },
-          "accuracy": 0.7952755905511811,
           "macro avg": {
-            "precision": 0.7839991530208921,
-            "recall": 0.7931871174584669,
-            "f1-score": 0.7872498836668218,
             "support": 762.0
           },
           "weighted avg": {
-            "precision": 0.8010093723462433,
-            "recall": 0.7952755905511811,
-            "f1-score": 0.7969024230277404,
             "support": 762.0
           }
         },
-        "roc_auc": 0.8801005537744098,
-        "average_precision": 0.8246628238347572
       },
       "test_optimal_threshold": {
-        "threshold": 0.563937513505343,
-        "accuracy": 0.7992125984251969,
-        "precision": 0.7455830388692579,
-        "recall": 0.7226027397260274,
-        "f1": 0.7339130434782609,
         "confusion_matrix": [
           [
-            398,
-            72
           ],
           [
-            81,
-            211
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.8308977035490606,
-            "recall": 0.8468085106382979,
-            "f1-score": 0.8387776606954689,
             "support": 470.0
           },
           "RELEVANT": {
-            "precision": 0.7455830388692579,
-            "recall": 0.7226027397260274,
-            "f1-score": 0.7339130434782609,
             "support": 292.0
           },
-          "accuracy": 0.7992125984251969,
           "macro avg": {
-            "precision": 0.7882403712091592,
-            "recall": 0.7847056251821627,
-            "f1-score": 0.7863453520868648,
             "support": 762.0
           },
           "weighted avg": {
-            "precision": 0.7982049449053567,
-            "recall": 0.7992125984251969,
-            "f1-score": 0.7985933191896621,
             "support": 762.0
           }
         },
-        "roc_auc": 0.8801005537744098,
-        "average_precision": 0.8246628238347572
       }
     },
     {
@@ -394,102 +671,194 @@
       "artifact_dir": "/content/agri-wheat-classifier/baselines/embedding-svm",
       "artifact_file": "/content/agri-wheat-classifier/baselines/embedding-svm/embedding-svm.joblib",
       "validation_best_threshold": {
-        "threshold": 0.40634467461913637,
-        "f1": 0.7335526315789473,
-        "precision": 0.6656716417910448,
-        "recall": 0.8168498168498168
       },
       "test_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.8110236220472441,
-        "precision": 0.7936507936507936,
-        "recall": 0.684931506849315,
-        "f1": 0.7352941176470589,
         "confusion_matrix": [
           [
-            418,
-            52
           ],
           [
-            92,
-            200
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.8196078431372549,
-            "recall": 0.8893617021276595,
-            "f1-score": 0.8530612244897959,
             "support": 470.0
           },
           "RELEVANT": {
-            "precision": 0.7936507936507936,
-            "recall": 0.684931506849315,
-            "f1-score": 0.7352941176470589,
             "support": 292.0
           },
-          "accuracy": 0.8110236220472441,
           "macro avg": {
-            "precision": 0.8066293183940243,
-            "recall": 0.7871466044884873,
-            "f1-score": 0.7941776710684274,
             "support": 762.0
           },
           "weighted avg": {
-            "precision": 0.8096610472710519,
-            "recall": 0.8110236220472441,
-            "f1-score": 0.8079326218676448,
             "support": 762.0
           }
         },
-        "roc_auc": 0.8844068784610901,
-        "average_precision": 0.8275847340102567
       },
       "test_optimal_threshold": {
-        "threshold": 0.40634467461913637,
-        "accuracy": 0.800524934383202,
-        "precision": 0.7160493827160493,
-        "recall": 0.7945205479452054,
-        "f1": 0.7532467532467533,
         "confusion_matrix": [
           [
-            378,
-            92
           ],
           [
-            60,
-            232
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.863013698630137,
-            "recall": 0.8042553191489362,
-            "f1-score": 0.8325991189427313,
             "support": 470.0
           },
           "RELEVANT": {
-            "precision": 0.7160493827160493,
-            "recall": 0.7945205479452054,
-            "f1-score": 0.7532467532467533,
             "support": 292.0
           },
-          "accuracy": 0.800524934383202,
           "macro avg": {
-            "precision": 0.7895315406730932,
-            "recall": 0.7993879335470708,
-            "f1-score": 0.7929229360947423,
             "support": 762.0
           },
           "weighted avg": {
-            "precision": 0.8066966641853685,
-            "recall": 0.800524934383202,
-            "f1-score": 0.802191125788892,
             "support": 762.0
           }
         },
-        "roc_auc": 0.8844068784610901,
-        "average_precision": 0.8275847340102567
       }
     },
     {
@@ -499,205 +868,389 @@
       "artifact_dir": "/content/agri-wheat-classifier/baselines/embedding-lightgbm",
       "artifact_file": "/content/agri-wheat-classifier/baselines/embedding-lightgbm/embedding-lightgbm.joblib",
       "validation_best_threshold": {
-        "threshold": 0.5404668230512064,
-        "f1": 0.7482014388489209,
-        "precision": 0.734982332155477,
-        "recall": 0.7619047619047619
       },
       "test_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.8070866141732284,
-        "precision": 0.7561837455830389,
-        "recall": 0.7328767123287672,
-        "f1": 0.7443478260869565,
         "confusion_matrix": [
           [
-            401,
-            69
           ],
           [
-            78,
-            214
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.837160751565762,
-            "recall": 0.8531914893617021,
-            "f1-score": 0.845100105374078,
             "support": 470.0
           },
           "RELEVANT": {
-            "precision": 0.7561837455830389,
-            "recall": 0.7328767123287672,
-            "f1-score": 0.7443478260869565,
             "support": 292.0
           },
-          "accuracy": 0.8070866141732284,
           "macro avg": {
-            "precision": 0.7966722485744004,
-            "recall": 0.7930341008452346,
-            "f1-score": 0.7947239657305172,
             "support": 762.0
           },
           "weighted avg": {
-            "precision": 0.8061301928427238,
-            "recall": 0.8070866141732284,
-            "f1-score": 0.8064916203979107,
             "support": 762.0
           }
         },
-        "roc_auc": 0.8878825415330808,
-        "average_precision": 0.8230959168683762
       },
       "test_optimal_threshold": {
-        "threshold": 0.5404668230512064,
         "accuracy": 0.8057742782152231,
-        "precision": 0.7608695652173914,
-        "recall": 0.7191780821917808,
-        "f1": 0.7394366197183099,
         "confusion_matrix": [
           [
-            404,
-            66
           ],
           [
-            82,
-            210
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.831275720164609,
-            "recall": 0.8595744680851064,
-            "f1-score": 0.8451882845188284,
             "support": 470.0
           },
           "RELEVANT": {
-            "precision": 0.7608695652173914,
-            "recall": 0.7191780821917808,
-            "f1-score": 0.7394366197183099,
             "support": 292.0
           },
           "accuracy": 0.8057742782152231,
           "macro avg": {
-            "precision": 0.7960726426910002,
-            "recall": 0.7893762751384437,
-            "f1-score": 0.7923124521185692,
             "support": 762.0
           },
           "weighted avg": {
-            "precision": 0.8042959337543892,
             "recall": 0.8057742782152231,
-            "f1-score": 0.80466402451653,
             "support": 762.0
           }
         },
-        "roc_auc": 0.8878825415330808,
-        "average_precision": 0.8230959168683762
       }
     },
     {
       "model_type": "transformer",
-      "model_name": "distilbert/distilbert-base-multilingual-cased",
       "artifact_dir": "/content/agri-wheat-classifier/transformer",
       "validation_best_threshold": {
-        "threshold": 0.5806344747543335,
-        "f1": 0.8776978417266188,
-        "precision": 0.8621908127208481,
-        "recall": 0.8937728937728938
       },
       "test_default_0_5": {
         "threshold": 0.5,
-        "accuracy": 0.8805774278215223,
-        "precision": 0.8231511254019293,
-        "recall": 0.8767123287671232,
-        "f1": 0.8490878938640133,
         "confusion_matrix": [
           [
-            415,
-            55
           ],
           [
-            36,
-            256
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9201773835920177,
-            "recall": 0.8829787234042553,
-            "f1-score": 0.9011943539630836,
             "support": 470.0
           },
           "RELEVANT": {
-            "precision": 0.8231511254019293,
-            "recall": 0.8767123287671232,
-            "f1-score": 0.8490878938640133,
             "support": 292.0
           },
-          "accuracy": 0.8805774278215223,
           "macro avg": {
-            "precision": 0.8716642544969735,
-            "recall": 0.8798455260856892,
-            "f1-score": 0.8751411239135485,
             "support": 762.0
           },
           "weighted avg": {
-            "precision": 0.8829967177238999,
-            "recall": 0.8805774278215223,
-            "f1-score": 0.8812270490432298,
             "support": 762.0
           }
         },
-        "roc_auc": 0.9439886330515885,
-        "average_precision": 0.905280557562998
       },
       "test_optimal_threshold": {
-        "threshold": 0.5806344747543335,
-        "accuracy": 0.8805774278215223,
-        "precision": 0.8295081967213115,
-        "recall": 0.8664383561643836,
-        "f1": 0.847571189279732,
         "confusion_matrix": [
           [
-            418,
-            52
           ],
           [
-            39,
-            253
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
-            "precision": 0.9146608315098468,
-            "recall": 0.8893617021276595,
-            "f1-score": 0.9018338727076591,
             "support": 470.0
           },
           "RELEVANT": {
-            "precision": 0.8295081967213115,
-            "recall": 0.8664383561643836,
-            "f1-score": 0.847571189279732,
             "support": 292.0
           },
-          "accuracy": 0.8805774278215223,
           "macro avg": {
-            "precision": 0.8720845141155791,
-            "recall": 0.8779000291460215,
-            "f1-score": 0.8747025309936955,
             "support": 762.0
           },
           "weighted avg": {
-            "precision": 0.8820301630606968,
-            "recall": 0.8805774278215223,
-            "f1-score": 0.8810402984806845,
             "support": 762.0
           }
         },
-        "roc_auc": 0.9439886330515885,
-        "average_precision": 0.905280557562998
       }
     }
   ]

 {
+  "created_at": "2026-05-29T18:13:08.384805+00:00",
   "config": {
     "hf_dataset": "faodl/amis-agri-wheat",
     "hf_subset": null,
+    "hf_revision": "main",
     "train_split": "train",
     "validation_split": "validation",
     "test_split": "test",
     "label_col": "label",
     "group_col": "id",
     "id_col": "chunk_id",
+    "model_name": "FacebookAI/xlm-roberta-base",
     "output_dir": "/content/agri-wheat-classifier",
     "max_length": 256,
     "learning_rate": 2e-05,
     "embedding_batch_size": 64,
     "positive_label_name": "RELEVANT",
     "negative_label_name": "NOT_RELEVANT",
+    "push_to_hub": false,
+    "hub_model_id": null,
     "hub_private_repo": false
   },
   "dataset_summary": {
         "precision": 0.7087087087087087,
         "recall": 0.8644688644688645
       },
+      "validation_default_0_5": {
+        "threshold": 0.5,
+        "accuracy": 0.8181818181818182,
+        "precision": 0.7184466019417476,
+        "recall": 0.8131868131868132,
+        "f1": 0.7628865979381443,
+        "confusion_matrix": [
+          [
+            399,
+            87
+          ],
+          [
+            51,
+            222
+          ]
+        ],
+        "classification_report": {
+          "NOT_RELEVANT": {
+            "precision": 0.8866666666666667,
+            "recall": 0.8209876543209876,
+            "f1-score": 0.8525641025641025,
+            "support": 486.0
+          },
+          "RELEVANT": {
+            "precision": 0.7184466019417476,
+            "recall": 0.8131868131868132,
+            "f1-score": 0.7628865979381443,
+            "support": 273.0
+          },
+          "accuracy": 0.8181818181818182,
+          "macro avg": {
+            "precision": 0.8025566343042072,
+            "recall": 0.8170872337539004,
+            "f1-score": 0.8077253502511235,
+            "support": 759.0
+          },
+          "weighted avg": {
+            "precision": 0.8261606354810239,
+            "recall": 0.8181818181818182,
+            "f1-score": 0.8203085574219594,
+            "support": 759.0
+          }
+        },
+        "roc_auc": 0.9070908515352959,
+        "average_precision": 0.8669161076776083
+      },
+      "validation_optimal_threshold": {
+        "threshold": 0.46961394282689456,
+        "accuracy": 0.8234519104084321,
+        "precision": 0.7087087087087087,
+        "recall": 0.8644688644688645,
+        "f1": 0.7788778877887789,
+        "confusion_matrix": [
+          [
+            389,
+            97
+          ],
+          [
+            37,
+            236
+          ]
+        ],
+        "classification_report": {
+          "NOT_RELEVANT": {
+            "precision": 0.9131455399061033,
+            "recall": 0.8004115226337448,
+            "f1-score": 0.8530701754385965,
+            "support": 486.0
+          },
+          "RELEVANT": {
+            "precision": 0.7087087087087087,
+            "recall": 0.8644688644688645,
+            "f1-score": 0.7788778877887789,
+            "support": 273.0
+          },
+          "accuracy": 0.8234519104084321,
+          "macro avg": {
+            "precision": 0.810927124307406,
+            "recall": 0.8324401935513046,
+            "f1-score": 0.8159740316136876,
+            "support": 759.0
+          },
+          "weighted avg": {
+            "precision": 0.8396129247323368,
+            "recall": 0.8234519104084321,
+            "f1-score": 0.8263844118965672,
+            "support": 759.0
+          }
+        },
+        "roc_auc": 0.9070908515352959,
+        "average_precision": 0.8669161076776083
+      },
       "test_default_0_5": {
         "threshold": 0.5,
         "accuracy": 0.8031496062992126,
         "precision": 0.8158844765342961,
         "recall": 0.8278388278388278
       },
+      "validation_default_0_5": {
+        "threshold": 0.5,
+        "accuracy": 0.8682476943346509,
+        "precision": 0.8078291814946619,
+        "recall": 0.8315018315018315,
+        "f1": 0.8194945848375451,
+        "confusion_matrix": [
+          [
+            432,
+            54
+          ],
+          [
+            46,
+            227
+          ]
+        ],
+        "classification_report": {
+          "NOT_RELEVANT": {
+            "precision": 0.9037656903765691,
+            "recall": 0.8888888888888888,
+            "f1-score": 0.8962655601659751,
+            "support": 486.0
+          },
+          "RELEVANT": {
+            "precision": 0.8078291814946619,
+            "recall": 0.8315018315018315,
+            "f1-score": 0.8194945848375451,
+            "support": 273.0
+          },
+          "accuracy": 0.8682476943346509,
+          "macro avg": {
+            "precision": 0.8557974359356155,
+            "recall": 0.8601953601953602,
+            "f1-score": 0.8578800725017601,
+            "support": 759.0
+          },
+          "weighted avg": {
+            "precision": 0.8692588828340648,
+            "recall": 0.8682476943346509,
+            "f1-score": 0.8686522844549588,
+            "support": 759.0
+          }
+        },
+        "roc_auc": 0.9346915087655827,
+        "average_precision": 0.8916128406855647
+      },
+      "validation_optimal_threshold": {
+        "threshold": 0.5195086002349854,
+        "accuracy": 0.8708827404479579,
+        "precision": 0.8158844765342961,
+        "recall": 0.8278388278388278,
+        "f1": 0.8218181818181818,
+        "confusion_matrix": [
+          [
+            435,
+            51
+          ],
+          [
+            47,
+            226
+          ]
+        ],
+        "classification_report": {
+          "NOT_RELEVANT": {
+            "precision": 0.9024896265560166,
+            "recall": 0.8950617283950617,
+            "f1-score": 0.8987603305785123,
+            "support": 486.0
+          },
+          "RELEVANT": {
+            "precision": 0.8158844765342961,
+            "recall": 0.8278388278388278,
+            "f1-score": 0.8218181818181818,
+            "support": 273.0
+          },
+          "accuracy": 0.8708827404479579,
+          "macro avg": {
+            "precision": 0.8591870515451563,
+            "recall": 0.8614502781169447,
+            "f1-score": 0.8602892561983471,
+            "support": 759.0
+          },
+          "weighted avg": {
+            "precision": 0.8713391575758721,
+            "recall": 0.8708827404479579,
+            "f1-score": 0.8710854865579982,
+            "support": 759.0
+          }
+        },
+        "roc_auc": 0.9346915087655827,
+        "average_precision": 0.8916128406855647
+      },
       "test_default_0_5": {
         "threshold": 0.5,
         "accuracy": 0.8346456692913385,
       "artifact_dir": "/content/agri-wheat-classifier/baselines/embedding-logistic",
       "artifact_file": "/content/agri-wheat-classifier/baselines/embedding-logistic/embedding-logistic.joblib",
       "validation_best_threshold": {
+        "threshold": 0.521271516877752,
+        "f1": 0.7363184079601991,
+        "precision": 0.6727272727272727,
+        "recall": 0.8131868131868132
+      },
+      "validation_default_0_5": {
+        "threshold": 0.5,
+        "accuracy": 0.782608695652174,
+        "precision": 0.6578947368421053,
+        "recall": 0.8241758241758241,
+        "f1": 0.7317073170731707,
+        "confusion_matrix": [
+          [
+            369,
+            117
+          ],
+          [
+            48,
+            225
+          ]
+        ],
+        "classification_report": {
+          "NOT_RELEVANT": {
+            "precision": 0.8848920863309353,
+            "recall": 0.7592592592592593,
+            "f1-score": 0.8172757475083057,
+            "support": 486.0
+          },
+          "RELEVANT": {
+            "precision": 0.6578947368421053,
+            "recall": 0.8241758241758241,
+            "f1-score": 0.7317073170731707,
+            "support": 273.0
+          },
+          "accuracy": 0.782608695652174,
+          "macro avg": {
+            "precision": 0.7713934115865203,
+            "recall": 0.7917175417175417,
+            "f1-score": 0.7744915322907382,
+            "support": 759.0
+          },
+          "weighted avg": {
+            "precision": 0.8032448183329766,
+            "recall": 0.782608695652174,
+            "f1-score": 0.7864981697628618,
+            "support": 759.0
+          }
+        },
+        "roc_auc": 0.8619213434028248,
+        "average_precision": 0.7798827839342581
+      },
+      "validation_optimal_threshold": {
+        "threshold": 0.521271516877752,
+        "accuracy": 0.7905138339920948,
+        "precision": 0.6727272727272727,
+        "recall": 0.8131868131868132,
+        "f1": 0.736318407960199,
+        "confusion_matrix": [
+          [
+            378,
+            108
+          ],
+          [
+            51,
+            222
+          ]
+        ],
+        "classification_report": {
+          "NOT_RELEVANT": {
+            "precision": 0.8811188811188811,
+            "recall": 0.7777777777777778,
+            "f1-score": 0.8262295081967214,
+            "support": 486.0
+          },
+          "RELEVANT": {
+            "precision": 0.6727272727272727,
+            "recall": 0.8131868131868132,
+            "f1-score": 0.736318407960199,
+            "support": 273.0
+          },
+          "accuracy": 0.7905138339920948,
+          "macro avg": {
+            "precision": 0.7769230769230769,
+            "recall": 0.7954822954822955,
+            "f1-score": 0.7812739580784602,
+            "support": 759.0
+          },
+          "weighted avg": {
+            "precision": 0.8061637966776306,
+            "recall": 0.7905138339920948,
+            "f1-score": 0.7938899424989999,
+            "support": 759.0
+          }
+        },
+        "roc_auc": 0.8619213434028248,
+        "average_precision": 0.7798827839342581
       },
       "test_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.7821522309711286,
+        "precision": 0.6993670886075949,
+        "recall": 0.7568493150684932,
+        "f1": 0.7269736842105263,
         "confusion_matrix": [
           [
+            375,
+            95
           ],
           [
+            71,
+            221
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.8408071748878924,
+            "recall": 0.7978723404255319,
+            "f1-score": 0.8187772925764192,
             "support": 470.0
           },
           "RELEVANT": {
+            "precision": 0.6993670886075949,
+            "recall": 0.7568493150684932,
+            "f1-score": 0.7269736842105263,
             "support": 292.0
           },
+          "accuracy": 0.7821522309711286,
           "macro avg": {
+            "precision": 0.7700871317477436,
+            "recall": 0.7773608277470125,
+            "f1-score": 0.7728754883934728,
             "support": 762.0
           },
           "weighted avg": {
+            "precision": 0.7866070368382246,
+            "recall": 0.7821522309711286,
+            "f1-score": 0.783597957087127,
             "support": 762.0
           }
         },
+        "roc_auc": 0.8769309239288836,
+        "average_precision": 0.8205790680541594
       },
       "test_optimal_threshold": {
+        "threshold": 0.521271516877752,
+        "accuracy": 0.7887139107611548,
+        "precision": 0.7133550488599348,
+        "recall": 0.75,
+        "f1": 0.7312186978297162,
         "confusion_matrix": [
           [
+            382,
+            88
           ],
           [
+            73,
+            219
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.8395604395604396,
+            "recall": 0.8127659574468085,
+            "f1-score": 0.825945945945946,
             "support": 470.0
           },
           "RELEVANT": {
+            "precision": 0.7133550488599348,
+            "recall": 0.75,
+            "f1-score": 0.7312186978297162,
             "support": 292.0
           },
+          "accuracy": 0.7887139107611548,
           "macro avg": {
+            "precision": 0.7764577442101872,
+            "recall": 0.7813829787234042,
+            "f1-score": 0.778582321887831,
             "support": 762.0
           },
           "weighted avg": {
+            "precision": 0.7911982688458105,
+            "recall": 0.7887139107611548,
+            "f1-score": 0.7896462655654485,
             "support": 762.0
           }
         },
+        "roc_auc": 0.8769309239288836,
+        "average_precision": 0.8205790680541594
       }
     },
     {
       "artifact_dir": "/content/agri-wheat-classifier/baselines/embedding-svm",
       "artifact_file": "/content/agri-wheat-classifier/baselines/embedding-svm/embedding-svm.joblib",
       "validation_best_threshold": {
+        "threshold": 0.47291079297616506,
+        "f1": 0.7448275862068966,
+        "precision": 0.7035830618892508,
+        "recall": 0.7912087912087912
+      },
+      "validation_default_0_5": {
+        "threshold": 0.5,
+        "accuracy": 0.8036890645586298,
+        "precision": 0.7137931034482758,
+        "recall": 0.7582417582417582,
+        "f1": 0.7353463587921847,
+        "confusion_matrix": [
+          [
+            403,
+            83
+          ],
+          [
+            66,
+            207
+          ]
+        ],
+        "classification_report": {
+          "NOT_RELEVANT": {
+            "precision": 0.8592750533049041,
+            "recall": 0.8292181069958847,
+            "f1-score": 0.8439790575916231,
+            "support": 486.0
+          },
+          "RELEVANT": {
+            "precision": 0.7137931034482758,
+            "recall": 0.7582417582417582,
+            "f1-score": 0.7353463587921847,
+            "support": 273.0
+          },
+          "accuracy": 0.8036890645586298,
+          "macro avg": {
+            "precision": 0.78653407837659,
+            "recall": 0.7937299326188214,
+            "f1-score": 0.7896627081919039,
+            "support": 759.0
+          },
+          "weighted avg": {
+            "precision": 0.8069475535541011,
+            "recall": 0.8036890645586298,
+            "f1-score": 0.8049056362843152,
+            "support": 759.0
+          }
+        },
+        "roc_auc": 0.8689835541687394,
+        "average_precision": 0.7918617140757781
+      },
+      "validation_optimal_threshold": {
+        "threshold": 0.47291079297616506,
+        "accuracy": 0.8050065876152833,
+        "precision": 0.7035830618892508,
+        "recall": 0.7912087912087912,
+        "f1": 0.7448275862068966,
+        "confusion_matrix": [
+          [
+            395,
+            91
+          ],
+          [
+            57,
+            216
+          ]
+        ],
+        "classification_report": {
+          "NOT_RELEVANT": {
+            "precision": 0.8738938053097345,
+            "recall": 0.8127572016460906,
+            "f1-score": 0.8422174840085288,
+            "support": 486.0
+          },
+          "RELEVANT": {
+            "precision": 0.7035830618892508,
+            "recall": 0.7912087912087912,
+            "f1-score": 0.7448275862068966,
+            "support": 273.0
+          },
+          "accuracy": 0.8050065876152833,
+          "macro avg": {
+            "precision": 0.7887384335994927,
+            "recall": 0.8019829964274409,
+            "f1-score": 0.7935225351077126,
+            "support": 759.0
+          },
+          "weighted avg": {
+            "precision": 0.8126357908778609,
+            "recall": 0.8050065876152833,
+            "f1-score": 0.8071879160245424,
+            "support": 759.0
+          }
+        },
+        "roc_auc": 0.8689835541687394,
+        "average_precision": 0.7918617140757781
       },
       "test_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.8175853018372703,
+        "precision": 0.7781818181818182,
+        "recall": 0.7328767123287672,
+        "f1": 0.7548500881834215,
         "confusion_matrix": [
           [
+            409,
+            61
           ],
           [
+            78,
+            214
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.839835728952772,
+            "recall": 0.8702127659574468,
+            "f1-score": 0.8547544409613375,
             "support": 470.0
           },
           "RELEVANT": {
+            "precision": 0.7781818181818182,
+            "recall": 0.7328767123287672,
+            "f1-score": 0.7548500881834215,
             "support": 292.0
           },
+          "accuracy": 0.8175853018372703,
           "macro avg": {
+            "precision": 0.8090087735672951,
+            "recall": 0.801544739143107,
+            "f1-score": 0.8048022645723795,
             "support": 762.0
           },
           "weighted avg": {
+            "precision": 0.8162098208883121,
+            "recall": 0.8175853018372703,
+            "f1-score": 0.8164708832039208,
             "support": 762.0
           }
         },
+        "roc_auc": 0.8834814922763043,
+        "average_precision": 0.8241931351812108
       },
       "test_optimal_threshold": {
+        "threshold": 0.47291079297616506,
+        "accuracy": 0.8123359580052494,
+        "precision": 0.7577854671280276,
+        "recall": 0.75,
+        "f1": 0.7538726333907056,
         "confusion_matrix": [
           [
+            400,
+            70
           ],
           [
+            73,
+            219
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.8456659619450317,
+            "recall": 0.851063829787234,
+            "f1-score": 0.848356309650053,
             "support": 470.0
           },
           "RELEVANT": {
+            "precision": 0.7577854671280276,
+            "recall": 0.75,
+            "f1-score": 0.7538726333907056,
             "support": 292.0
           },
+          "accuracy": 0.8123359580052494,
           "macro avg": {
+            "precision": 0.8017257145365297,
+            "recall": 0.800531914893617,
+            "f1-score": 0.8011144715203793,
             "support": 762.0
           },
           "weighted avg": {
+            "precision": 0.8119899718051824,
+            "recall": 0.8123359580052494,
+            "f1-score": 0.8121499665165498,
             "support": 762.0
           }
         },
+        "roc_auc": 0.8834814922763043,
+        "average_precision": 0.8241931351812108
       }
     },
     {
       "artifact_dir": "/content/agri-wheat-classifier/baselines/embedding-lightgbm",
       "artifact_file": "/content/agri-wheat-classifier/baselines/embedding-lightgbm/embedding-lightgbm.joblib",
       "validation_best_threshold": {
+        "threshold": 0.4330901925282479,
+        "f1": 0.7406143344709898,
+        "precision": 0.6932907348242812,
+        "recall": 0.7948717948717948
+      },
+      "validation_default_0_5": {
+        "threshold": 0.5,
+        "accuracy": 0.7905138339920948,
+        "precision": 0.6938775510204082,
+        "recall": 0.7472527472527473,
+        "f1": 0.7195767195767195,
+        "confusion_matrix": [
+          [
+            396,
+            90
+          ],
+          [
+            69,
+            204
+          ]
+        ],
+        "classification_report": {
+          "NOT_RELEVANT": {
+            "precision": 0.8516129032258064,
+            "recall": 0.8148148148148148,
+            "f1-score": 0.832807570977918,
+            "support": 486.0
+          },
+          "RELEVANT": {
+            "precision": 0.6938775510204082,
+            "recall": 0.7472527472527473,
+            "f1-score": 0.7195767195767195,
+            "support": 273.0
+          },
+          "accuracy": 0.7905138339920948,
+          "macro avg": {
+            "precision": 0.7727452271231072,
+            "recall": 0.7810337810337811,
+            "f1-score": 0.7761921452773188,
+            "support": 759.0
+          },
+          "weighted avg": {
+            "precision": 0.7948780532230743,
+            "recall": 0.7905138339920948,
+            "f1-score": 0.7920802686952735,
+            "support": 759.0
+          }
+        },
+        "roc_auc": 0.8684408869594056,
+        "average_precision": 0.7857728796203002
+      },
+      "validation_optimal_threshold": {
+        "threshold": 0.4330901925282479,
+        "accuracy": 0.7997364953886693,
+        "precision": 0.6932907348242812,
+        "recall": 0.7948717948717948,
+        "f1": 0.7406143344709898,
+        "confusion_matrix": [
+          [
+            390,
+            96
+          ],
+          [
+            56,
+            217
+          ]
+        ],
+        "classification_report": {
+          "NOT_RELEVANT": {
+            "precision": 0.874439461883408,
+            "recall": 0.8024691358024691,
+            "f1-score": 0.8369098712446352,
+            "support": 486.0
+          },
+          "RELEVANT": {
+            "precision": 0.6932907348242812,
+            "recall": 0.7948717948717948,
+            "f1-score": 0.7406143344709898,
+            "support": 273.0
+          },
+          "accuracy": 0.7997364953886693,
+          "macro avg": {
+            "precision": 0.7838650983538447,
+            "recall": 0.7986704653371319,
+            "f1-score": 0.7887621028578125,
+            "support": 759.0
+          },
+          "weighted avg": {
+            "precision": 0.8092832003720225,
+            "recall": 0.7997364953886693,
+            "f1-score": 0.8022739271877114,
+            "support": 759.0
+          }
+        },
+        "roc_auc": 0.8684408869594056,
+        "average_precision": 0.7857728796203002
       },
       "test_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.7979002624671916,
+        "precision": 0.7395833333333334,
+        "recall": 0.7294520547945206,
+        "f1": 0.7344827586206897,
         "confusion_matrix": [
           [
+            395,
+            75
           ],
           [
+            79,
+            213
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.8333333333333334,
+            "recall": 0.8404255319148937,
+            "f1-score": 0.836864406779661,
             "support": 470.0
           },
           "RELEVANT": {
+            "precision": 0.7395833333333334,
+            "recall": 0.7294520547945206,
+            "f1-score": 0.7344827586206897,
             "support": 292.0
           },
+          "accuracy": 0.7979002624671916,
           "macro avg": {
+            "precision": 0.7864583333333334,
+            "recall": 0.7849387933547072,
+            "f1-score": 0.7856735827001753,
             "support": 762.0
           },
           "weighted avg": {
+            "precision": 0.7974081364829396,
+            "recall": 0.7979002624671916,
+            "f1-score": 0.7976315442305539,
             "support": 762.0
           }
         },
+        "roc_auc": 0.8918245409501604,
+        "average_precision": 0.8474870908097023
       },
       "test_optimal_threshold": {
+        "threshold": 0.4330901925282479,
         "accuracy": 0.8057742782152231,
+        "precision": 0.7352941176470589,
+        "recall": 0.7705479452054794,
+        "f1": 0.7525083612040134,
         "confusion_matrix": [
           [
+            389,
+            81
           ],
           [
+            67,
+            225
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.8530701754385965,
+            "recall": 0.8276595744680851,
+            "f1-score": 0.8401727861771058,
             "support": 470.0
           },
           "RELEVANT": {
+            "precision": 0.7352941176470589,
+            "recall": 0.7705479452054794,
+            "f1-score": 0.7525083612040134,
             "support": 292.0
           },
           "accuracy": 0.8057742782152231,
           "macro avg": {
+            "precision": 0.7941821465428277,
+            "recall": 0.7991037598367823,
+            "f1-score": 0.7963405736905596,
             "support": 762.0
           },
           "weighted avg": {
+            "precision": 0.8079381427940704,
             "recall": 0.8057742782152231,
+            "f1-score": 0.8065795944551334,
             "support": 762.0
           }
         },
+        "roc_auc": 0.8918245409501604,
+        "average_precision": 0.8474870908097023
       }
     },
     {
       "model_type": "transformer",
+      "model_name": "FacebookAI/xlm-roberta-base",
       "artifact_dir": "/content/agri-wheat-classifier/transformer",
       "validation_best_threshold": {
+        "threshold": 0.2030746340751648,
+        "f1": 0.8992805755395683,
+        "precision": 0.8833922261484098,
+        "recall": 0.9157509157509157
+      },
+      "validation_default_0_5": {
+        "threshold": 0.5,
+        "accuracy": 0.924901185770751,
+        "precision": 0.8941605839416058,
+        "recall": 0.8974358974358975,
+        "f1": 0.8957952468007313,
+        "confusion_matrix": [
+          [
+            457,
+            29
+          ],
+          [
+            28,
+            245
+          ]
+        ],
+        "classification_report": {
+          "NOT_RELEVANT": {
+            "precision": 0.9422680412371134,
+            "recall": 0.9403292181069959,
+            "f1-score": 0.94129763130793,
+            "support": 486.0
+          },
+          "RELEVANT": {
+            "precision": 0.8941605839416058,
+            "recall": 0.8974358974358975,
+            "f1-score": 0.8957952468007313,
+            "support": 273.0
+          },
+          "accuracy": 0.924901185770751,
+          "macro avg": {
+            "precision": 0.9182143125893596,
+            "recall": 0.9188825577714467,
+            "f1-score": 0.9185464390543306,
+            "support": 759.0
+          },
+          "weighted avg": {
+            "precision": 0.9249645684549348,
+            "recall": 0.924901185770751,
+            "f1-score": 0.9249311609911115,
+            "support": 759.0
+          }
+        },
+        "roc_auc": 0.9563906600943638,
+        "average_precision": 0.914270669615161
+      },
+      "validation_optimal_threshold": {
+        "threshold": 0.2030746340751648,
+        "accuracy": 0.9262187088274044,
+        "precision": 0.8833922261484098,
+        "recall": 0.9157509157509157,
+        "f1": 0.8992805755395683,
+        "confusion_matrix": [
+          [
+            453,
+            33
+          ],
+          [
+            23,
+            250
+          ]
+        ],
+        "classification_report": {
+          "NOT_RELEVANT": {
+            "precision": 0.9516806722689075,
+            "recall": 0.9320987654320988,
+            "f1-score": 0.9417879417879418,
+            "support": 486.0
+          },
+          "RELEVANT": {
+            "precision": 0.8833922261484098,
+            "recall": 0.9157509157509157,
+            "f1-score": 0.8992805755395683,
+            "support": 273.0
+          },
+          "accuracy": 0.9262187088274044,
+          "macro avg": {
+            "precision": 0.9175364492086586,
+            "recall": 0.9239248405915073,
+            "f1-score": 0.920534258663755,
+            "support": 759.0
+          },
+          "weighted avg": {
+            "precision": 0.9271184248500723,
+            "recall": 0.9262187088274044,
+            "f1-score": 0.9264987310029535,
+            "support": 759.0
+          }
+        },
+        "roc_auc": 0.9563906600943638,
+        "average_precision": 0.914270669615161
       },
       "test_default_0_5": {
         "threshold": 0.5,
+        "accuracy": 0.884514435695538,
+        "precision": 0.8617021276595744,
+        "recall": 0.8321917808219178,
+        "f1": 0.8466898954703833,
         "confusion_matrix": [
           [
+            431,
+            39
           ],
           [
+            49,
+            243
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.8979166666666667,
+            "recall": 0.9170212765957447,
+            "f1-score": 0.9073684210526316,
             "support": 470.0
           },
           "RELEVANT": {
+            "precision": 0.8617021276595744,
+            "recall": 0.8321917808219178,
+            "f1-score": 0.8466898954703833,
             "support": 292.0
           },
+          "accuracy": 0.884514435695538,
           "macro avg": {
+            "precision": 0.8798093971631206,
+            "recall": 0.8746065287088313,
+            "f1-score": 0.8770291582615075,
             "support": 762.0
           },
           "weighted avg": {
+            "precision": 0.8840391792781221,
+            "recall": 0.884514435695538,
+            "f1-score": 0.8841162826405365,
             "support": 762.0
           }
         },
+        "roc_auc": 0.9430960361410667,
+        "average_precision": 0.9145930239314757
       },
       "test_optimal_threshold": {
+        "threshold": 0.2030746340751648,
+        "accuracy": 0.889763779527559,
+        "precision": 0.8537414965986394,
+        "recall": 0.8595890410958904,
+        "f1": 0.856655290102389,
         "confusion_matrix": [
           [
+            427,
+            43
           ],
           [
+            41,
+            251
           ]
         ],
         "classification_report": {
           "NOT_RELEVANT": {
+            "precision": 0.9123931623931624,
+            "recall": 0.9085106382978724,
+            "f1-score": 0.9104477611940298,
             "support": 470.0
           },
           "RELEVANT": {
+            "precision": 0.8537414965986394,
+            "recall": 0.8595890410958904,
+            "f1-score": 0.856655290102389,
             "support": 292.0
           },
+          "accuracy": 0.889763779527559,
           "macro avg": {
+            "precision": 0.8830673294959008,
+            "recall": 0.8840498396968814,
+            "f1-score": 0.8835515256482094,
             "support": 762.0
           },
           "weighted avg": {
+            "precision": 0.8899177209075971,
+            "recall": 0.889763779527559,
+            "f1-score": 0.8898343733216425,
             "support": 762.0
           }
         },
+        "roc_auc": 0.9430960361410667,
+        "average_precision": 0.9145930239314757
       }
     }
   ]

transformer/checkpoint-1135/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "add_cross_attention": false,
+  "architectures": [
+    "XLMRobertaForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "dtype": "float32",
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "NOT_RELEVANT",
+    "1": "RELEVANT"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "is_decoder": false,
+  "label2id": {
+    "NOT_RELEVANT": 0,
+    "RELEVANT": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "xlm-roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "tie_word_embeddings": true,
+  "transformers_version": "5.9.0",
+  "type_vocab_size": 1,
+  "use_cache": false,
+  "vocab_size": 250002
+}

transformer/checkpoint-1135/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49e9acb9da03ba022fefe40028a1df7f7fa4ccef569677e26812cafd225ef8ae
+size 1112205008

transformer/checkpoint-1135/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4cb1db50ca28d52ccaa8a7b730432372aa61a6a1769b32667328207c647b3a82
+size 2224532875

transformer/checkpoint-1135/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a7ce43043e72e4492ea95f56e147b44a9c5f8c96c4094efb5609bed070ff06c7
+size 14645

transformer/checkpoint-1135/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3e3e475419c2177afcc69f2e211ad481cd1b96ff1a6e3f24aee6b25a1983c6e1
+size 1383

transformer/checkpoint-1135/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:06462f15ba58fbb78a4dc0cc4e0eca4e82f972fc107ff3f7ac0f4c4d6c6eba6e
+size 1465

transformer/checkpoint-1135/tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc02d42fb2a10276563109e2287cc0dbe6b595d5b3b3401c7cfeffc0b7e20270
+size 17098351

transformer/checkpoint-1135/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "add_prefix_space": true,
+  "backend": "tokenizers",
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "is_local": false,
+  "local_files_only": false,
+  "mask_token": "<mask>",
+  "model_max_length": 512,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "tokenizer_class": "XLMRobertaTokenizer",
+  "unk_token": "<unk>"
+}

transformer/checkpoint-1135/trainer_state.json ADDED Viewed

	@@ -0,0 +1,423 @@

+{
+  "best_global_step": 908,
+  "best_metric": 0.8957952468007313,
+  "best_model_checkpoint": "/content/agri-wheat-classifier/transformer/checkpoint-908",
+  "epoch": 5.0,
+  "eval_steps": 500,
+  "global_step": 1135,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.11013215859030837,
+      "grad_norm": 3.4615602493286133,
+      "learning_rate": 4.247787610619469e-06,
+      "loss": 0.7144061279296875,
+      "step": 25
+    },
+    {
+      "epoch": 0.22026431718061673,
+      "grad_norm": 6.50156307220459,
+      "learning_rate": 8.672566371681418e-06,
+      "loss": 0.6882943725585937,
+      "step": 50
+    },
+    {
+      "epoch": 0.3303964757709251,
+      "grad_norm": 4.099428176879883,
+      "learning_rate": 1.3097345132743363e-05,
+      "loss": 0.6711004638671875,
+      "step": 75
+    },
+    {
+      "epoch": 0.44052863436123346,
+      "grad_norm": 7.663174629211426,
+      "learning_rate": 1.7522123893805313e-05,
+      "loss": 0.681163330078125,
+      "step": 100
+    },
+    {
+      "epoch": 0.5506607929515418,
+      "grad_norm": 10.003649711608887,
+      "learning_rate": 1.9784735812133072e-05,
+      "loss": 0.672431640625,
+      "step": 125
+    },
+    {
+      "epoch": 0.6607929515418502,
+      "grad_norm": 4.136000633239746,
+      "learning_rate": 1.929549902152642e-05,
+      "loss": 0.6405279541015625,
+      "step": 150
+    },
+    {
+      "epoch": 0.7709251101321586,
+      "grad_norm": 8.746106147766113,
+      "learning_rate": 1.8806262230919768e-05,
+      "loss": 0.6329603576660157,
+      "step": 175
+    },
+    {
+      "epoch": 0.8810572687224669,
+      "grad_norm": 6.302291393280029,
+      "learning_rate": 1.8317025440313113e-05,
+      "loss": 0.48342845916748045,
+      "step": 200
+    },
+    {
+      "epoch": 0.9911894273127754,
+      "grad_norm": 9.206014633178711,
+      "learning_rate": 1.7827788649706457e-05,
+      "loss": 0.498061408996582,
+      "step": 225
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.8880105401844532,
+      "eval_f1": 0.8434622467771639,
+      "eval_loss": 0.3247315287590027,
+      "eval_precision": 0.8481481481481481,
+      "eval_recall": 0.8388278388278388,
+      "eval_roc_auc": 0.9395378284267173,
+      "eval_runtime": 2.8582,
+      "eval_samples_per_second": 265.551,
+      "eval_steps_per_second": 8.397,
+      "step": 227
+    },
+    {
+      "epoch": 1.1013215859030836,
+      "grad_norm": 36.54235076904297,
+      "learning_rate": 1.7338551859099805e-05,
+      "loss": 0.34838932037353515,
+      "step": 250
+    },
+    {
+      "epoch": 1.2114537444933922,
+      "grad_norm": 11.171507835388184,
+      "learning_rate": 1.6849315068493153e-05,
+      "loss": 0.4250565719604492,
+      "step": 275
+    },
+    {
+      "epoch": 1.3215859030837005,
+      "grad_norm": 18.83371353149414,
+      "learning_rate": 1.6360078277886498e-05,
+      "loss": 0.3523222351074219,
+      "step": 300
+    },
+    {
+      "epoch": 1.4317180616740088,
+      "grad_norm": 12.578425407409668,
+      "learning_rate": 1.5870841487279843e-05,
+      "loss": 0.3326843643188477,
+      "step": 325
+    },
+    {
+      "epoch": 1.5418502202643172,
+      "grad_norm": 4.249295711517334,
+      "learning_rate": 1.538160469667319e-05,
+      "loss": 0.4222240447998047,
+      "step": 350
+    },
+    {
+      "epoch": 1.6519823788546255,
+      "grad_norm": 12.961797714233398,
+      "learning_rate": 1.4892367906066539e-05,
+      "loss": 0.3197017669677734,
+      "step": 375
+    },
+    {
+      "epoch": 1.7621145374449338,
+      "grad_norm": 15.027281761169434,
+      "learning_rate": 1.4403131115459884e-05,
+      "loss": 0.3585982894897461,
+      "step": 400
+    },
+    {
+      "epoch": 1.8722466960352424,
+      "grad_norm": 5.844873428344727,
+      "learning_rate": 1.391389432485323e-05,
+      "loss": 0.3265089416503906,
+      "step": 425
+    },
+    {
+      "epoch": 1.9823788546255505,
+      "grad_norm": 17.369247436523438,
+      "learning_rate": 1.3424657534246576e-05,
+      "loss": 0.30590789794921874,
+      "step": 450
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.8880105401844532,
+      "eval_f1": 0.8571428571428571,
+      "eval_loss": 0.2787843644618988,
+      "eval_precision": 0.7919254658385093,
+      "eval_recall": 0.9340659340659341,
+      "eval_roc_auc": 0.959367792701126,
+      "eval_runtime": 2.7537,
+      "eval_samples_per_second": 275.624,
+      "eval_steps_per_second": 8.715,
+      "step": 454
+    },
+    {
+      "epoch": 2.092511013215859,
+      "grad_norm": 10.165802955627441,
+      "learning_rate": 1.2935420743639924e-05,
+      "loss": 0.3099861145019531,
+      "step": 475
+    },
+    {
+      "epoch": 2.202643171806167,
+      "grad_norm": 12.579766273498535,
+      "learning_rate": 1.2446183953033269e-05,
+      "loss": 0.24645326614379884,
+      "step": 500
+    },
+    {
+      "epoch": 2.3127753303964758,
+      "grad_norm": 16.500667572021484,
+      "learning_rate": 1.1956947162426615e-05,
+      "loss": 0.32091796875,
+      "step": 525
+    },
+    {
+      "epoch": 2.4229074889867843,
+      "grad_norm": 48.79829788208008,
+      "learning_rate": 1.1467710371819962e-05,
+      "loss": 0.28792179107666016,
+      "step": 550
+    },
+    {
+      "epoch": 2.5330396475770924,
+      "grad_norm": 3.1696665287017822,
+      "learning_rate": 1.097847358121331e-05,
+      "loss": 0.20424072265625,
+      "step": 575
+    },
+    {
+      "epoch": 2.643171806167401,
+      "grad_norm": 5.296319007873535,
+      "learning_rate": 1.0489236790606654e-05,
+      "loss": 0.3179521179199219,
+      "step": 600
+    },
+    {
+      "epoch": 2.753303964757709,
+      "grad_norm": 2.286626100540161,
+      "learning_rate": 1e-05,
+      "loss": 0.20801780700683595,
+      "step": 625
+    },
+    {
+      "epoch": 2.8634361233480177,
+      "grad_norm": 18.524463653564453,
+      "learning_rate": 9.510763209393347e-06,
+      "loss": 0.2919172477722168,
+      "step": 650
+    },
+    {
+      "epoch": 2.9735682819383262,
+      "grad_norm": 11.000245094299316,
+      "learning_rate": 9.021526418786694e-06,
+      "loss": 0.2509865570068359,
+      "step": 675
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.9117259552042161,
+      "eval_f1": 0.8809946714031972,
+      "eval_loss": 0.2792136073112488,
+      "eval_precision": 0.8551724137931035,
+      "eval_recall": 0.9084249084249084,
+      "eval_roc_auc": 0.9613387298572483,
+      "eval_runtime": 2.7576,
+      "eval_samples_per_second": 275.236,
+      "eval_steps_per_second": 8.703,
+      "step": 681
+    },
+    {
+      "epoch": 3.0837004405286343,
+      "grad_norm": 7.4162092208862305,
+      "learning_rate": 8.53228962818004e-06,
+      "loss": 0.2622438621520996,
+      "step": 700
+    },
+    {
+      "epoch": 3.193832599118943,
+      "grad_norm": 28.406911849975586,
+      "learning_rate": 8.043052837573386e-06,
+      "loss": 0.25699047088623045,
+      "step": 725
+    },
+    {
+      "epoch": 3.303964757709251,
+      "grad_norm": 6.7196173667907715,
+      "learning_rate": 7.553816046966732e-06,
+      "loss": 0.24291038513183594,
+      "step": 750
+    },
+    {
+      "epoch": 3.4140969162995596,
+      "grad_norm": 2.39223575592041,
+      "learning_rate": 7.064579256360079e-06,
+      "loss": 0.19176918029785156,
+      "step": 775
+    },
+    {
+      "epoch": 3.5242290748898677,
+      "grad_norm": 0.3074190616607666,
+      "learning_rate": 6.5753424657534245e-06,
+      "loss": 0.1717354965209961,
+      "step": 800
+    },
+    {
+      "epoch": 3.6343612334801763,
+      "grad_norm": 38.88882064819336,
+      "learning_rate": 6.086105675146772e-06,
+      "loss": 0.21332130432128907,
+      "step": 825
+    },
+    {
+      "epoch": 3.744493392070485,
+      "grad_norm": 33.53501510620117,
+      "learning_rate": 5.596868884540117e-06,
+      "loss": 0.27872785568237307,
+      "step": 850
+    },
+    {
+      "epoch": 3.854625550660793,
+      "grad_norm": 6.368429183959961,
+      "learning_rate": 5.1076320939334645e-06,
+      "loss": 0.1715443801879883,
+      "step": 875
+    },
+    {
+      "epoch": 3.964757709251101,
+      "grad_norm": 15.106273651123047,
+      "learning_rate": 4.61839530332681e-06,
+      "loss": 0.1291443634033203,
+      "step": 900
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.924901185770751,
+      "eval_f1": 0.8957952468007313,
+      "eval_loss": 0.309478223323822,
+      "eval_precision": 0.8941605839416058,
+      "eval_recall": 0.8974358974358975,
+      "eval_roc_auc": 0.9563906600943638,
+      "eval_runtime": 2.7645,
+      "eval_samples_per_second": 274.553,
+      "eval_steps_per_second": 8.682,
+      "step": 908
+    },
+    {
+      "epoch": 4.07488986784141,
+      "grad_norm": 13.50270938873291,
+      "learning_rate": 4.129158512720156e-06,
+      "loss": 0.19201255798339845,
+      "step": 925
+    },
+    {
+      "epoch": 4.185022026431718,
+      "grad_norm": 9.977457046508789,
+      "learning_rate": 3.639921722113503e-06,
+      "loss": 0.19937816619873047,
+      "step": 950
+    },
+    {
+      "epoch": 4.295154185022026,
+      "grad_norm": 0.21389485895633698,
+      "learning_rate": 3.1506849315068495e-06,
+      "loss": 0.13615628242492675,
+      "step": 975
+    },
+    {
+      "epoch": 4.405286343612334,
+      "grad_norm": 20.24959373474121,
+      "learning_rate": 2.661448140900196e-06,
+      "loss": 0.16153732299804688,
+      "step": 1000
+    },
+    {
+      "epoch": 4.515418502202643,
+      "grad_norm": 0.8777796030044556,
+      "learning_rate": 2.1722113502935423e-06,
+      "loss": 0.2165633773803711,
+      "step": 1025
+    },
+    {
+      "epoch": 4.6255506607929515,
+      "grad_norm": 7.8306427001953125,
+      "learning_rate": 1.6829745596868884e-06,
+      "loss": 0.1584473419189453,
+      "step": 1050
+    },
+    {
+      "epoch": 4.73568281938326,
+      "grad_norm": 13.857385635375977,
+      "learning_rate": 1.1937377690802348e-06,
+      "loss": 0.14604366302490235,
+      "step": 1075
+    },
+    {
+      "epoch": 4.845814977973569,
+      "grad_norm": 4.830343723297119,
+      "learning_rate": 7.045009784735812e-07,
+      "loss": 0.16852569580078125,
+      "step": 1100
+    },
+    {
+      "epoch": 4.955947136563877,
+      "grad_norm": 9.196575164794922,
+      "learning_rate": 2.152641878669276e-07,
+      "loss": 0.1510540199279785,
+      "step": 1125
+    },
+    {
+      "epoch": 5.0,
+      "eval_accuracy": 0.9183135704874835,
+      "eval_f1": 0.8908450704225352,
+      "eval_loss": 0.34406429529190063,
+      "eval_precision": 0.8576271186440678,
+      "eval_recall": 0.9267399267399268,
+      "eval_roc_auc": 0.9593037278222463,
+      "eval_runtime": 2.7389,
+      "eval_samples_per_second": 277.123,
+      "eval_steps_per_second": 8.763,
+      "step": 1135
+    }
+  ],
+  "logging_steps": 25,
+  "max_steps": 1135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 2,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 1
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2382470606284800.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

transformer/checkpoint-1135/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ad6f33c2b51fa383f7ec28e16f5b3fe2bf41c0a6a27a9c136fc4163f2fd2af84
+size 5265

transformer/checkpoint-227/config.json CHANGED Viewed

@@ -1,37 +1,39 @@
 {
-  "activation": "gelu",
   "architectures": [
-    "DistilBertForSequenceClassification"
   ],
-  "attention_dropout": 0.1,
-  "bos_token_id": null,
-  "dim": 768,
-  "dropout": 0.1,
   "dtype": "float32",
-  "eos_token_id": null,
-  "hidden_dim": 3072,
   "id2label": {
     "0": "NOT_RELEVANT",
     "1": "RELEVANT"
   },
   "initializer_range": 0.02,
   "label2id": {
     "NOT_RELEVANT": 0,
     "RELEVANT": 1
   },
-  "max_position_embeddings": 512,
-  "model_type": "distilbert",
-  "n_heads": 12,
-  "n_layers": 6,
   "output_past": true,
-  "pad_token_id": 0,
   "problem_type": "single_label_classification",
-  "qa_dropout": 0.1,
-  "seq_classif_dropout": 0.2,
-  "sinusoidal_pos_embds": false,
-  "tie_weights_": true,
   "tie_word_embeddings": true,
-  "transformers_version": "5.8.1",
   "use_cache": false,
-  "vocab_size": 119547
 }

 {
+  "add_cross_attention": false,
   "architectures": [
+    "XLMRobertaForSequenceClassification"
   ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
   "dtype": "float32",
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
   "id2label": {
     "0": "NOT_RELEVANT",
     "1": "RELEVANT"
   },
   "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "is_decoder": false,
   "label2id": {
     "NOT_RELEVANT": 0,
     "RELEVANT": 1
   },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "xlm-roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
   "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "tie_word_embeddings": true,
+  "transformers_version": "5.9.0",
+  "type_vocab_size": 1,
   "use_cache": false,
+  "vocab_size": 250002
 }

transformer/checkpoint-227/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4cede1e3c0d6f010b726da8422a7c555e08c61be7af5f00f8477297b28a7b708
-size 541317368

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ae8505bd923cfe335983cca3cba49d4461527d3bb96fc02892a33697682353e
+size 1112205008

transformer/checkpoint-227/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cf5feec4824c7c215d1b0de421e30f0d38d5700d2e1efc79099d80e32912708b
-size 1082698827

 version https://git-lfs.github.com/spec/v1
+oid sha256:db999a375a165b45e9dfd99aae3b7375b3b92a4981dbfefc3d6ac2fac61108d4
+size 2224532875

transformer/checkpoint-227/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5dd47edc976f1f1e4a848e1daffaaa533c0664f4d98fe31814a2b3deb4e4cd9c
 size 14645

 version https://git-lfs.github.com/spec/v1
+oid sha256:3f255e472d4a5579c702ed63db6978307a2abcb0abd903d3ee59892545951936
 size 14645

transformer/checkpoint-227/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bac907eb00ed55aa1cc8c3b58662d1f1268807a09194ba0d2dcb1faee5f1ac0b
 size 1383

 version https://git-lfs.github.com/spec/v1
+oid sha256:89f7ad9587099a5114861231d169a8ed0d5c9a53a0de53f61a918378c928e007
 size 1383

transformer/checkpoint-227/tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

transformer/checkpoint-227/tokenizer_config.json CHANGED Viewed

@@ -1,15 +1,15 @@
 {
   "backend": "tokenizers",
-  "cls_token": "[CLS]",
-  "do_lower_case": false,
   "is_local": false,
   "local_files_only": false,
-  "mask_token": "[MASK]",
   "model_max_length": 512,
-  "pad_token": "[PAD]",
-  "sep_token": "[SEP]",
-  "strip_accents": null,
-  "tokenize_chinese_chars": true,
-  "tokenizer_class": "BertTokenizer",
-  "unk_token": "[UNK]"
 }

 {
+  "add_prefix_space": true,
   "backend": "tokenizers",
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
   "is_local": false,
   "local_files_only": false,
+  "mask_token": "<mask>",
   "model_max_length": 512,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "tokenizer_class": "XLMRobertaTokenizer",
+  "unk_token": "<unk>"
 }

transformer/checkpoint-227/trainer_state.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "best_global_step": 227,
-  "best_metric": 0.8527397260273972,
   "best_model_checkpoint": "/content/agri-wheat-classifier/transformer/checkpoint-227",
   "epoch": 1.0,
   "eval_steps": 500,
@@ -11,78 +11,78 @@
   "log_history": [
     {
       "epoch": 0.11013215859030837,
-      "grad_norm": 1.3902881145477295,
       "learning_rate": 4.247787610619469e-06,
-      "loss": 0.6896240234375,
       "step": 25
     },
     {
       "epoch": 0.22026431718061673,
-      "grad_norm": 1.9834767580032349,
       "learning_rate": 8.672566371681418e-06,
-      "loss": 0.6819134521484375,
       "step": 50
     },
     {
       "epoch": 0.3303964757709251,
-      "grad_norm": 1.3664361238479614,
       "learning_rate": 1.3097345132743363e-05,
-      "loss": 0.67228271484375,
       "step": 75
     },
     {
       "epoch": 0.44052863436123346,
-      "grad_norm": 3.0097296237945557,
       "learning_rate": 1.7522123893805313e-05,
-      "loss": 0.6490057373046875,
       "step": 100
     },
     {
       "epoch": 0.5506607929515418,
-      "grad_norm": 4.345597267150879,
       "learning_rate": 1.9784735812133072e-05,
-      "loss": 0.5840890502929688,
       "step": 125
     },
     {
       "epoch": 0.6607929515418502,
-      "grad_norm": 6.036681175231934,
       "learning_rate": 1.929549902152642e-05,
-      "loss": 0.4646404266357422,
       "step": 150
     },
     {
       "epoch": 0.7709251101321586,
-      "grad_norm": 17.463848114013672,
       "learning_rate": 1.8806262230919768e-05,
-      "loss": 0.4186407089233398,
       "step": 175
     },
     {
       "epoch": 0.8810572687224669,
-      "grad_norm": 4.881515026092529,
       "learning_rate": 1.8317025440313113e-05,
-      "loss": 0.408887939453125,
       "step": 200
     },
     {
       "epoch": 0.9911894273127754,
-      "grad_norm": 5.256113529205322,
       "learning_rate": 1.7827788649706457e-05,
-      "loss": 0.3965899658203125,
       "step": 225
     },
     {
       "epoch": 1.0,
-      "eval_accuracy": 0.8866930171277997,
-      "eval_f1": 0.8527397260273972,
-      "eval_loss": 0.29110145568847656,
-      "eval_precision": 0.8006430868167203,
-      "eval_recall": 0.9120879120879121,
-      "eval_roc_auc": 0.9464116130782798,
-      "eval_runtime": 1.638,
-      "eval_samples_per_second": 463.383,
-      "eval_steps_per_second": 14.652,
       "step": 227
     }
   ],
@@ -112,7 +112,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 239898458966016.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

 {
   "best_global_step": 227,
+  "best_metric": 0.8434622467771639,
   "best_model_checkpoint": "/content/agri-wheat-classifier/transformer/checkpoint-227",
   "epoch": 1.0,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 0.11013215859030837,
+      "grad_norm": 3.4615602493286133,
       "learning_rate": 4.247787610619469e-06,
+      "loss": 0.7144061279296875,
       "step": 25
     },
     {
       "epoch": 0.22026431718061673,
+      "grad_norm": 6.50156307220459,
       "learning_rate": 8.672566371681418e-06,
+      "loss": 0.6882943725585937,
       "step": 50
     },
     {
       "epoch": 0.3303964757709251,
+      "grad_norm": 4.099428176879883,
       "learning_rate": 1.3097345132743363e-05,
+      "loss": 0.6711004638671875,
       "step": 75
     },
     {
       "epoch": 0.44052863436123346,
+      "grad_norm": 7.663174629211426,
       "learning_rate": 1.7522123893805313e-05,
+      "loss": 0.681163330078125,
       "step": 100
     },
     {
       "epoch": 0.5506607929515418,
+      "grad_norm": 10.003649711608887,
       "learning_rate": 1.9784735812133072e-05,
+      "loss": 0.672431640625,
       "step": 125
     },
     {
       "epoch": 0.6607929515418502,
+      "grad_norm": 4.136000633239746,
       "learning_rate": 1.929549902152642e-05,
+      "loss": 0.6405279541015625,
       "step": 150
     },
     {
       "epoch": 0.7709251101321586,
+      "grad_norm": 8.746106147766113,
       "learning_rate": 1.8806262230919768e-05,
+      "loss": 0.6329603576660157,
       "step": 175
     },
     {
       "epoch": 0.8810572687224669,
+      "grad_norm": 6.302291393280029,
       "learning_rate": 1.8317025440313113e-05,
+      "loss": 0.48342845916748045,
       "step": 200
     },
     {
       "epoch": 0.9911894273127754,
+      "grad_norm": 9.206014633178711,
       "learning_rate": 1.7827788649706457e-05,
+      "loss": 0.498061408996582,
       "step": 225
     },
     {
       "epoch": 1.0,
+      "eval_accuracy": 0.8880105401844532,
+      "eval_f1": 0.8434622467771639,
+      "eval_loss": 0.3247315287590027,
+      "eval_precision": 0.8481481481481481,
+      "eval_recall": 0.8388278388278388,
+      "eval_roc_auc": 0.9395378284267173,
+      "eval_runtime": 2.8582,
+      "eval_samples_per_second": 265.551,
+      "eval_steps_per_second": 8.397,
       "step": 227
     }
   ],
       "attributes": {}
     }
   },
+  "total_flos": 476494121256960.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

transformer/checkpoint-454/config.json CHANGED Viewed

@@ -1,37 +1,39 @@
 {
-  "activation": "gelu",
   "architectures": [
-    "DistilBertForSequenceClassification"
   ],
-  "attention_dropout": 0.1,
-  "bos_token_id": null,
-  "dim": 768,
-  "dropout": 0.1,
   "dtype": "float32",
-  "eos_token_id": null,
-  "hidden_dim": 3072,
   "id2label": {
     "0": "NOT_RELEVANT",
     "1": "RELEVANT"
   },
   "initializer_range": 0.02,
   "label2id": {
     "NOT_RELEVANT": 0,
     "RELEVANT": 1
   },
-  "max_position_embeddings": 512,
-  "model_type": "distilbert",
-  "n_heads": 12,
-  "n_layers": 6,
   "output_past": true,
-  "pad_token_id": 0,
   "problem_type": "single_label_classification",
-  "qa_dropout": 0.1,
-  "seq_classif_dropout": 0.2,
-  "sinusoidal_pos_embds": false,
-  "tie_weights_": true,
   "tie_word_embeddings": true,
-  "transformers_version": "5.8.1",
   "use_cache": false,
-  "vocab_size": 119547
 }

 {
+  "add_cross_attention": false,
   "architectures": [
+    "XLMRobertaForSequenceClassification"
   ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
   "dtype": "float32",
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
   "id2label": {
     "0": "NOT_RELEVANT",
     "1": "RELEVANT"
   },
   "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "is_decoder": false,
   "label2id": {
     "NOT_RELEVANT": 0,
     "RELEVANT": 1
   },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "xlm-roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
   "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "tie_word_embeddings": true,
+  "transformers_version": "5.9.0",
+  "type_vocab_size": 1,
   "use_cache": false,
+  "vocab_size": 250002
 }

transformer/checkpoint-454/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c813472ffef86e6412f8bc455be06e22e7b3be9e5979717cf0f10884503488bf
-size 541317368

 version https://git-lfs.github.com/spec/v1
+oid sha256:97d244fdb253808bc25a95339c9095f5dc92925684865b678269c67b17b933be
+size 1112205008

transformer/checkpoint-454/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:931fbcf19ecce6eeb7f41c3218585f141d0c43a579e1061b55d655329bb3de67
-size 1082698827

 version https://git-lfs.github.com/spec/v1
+oid sha256:e0df3d9070e295427dc0c988c887e84b552089876eef56ca06d99d9a8875d76a
+size 2224532875

transformer/checkpoint-454/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1921ad234fe3b91fe6a72596cdd2262832556d8d9ae96f192b266b92568ee3cd
 size 14645

 version https://git-lfs.github.com/spec/v1
+oid sha256:3a84aa11b3c29b368f323fea589aa91007265db407738674e6271fe471994e1a
 size 14645

transformer/checkpoint-454/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ac5aed5d012227ef149cfdb943aaec829a5038bc900759eb1618d705466b0691
 size 1383

 version https://git-lfs.github.com/spec/v1
+oid sha256:e7207a60515ba26ba02a6e3b66fb20ca760789c077bc0a7b95de2554829d36af
 size 1383

transformer/checkpoint-454/tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

transformer/checkpoint-454/tokenizer_config.json CHANGED Viewed

@@ -1,15 +1,15 @@
 {
   "backend": "tokenizers",
-  "cls_token": "[CLS]",
-  "do_lower_case": false,
   "is_local": false,
   "local_files_only": false,
-  "mask_token": "[MASK]",
   "model_max_length": 512,
-  "pad_token": "[PAD]",
-  "sep_token": "[SEP]",
-  "strip_accents": null,
-  "tokenize_chinese_chars": true,
-  "tokenizer_class": "BertTokenizer",
-  "unk_token": "[UNK]"
 }

 {
+  "add_prefix_space": true,
   "backend": "tokenizers",
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
   "is_local": false,
   "local_files_only": false,
+  "mask_token": "<mask>",
   "model_max_length": 512,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "tokenizer_class": "XLMRobertaTokenizer",
+  "unk_token": "<unk>"
 }

transformer/checkpoint-454/trainer_state.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "best_global_step": 454,
-  "best_metric": 0.8765652951699463,
   "best_model_checkpoint": "/content/agri-wheat-classifier/transformer/checkpoint-454",
   "epoch": 2.0,
   "eval_steps": 500,
@@ -11,154 +11,154 @@
   "log_history": [
     {
       "epoch": 0.11013215859030837,
-      "grad_norm": 1.3902881145477295,
       "learning_rate": 4.247787610619469e-06,
-      "loss": 0.6896240234375,
       "step": 25
     },
     {
       "epoch": 0.22026431718061673,
-      "grad_norm": 1.9834767580032349,
       "learning_rate": 8.672566371681418e-06,
-      "loss": 0.6819134521484375,
       "step": 50
     },
     {
       "epoch": 0.3303964757709251,
-      "grad_norm": 1.3664361238479614,
       "learning_rate": 1.3097345132743363e-05,
-      "loss": 0.67228271484375,
       "step": 75
     },
     {
       "epoch": 0.44052863436123346,
-      "grad_norm": 3.0097296237945557,
       "learning_rate": 1.7522123893805313e-05,
-      "loss": 0.6490057373046875,
       "step": 100
     },
     {
       "epoch": 0.5506607929515418,
-      "grad_norm": 4.345597267150879,
       "learning_rate": 1.9784735812133072e-05,
-      "loss": 0.5840890502929688,
       "step": 125
     },
     {
       "epoch": 0.6607929515418502,
-      "grad_norm": 6.036681175231934,
       "learning_rate": 1.929549902152642e-05,
-      "loss": 0.4646404266357422,
       "step": 150
     },
     {
       "epoch": 0.7709251101321586,
-      "grad_norm": 17.463848114013672,
       "learning_rate": 1.8806262230919768e-05,
-      "loss": 0.4186407089233398,
       "step": 175
     },
     {
       "epoch": 0.8810572687224669,
-      "grad_norm": 4.881515026092529,
       "learning_rate": 1.8317025440313113e-05,
-      "loss": 0.408887939453125,
       "step": 200
     },
     {
       "epoch": 0.9911894273127754,
-      "grad_norm": 5.256113529205322,
       "learning_rate": 1.7827788649706457e-05,
-      "loss": 0.3965899658203125,
       "step": 225
     },
     {
       "epoch": 1.0,
-      "eval_accuracy": 0.8866930171277997,
-      "eval_f1": 0.8527397260273972,
-      "eval_loss": 0.29110145568847656,
-      "eval_precision": 0.8006430868167203,
-      "eval_recall": 0.9120879120879121,
-      "eval_roc_auc": 0.9464116130782798,
-      "eval_runtime": 1.638,
-      "eval_samples_per_second": 463.383,
-      "eval_steps_per_second": 14.652,
       "step": 227
     },
     {
       "epoch": 1.1013215859030836,
-      "grad_norm": 8.05300521850586,
       "learning_rate": 1.7338551859099805e-05,
-      "loss": 0.2900468635559082,
       "step": 250
     },
     {
       "epoch": 1.2114537444933922,
-      "grad_norm": 3.648190975189209,
       "learning_rate": 1.6849315068493153e-05,
-      "loss": 0.3152153396606445,
       "step": 275
     },
     {
       "epoch": 1.3215859030837005,
-      "grad_norm": 13.387518882751465,
       "learning_rate": 1.6360078277886498e-05,
-      "loss": 0.2970449638366699,
       "step": 300
     },
     {
       "epoch": 1.4317180616740088,
-      "grad_norm": 2.984701633453369,
       "learning_rate": 1.5870841487279843e-05,
-      "loss": 0.2916489791870117,
       "step": 325
     },
     {
       "epoch": 1.5418502202643172,
-      "grad_norm": 4.417141914367676,
       "learning_rate": 1.538160469667319e-05,
-      "loss": 0.2869120979309082,
       "step": 350
     },
     {
       "epoch": 1.6519823788546255,
-      "grad_norm": 3.330986499786377,
       "learning_rate": 1.4892367906066539e-05,
-      "loss": 0.3101354217529297,
       "step": 375
     },
     {
       "epoch": 1.7621145374449338,
-      "grad_norm": 5.084468364715576,
       "learning_rate": 1.4403131115459884e-05,
-      "loss": 0.30187932968139647,
       "step": 400
     },
     {
       "epoch": 1.8722466960352424,
-      "grad_norm": 6.020040512084961,
       "learning_rate": 1.391389432485323e-05,
-      "loss": 0.30431194305419923,
       "step": 425
     },
     {
       "epoch": 1.9823788546255505,
-      "grad_norm": 3.684113025665283,
       "learning_rate": 1.3424657534246576e-05,
-      "loss": 0.2970767021179199,
       "step": 450
     },
     {
       "epoch": 2.0,
-      "eval_accuracy": 0.9090909090909091,
-      "eval_f1": 0.8765652951699463,
-      "eval_loss": 0.255423367023468,
-      "eval_precision": 0.8566433566433567,
-      "eval_recall": 0.8974358974358975,
-      "eval_roc_auc": 0.9556633352929649,
-      "eval_runtime": 1.716,
-      "eval_samples_per_second": 442.313,
-      "eval_steps_per_second": 13.986,
       "step": 454
     }
   ],
@@ -188,7 +188,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 479796917932032.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

 {
   "best_global_step": 454,
+  "best_metric": 0.8571428571428571,
   "best_model_checkpoint": "/content/agri-wheat-classifier/transformer/checkpoint-454",
   "epoch": 2.0,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 0.11013215859030837,
+      "grad_norm": 3.4615602493286133,
       "learning_rate": 4.247787610619469e-06,
+      "loss": 0.7144061279296875,
       "step": 25
     },
     {
       "epoch": 0.22026431718061673,
+      "grad_norm": 6.50156307220459,
       "learning_rate": 8.672566371681418e-06,
+      "loss": 0.6882943725585937,
       "step": 50
     },
     {
       "epoch": 0.3303964757709251,
+      "grad_norm": 4.099428176879883,
       "learning_rate": 1.3097345132743363e-05,
+      "loss": 0.6711004638671875,
       "step": 75
     },
     {
       "epoch": 0.44052863436123346,
+      "grad_norm": 7.663174629211426,
       "learning_rate": 1.7522123893805313e-05,
+      "loss": 0.681163330078125,
       "step": 100
     },
     {
       "epoch": 0.5506607929515418,
+      "grad_norm": 10.003649711608887,
       "learning_rate": 1.9784735812133072e-05,
+      "loss": 0.672431640625,
       "step": 125
     },
     {
       "epoch": 0.6607929515418502,
+      "grad_norm": 4.136000633239746,
       "learning_rate": 1.929549902152642e-05,
+      "loss": 0.6405279541015625,
       "step": 150
     },
     {
       "epoch": 0.7709251101321586,
+      "grad_norm": 8.746106147766113,
       "learning_rate": 1.8806262230919768e-05,
+      "loss": 0.6329603576660157,
       "step": 175
     },
     {
       "epoch": 0.8810572687224669,
+      "grad_norm": 6.302291393280029,
       "learning_rate": 1.8317025440313113e-05,
+      "loss": 0.48342845916748045,
       "step": 200
     },
     {
       "epoch": 0.9911894273127754,
+      "grad_norm": 9.206014633178711,
       "learning_rate": 1.7827788649706457e-05,
+      "loss": 0.498061408996582,
       "step": 225
     },
     {
       "epoch": 1.0,
+      "eval_accuracy": 0.8880105401844532,
+      "eval_f1": 0.8434622467771639,
+      "eval_loss": 0.3247315287590027,
+      "eval_precision": 0.8481481481481481,
+      "eval_recall": 0.8388278388278388,
+      "eval_roc_auc": 0.9395378284267173,
+      "eval_runtime": 2.8582,
+      "eval_samples_per_second": 265.551,
+      "eval_steps_per_second": 8.397,
       "step": 227
     },
     {
       "epoch": 1.1013215859030836,
+      "grad_norm": 36.54235076904297,
       "learning_rate": 1.7338551859099805e-05,
+      "loss": 0.34838932037353515,
       "step": 250
     },
     {
       "epoch": 1.2114537444933922,
+      "grad_norm": 11.171507835388184,
       "learning_rate": 1.6849315068493153e-05,
+      "loss": 0.4250565719604492,
       "step": 275
     },
     {
       "epoch": 1.3215859030837005,
+      "grad_norm": 18.83371353149414,
       "learning_rate": 1.6360078277886498e-05,
+      "loss": 0.3523222351074219,
       "step": 300
     },
     {
       "epoch": 1.4317180616740088,
+      "grad_norm": 12.578425407409668,
       "learning_rate": 1.5870841487279843e-05,
+      "loss": 0.3326843643188477,
       "step": 325
     },
     {
       "epoch": 1.5418502202643172,
+      "grad_norm": 4.249295711517334,
       "learning_rate": 1.538160469667319e-05,
+      "loss": 0.4222240447998047,
       "step": 350
     },
     {
       "epoch": 1.6519823788546255,
+      "grad_norm": 12.961797714233398,
       "learning_rate": 1.4892367906066539e-05,
+      "loss": 0.3197017669677734,
       "step": 375
     },
     {
       "epoch": 1.7621145374449338,
+      "grad_norm": 15.027281761169434,
       "learning_rate": 1.4403131115459884e-05,
+      "loss": 0.3585982894897461,
       "step": 400
     },
     {
       "epoch": 1.8722466960352424,
+      "grad_norm": 5.844873428344727,
       "learning_rate": 1.391389432485323e-05,
+      "loss": 0.3265089416503906,
       "step": 425
     },
     {
       "epoch": 1.9823788546255505,
+      "grad_norm": 17.369247436523438,
       "learning_rate": 1.3424657534246576e-05,
+      "loss": 0.30590789794921874,
       "step": 450
     },
     {
       "epoch": 2.0,
+      "eval_accuracy": 0.8880105401844532,
+      "eval_f1": 0.8571428571428571,
+      "eval_loss": 0.2787843644618988,
+      "eval_precision": 0.7919254658385093,
+      "eval_recall": 0.9340659340659341,
+      "eval_roc_auc": 0.959367792701126,
+      "eval_runtime": 2.7537,
+      "eval_samples_per_second": 275.624,
+      "eval_steps_per_second": 8.715,
       "step": 454
     }
   ],
       "attributes": {}
     }
   },
+  "total_flos": 952988242513920.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

transformer/checkpoint-681/config.json CHANGED Viewed

@@ -1,37 +1,39 @@
 {
-  "activation": "gelu",
   "architectures": [
-    "DistilBertForSequenceClassification"
   ],
-  "attention_dropout": 0.1,
-  "bos_token_id": null,
-  "dim": 768,
-  "dropout": 0.1,
   "dtype": "float32",
-  "eos_token_id": null,
-  "hidden_dim": 3072,
   "id2label": {
     "0": "NOT_RELEVANT",
     "1": "RELEVANT"
   },
   "initializer_range": 0.02,
   "label2id": {
     "NOT_RELEVANT": 0,
     "RELEVANT": 1
   },
-  "max_position_embeddings": 512,
-  "model_type": "distilbert",
-  "n_heads": 12,
-  "n_layers": 6,
   "output_past": true,
-  "pad_token_id": 0,
   "problem_type": "single_label_classification",
-  "qa_dropout": 0.1,
-  "seq_classif_dropout": 0.2,
-  "sinusoidal_pos_embds": false,
-  "tie_weights_": true,
   "tie_word_embeddings": true,
-  "transformers_version": "5.8.1",
   "use_cache": false,
-  "vocab_size": 119547
 }

 {
+  "add_cross_attention": false,
   "architectures": [
+    "XLMRobertaForSequenceClassification"
   ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
   "dtype": "float32",
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
   "id2label": {
     "0": "NOT_RELEVANT",
     "1": "RELEVANT"
   },
   "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "is_decoder": false,
   "label2id": {
     "NOT_RELEVANT": 0,
     "RELEVANT": 1
   },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "xlm-roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
   "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "tie_word_embeddings": true,
+  "transformers_version": "5.9.0",
+  "type_vocab_size": 1,
   "use_cache": false,
+  "vocab_size": 250002
 }

transformer/checkpoint-681/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:03dbde438b6b09e9c569ccf3d52d3026870a20fcbed088f82020a5c58d757b9c
-size 541317368

 version https://git-lfs.github.com/spec/v1
+oid sha256:99cd43daccc55ad1ce995212b80d2c417997816e8fff5663abf8e22826766c90
+size 1112205008

transformer/checkpoint-681/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:98bc3e69e944d0fdfd57444f651c232fe90a0c01c77fc9485b1e89c9b1da6e44
-size 1082698827

 version https://git-lfs.github.com/spec/v1
+oid sha256:b8ab5e9309c0a4d78dde38e471c4fdefdfb6af708e8fdac20851e3a7ba69f922
+size 2224532875

transformer/checkpoint-681/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e9be3f1c7f8a91518af8a97c2e068378aafd12649996efa700161802b694aaf3
 size 14645

 version https://git-lfs.github.com/spec/v1
+oid sha256:2ef666104b20bd014bb99759c12ba2ab3544d8d6a6c794765b50a125425e2514
 size 14645

transformer/checkpoint-681/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:08bb78a60da8a2d1603090739ac594effe08f188234024d60472cddbc5a648e9
 size 1383

 version https://git-lfs.github.com/spec/v1
+oid sha256:7821ac2948192ae5dfdbf609f2c5b345a33913b1a653a84c34869f001e99d2aa
 size 1383

transformer/checkpoint-681/tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

transformer/checkpoint-681/tokenizer_config.json CHANGED Viewed

@@ -1,15 +1,15 @@
 {
   "backend": "tokenizers",
-  "cls_token": "[CLS]",
-  "do_lower_case": false,
   "is_local": false,
   "local_files_only": false,
-  "mask_token": "[MASK]",
   "model_max_length": 512,
-  "pad_token": "[PAD]",
-  "sep_token": "[SEP]",
-  "strip_accents": null,
-  "tokenize_chinese_chars": true,
-  "tokenizer_class": "BertTokenizer",
-  "unk_token": "[UNK]"
 }

 {
+  "add_prefix_space": true,
   "backend": "tokenizers",
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
   "is_local": false,
   "local_files_only": false,
+  "mask_token": "<mask>",
   "model_max_length": 512,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "tokenizer_class": "XLMRobertaTokenizer",
+  "unk_token": "<unk>"
 }

transformer/checkpoint-681/trainer_state.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
-  "best_global_step": 454,
-  "best_metric": 0.8765652951699463,
-  "best_model_checkpoint": "/content/agri-wheat-classifier/transformer/checkpoint-454",
   "epoch": 3.0,
   "eval_steps": 500,
   "global_step": 681,
@@ -11,230 +11,230 @@
   "log_history": [
     {
       "epoch": 0.11013215859030837,
-      "grad_norm": 1.3902881145477295,
       "learning_rate": 4.247787610619469e-06,
-      "loss": 0.6896240234375,
       "step": 25
     },
     {
       "epoch": 0.22026431718061673,
-      "grad_norm": 1.9834767580032349,
       "learning_rate": 8.672566371681418e-06,
-      "loss": 0.6819134521484375,
       "step": 50
     },
     {
       "epoch": 0.3303964757709251,
-      "grad_norm": 1.3664361238479614,
       "learning_rate": 1.3097345132743363e-05,
-      "loss": 0.67228271484375,
       "step": 75
     },
     {
       "epoch": 0.44052863436123346,
-      "grad_norm": 3.0097296237945557,
       "learning_rate": 1.7522123893805313e-05,
-      "loss": 0.6490057373046875,
       "step": 100
     },
     {
       "epoch": 0.5506607929515418,
-      "grad_norm": 4.345597267150879,
       "learning_rate": 1.9784735812133072e-05,
-      "loss": 0.5840890502929688,
       "step": 125
     },
     {
       "epoch": 0.6607929515418502,
-      "grad_norm": 6.036681175231934,
       "learning_rate": 1.929549902152642e-05,
-      "loss": 0.4646404266357422,
       "step": 150
     },
     {
       "epoch": 0.7709251101321586,
-      "grad_norm": 17.463848114013672,
       "learning_rate": 1.8806262230919768e-05,
-      "loss": 0.4186407089233398,
       "step": 175
     },
     {
       "epoch": 0.8810572687224669,
-      "grad_norm": 4.881515026092529,
       "learning_rate": 1.8317025440313113e-05,
-      "loss": 0.408887939453125,
       "step": 200
     },
     {
       "epoch": 0.9911894273127754,
-      "grad_norm": 5.256113529205322,
       "learning_rate": 1.7827788649706457e-05,
-      "loss": 0.3965899658203125,
       "step": 225
     },
     {
       "epoch": 1.0,
-      "eval_accuracy": 0.8866930171277997,
-      "eval_f1": 0.8527397260273972,
-      "eval_loss": 0.29110145568847656,
-      "eval_precision": 0.8006430868167203,
-      "eval_recall": 0.9120879120879121,
-      "eval_roc_auc": 0.9464116130782798,
-      "eval_runtime": 1.638,
-      "eval_samples_per_second": 463.383,
-      "eval_steps_per_second": 14.652,
       "step": 227
     },
     {
       "epoch": 1.1013215859030836,
-      "grad_norm": 8.05300521850586,
       "learning_rate": 1.7338551859099805e-05,
-      "loss": 0.2900468635559082,
       "step": 250
     },
     {
       "epoch": 1.2114537444933922,
-      "grad_norm": 3.648190975189209,
       "learning_rate": 1.6849315068493153e-05,
-      "loss": 0.3152153396606445,
       "step": 275
     },
     {
       "epoch": 1.3215859030837005,
-      "grad_norm": 13.387518882751465,
       "learning_rate": 1.6360078277886498e-05,
-      "loss": 0.2970449638366699,
       "step": 300
     },
     {
       "epoch": 1.4317180616740088,
-      "grad_norm": 2.984701633453369,
       "learning_rate": 1.5870841487279843e-05,
-      "loss": 0.2916489791870117,
       "step": 325
     },
     {
       "epoch": 1.5418502202643172,
-      "grad_norm": 4.417141914367676,
       "learning_rate": 1.538160469667319e-05,
-      "loss": 0.2869120979309082,
       "step": 350
     },
     {
       "epoch": 1.6519823788546255,
-      "grad_norm": 3.330986499786377,
       "learning_rate": 1.4892367906066539e-05,
-      "loss": 0.3101354217529297,
       "step": 375
     },
     {
       "epoch": 1.7621145374449338,
-      "grad_norm": 5.084468364715576,
       "learning_rate": 1.4403131115459884e-05,
-      "loss": 0.30187932968139647,
       "step": 400
     },
     {
       "epoch": 1.8722466960352424,
-      "grad_norm": 6.020040512084961,
       "learning_rate": 1.391389432485323e-05,
-      "loss": 0.30431194305419923,
       "step": 425
     },
     {
       "epoch": 1.9823788546255505,
-      "grad_norm": 3.684113025665283,
       "learning_rate": 1.3424657534246576e-05,
-      "loss": 0.2970767021179199,
       "step": 450
     },
     {
       "epoch": 2.0,
-      "eval_accuracy": 0.9090909090909091,
-      "eval_f1": 0.8765652951699463,
-      "eval_loss": 0.255423367023468,
-      "eval_precision": 0.8566433566433567,
-      "eval_recall": 0.8974358974358975,
-      "eval_roc_auc": 0.9556633352929649,
-      "eval_runtime": 1.716,
-      "eval_samples_per_second": 442.313,
-      "eval_steps_per_second": 13.986,
       "step": 454
     },
     {
       "epoch": 2.092511013215859,
-      "grad_norm": 5.848704814910889,
       "learning_rate": 1.2935420743639924e-05,
-      "loss": 0.2515826416015625,
       "step": 475
     },
     {
       "epoch": 2.202643171806167,
-      "grad_norm": 6.936087131500244,
       "learning_rate": 1.2446183953033269e-05,
-      "loss": 0.2454897689819336,
       "step": 500
     },
     {
       "epoch": 2.3127753303964758,
-      "grad_norm": 8.904288291931152,
       "learning_rate": 1.1956947162426615e-05,
-      "loss": 0.24430061340332032,
       "step": 525
     },
     {
       "epoch": 2.4229074889867843,
-      "grad_norm": 9.340006828308105,
       "learning_rate": 1.1467710371819962e-05,
-      "loss": 0.25365222930908204,
       "step": 550
     },
     {
       "epoch": 2.5330396475770924,
-      "grad_norm": 10.99807071685791,
       "learning_rate": 1.097847358121331e-05,
-      "loss": 0.20383157730102539,
       "step": 575
     },
     {
       "epoch": 2.643171806167401,
-      "grad_norm": 0.9036199450492859,
       "learning_rate": 1.0489236790606654e-05,
-      "loss": 0.2450111961364746,
       "step": 600
     },
     {
       "epoch": 2.753303964757709,
-      "grad_norm": 11.331809043884277,
       "learning_rate": 1e-05,
-      "loss": 0.2072979736328125,
       "step": 625
     },
     {
       "epoch": 2.8634361233480177,
-      "grad_norm": 11.751481056213379,
       "learning_rate": 9.510763209393347e-06,
-      "loss": 0.19760629653930664,
       "step": 650
     },
     {
       "epoch": 2.9735682819383262,
-      "grad_norm": 10.376523971557617,
       "learning_rate": 9.021526418786694e-06,
-      "loss": 0.17518287658691406,
       "step": 675
     },
     {
       "epoch": 3.0,
-      "eval_accuracy": 0.8774703557312253,
-      "eval_f1": 0.8426395939086294,
-      "eval_loss": 0.3243195116519928,
-      "eval_precision": 0.7830188679245284,
-      "eval_recall": 0.9120879120879121,
-      "eval_roc_auc": 0.9531158142269252,
-      "eval_runtime": 1.6443,
-      "eval_samples_per_second": 461.6,
-      "eval_steps_per_second": 14.596,
       "step": 681
     }
   ],
@@ -250,7 +250,7 @@
         "early_stopping_threshold": 0.0
       },
       "attributes": {
-        "early_stopping_patience_counter": 1
       }
     },
     "TrainerControl": {
@@ -264,7 +264,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 719695376898048.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

 {
+  "best_global_step": 681,
+  "best_metric": 0.8809946714031972,
+  "best_model_checkpoint": "/content/agri-wheat-classifier/transformer/checkpoint-681",
   "epoch": 3.0,
   "eval_steps": 500,
   "global_step": 681,
   "log_history": [
     {
       "epoch": 0.11013215859030837,
+      "grad_norm": 3.4615602493286133,
       "learning_rate": 4.247787610619469e-06,
+      "loss": 0.7144061279296875,
       "step": 25
     },
     {
       "epoch": 0.22026431718061673,
+      "grad_norm": 6.50156307220459,
       "learning_rate": 8.672566371681418e-06,
+      "loss": 0.6882943725585937,
       "step": 50
     },
     {
       "epoch": 0.3303964757709251,
+      "grad_norm": 4.099428176879883,
       "learning_rate": 1.3097345132743363e-05,
+      "loss": 0.6711004638671875,
       "step": 75
     },
     {
       "epoch": 0.44052863436123346,
+      "grad_norm": 7.663174629211426,
       "learning_rate": 1.7522123893805313e-05,
+      "loss": 0.681163330078125,
       "step": 100
     },
     {
       "epoch": 0.5506607929515418,
+      "grad_norm": 10.003649711608887,
       "learning_rate": 1.9784735812133072e-05,
+      "loss": 0.672431640625,
       "step": 125
     },
     {
       "epoch": 0.6607929515418502,
+      "grad_norm": 4.136000633239746,
       "learning_rate": 1.929549902152642e-05,
+      "loss": 0.6405279541015625,
       "step": 150
     },
     {
       "epoch": 0.7709251101321586,
+      "grad_norm": 8.746106147766113,
       "learning_rate": 1.8806262230919768e-05,
+      "loss": 0.6329603576660157,
       "step": 175
     },
     {
       "epoch": 0.8810572687224669,
+      "grad_norm": 6.302291393280029,
       "learning_rate": 1.8317025440313113e-05,
+      "loss": 0.48342845916748045,
       "step": 200
     },
     {
       "epoch": 0.9911894273127754,
+      "grad_norm": 9.206014633178711,
       "learning_rate": 1.7827788649706457e-05,
+      "loss": 0.498061408996582,
       "step": 225
     },
     {
       "epoch": 1.0,
+      "eval_accuracy": 0.8880105401844532,
+      "eval_f1": 0.8434622467771639,
+      "eval_loss": 0.3247315287590027,
+      "eval_precision": 0.8481481481481481,
+      "eval_recall": 0.8388278388278388,
+      "eval_roc_auc": 0.9395378284267173,
+      "eval_runtime": 2.8582,
+      "eval_samples_per_second": 265.551,
+      "eval_steps_per_second": 8.397,
       "step": 227
     },
     {
       "epoch": 1.1013215859030836,
+      "grad_norm": 36.54235076904297,
       "learning_rate": 1.7338551859099805e-05,
+      "loss": 0.34838932037353515,
       "step": 250
     },
     {
       "epoch": 1.2114537444933922,
+      "grad_norm": 11.171507835388184,
       "learning_rate": 1.6849315068493153e-05,
+      "loss": 0.4250565719604492,
       "step": 275
     },
     {
       "epoch": 1.3215859030837005,
+      "grad_norm": 18.83371353149414,
       "learning_rate": 1.6360078277886498e-05,
+      "loss": 0.3523222351074219,
       "step": 300
     },
     {
       "epoch": 1.4317180616740088,
+      "grad_norm": 12.578425407409668,
       "learning_rate": 1.5870841487279843e-05,
+      "loss": 0.3326843643188477,
       "step": 325
     },
     {
       "epoch": 1.5418502202643172,
+      "grad_norm": 4.249295711517334,
       "learning_rate": 1.538160469667319e-05,
+      "loss": 0.4222240447998047,
       "step": 350
     },
     {
       "epoch": 1.6519823788546255,
+      "grad_norm": 12.961797714233398,
       "learning_rate": 1.4892367906066539e-05,
+      "loss": 0.3197017669677734,
       "step": 375
     },
     {
       "epoch": 1.7621145374449338,
+      "grad_norm": 15.027281761169434,
       "learning_rate": 1.4403131115459884e-05,
+      "loss": 0.3585982894897461,
       "step": 400
     },
     {
       "epoch": 1.8722466960352424,
+      "grad_norm": 5.844873428344727,
       "learning_rate": 1.391389432485323e-05,
+      "loss": 0.3265089416503906,
       "step": 425
     },
     {
       "epoch": 1.9823788546255505,
+      "grad_norm": 17.369247436523438,
       "learning_rate": 1.3424657534246576e-05,
+      "loss": 0.30590789794921874,
       "step": 450
     },
     {
       "epoch": 2.0,
+      "eval_accuracy": 0.8880105401844532,
+      "eval_f1": 0.8571428571428571,
+      "eval_loss": 0.2787843644618988,
+      "eval_precision": 0.7919254658385093,
+      "eval_recall": 0.9340659340659341,
+      "eval_roc_auc": 0.959367792701126,
+      "eval_runtime": 2.7537,
+      "eval_samples_per_second": 275.624,
+      "eval_steps_per_second": 8.715,
       "step": 454
     },
     {
       "epoch": 2.092511013215859,
+      "grad_norm": 10.165802955627441,
       "learning_rate": 1.2935420743639924e-05,
+      "loss": 0.3099861145019531,
       "step": 475
     },
     {
       "epoch": 2.202643171806167,
+      "grad_norm": 12.579766273498535,
       "learning_rate": 1.2446183953033269e-05,
+      "loss": 0.24645326614379884,
       "step": 500
     },
     {
       "epoch": 2.3127753303964758,
+      "grad_norm": 16.500667572021484,
       "learning_rate": 1.1956947162426615e-05,
+      "loss": 0.32091796875,
       "step": 525
     },
     {
       "epoch": 2.4229074889867843,
+      "grad_norm": 48.79829788208008,
       "learning_rate": 1.1467710371819962e-05,
+      "loss": 0.28792179107666016,
       "step": 550
     },
     {
       "epoch": 2.5330396475770924,
+      "grad_norm": 3.1696665287017822,
       "learning_rate": 1.097847358121331e-05,
+      "loss": 0.20424072265625,
       "step": 575
     },
     {
       "epoch": 2.643171806167401,
+      "grad_norm": 5.296319007873535,
       "learning_rate": 1.0489236790606654e-05,
+      "loss": 0.3179521179199219,
       "step": 600
     },
     {
       "epoch": 2.753303964757709,
+      "grad_norm": 2.286626100540161,
       "learning_rate": 1e-05,
+      "loss": 0.20801780700683595,
       "step": 625
     },
     {
       "epoch": 2.8634361233480177,
+      "grad_norm": 18.524463653564453,
       "learning_rate": 9.510763209393347e-06,
+      "loss": 0.2919172477722168,
       "step": 650
     },
     {
       "epoch": 2.9735682819383262,
+      "grad_norm": 11.000245094299316,
       "learning_rate": 9.021526418786694e-06,
+      "loss": 0.2509865570068359,
       "step": 675
     },
     {
       "epoch": 3.0,
+      "eval_accuracy": 0.9117259552042161,
+      "eval_f1": 0.8809946714031972,
+      "eval_loss": 0.2792136073112488,
+      "eval_precision": 0.8551724137931035,
+      "eval_recall": 0.9084249084249084,
+      "eval_roc_auc": 0.9613387298572483,
+      "eval_runtime": 2.7576,
+      "eval_samples_per_second": 275.236,
+      "eval_steps_per_second": 8.703,
       "step": 681
     }
   ],
         "early_stopping_threshold": 0.0
       },
       "attributes": {
+        "early_stopping_patience_counter": 0
       }
     },
     "TrainerControl": {
       "attributes": {}
     }
   },
+  "total_flos": 1429482363770880.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

transformer/checkpoint-908/config.json CHANGED Viewed

@@ -1,37 +1,39 @@
 {
-  "activation": "gelu",
   "architectures": [
-    "DistilBertForSequenceClassification"
   ],
-  "attention_dropout": 0.1,
-  "bos_token_id": null,
-  "dim": 768,
-  "dropout": 0.1,
   "dtype": "float32",
-  "eos_token_id": null,
-  "hidden_dim": 3072,
   "id2label": {
     "0": "NOT_RELEVANT",
     "1": "RELEVANT"
   },
   "initializer_range": 0.02,
   "label2id": {
     "NOT_RELEVANT": 0,
     "RELEVANT": 1
   },
-  "max_position_embeddings": 512,
-  "model_type": "distilbert",
-  "n_heads": 12,
-  "n_layers": 6,
   "output_past": true,
-  "pad_token_id": 0,
   "problem_type": "single_label_classification",
-  "qa_dropout": 0.1,
-  "seq_classif_dropout": 0.2,
-  "sinusoidal_pos_embds": false,
-  "tie_weights_": true,
   "tie_word_embeddings": true,
-  "transformers_version": "5.8.1",
   "use_cache": false,
-  "vocab_size": 119547
 }

 {
+  "add_cross_attention": false,
   "architectures": [
+    "XLMRobertaForSequenceClassification"
   ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
   "dtype": "float32",
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
   "id2label": {
     "0": "NOT_RELEVANT",
     "1": "RELEVANT"
   },
   "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "is_decoder": false,
   "label2id": {
     "NOT_RELEVANT": 0,
     "RELEVANT": 1
   },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 514,
+  "model_type": "xlm-roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
   "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "tie_word_embeddings": true,
+  "transformers_version": "5.9.0",
+  "type_vocab_size": 1,
   "use_cache": false,
+  "vocab_size": 250002
 }

transformer/checkpoint-908/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cda5d1601a665324d26d288eb6116f925bca8729dea7e932524e9bac11b6f5e4
-size 541317368

 version https://git-lfs.github.com/spec/v1
+oid sha256:4e5c530095532c2b7b2533294a4f71b74527ec3d50e89f8da1c71b1e8f7e6e45
+size 1112205008

transformer/checkpoint-908/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0d5fd9ef5917c9829fb094dcd22189d2d57d1ca5b11470f33e337d67b2d1d616
-size 1082698827

 version https://git-lfs.github.com/spec/v1
+oid sha256:ac9ab63cee4c17da8e692806f4f7e83a5a4d99a2383f4d3c0421bd39157d1743
+size 2224532875