robo-noct commited on Jun 30, 2025

Commit

aa31af5

verified ·

1 Parent(s): e56d0dd

Upload folder using huggingface_hub

Browse files

Files changed (18) hide show

README.md +37 -0
checkpoint-84/config.json +53 -0
checkpoint-84/model.safetensors +3 -0
checkpoint-84/optimizer.pt +3 -0
checkpoint-84/rng_state.pth +3 -0
checkpoint-84/scheduler.pt +3 -0
checkpoint-84/trainer_state.json +684 -0
checkpoint-84/training_args.bin +3 -0
config.json +53 -0
model.safetensors +3 -0
runs/Jun30_23-40-29_r-robo-noct-autotrain-advanced-kegy3hzm-59701-y966k/events.out.tfevents.1751326832.r-robo-noct-autotrain-advanced-kegy3hzm-59701-y966k.114.0 +2 -2
runs/Jun30_23-40-29_r-robo-noct-autotrain-advanced-kegy3hzm-59701-y966k/events.out.tfevents.1751327028.r-robo-noct-autotrain-advanced-kegy3hzm-59701-y966k.114.1 +3 -0
special_tokens_map.json +7 -0
tokenizer.json +0 -0
tokenizer_config.json +56 -0
training_args.bin +3 -0
training_params.json +30 -0
vocab.txt +0 -0

README.md ADDED Viewed

	@@ -0,0 +1,37 @@

+---
+library_name: transformers
+tags:
+- autotrain
+- text-classification
+base_model: google/mobilebert-uncased
+widget:
+- text: "I love AutoTrain"
+---
+# Model Trained Using AutoTrain
+- Problem type: Text Classification
+## Validation Metrics
+loss: 1.7558108568191528
+f1_macro: 0.3432320638995863
+f1_micro: 0.35714285714285715
+f1_weighted: 0.3432320638995863
+precision_macro: 0.6085343228200372
+precision_micro: 0.35714285714285715
+precision_weighted: 0.6085343228200372
+recall_macro: 0.35714285714285715
+recall_micro: 0.35714285714285715
+recall_weighted: 0.35714285714285715
+accuracy: 0.35714285714285715

checkpoint-84/config.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "_name_or_path": "google/mobilebert-uncased",
+  "_num_labels": 7,
+  "architectures": [
+    "MobileBertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_activation": false,
+  "classifier_dropout": null,
+  "embedding_size": 128,
+  "hidden_act": "relu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_size": 512,
+  "id2label": {
+    "0": "anniversary",
+    "1": "baby",
+    "2": "birthday",
+    "3": "get_well",
+    "4": "holiday",
+    "5": "promotion",
+    "6": "wedding"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 512,
+  "intra_bottleneck_size": 128,
+  "key_query_shared_bottleneck": true,
+  "label2id": {
+    "anniversary": 0,
+    "baby": 1,
+    "birthday": 2,
+    "get_well": 3,
+    "holiday": 4,
+    "promotion": 5,
+    "wedding": 6
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "mobilebert",
+  "normalization_type": "no_norm",
+  "num_attention_heads": 4,
+  "num_feedforward_networks": 4,
+  "num_hidden_layers": 24,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.0",
+  "trigram_input": true,
+  "true_hidden_size": 128,
+  "type_vocab_size": 2,
+  "use_bottleneck": true,
+  "use_bottleneck_attention": false,
+  "vocab_size": 30522
+}

checkpoint-84/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6f3afca87ac473bfc430ab58b3fe58e985d3ac71f86c6748fd1e7e3432e743ae
+size 98480380

checkpoint-84/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3e71e0bba8d7dc74a70ef2f96b0223c0e214fc6d5766120c470c3e8c6d881ac4
+size 197583069

checkpoint-84/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:34f589ceff3622f09550f9b30eae034559a07be8bcd0c079a574e80fdf0f2936
+size 13990

checkpoint-84/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b176eedd19a752a5759156c376fae5bff5a174b7b100c0698e65f5e76ac4547e
+size 1064

checkpoint-84/trainer_state.json ADDED Viewed

	@@ -0,0 +1,684 @@

+{
+  "best_metric": 1.7558108568191528,
+  "best_model_checkpoint": "greetings/checkpoint-84",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 84,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.03571428571428571,
+      "grad_norm": 363697984.0,
+      "learning_rate": 5.555555555555556e-06,
+      "loss": 2329191.0,
+      "step": 1
+    },
+    {
+      "epoch": 0.07142857142857142,
+      "grad_norm": 332609952.0,
+      "learning_rate": 1.1111111111111112e-05,
+      "loss": 4540264.0,
+      "step": 2
+    },
+    {
+      "epoch": 0.10714285714285714,
+      "grad_norm": 366500000.0,
+      "learning_rate": 1.6666666666666667e-05,
+      "loss": 1966578.75,
+      "step": 3
+    },
+    {
+      "epoch": 0.14285714285714285,
+      "grad_norm": 367947328.0,
+      "learning_rate": 2.2222222222222223e-05,
+      "loss": 4571710.5,
+      "step": 4
+    },
+    {
+      "epoch": 0.17857142857142858,
+      "grad_norm": 174013440.0,
+      "learning_rate": 2.777777777777778e-05,
+      "loss": 2946220.5,
+      "step": 5
+    },
+    {
+      "epoch": 0.21428571428571427,
+      "grad_norm": 310462848.0,
+      "learning_rate": 3.3333333333333335e-05,
+      "loss": 4198167.5,
+      "step": 6
+    },
+    {
+      "epoch": 0.25,
+      "grad_norm": 295043232.0,
+      "learning_rate": 3.888888888888889e-05,
+      "loss": 2041447.375,
+      "step": 7
+    },
+    {
+      "epoch": 0.2857142857142857,
+      "grad_norm": 275529440.0,
+      "learning_rate": 4.4444444444444447e-05,
+      "loss": 3907286.5,
+      "step": 8
+    },
+    {
+      "epoch": 0.32142857142857145,
+      "grad_norm": 261926944.0,
+      "learning_rate": 5e-05,
+      "loss": 2561375.0,
+      "step": 9
+    },
+    {
+      "epoch": 0.35714285714285715,
+      "grad_norm": 198724384.0,
+      "learning_rate": 4.933333333333334e-05,
+      "loss": 684095.8125,
+      "step": 10
+    },
+    {
+      "epoch": 0.39285714285714285,
+      "grad_norm": 74599368.0,
+      "learning_rate": 4.866666666666667e-05,
+      "loss": 730185.5625,
+      "step": 11
+    },
+    {
+      "epoch": 0.42857142857142855,
+      "grad_norm": 141572384.0,
+      "learning_rate": 4.8e-05,
+      "loss": 1238386.5,
+      "step": 12
+    },
+    {
+      "epoch": 0.4642857142857143,
+      "grad_norm": 105069400.0,
+      "learning_rate": 4.7333333333333336e-05,
+      "loss": 329932.7188,
+      "step": 13
+    },
+    {
+      "epoch": 0.5,
+      "grad_norm": 78809056.0,
+      "learning_rate": 4.666666666666667e-05,
+      "loss": 502494.0312,
+      "step": 14
+    },
+    {
+      "epoch": 0.5357142857142857,
+      "grad_norm": 45120072.0,
+      "learning_rate": 4.600000000000001e-05,
+      "loss": 132410.2188,
+      "step": 15
+    },
+    {
+      "epoch": 0.5714285714285714,
+      "grad_norm": 14674872.0,
+      "learning_rate": 4.5333333333333335e-05,
+      "loss": 117778.0703,
+      "step": 16
+    },
+    {
+      "epoch": 0.6071428571428571,
+      "grad_norm": 12449395.0,
+      "learning_rate": 4.466666666666667e-05,
+      "loss": 36973.5859,
+      "step": 17
+    },
+    {
+      "epoch": 0.6428571428571429,
+      "grad_norm": 7055619.0,
+      "learning_rate": 4.4000000000000006e-05,
+      "loss": 17534.8203,
+      "step": 18
+    },
+    {
+      "epoch": 0.6785714285714286,
+      "grad_norm": 2371520.25,
+      "learning_rate": 4.3333333333333334e-05,
+      "loss": 8574.9141,
+      "step": 19
+    },
+    {
+      "epoch": 0.7142857142857143,
+      "grad_norm": 689186.875,
+      "learning_rate": 4.266666666666667e-05,
+      "loss": 960.9683,
+      "step": 20
+    },
+    {
+      "epoch": 0.75,
+      "grad_norm": 5261831.0,
+      "learning_rate": 4.2e-05,
+      "loss": 3616.8489,
+      "step": 21
+    },
+    {
+      "epoch": 0.7857142857142857,
+      "grad_norm": 391023.5625,
+      "learning_rate": 4.133333333333333e-05,
+      "loss": 1925.2124,
+      "step": 22
+    },
+    {
+      "epoch": 0.8214285714285714,
+      "grad_norm": 348153.03125,
+      "learning_rate": 4.066666666666667e-05,
+      "loss": 846.3534,
+      "step": 23
+    },
+    {
+      "epoch": 0.8571428571428571,
+      "grad_norm": 195729.609375,
+      "learning_rate": 4e-05,
+      "loss": 1115.4226,
+      "step": 24
+    },
+    {
+      "epoch": 0.8928571428571429,
+      "grad_norm": 213168.09375,
+      "learning_rate": 3.933333333333333e-05,
+      "loss": 549.3003,
+      "step": 25
+    },
+    {
+      "epoch": 0.9285714285714286,
+      "grad_norm": 174626.953125,
+      "learning_rate": 3.866666666666667e-05,
+      "loss": 1134.6808,
+      "step": 26
+    },
+    {
+      "epoch": 0.9642857142857143,
+      "grad_norm": 140094.015625,
+      "learning_rate": 3.8e-05,
+      "loss": 317.9678,
+      "step": 27
+    },
+    {
+      "epoch": 1.0,
+      "grad_norm": 18230.22265625,
+      "learning_rate": 3.733333333333334e-05,
+      "loss": 26.3715,
+      "step": 28
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.14285714285714285,
+      "eval_f1_macro": 0.036281179138321996,
+      "eval_f1_micro": 0.14285714285714285,
+      "eval_f1_weighted": 0.036281179138321996,
+      "eval_loss": 3.2450358867645264,
+      "eval_precision_macro": 0.02077922077922078,
+      "eval_precision_micro": 0.14285714285714285,
+      "eval_precision_weighted": 0.02077922077922078,
+      "eval_recall_macro": 0.14285714285714285,
+      "eval_recall_micro": 0.14285714285714285,
+      "eval_recall_weighted": 0.14285714285714285,
+      "eval_runtime": 4.5357,
+      "eval_samples_per_second": 12.346,
+      "eval_steps_per_second": 0.882,
+      "step": 28
+    },
+    {
+      "epoch": 1.0357142857142858,
+      "grad_norm": 44302.54296875,
+      "learning_rate": 3.6666666666666666e-05,
+      "loss": 57.2804,
+      "step": 29
+    },
+    {
+      "epoch": 1.0714285714285714,
+      "grad_norm": 59.95901870727539,
+      "learning_rate": 3.6e-05,
+      "loss": 3.1393,
+      "step": 30
+    },
+    {
+      "epoch": 1.1071428571428572,
+      "grad_norm": 16230.6044921875,
+      "learning_rate": 3.5333333333333336e-05,
+      "loss": 18.976,
+      "step": 31
+    },
+    {
+      "epoch": 1.1428571428571428,
+      "grad_norm": 10362.8798828125,
+      "learning_rate": 3.466666666666667e-05,
+      "loss": 5.5453,
+      "step": 32
+    },
+    {
+      "epoch": 1.1785714285714286,
+      "grad_norm": 55.348052978515625,
+      "learning_rate": 3.4000000000000007e-05,
+      "loss": 3.1038,
+      "step": 33
+    },
+    {
+      "epoch": 1.2142857142857142,
+      "grad_norm": 36.999446868896484,
+      "learning_rate": 3.3333333333333335e-05,
+      "loss": 2.6861,
+      "step": 34
+    },
+    {
+      "epoch": 1.25,
+      "grad_norm": 33.05454635620117,
+      "learning_rate": 3.266666666666667e-05,
+      "loss": 1.6557,
+      "step": 35
+    },
+    {
+      "epoch": 1.2857142857142856,
+      "grad_norm": 60.194175720214844,
+      "learning_rate": 3.2000000000000005e-05,
+      "loss": 2.6653,
+      "step": 36
+    },
+    {
+      "epoch": 1.3214285714285714,
+      "grad_norm": 24.14499282836914,
+      "learning_rate": 3.1333333333333334e-05,
+      "loss": 2.1868,
+      "step": 37
+    },
+    {
+      "epoch": 1.3571428571428572,
+      "grad_norm": 42.75698471069336,
+      "learning_rate": 3.066666666666667e-05,
+      "loss": 2.4374,
+      "step": 38
+    },
+    {
+      "epoch": 1.3928571428571428,
+      "grad_norm": 34.075408935546875,
+      "learning_rate": 3e-05,
+      "loss": 1.9931,
+      "step": 39
+    },
+    {
+      "epoch": 1.4285714285714286,
+      "grad_norm": 53.1582145690918,
+      "learning_rate": 2.9333333333333336e-05,
+      "loss": 2.0789,
+      "step": 40
+    },
+    {
+      "epoch": 1.4642857142857144,
+      "grad_norm": 35.603214263916016,
+      "learning_rate": 2.8666666666666668e-05,
+      "loss": 2.1585,
+      "step": 41
+    },
+    {
+      "epoch": 1.5,
+      "grad_norm": 25.19101333618164,
+      "learning_rate": 2.8000000000000003e-05,
+      "loss": 2.1399,
+      "step": 42
+    },
+    {
+      "epoch": 1.5357142857142856,
+      "grad_norm": 28.07346534729004,
+      "learning_rate": 2.733333333333333e-05,
+      "loss": 2.0334,
+      "step": 43
+    },
+    {
+      "epoch": 1.5714285714285714,
+      "grad_norm": 28.849031448364258,
+      "learning_rate": 2.6666666666666667e-05,
+      "loss": 2.0505,
+      "step": 44
+    },
+    {
+      "epoch": 1.6071428571428572,
+      "grad_norm": 27.37757682800293,
+      "learning_rate": 2.6000000000000002e-05,
+      "loss": 1.9464,
+      "step": 45
+    },
+    {
+      "epoch": 1.6428571428571428,
+      "grad_norm": 33.769561767578125,
+      "learning_rate": 2.5333333333333337e-05,
+      "loss": 1.9979,
+      "step": 46
+    },
+    {
+      "epoch": 1.6785714285714286,
+      "grad_norm": 28.812028884887695,
+      "learning_rate": 2.466666666666667e-05,
+      "loss": 2.0561,
+      "step": 47
+    },
+    {
+      "epoch": 1.7142857142857144,
+      "grad_norm": 30.845348358154297,
+      "learning_rate": 2.4e-05,
+      "loss": 2.1788,
+      "step": 48
+    },
+    {
+      "epoch": 1.75,
+      "grad_norm": 20.779951095581055,
+      "learning_rate": 2.3333333333333336e-05,
+      "loss": 2.0341,
+      "step": 49
+    },
+    {
+      "epoch": 1.7857142857142856,
+      "grad_norm": 33.18374252319336,
+      "learning_rate": 2.2666666666666668e-05,
+      "loss": 1.9194,
+      "step": 50
+    },
+    {
+      "epoch": 1.8214285714285714,
+      "grad_norm": 28.13947105407715,
+      "learning_rate": 2.2000000000000003e-05,
+      "loss": 2.0167,
+      "step": 51
+    },
+    {
+      "epoch": 1.8571428571428572,
+      "grad_norm": 18.270055770874023,
+      "learning_rate": 2.1333333333333335e-05,
+      "loss": 2.0225,
+      "step": 52
+    },
+    {
+      "epoch": 1.8928571428571428,
+      "grad_norm": 30.988462448120117,
+      "learning_rate": 2.0666666666666666e-05,
+      "loss": 1.9634,
+      "step": 53
+    },
+    {
+      "epoch": 1.9285714285714286,
+      "grad_norm": 30.876007080078125,
+      "learning_rate": 2e-05,
+      "loss": 2.1378,
+      "step": 54
+    },
+    {
+      "epoch": 1.9642857142857144,
+      "grad_norm": 19.88353729248047,
+      "learning_rate": 1.9333333333333333e-05,
+      "loss": 1.971,
+      "step": 55
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 28.21643829345703,
+      "learning_rate": 1.866666666666667e-05,
+      "loss": 1.8975,
+      "step": 56
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.19642857142857142,
+      "eval_f1_macro": 0.12244897959183673,
+      "eval_f1_micro": 0.19642857142857142,
+      "eval_f1_weighted": 0.12244897959183673,
+      "eval_loss": 1.9160802364349365,
+      "eval_precision_macro": 0.20477664750110572,
+      "eval_precision_micro": 0.19642857142857142,
+      "eval_precision_weighted": 0.20477664750110572,
+      "eval_recall_macro": 0.19642857142857142,
+      "eval_recall_micro": 0.19642857142857142,
+      "eval_recall_weighted": 0.19642857142857142,
+      "eval_runtime": 4.7496,
+      "eval_samples_per_second": 11.79,
+      "eval_steps_per_second": 0.842,
+      "step": 56
+    },
+    {
+      "epoch": 2.0357142857142856,
+      "grad_norm": 45.93918228149414,
+      "learning_rate": 1.8e-05,
+      "loss": 1.637,
+      "step": 57
+    },
+    {
+      "epoch": 2.0714285714285716,
+      "grad_norm": 29.07505226135254,
+      "learning_rate": 1.7333333333333336e-05,
+      "loss": 2.0992,
+      "step": 58
+    },
+    {
+      "epoch": 2.107142857142857,
+      "grad_norm": 19.287498474121094,
+      "learning_rate": 1.6666666666666667e-05,
+      "loss": 1.7994,
+      "step": 59
+    },
+    {
+      "epoch": 2.142857142857143,
+      "grad_norm": 25.761016845703125,
+      "learning_rate": 1.6000000000000003e-05,
+      "loss": 1.8948,
+      "step": 60
+    },
+    {
+      "epoch": 2.1785714285714284,
+      "grad_norm": 30.0518798828125,
+      "learning_rate": 1.5333333333333334e-05,
+      "loss": 1.9301,
+      "step": 61
+    },
+    {
+      "epoch": 2.2142857142857144,
+      "grad_norm": 27.495458602905273,
+      "learning_rate": 1.4666666666666668e-05,
+      "loss": 1.9712,
+      "step": 62
+    },
+    {
+      "epoch": 2.25,
+      "grad_norm": 27.65778350830078,
+      "learning_rate": 1.4000000000000001e-05,
+      "loss": 1.9837,
+      "step": 63
+    },
+    {
+      "epoch": 2.2857142857142856,
+      "grad_norm": 26.54891014099121,
+      "learning_rate": 1.3333333333333333e-05,
+      "loss": 1.7548,
+      "step": 64
+    },
+    {
+      "epoch": 2.3214285714285716,
+      "grad_norm": 31.930673599243164,
+      "learning_rate": 1.2666666666666668e-05,
+      "loss": 1.9568,
+      "step": 65
+    },
+    {
+      "epoch": 2.357142857142857,
+      "grad_norm": 27.43727684020996,
+      "learning_rate": 1.2e-05,
+      "loss": 1.9759,
+      "step": 66
+    },
+    {
+      "epoch": 2.392857142857143,
+      "grad_norm": 21.30677032470703,
+      "learning_rate": 1.1333333333333334e-05,
+      "loss": 2.0283,
+      "step": 67
+    },
+    {
+      "epoch": 2.4285714285714284,
+      "grad_norm": 28.749021530151367,
+      "learning_rate": 1.0666666666666667e-05,
+      "loss": 1.8936,
+      "step": 68
+    },
+    {
+      "epoch": 2.4642857142857144,
+      "grad_norm": 26.132905960083008,
+      "learning_rate": 1e-05,
+      "loss": 1.8316,
+      "step": 69
+    },
+    {
+      "epoch": 2.5,
+      "grad_norm": 17.647850036621094,
+      "learning_rate": 9.333333333333334e-06,
+      "loss": 1.6821,
+      "step": 70
+    },
+    {
+      "epoch": 2.5357142857142856,
+      "grad_norm": 19.563146591186523,
+      "learning_rate": 8.666666666666668e-06,
+      "loss": 1.7006,
+      "step": 71
+    },
+    {
+      "epoch": 2.571428571428571,
+      "grad_norm": 25.576669692993164,
+      "learning_rate": 8.000000000000001e-06,
+      "loss": 1.9317,
+      "step": 72
+    },
+    {
+      "epoch": 2.607142857142857,
+      "grad_norm": 21.140615463256836,
+      "learning_rate": 7.333333333333334e-06,
+      "loss": 1.7071,
+      "step": 73
+    },
+    {
+      "epoch": 2.642857142857143,
+      "grad_norm": 18.916963577270508,
+      "learning_rate": 6.666666666666667e-06,
+      "loss": 1.6799,
+      "step": 74
+    },
+    {
+      "epoch": 2.678571428571429,
+      "grad_norm": 21.43787956237793,
+      "learning_rate": 6e-06,
+      "loss": 1.7079,
+      "step": 75
+    },
+    {
+      "epoch": 2.7142857142857144,
+      "grad_norm": 32.862083435058594,
+      "learning_rate": 5.333333333333334e-06,
+      "loss": 1.7776,
+      "step": 76
+    },
+    {
+      "epoch": 2.75,
+      "grad_norm": 19.999584197998047,
+      "learning_rate": 4.666666666666667e-06,
+      "loss": 1.422,
+      "step": 77
+    },
+    {
+      "epoch": 2.7857142857142856,
+      "grad_norm": 31.127351760864258,
+      "learning_rate": 4.000000000000001e-06,
+      "loss": 2.0594,
+      "step": 78
+    },
+    {
+      "epoch": 2.821428571428571,
+      "grad_norm": 29.890186309814453,
+      "learning_rate": 3.3333333333333333e-06,
+      "loss": 1.5418,
+      "step": 79
+    },
+    {
+      "epoch": 2.857142857142857,
+      "grad_norm": 26.948698043823242,
+      "learning_rate": 2.666666666666667e-06,
+      "loss": 1.8609,
+      "step": 80
+    },
+    {
+      "epoch": 2.892857142857143,
+      "grad_norm": 29.302663803100586,
+      "learning_rate": 2.0000000000000003e-06,
+      "loss": 1.8429,
+      "step": 81
+    },
+    {
+      "epoch": 2.928571428571429,
+      "grad_norm": 28.169702529907227,
+      "learning_rate": 1.3333333333333334e-06,
+      "loss": 1.7572,
+      "step": 82
+    },
+    {
+      "epoch": 2.9642857142857144,
+      "grad_norm": 32.628578186035156,
+      "learning_rate": 6.666666666666667e-07,
+      "loss": 1.693,
+      "step": 83
+    },
+    {
+      "epoch": 3.0,
+      "grad_norm": 25.8957462310791,
+      "learning_rate": 0.0,
+      "loss": 1.422,
+      "step": 84
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.35714285714285715,
+      "eval_f1_macro": 0.3432320638995863,
+      "eval_f1_micro": 0.35714285714285715,
+      "eval_f1_weighted": 0.3432320638995863,
+      "eval_loss": 1.7558108568191528,
+      "eval_precision_macro": 0.6085343228200372,
+      "eval_precision_micro": 0.35714285714285715,
+      "eval_precision_weighted": 0.6085343228200372,
+      "eval_recall_macro": 0.35714285714285715,
+      "eval_recall_micro": 0.35714285714285715,
+      "eval_recall_weighted": 0.35714285714285715,
+      "eval_runtime": 4.7032,
+      "eval_samples_per_second": 11.907,
+      "eval_steps_per_second": 0.85,
+      "step": 84
+    }
+  ],
+  "logging_steps": 1,
+  "max_steps": 84,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 5,
+        "early_stopping_threshold": 0.01
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 10536355307520.0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-84/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91985e71ce5cb37df961d9103170c821b998b7345c2051c8e5b5548a218e1985
+size 5368

config.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "_name_or_path": "google/mobilebert-uncased",
+  "_num_labels": 7,
+  "architectures": [
+    "MobileBertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_activation": false,
+  "classifier_dropout": null,
+  "embedding_size": 128,
+  "hidden_act": "relu",
+  "hidden_dropout_prob": 0.0,
+  "hidden_size": 512,
+  "id2label": {
+    "0": "anniversary",
+    "1": "baby",
+    "2": "birthday",
+    "3": "get_well",
+    "4": "holiday",
+    "5": "promotion",
+    "6": "wedding"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 512,
+  "intra_bottleneck_size": 128,
+  "key_query_shared_bottleneck": true,
+  "label2id": {
+    "anniversary": 0,
+    "baby": 1,
+    "birthday": 2,
+    "get_well": 3,
+    "holiday": 4,
+    "promotion": 5,
+    "wedding": 6
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "mobilebert",
+  "normalization_type": "no_norm",
+  "num_attention_heads": 4,
+  "num_feedforward_networks": 4,
+  "num_hidden_layers": 24,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.0",
+  "trigram_input": true,
+  "true_hidden_size": 128,
+  "type_vocab_size": 2,
+  "use_bottleneck": true,
+  "use_bottleneck_attention": false,
+  "vocab_size": 30522
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6f3afca87ac473bfc430ab58b3fe58e985d3ac71f86c6748fd1e7e3432e743ae
+size 98480380

runs/Jun30_23-40-29_r-robo-noct-autotrain-advanced-kegy3hzm-59701-y966k/events.out.tfevents.1751326832.r-robo-noct-autotrain-advanced-kegy3hzm-59701-y966k.114.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4be9a5d099a3aa2d226fdf5428f8a3382440693ec98836cc61b1a71ebda352d3
-size 5620

 version https://git-lfs.github.com/spec/v1
+oid sha256:502aff7fdf42b72e4b74549c20e58c35d46838e38c75b550afc2c14f14ce8710
+size 25810

runs/Jun30_23-40-29_r-robo-noct-autotrain-advanced-kegy3hzm-59701-y966k/events.out.tfevents.1751327028.r-robo-noct-autotrain-advanced-kegy3hzm-59701-y966k.114.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f1bceee9820d7a77eaafb097e463b608cabc2ec5e1a03f32d7e19a25256c4d81
+size 906

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "MobileBertTokenizer",
+  "unk_token": "[UNK]"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91985e71ce5cb37df961d9103170c821b998b7345c2051c8e5b5548a218e1985
+size 5368

training_params.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+    "data_path": "greetings/autotrain-data",
+    "model": "google/mobilebert-uncased",
+    "lr": 5e-05,
+    "epochs": 3,
+    "max_seq_length": 128,
+    "batch_size": 8,
+    "warmup_ratio": 0.1,
+    "gradient_accumulation": 1,
+    "optimizer": "adamw_torch",
+    "scheduler": "linear",
+    "weight_decay": 0.0,
+    "max_grad_norm": 1.0,
+    "seed": 42,
+    "train_split": "train",
+    "valid_split": "validation",
+    "text_column": "autotrain_text",
+    "target_column": "autotrain_label",
+    "logging_steps": -1,
+    "project_name": "greetings",
+    "auto_find_batch_size": false,
+    "mixed_precision": "fp16",
+    "save_total_limit": 1,
+    "push_to_hub": true,
+    "eval_strategy": "epoch",
+    "username": "robo-noct",
+    "log": "tensorboard",
+    "early_stopping_patience": 5,
+    "early_stopping_threshold": 0.01
+}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff