thilaksai77 commited on Apr 19, 2025

Commit

e041d61

verified ·

1 Parent(s): b6ce170

Upload folder using huggingface_hub

Browse files

Files changed (42) hide show

checkpoint-106/config.json +42 -0
checkpoint-106/model.safetensors +3 -0
checkpoint-106/optimizer.pt +3 -0
checkpoint-106/rng_state.pth +3 -0
checkpoint-106/scheduler.pt +3 -0
checkpoint-106/trainer_state.json +66 -0
checkpoint-106/training_args.bin +3 -0
checkpoint-159/config.json +42 -0
checkpoint-159/model.safetensors +3 -0
checkpoint-159/optimizer.pt +3 -0
checkpoint-159/rng_state.pth +3 -0
checkpoint-159/scheduler.pt +3 -0
checkpoint-159/trainer_state.json +82 -0
checkpoint-159/training_args.bin +3 -0
checkpoint-212/config.json +42 -0
checkpoint-212/model.safetensors +3 -0
checkpoint-212/optimizer.pt +3 -0
checkpoint-212/rng_state.pth +3 -0
checkpoint-212/scheduler.pt +3 -0
checkpoint-212/trainer_state.json +98 -0
checkpoint-212/training_args.bin +3 -0
checkpoint-265/config.json +42 -0
checkpoint-265/model.safetensors +3 -0
checkpoint-265/optimizer.pt +3 -0
checkpoint-265/rng_state.pth +3 -0
checkpoint-265/scheduler.pt +3 -0
checkpoint-265/trainer_state.json +114 -0
checkpoint-265/training_args.bin +3 -0
checkpoint-53/config.json +42 -0
checkpoint-53/model.safetensors +3 -0
checkpoint-53/optimizer.pt +3 -0
checkpoint-53/rng_state.pth +3 -0
checkpoint-53/scheduler.pt +3 -0
checkpoint-53/trainer_state.json +50 -0
checkpoint-53/training_args.bin +3 -0
config.json +42 -0
label_encoder.joblib +3 -0
model.safetensors +3 -0
special_tokens_map.json +7 -0
tokenizer.json +0 -0
tokenizer_config.json +56 -0
vocab.txt +0 -0

checkpoint-106/config.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6"
+  },
+  "initializer_range": 0.02,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2,
+    "LABEL_3": 3,
+    "LABEL_4": 4,
+    "LABEL_5": 5,
+    "LABEL_6": 6
+  },
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.51.3",
+  "vocab_size": 30522
+}

checkpoint-106/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6080ad8f680c96f69d7615cfc2f17cd3aa3a5d7d86a120fdd73fb3fbe5cd54bc
+size 267847948

checkpoint-106/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c2f6ed832b46410fc9808835f0e3b557805210aed2d25d701ec786bce49938fa
+size 535755130

checkpoint-106/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:06e55bfc8723f269a626afca0be6f7def5753f3bb265436b94c5580b703cfcc7
+size 13990

checkpoint-106/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d454f75613eedad47305d0f5455c6623b5e20d207f2b824cc564f1776df73e4
+size 1064

checkpoint-106/trainer_state.json ADDED Viewed

	@@ -0,0 +1,66 @@

+{
+  "best_global_step": 106,
+  "best_metric": 0.5238095238095238,
+  "best_model_checkpoint": "./emotion_classifier/checkpoint-106",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 106,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9433962264150944,
+      "grad_norm": 3.0282411575317383,
+      "learning_rate": 1.6301886792452833e-05,
+      "loss": 1.6377,
+      "step": 50
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.47619047619047616,
+      "eval_loss": 1.4806143045425415,
+      "eval_runtime": 2.5602,
+      "eval_samples_per_second": 41.012,
+      "eval_steps_per_second": 2.734,
+      "step": 53
+    },
+    {
+      "epoch": 1.8867924528301887,
+      "grad_norm": 5.8678812980651855,
+      "learning_rate": 1.2528301886792453e-05,
+      "loss": 1.4,
+      "step": 100
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.5238095238095238,
+      "eval_loss": 1.3838814496994019,
+      "eval_runtime": 2.3279,
+      "eval_samples_per_second": 45.106,
+      "eval_steps_per_second": 3.007,
+      "step": 106
+    }
+  ],
+  "logging_steps": 50,
+  "max_steps": 265,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 55641268408320.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-106/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9176974d5ca9307eaa01d489fefe68df96bb0a20f04f32ce3a207d3158a4f91d
+size 5240

checkpoint-159/config.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6"
+  },
+  "initializer_range": 0.02,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2,
+    "LABEL_3": 3,
+    "LABEL_4": 4,
+    "LABEL_5": 5,
+    "LABEL_6": 6
+  },
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.51.3",
+  "vocab_size": 30522
+}

checkpoint-159/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cf7ac83f56b901c470482732a0102fa47de706dc56618c1d32811db881d4720d
+size 267847948

checkpoint-159/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6da379e7c982530b9c15753734b706ae5c65f64e41dd105d64481f302c5d5f24
+size 535755130

checkpoint-159/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:32d32051101ec51c2b04c4ee6a6d2c7f40562e56836cbb02d6e6e3126490484d
+size 13990

checkpoint-159/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6f1da9e78fb7143f96c608378211ebe49e8b42e09cc551a079d15d8d54a1a44
+size 1064

checkpoint-159/trainer_state.json ADDED Viewed

	@@ -0,0 +1,82 @@

+{
+  "best_global_step": 106,
+  "best_metric": 0.5238095238095238,
+  "best_model_checkpoint": "./emotion_classifier/checkpoint-106",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 159,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9433962264150944,
+      "grad_norm": 3.0282411575317383,
+      "learning_rate": 1.6301886792452833e-05,
+      "loss": 1.6377,
+      "step": 50
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.47619047619047616,
+      "eval_loss": 1.4806143045425415,
+      "eval_runtime": 2.5602,
+      "eval_samples_per_second": 41.012,
+      "eval_steps_per_second": 2.734,
+      "step": 53
+    },
+    {
+      "epoch": 1.8867924528301887,
+      "grad_norm": 5.8678812980651855,
+      "learning_rate": 1.2528301886792453e-05,
+      "loss": 1.4,
+      "step": 100
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.5238095238095238,
+      "eval_loss": 1.3838814496994019,
+      "eval_runtime": 2.3279,
+      "eval_samples_per_second": 45.106,
+      "eval_steps_per_second": 3.007,
+      "step": 106
+    },
+    {
+      "epoch": 2.830188679245283,
+      "grad_norm": 4.850906848907471,
+      "learning_rate": 8.754716981132076e-06,
+      "loss": 1.2805,
+      "step": 150
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.5238095238095238,
+      "eval_loss": 1.3527458906173706,
+      "eval_runtime": 2.4197,
+      "eval_samples_per_second": 43.394,
+      "eval_steps_per_second": 2.893,
+      "step": 159
+    }
+  ],
+  "logging_steps": 50,
+  "max_steps": 265,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 83461902612480.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-159/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9176974d5ca9307eaa01d489fefe68df96bb0a20f04f32ce3a207d3158a4f91d
+size 5240

checkpoint-212/config.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6"
+  },
+  "initializer_range": 0.02,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2,
+    "LABEL_3": 3,
+    "LABEL_4": 4,
+    "LABEL_5": 5,
+    "LABEL_6": 6
+  },
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.51.3",
+  "vocab_size": 30522
+}

checkpoint-212/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05db532e969998d68aab84e8793f077254f48699ddef1b716bee5218b010da1d
+size 267847948

checkpoint-212/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:86242dbcb65e37020fbbb309a71609d3bbb2b5c335006214af46fec7212439ec
+size 535755130

checkpoint-212/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2fed77b14fe062f6db72d68cedd6fd95bae3305b7a735eef3c85da43fd15d476
+size 13990

checkpoint-212/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4975515fea706f12828b41b6a19e58079c2d505f4d25932c978e5edb1c949651
+size 1064

checkpoint-212/trainer_state.json ADDED Viewed

	@@ -0,0 +1,98 @@

+{
+  "best_global_step": 212,
+  "best_metric": 0.5619047619047619,
+  "best_model_checkpoint": "./emotion_classifier/checkpoint-212",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 212,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9433962264150944,
+      "grad_norm": 3.0282411575317383,
+      "learning_rate": 1.6301886792452833e-05,
+      "loss": 1.6377,
+      "step": 50
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.47619047619047616,
+      "eval_loss": 1.4806143045425415,
+      "eval_runtime": 2.5602,
+      "eval_samples_per_second": 41.012,
+      "eval_steps_per_second": 2.734,
+      "step": 53
+    },
+    {
+      "epoch": 1.8867924528301887,
+      "grad_norm": 5.8678812980651855,
+      "learning_rate": 1.2528301886792453e-05,
+      "loss": 1.4,
+      "step": 100
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.5238095238095238,
+      "eval_loss": 1.3838814496994019,
+      "eval_runtime": 2.3279,
+      "eval_samples_per_second": 45.106,
+      "eval_steps_per_second": 3.007,
+      "step": 106
+    },
+    {
+      "epoch": 2.830188679245283,
+      "grad_norm": 4.850906848907471,
+      "learning_rate": 8.754716981132076e-06,
+      "loss": 1.2805,
+      "step": 150
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.5238095238095238,
+      "eval_loss": 1.3527458906173706,
+      "eval_runtime": 2.4197,
+      "eval_samples_per_second": 43.394,
+      "eval_steps_per_second": 2.893,
+      "step": 159
+    },
+    {
+      "epoch": 3.7735849056603774,
+      "grad_norm": 5.995235919952393,
+      "learning_rate": 4.981132075471698e-06,
+      "loss": 1.1901,
+      "step": 200
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.5619047619047619,
+      "eval_loss": 1.3129359483718872,
+      "eval_runtime": 2.3883,
+      "eval_samples_per_second": 43.964,
+      "eval_steps_per_second": 2.931,
+      "step": 212
+    }
+  ],
+  "logging_steps": 50,
+  "max_steps": 265,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 111282536816640.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-212/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9176974d5ca9307eaa01d489fefe68df96bb0a20f04f32ce3a207d3158a4f91d
+size 5240

checkpoint-265/config.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6"
+  },
+  "initializer_range": 0.02,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2,
+    "LABEL_3": 3,
+    "LABEL_4": 4,
+    "LABEL_5": 5,
+    "LABEL_6": 6
+  },
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.51.3",
+  "vocab_size": 30522
+}

checkpoint-265/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91e89b6ec3ca68b80d5a63dd889e7abac68c35ff11edc084857cb6acd90e9fad
+size 267847948

checkpoint-265/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:672a5278e81c001a17230b84b8783e3f00d4d1bbda5d9c6ec4ef8c3768c7754c
+size 535755130

checkpoint-265/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:013d13e4b269a8648da58d2f40bf48e004388ea0631771b8c8e588ab75375092
+size 13990

checkpoint-265/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e4c4cef33a319fecd6991107d5735165ecc2806d559e7a9020ceb0f2dfce8ad
+size 1064

checkpoint-265/trainer_state.json ADDED Viewed

	@@ -0,0 +1,114 @@

+{
+  "best_global_step": 212,
+  "best_metric": 0.5619047619047619,
+  "best_model_checkpoint": "./emotion_classifier/checkpoint-212",
+  "epoch": 5.0,
+  "eval_steps": 500,
+  "global_step": 265,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9433962264150944,
+      "grad_norm": 3.0282411575317383,
+      "learning_rate": 1.6301886792452833e-05,
+      "loss": 1.6377,
+      "step": 50
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.47619047619047616,
+      "eval_loss": 1.4806143045425415,
+      "eval_runtime": 2.5602,
+      "eval_samples_per_second": 41.012,
+      "eval_steps_per_second": 2.734,
+      "step": 53
+    },
+    {
+      "epoch": 1.8867924528301887,
+      "grad_norm": 5.8678812980651855,
+      "learning_rate": 1.2528301886792453e-05,
+      "loss": 1.4,
+      "step": 100
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.5238095238095238,
+      "eval_loss": 1.3838814496994019,
+      "eval_runtime": 2.3279,
+      "eval_samples_per_second": 45.106,
+      "eval_steps_per_second": 3.007,
+      "step": 106
+    },
+    {
+      "epoch": 2.830188679245283,
+      "grad_norm": 4.850906848907471,
+      "learning_rate": 8.754716981132076e-06,
+      "loss": 1.2805,
+      "step": 150
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.5238095238095238,
+      "eval_loss": 1.3527458906173706,
+      "eval_runtime": 2.4197,
+      "eval_samples_per_second": 43.394,
+      "eval_steps_per_second": 2.893,
+      "step": 159
+    },
+    {
+      "epoch": 3.7735849056603774,
+      "grad_norm": 5.995235919952393,
+      "learning_rate": 4.981132075471698e-06,
+      "loss": 1.1901,
+      "step": 200
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.5619047619047619,
+      "eval_loss": 1.3129359483718872,
+      "eval_runtime": 2.3883,
+      "eval_samples_per_second": 43.964,
+      "eval_steps_per_second": 2.931,
+      "step": 212
+    },
+    {
+      "epoch": 4.716981132075472,
+      "grad_norm": 5.1387858390808105,
+      "learning_rate": 1.207547169811321e-06,
+      "loss": 1.1054,
+      "step": 250
+    },
+    {
+      "epoch": 5.0,
+      "eval_accuracy": 0.5619047619047619,
+      "eval_loss": 1.3082963228225708,
+      "eval_runtime": 2.8874,
+      "eval_samples_per_second": 36.365,
+      "eval_steps_per_second": 2.424,
+      "step": 265
+    }
+  ],
+  "logging_steps": 50,
+  "max_steps": 265,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 139103171020800.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-265/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9176974d5ca9307eaa01d489fefe68df96bb0a20f04f32ce3a207d3158a4f91d
+size 5240

checkpoint-53/config.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6"
+  },
+  "initializer_range": 0.02,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2,
+    "LABEL_3": 3,
+    "LABEL_4": 4,
+    "LABEL_5": 5,
+    "LABEL_6": 6
+  },
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.51.3",
+  "vocab_size": 30522
+}

checkpoint-53/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0592d0c1503f64aec1f8fdf55535d5502ee1897a730a515560a943cb1043447d
+size 267847948

checkpoint-53/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3c2a8bfe652da492f8a075be57243a9e4d4308b34c37484ae24a09ca6a092775
+size 535755130

checkpoint-53/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8b182573f61d8bcf5eaefcbf8f98d8734b6db51b44ad36aed3a305c431539fa1
+size 13990

checkpoint-53/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6b5f63d83bd91fc8f839183eaded51a51404df88223c86067e72107f7fcf1d3f
+size 1064

checkpoint-53/trainer_state.json ADDED Viewed

	@@ -0,0 +1,50 @@

+{
+  "best_global_step": 53,
+  "best_metric": 0.47619047619047616,
+  "best_model_checkpoint": "./emotion_classifier/checkpoint-53",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 53,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9433962264150944,
+      "grad_norm": 3.0282411575317383,
+      "learning_rate": 1.6301886792452833e-05,
+      "loss": 1.6377,
+      "step": 50
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.47619047619047616,
+      "eval_loss": 1.4806143045425415,
+      "eval_runtime": 2.5602,
+      "eval_samples_per_second": 41.012,
+      "eval_steps_per_second": 2.734,
+      "step": 53
+    }
+  ],
+  "logging_steps": 50,
+  "max_steps": 265,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 27820634204160.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-53/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9176974d5ca9307eaa01d489fefe68df96bb0a20f04f32ce3a207d3158a4f91d
+size 5240

config.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5",
+    "6": "LABEL_6"
+  },
+  "initializer_range": 0.02,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2,
+    "LABEL_3": 3,
+    "LABEL_4": 4,
+    "LABEL_5": 5,
+    "LABEL_6": 6
+  },
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.51.3",
+  "vocab_size": 30522
+}

label_encoder.joblib ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fec0df84b82ac7d39a7922b4afdde8eac836d198673eb110dcf5ff29b6e6cb24
+size 608

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05db532e969998d68aab84e8793f077254f48699ddef1b716bee5218b010da1d
+size 267847948

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff