jkloip commited on Dec 23, 2023

Commit

b757da9

1 Parent(s): 5ff920b

Training in progress, epoch 5

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model.safetensors +1 -1
run-3/checkpoint-134/config.json +25 -0
run-3/checkpoint-134/model.safetensors +3 -0
run-3/checkpoint-134/optimizer.pt +3 -0
run-3/checkpoint-134/rng_state.pth +3 -0
run-3/checkpoint-134/scheduler.pt +3 -0
run-3/checkpoint-134/special_tokens_map.json +7 -0
run-3/checkpoint-134/tokenizer.json +0 -0
run-3/checkpoint-134/tokenizer_config.json +55 -0
run-3/checkpoint-134/trainer_state.json +35 -0
run-3/checkpoint-134/training_args.bin +3 -0
run-3/checkpoint-134/vocab.txt +0 -0
run-3/checkpoint-268/config.json +25 -0
run-3/checkpoint-268/model.safetensors +3 -0
run-3/checkpoint-268/optimizer.pt +3 -0
run-3/checkpoint-268/rng_state.pth +3 -0
run-3/checkpoint-268/scheduler.pt +3 -0
run-3/checkpoint-268/special_tokens_map.json +7 -0
run-3/checkpoint-268/tokenizer.json +0 -0
run-3/checkpoint-268/tokenizer_config.json +55 -0
run-3/checkpoint-268/trainer_state.json +44 -0
run-3/checkpoint-268/training_args.bin +3 -0
run-3/checkpoint-268/vocab.txt +0 -0
run-3/checkpoint-402/config.json +25 -0
run-3/checkpoint-402/model.safetensors +3 -0
run-3/checkpoint-402/optimizer.pt +3 -0
run-3/checkpoint-402/rng_state.pth +3 -0
run-3/checkpoint-402/scheduler.pt +3 -0
run-3/checkpoint-402/special_tokens_map.json +7 -0
run-3/checkpoint-402/tokenizer.json +0 -0
run-3/checkpoint-402/tokenizer_config.json +55 -0
run-3/checkpoint-402/trainer_state.json +53 -0
run-3/checkpoint-402/training_args.bin +3 -0
run-3/checkpoint-402/vocab.txt +0 -0
run-3/checkpoint-536/config.json +25 -0
run-3/checkpoint-536/model.safetensors +3 -0
run-3/checkpoint-536/optimizer.pt +3 -0
run-3/checkpoint-536/rng_state.pth +3 -0
run-3/checkpoint-536/scheduler.pt +3 -0
run-3/checkpoint-536/special_tokens_map.json +7 -0
run-3/checkpoint-536/tokenizer.json +0 -0
run-3/checkpoint-536/tokenizer_config.json +55 -0
run-3/checkpoint-536/trainer_state.json +68 -0
run-3/checkpoint-536/training_args.bin +3 -0
run-3/checkpoint-536/vocab.txt +0 -0
run-3/checkpoint-670/config.json +25 -0
run-3/checkpoint-670/model.safetensors +3 -0
run-3/checkpoint-670/optimizer.pt +3 -0
run-3/checkpoint-670/rng_state.pth +3 -0
run-3/checkpoint-670/scheduler.pt +3 -0

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c357968e0a3805db65c07d3c26ba48a78f6bd0bed57b7173d45b64ea9bb85388
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:18c08b238185a665e6c765c8543a25da9deb3f4fa8c810fa3f5a10a7cefdf02b
 size 267832560

run-3/checkpoint-134/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.2",
+  "vocab_size": 30522
+}

run-3/checkpoint-134/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c357968e0a3805db65c07d3c26ba48a78f6bd0bed57b7173d45b64ea9bb85388
+size 267832560

run-3/checkpoint-134/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3311991337ab90a77d3c3a714795c72c6a096e6e97f9b1ed4a95f02a4187c2fb
+size 535727290

run-3/checkpoint-134/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:672d05d07791b4671d0f7afa38c63a9ff85090cdc1d04cbad9ddfce0f46ec00d
+size 14308

run-3/checkpoint-134/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:adba1f7fc495a437f1201f5de22d3b69e0016f8d69c0e7f699f76582f591ca1d
+size 1064

run-3/checkpoint-134/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-134/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-134/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-134/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.5003634450667074,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-134",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 134,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.461589515209198,
+      "eval_matthews_correlation": 0.5003634450667074,
+      "eval_runtime": 0.7344,
+      "eval_samples_per_second": 1420.294,
+      "eval_steps_per_second": 89.875,
+      "step": 134
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 670,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.39643585629229e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 8
+  }
+}

run-3/checkpoint-134/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d067f40a1b69ace8d63eac7f97d640452b05211e150c858ed37e0bb442c21c6
+size 4792

run-3/checkpoint-134/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-268/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.2",
+  "vocab_size": 30522
+}

run-3/checkpoint-268/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff4b456a35d5f5fe2929e52f56dc1932d473f4a7020bfd856dc9e2737b0225ed
+size 267832560

run-3/checkpoint-268/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7263d4956a17aacb83f241a32d19a027251ea180ffff3033bb6c4db4390edab2
+size 535727290

run-3/checkpoint-268/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:543eb2f41e910aede1a91d84ecba8220d76bd861ddd49309c8a6285aff0f9aca
+size 14308

run-3/checkpoint-268/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f30d13db5297df36df88f2cb9c9a8dae3813d321bf15bb00e436a6e486bae69
+size 1064

run-3/checkpoint-268/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-268/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-268/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-268/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.5294539646667358,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-268",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 268,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.461589515209198,
+      "eval_matthews_correlation": 0.5003634450667074,
+      "eval_runtime": 0.7344,
+      "eval_samples_per_second": 1420.294,
+      "eval_steps_per_second": 89.875,
+      "step": 134
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.4695161283016205,
+      "eval_matthews_correlation": 0.5294539646667358,
+      "eval_runtime": 0.8028,
+      "eval_samples_per_second": 1299.154,
+      "eval_steps_per_second": 82.209,
+      "step": 268
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 670,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.39643585629229e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 8
+  }
+}

run-3/checkpoint-268/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d067f40a1b69ace8d63eac7f97d640452b05211e150c858ed37e0bb442c21c6
+size 4792

run-3/checkpoint-268/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-402/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.2",
+  "vocab_size": 30522
+}

run-3/checkpoint-402/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1e0c758160eb243610bc9b5fbb75d997db3cd02ab7e91bbf884cb95aa63a4fcf
+size 267832560

run-3/checkpoint-402/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fe59b45501434c3a13127695cf06458843f03f8df90a5c8bdbc4ae2cf9baa23b
+size 535727290

run-3/checkpoint-402/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:51731b36423511e6bbba899c1ecf4400783db1e30329c95ab76cb45afe42b280
+size 14308

run-3/checkpoint-402/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bbab540f7b7dd0b30df7a5b0680dae8208aa19a651310ca85f138502d00d09dd
+size 1064

run-3/checkpoint-402/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-402/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-402/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-402/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": 0.5307774141574897,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-402",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 402,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.461589515209198,
+      "eval_matthews_correlation": 0.5003634450667074,
+      "eval_runtime": 0.7344,
+      "eval_samples_per_second": 1420.294,
+      "eval_steps_per_second": 89.875,
+      "step": 134
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.4695161283016205,
+      "eval_matthews_correlation": 0.5294539646667358,
+      "eval_runtime": 0.8028,
+      "eval_samples_per_second": 1299.154,
+      "eval_steps_per_second": 82.209,
+      "step": 268
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.5461736917495728,
+      "eval_matthews_correlation": 0.5307774141574897,
+      "eval_runtime": 0.7708,
+      "eval_samples_per_second": 1353.061,
+      "eval_steps_per_second": 85.62,
+      "step": 402
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 670,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.39643585629229e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 8
+  }
+}

run-3/checkpoint-402/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d067f40a1b69ace8d63eac7f97d640452b05211e150c858ed37e0bb442c21c6
+size 4792

run-3/checkpoint-402/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-536/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.2",
+  "vocab_size": 30522
+}

run-3/checkpoint-536/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fd237df06af3bdaf8f0bae9d83c50dfabb167651af9c1cd482a209412f1121d3
+size 267832560

run-3/checkpoint-536/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:df40308541c65aeb30f9a9d3c0c08d096c95d20d7e7a19588e0d9d8fa2992c9a
+size 535727290

run-3/checkpoint-536/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b5b279552773eaceb1f4413113fbd71d8de8fb91e90760d113942025fc702866
+size 14308

run-3/checkpoint-536/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:125ab61c904d7d6bdbbae34a5e4413ed26f16770cfb0a40ee0dcdb552ed3c974
+size 1064

run-3/checkpoint-536/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-536/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-536/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-536/trainer_state.json ADDED Viewed

	@@ -0,0 +1,68 @@

+{
+  "best_metric": 0.5452100835559165,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-536",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 536,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.461589515209198,
+      "eval_matthews_correlation": 0.5003634450667074,
+      "eval_runtime": 0.7344,
+      "eval_samples_per_second": 1420.294,
+      "eval_steps_per_second": 89.875,
+      "step": 134
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.4695161283016205,
+      "eval_matthews_correlation": 0.5294539646667358,
+      "eval_runtime": 0.8028,
+      "eval_samples_per_second": 1299.154,
+      "eval_steps_per_second": 82.209,
+      "step": 268
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.5461736917495728,
+      "eval_matthews_correlation": 0.5307774141574897,
+      "eval_runtime": 0.7708,
+      "eval_samples_per_second": 1353.061,
+      "eval_steps_per_second": 85.62,
+      "step": 402
+    },
+    {
+      "epoch": 3.73,
+      "learning_rate": 1.1155135754771483e-05,
+      "loss": 0.3108,
+      "step": 500
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.6153345704078674,
+      "eval_matthews_correlation": 0.5452100835559165,
+      "eval_runtime": 1.1255,
+      "eval_samples_per_second": 926.661,
+      "eval_steps_per_second": 58.638,
+      "step": 536
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 670,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 210172722962532.0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.39643585629229e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 8
+  }
+}

run-3/checkpoint-536/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d067f40a1b69ace8d63eac7f97d640452b05211e150c858ed37e0bb442c21c6
+size 4792

run-3/checkpoint-536/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-670/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.2",
+  "vocab_size": 30522
+}

run-3/checkpoint-670/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:18c08b238185a665e6c765c8543a25da9deb3f4fa8c810fa3f5a10a7cefdf02b
+size 267832560

run-3/checkpoint-670/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9512b7910f1669173ffaf2fa83dc16c02303e93614ac64e47e0d5b051a264ca5
+size 535727290

run-3/checkpoint-670/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e340327c88a777fcc9ceef5f5a39f8264ab97fb7d31040e95b08a4454bed093
+size 14308

run-3/checkpoint-670/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d7f79e9f90e6f4bcadbfbd2bf23b381f22fdc5a0ce6ca1d2d782e864a09fc3f
+size 1064