dannychou commited on Dec 23, 2023

Commit

1d51f0b

1 Parent(s): 6e147d0

Training in progress, epoch 5

Browse files

Files changed (46) hide show

model.safetensors +1 -1
run-3/checkpoint-1072/config.json +25 -0
run-3/checkpoint-1072/model.safetensors +3 -0
run-3/checkpoint-1072/optimizer.pt +3 -0
run-3/checkpoint-1072/rng_state.pth +3 -0
run-3/checkpoint-1072/scheduler.pt +3 -0
run-3/checkpoint-1072/special_tokens_map.json +7 -0
run-3/checkpoint-1072/tokenizer.json +0 -0
run-3/checkpoint-1072/tokenizer_config.json +55 -0
run-3/checkpoint-1072/trainer_state.json +74 -0
run-3/checkpoint-1072/training_args.bin +3 -0
run-3/checkpoint-1072/vocab.txt +0 -0
run-3/checkpoint-268/config.json +25 -0
run-3/checkpoint-268/model.safetensors +3 -0
run-3/checkpoint-268/optimizer.pt +3 -0
run-3/checkpoint-268/rng_state.pth +3 -0
run-3/checkpoint-268/scheduler.pt +3 -0
run-3/checkpoint-268/special_tokens_map.json +7 -0
run-3/checkpoint-268/tokenizer.json +0 -0
run-3/checkpoint-268/tokenizer_config.json +55 -0
run-3/checkpoint-268/trainer_state.json +35 -0
run-3/checkpoint-268/training_args.bin +3 -0
run-3/checkpoint-268/vocab.txt +0 -0
run-3/checkpoint-536/config.json +25 -0
run-3/checkpoint-536/model.safetensors +3 -0
run-3/checkpoint-536/optimizer.pt +3 -0
run-3/checkpoint-536/rng_state.pth +3 -0
run-3/checkpoint-536/scheduler.pt +3 -0
run-3/checkpoint-536/special_tokens_map.json +7 -0
run-3/checkpoint-536/tokenizer.json +0 -0
run-3/checkpoint-536/tokenizer_config.json +55 -0
run-3/checkpoint-536/trainer_state.json +50 -0
run-3/checkpoint-536/training_args.bin +3 -0
run-3/checkpoint-536/vocab.txt +0 -0
run-3/checkpoint-804/config.json +25 -0
run-3/checkpoint-804/model.safetensors +3 -0
run-3/checkpoint-804/optimizer.pt +3 -0
run-3/checkpoint-804/rng_state.pth +3 -0
run-3/checkpoint-804/scheduler.pt +3 -0
run-3/checkpoint-804/special_tokens_map.json +7 -0
run-3/checkpoint-804/tokenizer.json +0 -0
run-3/checkpoint-804/tokenizer_config.json +55 -0
run-3/checkpoint-804/trainer_state.json +59 -0
run-3/checkpoint-804/training_args.bin +3 -0
run-3/checkpoint-804/vocab.txt +0 -0
runs/Dec23_02-10-12_067bf7a71e5c/events.out.tfevents.1703298490.067bf7a71e5c.178.5 +2 -2

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:df9da5d86d23a16eca8727d004dfe63b540561578a05c9033bcea31d05e1767e
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:d747f47ecdd25c1b091c915b2013ee4bdb18de77acfb25abbd5ceb5b8190e40a
 size 267832560

run-3/checkpoint-1072/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.2",
+  "vocab_size": 30522
+}

run-3/checkpoint-1072/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:612692b245ca538d9a6e5f6279115ccea72532d92ce833a6eba9d47249f20e76
+size 267832560

run-3/checkpoint-1072/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc79440b5bd720145f5f7eb32edc941fd85898fc38b9a620a7e7cd431b4d2db1
+size 535727290

run-3/checkpoint-1072/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c427b597378496e52a675cc52b7e7854560eca517bcc1a9acff185bab072c6e7
+size 14308

run-3/checkpoint-1072/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:625ac2ebd4538e5d5db3ebd5483143d39404f7887dda5e6f5564668b9441bb7b
+size 1064

run-3/checkpoint-1072/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-1072/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-1072/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-1072/trainer_state.json ADDED Viewed

	@@ -0,0 +1,74 @@

+{
+  "best_metric": 0.5104242686414723,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-1072",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 1072,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.49783048033714294,
+      "eval_matthews_correlation": 0.4111094454070522,
+      "eval_runtime": 0.7234,
+      "eval_samples_per_second": 1441.791,
+      "eval_steps_per_second": 91.235,
+      "step": 268
+    },
+    {
+      "epoch": 1.87,
+      "learning_rate": 7.123299677400847e-06,
+      "loss": 0.4894,
+      "step": 500
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5266438126564026,
+      "eval_matthews_correlation": 0.44722803398940786,
+      "eval_runtime": 0.7661,
+      "eval_samples_per_second": 1361.434,
+      "eval_steps_per_second": 86.15,
+      "step": 536
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.4729432761669159,
+      "eval_matthews_correlation": 0.5011490576561073,
+      "eval_runtime": 0.7179,
+      "eval_samples_per_second": 1452.841,
+      "eval_steps_per_second": 91.934,
+      "step": 804
+    },
+    {
+      "epoch": 3.73,
+      "learning_rate": 2.8832403456146286e-06,
+      "loss": 0.3212,
+      "step": 1000
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 0.5100820064544678,
+      "eval_matthews_correlation": 0.5104242686414723,
+      "eval_runtime": 0.8168,
+      "eval_samples_per_second": 1276.879,
+      "eval_steps_per_second": 80.8,
+      "step": 1072
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 1340,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 190621621567536.0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.1363359009187065e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 20
+  }
+}

run-3/checkpoint-1072/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b79499fe7d2034d8df2f65fc54dbfcd286a83e4c8aaa162c7b786314e484018d
+size 4792

run-3/checkpoint-1072/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-268/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.2",
+  "vocab_size": 30522
+}

run-3/checkpoint-268/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:df9da5d86d23a16eca8727d004dfe63b540561578a05c9033bcea31d05e1767e
+size 267832560

run-3/checkpoint-268/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a679603d9a76cfdbe2781eaf220b8313e1d6d44585e9153d707f8f52e61d3e77
+size 535727290

run-3/checkpoint-268/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9b8cfe25a915f9cc83ad71e9d831288a4edb9a530a69cb0778e7d75bb45a8399
+size 14308

run-3/checkpoint-268/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c7de586a3166598384cec9203cee7749fbf217486c3e1d29520f587dfa87956c
+size 1064

run-3/checkpoint-268/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-268/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-268/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-268/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.4111094454070522,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-268",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 268,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.49783048033714294,
+      "eval_matthews_correlation": 0.4111094454070522,
+      "eval_runtime": 0.7234,
+      "eval_samples_per_second": 1441.791,
+      "eval_steps_per_second": 91.235,
+      "step": 268
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 1340,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.1363359009187065e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 20
+  }
+}

run-3/checkpoint-268/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b79499fe7d2034d8df2f65fc54dbfcd286a83e4c8aaa162c7b786314e484018d
+size 4792

run-3/checkpoint-268/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-536/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.2",
+  "vocab_size": 30522
+}

run-3/checkpoint-536/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b344648de241011aa94f996e376817a0f10aba4078d77dba6e93a40c5e7916b5
+size 267832560

run-3/checkpoint-536/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2dc4362081b09b792adf0973ce8e55644289eebb37f9ea18418bdf05f5ae24e6
+size 535727290

run-3/checkpoint-536/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5eaf189c1b343d7c12f945cff87634b5508ec0a3a9be437fac5ba23414a097e1
+size 14308

run-3/checkpoint-536/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:42eb6a22f790c1818f6be136a2bf2f7a3374076047162452f27ed2546d14018d
+size 1064

run-3/checkpoint-536/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-536/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-536/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-536/trainer_state.json ADDED Viewed

	@@ -0,0 +1,50 @@

+{
+  "best_metric": 0.44722803398940786,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-536",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 536,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.49783048033714294,
+      "eval_matthews_correlation": 0.4111094454070522,
+      "eval_runtime": 0.7234,
+      "eval_samples_per_second": 1441.791,
+      "eval_steps_per_second": 91.235,
+      "step": 268
+    },
+    {
+      "epoch": 1.87,
+      "learning_rate": 7.123299677400847e-06,
+      "loss": 0.4894,
+      "step": 500
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5266438126564026,
+      "eval_matthews_correlation": 0.44722803398940786,
+      "eval_runtime": 0.7661,
+      "eval_samples_per_second": 1361.434,
+      "eval_steps_per_second": 86.15,
+      "step": 536
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 1340,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 95454144648720.0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.1363359009187065e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 20
+  }
+}

run-3/checkpoint-536/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b79499fe7d2034d8df2f65fc54dbfcd286a83e4c8aaa162c7b786314e484018d
+size 4792

run-3/checkpoint-536/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-804/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.2",
+  "vocab_size": 30522
+}

run-3/checkpoint-804/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d6018f5193f2bd259e1a5abc21969c8bdcc49733862c8d736396bd9e7ac48d58
+size 267832560

run-3/checkpoint-804/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:21192d208e889d8d0fb1853a20d4782a456acc266cd685f883aa64a953ce599a
+size 535727290

run-3/checkpoint-804/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b41f2ce534f4fadba8f6290aab1b81abd8b58681428b6205d4ea30dd7c33ae74
+size 14308

run-3/checkpoint-804/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:82343c51c4eb7f4880e03f8be75b76daf228610277755fe29fbef7a7e4487f81
+size 1064

run-3/checkpoint-804/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-804/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-3/checkpoint-804/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-3/checkpoint-804/trainer_state.json ADDED Viewed

	@@ -0,0 +1,59 @@

+{
+  "best_metric": 0.5011490576561073,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-3/checkpoint-804",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 804,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.49783048033714294,
+      "eval_matthews_correlation": 0.4111094454070522,
+      "eval_runtime": 0.7234,
+      "eval_samples_per_second": 1441.791,
+      "eval_steps_per_second": 91.235,
+      "step": 268
+    },
+    {
+      "epoch": 1.87,
+      "learning_rate": 7.123299677400847e-06,
+      "loss": 0.4894,
+      "step": 500
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5266438126564026,
+      "eval_matthews_correlation": 0.44722803398940786,
+      "eval_runtime": 0.7661,
+      "eval_samples_per_second": 1361.434,
+      "eval_steps_per_second": 86.15,
+      "step": 536
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.4729432761669159,
+      "eval_matthews_correlation": 0.5011490576561073,
+      "eval_runtime": 0.7179,
+      "eval_samples_per_second": 1452.841,
+      "eval_steps_per_second": 91.934,
+      "step": 804
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 1340,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 95454144648720.0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.1363359009187065e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 32,
+    "seed": 20
+  }
+}

run-3/checkpoint-804/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b79499fe7d2034d8df2f65fc54dbfcd286a83e4c8aaa162c7b786314e484018d
+size 4792

run-3/checkpoint-804/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

runs/Dec23_02-10-12_067bf7a71e5c/events.out.tfevents.1703298490.067bf7a71e5c.178.5 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:eb0db4d47370b4ec1da67edc9cebc83883adb9feb1e0bd3e070d654e3e36abf0
-size 5177

 version https://git-lfs.github.com/spec/v1
+oid sha256:fa403654bf2ac2814fa4b732d50c2514e693e0ba8f4096cb5b9c2316901cc15f
+size 6693