Training in progress, step 500

Browse files

Files changed (9) hide show

config.json +104 -104
model.safetensors +1 -1
preprocessor_config.json +10 -10
runs/Aug30_20-40-57_zjh/events.out.tfevents.1756557678.zjh.6440.0 +3 -0
runs/Aug30_20-55-14_zjh/events.out.tfevents.1756558533.zjh.13840.0 +3 -0
special_tokens_map.json +30 -6
tokenizer_config.json +51 -51
training_args.bin +2 -2
vocab.json +34 -34

config.json CHANGED Viewed

@@ -1,104 +1,104 @@
-{
-  "activation_dropout": 0.1,
-  "apply_spec_augment": true,
-  "architectures": [
-    "UniSpeechSatForCTC"
-  ],
-  "attention_dropout": 0.1,
-  "bos_token_id": 1,
-  "classifier_proj_size": 256,
-  "codevector_dim": 256,
-  "contrastive_logits_temperature": 0.1,
-  "conv_bias": false,
-  "conv_dim": [
-    512,
-    512,
-    512,
-    512,
-    512,
-    512,
-    512
-  ],
-  "conv_kernel": [
-    10,
-    3,
-    3,
-    3,
-    3,
-    2,
-    2
-  ],
-  "conv_stride": [
-    5,
-    2,
-    2,
-    2,
-    2,
-    2,
-    2
-  ],
-  "ctc_loss_reduction": "mean",
-  "ctc_zero_infinity": false,
-  "diversity_loss_weight": 0.1,
-  "do_stable_layer_norm": false,
-  "eos_token_id": 2,
-  "feat_extract_activation": "gelu",
-  "feat_extract_dropout": 0.0,
-  "feat_extract_norm": "group",
-  "feat_proj_dropout": 0.1,
-  "feat_quantizer_dropout": 0.0,
-  "final_dropout": 0.1,
-  "hidden_act": "gelu",
-  "hidden_dropout": 0.1,
-  "hidden_dropout_prob": 0.1,
-  "hidden_size": 768,
-  "initializer_range": 0.02,
-  "intermediate_size": 3072,
-  "layer_norm_eps": 1e-05,
-  "layerdrop": 0.1,
-  "mask_feature_length": 10,
-  "mask_feature_min_masks": 0,
-  "mask_feature_prob": 0.0,
-  "mask_time_length": 10,
-  "mask_time_min_masks": 2,
-  "mask_time_prob": 0.05,
-  "model_type": "unispeech-sat",
-  "num_attention_heads": 12,
-  "num_clusters": 504,
-  "num_codevector_groups": 2,
-  "num_codevectors_per_group": 320,
-  "num_conv_pos_embedding_groups": 16,
-  "num_conv_pos_embeddings": 128,
-  "num_feat_extract_layers": 7,
-  "num_hidden_layers": 12,
-  "num_negatives": 100,
-  "pad_token_id": 0,
-  "proj_codevector_dim": 256,
-  "tdnn_dilation": [
-    1,
-    2,
-    3,
-    1,
-    1
-  ],
-  "tdnn_dim": [
-    512,
-    512,
-    512,
-    512,
-    1500
-  ],
-  "tdnn_kernel": [
-    5,
-    3,
-    3,
-    1,
-    1
-  ],
-  "tokenizer_class": "Wav2Vec2CTCTokenizer",
-  "torch_dtype": "float32",
-  "transformers_version": "4.55.4",
-  "use_weighted_layer_sum": false,
-  "vocab_size": 32,
-  "xvector_output_dim": 512
-}

+{
+  "activation_dropout": 0.1,
+  "apply_spec_augment": true,
+  "architectures": [
+    "UniSpeechSatForCTC"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "codevector_dim": 256,
+  "contrastive_logits_temperature": 0.1,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "mean",
+  "ctc_zero_infinity": false,
+  "diversity_loss_weight": 0.1,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_dropout": 0.0,
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.1,
+  "feat_quantizer_dropout": 0.0,
+  "final_dropout": 0.1,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.1,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "unispeech-sat",
+  "num_attention_heads": 12,
+  "num_clusters": 504,
+  "num_codevector_groups": 2,
+  "num_codevectors_per_group": 320,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 12,
+  "num_negatives": 100,
+  "pad_token_id": 0,
+  "proj_codevector_dim": 256,
+  "tdnn_dilation": [
+    1,
+    2,
+    3,
+    1,
+    1
+  ],
+  "tdnn_dim": [
+    512,
+    512,
+    512,
+    512,
+    1500
+  ],
+  "tdnn_kernel": [
+    5,
+    3,
+    3,
+    1,
+    1
+  ],
+  "tokenizer_class": "Wav2Vec2CTCTokenizer",
+  "torch_dtype": "float32",
+  "transformers_version": "4.51.0",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32,
+  "xvector_output_dim": 512
+}

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:77defddc818ed32ce3fc8e7d34a9f0836438e896b2f1b688076e4f125929e98f
 size 377612176

 version https://git-lfs.github.com/spec/v1
+oid sha256:7449f5c3d4a726fea7d5e044718ce92bd6538d64d2f5a28ca5f8ce90ddb7f32e
 size 377612176

preprocessor_config.json CHANGED Viewed

@@ -1,10 +1,10 @@
-{
-  "do_normalize": true,
-  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
-  "feature_size": 1,
-  "padding_side": "right",
-  "padding_value": 0,
-  "processor_class": "Wav2Vec2Processor",
-  "return_attention_mask": false,
-  "sampling_rate": 16000
-}

+{
+  "do_normalize": true,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "processor_class": "Wav2Vec2Processor",
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

runs/Aug30_20-40-57_zjh/events.out.tfevents.1756557678.zjh.6440.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0c95212c7b40f954547156bbacb653e80e4b6a82335b8e10fb6f3f10c115c026
+size 6454

runs/Aug30_20-55-14_zjh/events.out.tfevents.1756558533.zjh.13840.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7cb5b2b2c48ccb96efce9d3a70ac5db04f01c62bc6865c55d6be3e64ed3c7487
+size 7616

special_tokens_map.json CHANGED Viewed

@@ -1,6 +1,30 @@
-{
-  "bos_token": "<s>",
-  "eos_token": "</s>",
-  "pad_token": "<pad>",
-  "unk_token": "<unk>"
-}

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": true,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": true,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<pad>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": true,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": true,
+    "normalized": false,
+    "rstrip": true,
+    "single_word": false
+  }
+}

tokenizer_config.json CHANGED Viewed

@@ -1,51 +1,51 @@
-{
-  "added_tokens_decoder": {
-    "0": {
-      "content": "<pad>",
-      "lstrip": true,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": false
-    },
-    "1": {
-      "content": "<s>",
-      "lstrip": true,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": false
-    },
-    "2": {
-      "content": "</s>",
-      "lstrip": true,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": false
-    },
-    "3": {
-      "content": "<unk>",
-      "lstrip": true,
-      "normalized": false,
-      "rstrip": true,
-      "single_word": false,
-      "special": false
-    }
-  },
-  "bos_token": "<s>",
-  "clean_up_tokenization_spaces": false,
-  "do_lower_case": false,
-  "do_normalize": true,
-  "eos_token": "</s>",
-  "extra_special_tokens": {},
-  "model_max_length": 1000000000000000019884624838656,
-  "pad_token": "<pad>",
-  "processor_class": "Wav2Vec2Processor",
-  "replace_word_delimiter_char": " ",
-  "return_attention_mask": false,
-  "target_lang": null,
-  "tokenizer_class": "Wav2Vec2CTCTokenizer",
-  "unk_token": "<unk>",
-  "word_delimiter_token": "|"
-}

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<pad>",
+      "lstrip": true,
+      "normalized": false,
+      "rstrip": true,
+      "single_word": false,
+      "special": false
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": true,
+      "normalized": false,
+      "rstrip": true,
+      "single_word": false,
+      "special": false
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": true,
+      "normalized": false,
+      "rstrip": true,
+      "single_word": false,
+      "special": false
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": true,
+      "normalized": false,
+      "rstrip": true,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "do_lower_case": false,
+  "do_normalize": true,
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<pad>",
+  "processor_class": "Wav2Vec2Processor",
+  "replace_word_delimiter_char": " ",
+  "return_attention_mask": false,
+  "target_lang": null,
+  "tokenizer_class": "Wav2Vec2CTCTokenizer",
+  "unk_token": "<unk>",
+  "word_delimiter_token": "|"
+}

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:06eb1c8779ef8e5e3734b6722b7314ecdd2a5ec4f7bbd188e009331c4f1d0a90
-size 5777

 version https://git-lfs.github.com/spec/v1
+oid sha256:c435b9d5561145c5daeafcfeba272f458bc3f34316d2c713bfd87c43ef17f3ea
+size 5713

vocab.json CHANGED Viewed

@@ -1,34 +1,34 @@
-{
-  "'": 27,
-  "</s>": 2,
-  "<pad>": 0,
-  "<s>": 1,
-  "<unk>": 3,
-  "A": 7,
-  "B": 24,
-  "C": 19,
-  "D": 14,
-  "E": 5,
-  "F": 20,
-  "G": 21,
-  "H": 11,
-  "I": 10,
-  "J": 29,
-  "K": 26,
-  "L": 15,
-  "M": 17,
-  "N": 9,
-  "O": 8,
-  "P": 23,
-  "Q": 30,
-  "R": 13,
-  "S": 12,
-  "T": 6,
-  "U": 16,
-  "V": 25,
-  "W": 18,
-  "X": 28,
-  "Y": 22,
-  "Z": 31,
-  "|": 4
-}

+{
+  "'": 27,
+  "</s>": 2,
+  "<pad>": 0,
+  "<s>": 1,
+  "<unk>": 3,
+  "A": 7,
+  "B": 24,
+  "C": 19,
+  "D": 14,
+  "E": 5,
+  "F": 20,
+  "G": 21,
+  "H": 11,
+  "I": 10,
+  "J": 29,
+  "K": 26,
+  "L": 15,
+  "M": 17,
+  "N": 9,
+  "O": 8,
+  "P": 23,
+  "Q": 30,
+  "R": 13,
+  "S": 12,
+  "T": 6,
+  "U": 16,
+  "V": 25,
+  "W": 18,
+  "X": 28,
+  "Y": 22,
+  "Z": 31,
+  "|": 4
+}