Training in progress, epoch 1, checkpoint

Browse files

Files changed (8) hide show

last-checkpoint/config.json +125 -0
last-checkpoint/model.safetensors +3 -0
last-checkpoint/optimizer.pt +3 -0
last-checkpoint/preprocessor_config.json +9 -0
last-checkpoint/rng_state.pth +3 -0
last-checkpoint/scheduler.pt +3 -0
last-checkpoint/trainer_state.json +386 -0
last-checkpoint/training_args.bin +3 -0

last-checkpoint/config.json ADDED Viewed

	@@ -0,0 +1,125 @@

+{
+  "activation_dropout": 0.0,
+  "adapter_attn_dim": null,
+  "adapter_kernel_size": 3,
+  "adapter_stride": 2,
+  "add_adapter": false,
+  "apply_spec_augment": true,
+  "architectures": [
+    "Wav2Vec2ForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "codevector_dim": 256,
+  "contrastive_logits_temperature": 0.1,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "diversity_loss_weight": 0.1,
+  "do_stable_layer_norm": false,
+  "dtype": "float32",
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.1,
+  "feat_quantizer_dropout": 0.0,
+  "final_dropout": 0.0,
+  "freeze_feat_extract_train": true,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "fake",
+    "1": "real"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "fake": "0",
+    "real": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_channel_length": 10,
+  "mask_channel_min_space": 1,
+  "mask_channel_other": 0.0,
+  "mask_channel_prob": 0.0,
+  "mask_channel_selection": "static",
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_min_space": 1,
+  "mask_time_other": 0.0,
+  "mask_time_prob": 0.05,
+  "mask_time_selection": "static",
+  "model_type": "wav2vec2",
+  "no_mask_channel_overlap": false,
+  "no_mask_time_overlap": false,
+  "num_adapter_layers": 3,
+  "num_attention_heads": 12,
+  "num_codevector_groups": 2,
+  "num_codevectors_per_group": 320,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 12,
+  "num_negatives": 100,
+  "output_hidden_size": 768,
+  "pad_token_id": 0,
+  "proj_codevector_dim": 256,
+  "tdnn_dilation": [
+    1,
+    2,
+    3,
+    1,
+    1
+  ],
+  "tdnn_dim": [
+    512,
+    512,
+    512,
+    512,
+    1500
+  ],
+  "tdnn_kernel": [
+    5,
+    3,
+    3,
+    1,
+    1
+  ],
+  "transformers_version": "4.57.3",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32,
+  "xvector_output_dim": 512
+}

last-checkpoint/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:61f046095e067203694eb7ac3b56101f802c222508ff36c0e8a4fbc1f72d4125
+size 378302360

last-checkpoint/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3789a0f05d3e97624e349985237e00b70832481cd75b893e1d50304972007da2
+size 756732602

last-checkpoint/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": true,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0.0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

last-checkpoint/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ca69c562ea24f9a8a4e249ce778e6aa3dd1db2c84993f5499e5f9500d2edad8e
+size 14308

last-checkpoint/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5699a0932df3dd97f15fcfcceb2d361d521d7117e842cbdb8f8aaaa5ca19c383
+size 1064

last-checkpoint/trainer_state.json ADDED Viewed

	@@ -0,0 +1,386 @@

+{
+  "best_global_step": 496,
+  "best_metric": 0.5052976791120081,
+  "best_model_checkpoint": "Deeepfake-audio-Recognition/checkpoint-496",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 496,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.020181634712411706,
+      "grad_norm": 0.6100882291793823,
+      "learning_rate": 5.399999999999999e-05,
+      "loss": 0.6925,
+      "step": 10
+    },
+    {
+      "epoch": 0.04036326942482341,
+      "grad_norm": 4.445184230804443,
+      "learning_rate": 0.00011399999999999999,
+      "loss": 0.6948,
+      "step": 20
+    },
+    {
+      "epoch": 0.060544904137235116,
+      "grad_norm": 2.134990692138672,
+      "learning_rate": 0.00017399999999999997,
+      "loss": 0.6859,
+      "step": 30
+    },
+    {
+      "epoch": 0.08072653884964683,
+      "grad_norm": 0.7902814149856567,
+      "learning_rate": 0.000234,
+      "loss": 0.7172,
+      "step": 40
+    },
+    {
+      "epoch": 0.10090817356205853,
+      "grad_norm": 0.5187829732894897,
+      "learning_rate": 0.000294,
+      "loss": 0.698,
+      "step": 50
+    },
+    {
+      "epoch": 0.12108980827447023,
+      "grad_norm": 0.06201840192079544,
+      "learning_rate": 0.00029394618834080715,
+      "loss": 0.6939,
+      "step": 60
+    },
+    {
+      "epoch": 0.14127144298688193,
+      "grad_norm": 0.3845376968383789,
+      "learning_rate": 0.000287219730941704,
+      "loss": 0.6893,
+      "step": 70
+    },
+    {
+      "epoch": 0.16145307769929365,
+      "grad_norm": 0.10666169226169586,
+      "learning_rate": 0.0002804932735426009,
+      "loss": 0.6989,
+      "step": 80
+    },
+    {
+      "epoch": 0.18163471241170534,
+      "grad_norm": 0.0453961119055748,
+      "learning_rate": 0.0002737668161434977,
+      "loss": 0.6962,
+      "step": 90
+    },
+    {
+      "epoch": 0.20181634712411706,
+      "grad_norm": 0.3139711320400238,
+      "learning_rate": 0.0002670403587443946,
+      "loss": 0.6969,
+      "step": 100
+    },
+    {
+      "epoch": 0.22199798183652875,
+      "grad_norm": 0.08844541013240814,
+      "learning_rate": 0.00026031390134529145,
+      "loss": 0.6895,
+      "step": 110
+    },
+    {
+      "epoch": 0.24217961654894046,
+      "grad_norm": 0.21342194080352783,
+      "learning_rate": 0.0002535874439461883,
+      "loss": 0.6964,
+      "step": 120
+    },
+    {
+      "epoch": 0.2623612512613522,
+      "grad_norm": 0.21850763261318207,
+      "learning_rate": 0.0002468609865470852,
+      "loss": 0.6946,
+      "step": 130
+    },
+    {
+      "epoch": 0.28254288597376387,
+      "grad_norm": 0.3530184328556061,
+      "learning_rate": 0.00024013452914798202,
+      "loss": 0.6928,
+      "step": 140
+    },
+    {
+      "epoch": 0.30272452068617556,
+      "grad_norm": 0.11930827051401138,
+      "learning_rate": 0.00023340807174887892,
+      "loss": 0.6951,
+      "step": 150
+    },
+    {
+      "epoch": 0.3229061553985873,
+      "grad_norm": 0.25173401832580566,
+      "learning_rate": 0.00022668161434977576,
+      "loss": 0.6934,
+      "step": 160
+    },
+    {
+      "epoch": 0.343087790110999,
+      "grad_norm": 0.25978365540504456,
+      "learning_rate": 0.00021995515695067262,
+      "loss": 0.6947,
+      "step": 170
+    },
+    {
+      "epoch": 0.3632694248234107,
+      "grad_norm": 0.07770789414644241,
+      "learning_rate": 0.00021322869955156952,
+      "loss": 0.6936,
+      "step": 180
+    },
+    {
+      "epoch": 0.3834510595358224,
+      "grad_norm": 0.01727680303156376,
+      "learning_rate": 0.00020650224215246636,
+      "loss": 0.6939,
+      "step": 190
+    },
+    {
+      "epoch": 0.4036326942482341,
+      "grad_norm": 0.11968690156936646,
+      "learning_rate": 0.00019977578475336322,
+      "loss": 0.6938,
+      "step": 200
+    },
+    {
+      "epoch": 0.4238143289606458,
+      "grad_norm": 0.21573954820632935,
+      "learning_rate": 0.00019304932735426006,
+      "loss": 0.6891,
+      "step": 210
+    },
+    {
+      "epoch": 0.4439959636730575,
+      "grad_norm": 0.2965114414691925,
+      "learning_rate": 0.00018632286995515693,
+      "loss": 0.7002,
+      "step": 220
+    },
+    {
+      "epoch": 0.46417759838546924,
+      "grad_norm": 0.21291188895702362,
+      "learning_rate": 0.0001795964125560538,
+      "loss": 0.6933,
+      "step": 230
+    },
+    {
+      "epoch": 0.4843592330978809,
+      "grad_norm": 0.19937728345394135,
+      "learning_rate": 0.00017286995515695066,
+      "loss": 0.693,
+      "step": 240
+    },
+    {
+      "epoch": 0.5045408678102926,
+      "grad_norm": 0.13156402111053467,
+      "learning_rate": 0.00016614349775784752,
+      "loss": 0.6934,
+      "step": 250
+    },
+    {
+      "epoch": 0.5247225025227044,
+      "grad_norm": 0.521071195602417,
+      "learning_rate": 0.00015941704035874436,
+      "loss": 0.6951,
+      "step": 260
+    },
+    {
+      "epoch": 0.544904137235116,
+      "grad_norm": 0.09291291236877441,
+      "learning_rate": 0.00015269058295964126,
+      "loss": 0.6924,
+      "step": 270
+    },
+    {
+      "epoch": 0.5650857719475277,
+      "grad_norm": 0.023215485736727715,
+      "learning_rate": 0.0001459641255605381,
+      "loss": 0.6983,
+      "step": 280
+    },
+    {
+      "epoch": 0.5852674066599395,
+      "grad_norm": 0.3948315978050232,
+      "learning_rate": 0.00013923766816143496,
+      "loss": 0.6927,
+      "step": 290
+    },
+    {
+      "epoch": 0.6054490413723511,
+      "grad_norm": 0.20814433693885803,
+      "learning_rate": 0.00013251121076233183,
+      "loss": 0.6944,
+      "step": 300
+    },
+    {
+      "epoch": 0.6256306760847629,
+      "grad_norm": 0.47286856174468994,
+      "learning_rate": 0.0001257847533632287,
+      "loss": 0.6932,
+      "step": 310
+    },
+    {
+      "epoch": 0.6458123107971746,
+      "grad_norm": 0.19758112728595734,
+      "learning_rate": 0.00011905829596412555,
+      "loss": 0.6933,
+      "step": 320
+    },
+    {
+      "epoch": 0.6659939455095862,
+      "grad_norm": 0.20121727883815765,
+      "learning_rate": 0.00011233183856502243,
+      "loss": 0.6933,
+      "step": 330
+    },
+    {
+      "epoch": 0.686175580221998,
+      "grad_norm": 0.02322172187268734,
+      "learning_rate": 0.00010560538116591928,
+      "loss": 0.6929,
+      "step": 340
+    },
+    {
+      "epoch": 0.7063572149344097,
+      "grad_norm": 0.10014554113149643,
+      "learning_rate": 9.887892376681613e-05,
+      "loss": 0.6923,
+      "step": 350
+    },
+    {
+      "epoch": 0.7265388496468214,
+      "grad_norm": 0.09777415543794632,
+      "learning_rate": 9.2152466367713e-05,
+      "loss": 0.6925,
+      "step": 360
+    },
+    {
+      "epoch": 0.7467204843592331,
+      "grad_norm": 0.1630220115184784,
+      "learning_rate": 8.542600896860985e-05,
+      "loss": 0.6947,
+      "step": 370
+    },
+    {
+      "epoch": 0.7669021190716448,
+      "grad_norm": 0.10113658010959625,
+      "learning_rate": 7.869955156950672e-05,
+      "loss": 0.6911,
+      "step": 380
+    },
+    {
+      "epoch": 0.7870837537840565,
+      "grad_norm": 0.23644621670246124,
+      "learning_rate": 7.197309417040358e-05,
+      "loss": 0.6949,
+      "step": 390
+    },
+    {
+      "epoch": 0.8072653884964682,
+      "grad_norm": 0.0247635617852211,
+      "learning_rate": 6.524663677130043e-05,
+      "loss": 0.6928,
+      "step": 400
+    },
+    {
+      "epoch": 0.82744702320888,
+      "grad_norm": 0.04597044363617897,
+      "learning_rate": 5.852017937219731e-05,
+      "loss": 0.6931,
+      "step": 410
+    },
+    {
+      "epoch": 0.8476286579212916,
+      "grad_norm": 0.10972382128238678,
+      "learning_rate": 5.1793721973094166e-05,
+      "loss": 0.6922,
+      "step": 420
+    },
+    {
+      "epoch": 0.8678102926337034,
+      "grad_norm": 0.026838891208171844,
+      "learning_rate": 4.5067264573991026e-05,
+      "loss": 0.6933,
+      "step": 430
+    },
+    {
+      "epoch": 0.887991927346115,
+      "grad_norm": 0.04809186980128288,
+      "learning_rate": 3.834080717488789e-05,
+      "loss": 0.6934,
+      "step": 440
+    },
+    {
+      "epoch": 0.9081735620585267,
+      "grad_norm": 0.05220267176628113,
+      "learning_rate": 3.161434977578475e-05,
+      "loss": 0.6942,
+      "step": 450
+    },
+    {
+      "epoch": 0.9283551967709385,
+      "grad_norm": 0.0148994205519557,
+      "learning_rate": 2.4887892376681614e-05,
+      "loss": 0.6936,
+      "step": 460
+    },
+    {
+      "epoch": 0.9485368314833501,
+      "grad_norm": 0.07287449389696121,
+      "learning_rate": 1.8161434977578473e-05,
+      "loss": 0.6932,
+      "step": 470
+    },
+    {
+      "epoch": 0.9687184661957619,
+      "grad_norm": 0.21053215861320496,
+      "learning_rate": 1.1434977578475336e-05,
+      "loss": 0.6926,
+      "step": 480
+    },
+    {
+      "epoch": 0.9889001009081736,
+      "grad_norm": 0.1443960815668106,
+      "learning_rate": 4.708520179372197e-06,
+      "loss": 0.694,
+      "step": 490
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.5052976791120081,
+      "eval_loss": 0.693091094493866,
+      "eval_runtime": 89.1283,
+      "eval_samples_per_second": 44.475,
+      "eval_steps_per_second": 5.565,
+      "step": 496
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 496,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.4392356324192e+17,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

last-checkpoint/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0317a4be8305d7c63b70fad14cde7804b597568fd2181ea062cb92553a0917d9
+size 5496