kbwaaablya commited on May 26, 2025

Commit

4fcae93

verified ·

1 Parent(s): 60d052b

Upload folder using huggingface_hub

Browse files

Files changed (38) hide show

.gitattributes +6 -0
checkpoint-500/config.json +40 -0
checkpoint-500/generation_config.json +16 -0
checkpoint-500/model.safetensors +3 -0
checkpoint-500/optimizer.pt +3 -0
checkpoint-500/rng_state.pth +3 -0
checkpoint-500/scaler.pt +3 -0
checkpoint-500/scheduler.pt +3 -0
checkpoint-500/source.spm +3 -0
checkpoint-500/special_tokens_map.json +5 -0
checkpoint-500/target.spm +3 -0
checkpoint-500/tokenizer_config.json +39 -0
checkpoint-500/trainer_state.json +57 -0
checkpoint-500/training_args.bin +3 -0
checkpoint-500/vocab.json +0 -0
checkpoint-729/config.json +40 -0
checkpoint-729/generation_config.json +16 -0
checkpoint-729/model.safetensors +3 -0
checkpoint-729/optimizer.pt +3 -0
checkpoint-729/rng_state.pth +3 -0
checkpoint-729/scaler.pt +3 -0
checkpoint-729/scheduler.pt +3 -0
checkpoint-729/source.spm +3 -0
checkpoint-729/special_tokens_map.json +5 -0
checkpoint-729/target.spm +3 -0
checkpoint-729/tokenizer_config.json +39 -0
checkpoint-729/trainer_state.json +57 -0
checkpoint-729/training_args.bin +3 -0
checkpoint-729/vocab.json +0 -0
config.json +40 -0
generation_config.json +16 -0
model.safetensors +3 -0
source.spm +3 -0
special_tokens_map.json +5 -0
target.spm +3 -0
tokenizer_config.json +39 -0
training_args.bin +3 -0
vocab.json +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,9 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+checkpoint-500/source.spm filter=lfs diff=lfs merge=lfs -text
+checkpoint-500/target.spm filter=lfs diff=lfs merge=lfs -text
+checkpoint-729/source.spm filter=lfs diff=lfs merge=lfs -text
+checkpoint-729/target.spm filter=lfs diff=lfs merge=lfs -text
+source.spm filter=lfs diff=lfs merge=lfs -text
+target.spm filter=lfs diff=lfs merge=lfs -text

checkpoint-500/config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "activation_dropout": 0.0,
+  "activation_function": "relu",
+  "architectures": [
+    "MarianMTModel"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 0,
+  "classifier_dropout": 0.0,
+  "d_model": 1024,
+  "decoder_attention_heads": 16,
+  "decoder_ffn_dim": 4096,
+  "decoder_layerdrop": 0.0,
+  "decoder_layers": 6,
+  "decoder_start_token_id": 58297,
+  "decoder_vocab_size": 58298,
+  "dropout": 0.1,
+  "encoder_attention_heads": 16,
+  "encoder_ffn_dim": 4096,
+  "encoder_layerdrop": 0.0,
+  "encoder_layers": 6,
+  "eos_token_id": 45603,
+  "forced_eos_token_id": null,
+  "init_std": 0.02,
+  "is_encoder_decoder": true,
+  "max_length": null,
+  "max_position_embeddings": 1024,
+  "model_type": "marian",
+  "normalize_embedding": false,
+  "num_beams": null,
+  "num_hidden_layers": 6,
+  "pad_token_id": 58297,
+  "scale_embedding": true,
+  "share_encoder_decoder_embeddings": true,
+  "static_position_embeddings": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.50.3",
+  "use_cache": true,
+  "vocab_size": 58298
+}

checkpoint-500/generation_config.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "bad_words_ids": [
+    [
+      58297
+    ]
+  ],
+  "bos_token_id": 0,
+  "decoder_start_token_id": 58297,
+  "eos_token_id": 45603,
+  "forced_eos_token_id": 45603,
+  "max_length": 512,
+  "num_beams": 4,
+  "pad_token_id": 58297,
+  "renormalize_logits": true,
+  "transformers_version": "4.50.3"
+}

checkpoint-500/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee650e4b0511d0e6c833c1c2b6dfa787f249add60f9af2dd63f3f0eb8e29f761
+size 944480920

checkpoint-500/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c02b58fa79aa9053d7b24bafb759a333657c4a927bd3e1146d0f7922345ecd57
+size 1888647802

checkpoint-500/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f8bd4f887a4dfc2ec04e88b27e2f24434961434651e5b601db63a08fa64cd06a
+size 14244

checkpoint-500/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7bfa51e071ccffcbabecfa11f208d56e0863809bdd9bf20f7e79e215c2919b42
+size 988

checkpoint-500/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c0531c4728970fe3718b0e2aea4a9f23f7f7069a53976bf37f68f21417c50bce
+size 1064

checkpoint-500/source.spm ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:94634cc0b00a2a1e0e2e4317cc0a49d0154d835f7951425e45be15c72ba21417
+size 798014

checkpoint-500/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "eos_token": "</s>",
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

checkpoint-500/target.spm ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:25446f415fe316afbf692acf7ef5131a74940dc820e2cbe31300f09ac3c492dc
+size 838711

checkpoint-500/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "added_tokens_decoder": {
+    "45603": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "54359": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "58297": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "model_max_length": 512,
+  "pad_token": "<pad>",
+  "separate_vocabs": false,
+  "source_lang": "en",
+  "sp_model_kwargs": {},
+  "target_lang": "lv",
+  "tokenizer_class": "MarianTokenizer",
+  "unk_token": "<unk>"
+}

checkpoint-500/trainer_state.json ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.05761316872428,
+  "eval_steps": 500,
+  "global_step": 500,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 1.3566852807998657,
+      "eval_runtime": 0.7082,
+      "eval_samples_per_second": 611.395,
+      "eval_steps_per_second": 77.66,
+      "step": 243
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 1.2682921886444092,
+      "eval_runtime": 0.6768,
+      "eval_samples_per_second": 639.761,
+      "eval_steps_per_second": 81.263,
+      "step": 486
+    },
+    {
+      "epoch": 2.05761316872428,
+      "grad_norm": 9.423436164855957,
+      "learning_rate": 6.3374485596707825e-06,
+      "loss": 1.3704,
+      "step": 500
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 729,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 109302069067776.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-500/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a1c563b600c69d2804728e9cfb80935191961a93c9761c2af118e10f951e12ea
+size 5496

checkpoint-500/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-729/config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "activation_dropout": 0.0,
+  "activation_function": "relu",
+  "architectures": [
+    "MarianMTModel"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 0,
+  "classifier_dropout": 0.0,
+  "d_model": 1024,
+  "decoder_attention_heads": 16,
+  "decoder_ffn_dim": 4096,
+  "decoder_layerdrop": 0.0,
+  "decoder_layers": 6,
+  "decoder_start_token_id": 58297,
+  "decoder_vocab_size": 58298,
+  "dropout": 0.1,
+  "encoder_attention_heads": 16,
+  "encoder_ffn_dim": 4096,
+  "encoder_layerdrop": 0.0,
+  "encoder_layers": 6,
+  "eos_token_id": 45603,
+  "forced_eos_token_id": null,
+  "init_std": 0.02,
+  "is_encoder_decoder": true,
+  "max_length": null,
+  "max_position_embeddings": 1024,
+  "model_type": "marian",
+  "normalize_embedding": false,
+  "num_beams": null,
+  "num_hidden_layers": 6,
+  "pad_token_id": 58297,
+  "scale_embedding": true,
+  "share_encoder_decoder_embeddings": true,
+  "static_position_embeddings": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.50.3",
+  "use_cache": true,
+  "vocab_size": 58298
+}

checkpoint-729/generation_config.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "bad_words_ids": [
+    [
+      58297
+    ]
+  ],
+  "bos_token_id": 0,
+  "decoder_start_token_id": 58297,
+  "eos_token_id": 45603,
+  "forced_eos_token_id": 45603,
+  "max_length": 512,
+  "num_beams": 4,
+  "pad_token_id": 58297,
+  "renormalize_logits": true,
+  "transformers_version": "4.50.3"
+}

checkpoint-729/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91c70b56aa595b23fba00656eb7563993fe0e2ce84c6ef412ac70c27b876fb44
+size 944480920

checkpoint-729/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bbe389f2ec3a56a06e3783bb4c0a3e45b8a4e3d6feaac7caaf406bd9b65de030
+size 1888647802

checkpoint-729/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c646261de0de4d9659cfc4dc149e116806085fd03be89858296eef087a55b532
+size 14244

checkpoint-729/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c16a360deedb9188983d768b70e906d28bbb3555fd7a93647015ad5f43f2ccdb
+size 988

checkpoint-729/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:65ca8c525c485e92210800dd551db2d064ae323799a3c9dd02921f2b56752fe7
+size 1064

checkpoint-729/source.spm ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:94634cc0b00a2a1e0e2e4317cc0a49d0154d835f7951425e45be15c72ba21417
+size 798014

checkpoint-729/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "eos_token": "</s>",
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

checkpoint-729/target.spm ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:25446f415fe316afbf692acf7ef5131a74940dc820e2cbe31300f09ac3c492dc
+size 838711

checkpoint-729/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "added_tokens_decoder": {
+    "45603": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "54359": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "58297": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "model_max_length": 512,
+  "pad_token": "<pad>",
+  "separate_vocabs": false,
+  "source_lang": "en",
+  "sp_model_kwargs": {},
+  "target_lang": "lv",
+  "tokenizer_class": "MarianTokenizer",
+  "unk_token": "<unk>"
+}

checkpoint-729/trainer_state.json ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 729,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 1.3566852807998657,
+      "eval_runtime": 0.7082,
+      "eval_samples_per_second": 611.395,
+      "eval_steps_per_second": 77.66,
+      "step": 243
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 1.2682921886444092,
+      "eval_runtime": 0.6768,
+      "eval_samples_per_second": 639.761,
+      "eval_steps_per_second": 81.263,
+      "step": 486
+    },
+    {
+      "epoch": 2.05761316872428,
+      "grad_norm": 9.423436164855957,
+      "learning_rate": 6.3374485596707825e-06,
+      "loss": 1.3704,
+      "step": 500
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 729,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 159331129491456.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-729/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a1c563b600c69d2804728e9cfb80935191961a93c9761c2af118e10f951e12ea
+size 5496

checkpoint-729/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "activation_dropout": 0.0,
+  "activation_function": "relu",
+  "architectures": [
+    "MarianMTModel"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 0,
+  "classifier_dropout": 0.0,
+  "d_model": 1024,
+  "decoder_attention_heads": 16,
+  "decoder_ffn_dim": 4096,
+  "decoder_layerdrop": 0.0,
+  "decoder_layers": 6,
+  "decoder_start_token_id": 58297,
+  "decoder_vocab_size": 58298,
+  "dropout": 0.1,
+  "encoder_attention_heads": 16,
+  "encoder_ffn_dim": 4096,
+  "encoder_layerdrop": 0.0,
+  "encoder_layers": 6,
+  "eos_token_id": 45603,
+  "forced_eos_token_id": null,
+  "init_std": 0.02,
+  "is_encoder_decoder": true,
+  "max_length": null,
+  "max_position_embeddings": 1024,
+  "model_type": "marian",
+  "normalize_embedding": false,
+  "num_beams": null,
+  "num_hidden_layers": 6,
+  "pad_token_id": 58297,
+  "scale_embedding": true,
+  "share_encoder_decoder_embeddings": true,
+  "static_position_embeddings": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.50.3",
+  "use_cache": true,
+  "vocab_size": 58298
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "bad_words_ids": [
+    [
+      58297
+    ]
+  ],
+  "bos_token_id": 0,
+  "decoder_start_token_id": 58297,
+  "eos_token_id": 45603,
+  "forced_eos_token_id": 45603,
+  "max_length": 512,
+  "num_beams": 4,
+  "pad_token_id": 58297,
+  "renormalize_logits": true,
+  "transformers_version": "4.50.3"
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91c70b56aa595b23fba00656eb7563993fe0e2ce84c6ef412ac70c27b876fb44
+size 944480920

source.spm ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:94634cc0b00a2a1e0e2e4317cc0a49d0154d835f7951425e45be15c72ba21417
+size 798014

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "eos_token": "</s>",
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

target.spm ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:25446f415fe316afbf692acf7ef5131a74940dc820e2cbe31300f09ac3c492dc
+size 838711

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "added_tokens_decoder": {
+    "45603": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "54359": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "58297": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "model_max_length": 512,
+  "pad_token": "<pad>",
+  "separate_vocabs": false,
+  "source_lang": "en",
+  "sp_model_kwargs": {},
+  "target_lang": "lv",
+  "tokenizer_class": "MarianTokenizer",
+  "unk_token": "<unk>"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a1c563b600c69d2804728e9cfb80935191961a93c9761c2af118e10f951e12ea
+size 5496

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff