Floressek commited on Nov 14, 2025

Commit

b2bc225

verified ·

1 Parent(s): 193c905

Upload folder using huggingface_hub

Browse files

Files changed (36) hide show

.gitattributes +1 -0
.hfignore +13 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-4092/config.json +24 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-4092/model.safetensors +3 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-4092/optimizer.pt +3 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-4092/rng_state.pth +3 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-4092/scaler.pt +3 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-4092/scheduler.pt +3 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-4092/special_tokens_map.json +7 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-4092/tokenizer.json +0 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-4092/tokenizer_config.json +56 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-4092/trainer_state.json +324 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-4092/training_args.bin +3 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-4092/vocab.txt +0 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-8184/config.json +24 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-8184/model.safetensors +3 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-8184/optimizer.pt +3 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-8184/rng_state.pth +3 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-8184/scaler.pt +3 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-8184/scheduler.pt +3 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-8184/special_tokens_map.json +7 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-8184/tokenizer.json +0 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-8184/tokenizer_config.json +56 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-8184/trainer_state.json +621 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-8184/training_args.bin +3 -0
Floressek/sentiment_classification_from_distillbert/checkpoint-8184/vocab.txt +0 -0
Floressek/sentiment_classification_from_distillbert/config.json +24 -0
Floressek/sentiment_classification_from_distillbert/model.safetensors +3 -0
Floressek/sentiment_classification_from_distillbert/special_tokens_map.json +7 -0
Floressek/sentiment_classification_from_distillbert/tokenizer.json +0 -0
Floressek/sentiment_classification_from_distillbert/tokenizer_config.json +56 -0
Floressek/sentiment_classification_from_distillbert/training_args.bin +3 -0
Floressek/sentiment_classification_from_distillbert/vocab.txt +0 -0
Szymon_Florek_Model_fine_tuning.ipynb +1145 -0
data/Amazon_Unlocked_Mobile.csv +3 -0
data/Amazon_Unlocked_Mobile.csv.zip +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+data/Amazon_Unlocked_Mobile.csv filter=lfs diff=lfs merge=lfs -text

.hfignore ADDED Viewed

	@@ -0,0 +1,13 @@

+.venv/
+.git/
+**/__pycache__/
+**/*.pyc
+**/*.pyd
+**/*.so
+**/*.parquet
+**/*.zip
+**/*.whl
+data/
+datasets/
+notebooks/
+tests/

Floressek/sentiment_classification_from_distillbert/checkpoint-4092/config.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "dtype": "float32",
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "transformers_version": "4.57.1",
+  "vocab_size": 30522
+}

Floressek/sentiment_classification_from_distillbert/checkpoint-4092/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:48f53c9337700718dfe05b128baaf117bd0426c55a2997dcb5eba2a6ece8b78a
+size 267832560

Floressek/sentiment_classification_from_distillbert/checkpoint-4092/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d60dd26e70b6b195af77ec24609240dc615fa06373e1041dbb7d954caac63ab9
+size 535727755

Floressek/sentiment_classification_from_distillbert/checkpoint-4092/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:33b3fc4dc6e72c19b95ccc6bf2103e72921fd75896fc4bef7c6d974ba74630e9
+size 14645

Floressek/sentiment_classification_from_distillbert/checkpoint-4092/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:484e81aa45a06ff82acc987feb7e25bd65f6d761d4b270f18fa3fdb66af71f57
+size 1383

Floressek/sentiment_classification_from_distillbert/checkpoint-4092/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ad6350ab52d6a97e61162b0ff6ee33357b33b4a128de1a32409ac383b24e0b81
+size 1465

Floressek/sentiment_classification_from_distillbert/checkpoint-4092/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

Floressek/sentiment_classification_from_distillbert/checkpoint-4092/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

Floressek/sentiment_classification_from_distillbert/checkpoint-4092/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

Floressek/sentiment_classification_from_distillbert/checkpoint-4092/trainer_state.json ADDED Viewed

	@@ -0,0 +1,324 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 4092,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.024437927663734114,
+      "grad_norm": 4.433139801025391,
+      "learning_rate": 1.9760508308895406e-05,
+      "loss": 0.2466,
+      "step": 100
+    },
+    {
+      "epoch": 0.04887585532746823,
+      "grad_norm": 2.9566471576690674,
+      "learning_rate": 1.9516129032258068e-05,
+      "loss": 0.0958,
+      "step": 200
+    },
+    {
+      "epoch": 0.07331378299120235,
+      "grad_norm": 3.056684732437134,
+      "learning_rate": 1.9271749755620726e-05,
+      "loss": 0.0854,
+      "step": 300
+    },
+    {
+      "epoch": 0.09775171065493646,
+      "grad_norm": 0.7034033536911011,
+      "learning_rate": 1.9027370478983384e-05,
+      "loss": 0.0854,
+      "step": 400
+    },
+    {
+      "epoch": 0.12218963831867058,
+      "grad_norm": 2.2177963256835938,
+      "learning_rate": 1.8782991202346042e-05,
+      "loss": 0.0851,
+      "step": 500
+    },
+    {
+      "epoch": 0.1466275659824047,
+      "grad_norm": 0.9197642803192139,
+      "learning_rate": 1.85386119257087e-05,
+      "loss": 0.0802,
+      "step": 600
+    },
+    {
+      "epoch": 0.1710654936461388,
+      "grad_norm": 2.132237672805786,
+      "learning_rate": 1.829423264907136e-05,
+      "loss": 0.068,
+      "step": 700
+    },
+    {
+      "epoch": 0.19550342130987292,
+      "grad_norm": 1.3075214624404907,
+      "learning_rate": 1.804985337243402e-05,
+      "loss": 0.0679,
+      "step": 800
+    },
+    {
+      "epoch": 0.21994134897360704,
+      "grad_norm": 2.7458581924438477,
+      "learning_rate": 1.7805474095796678e-05,
+      "loss": 0.0698,
+      "step": 900
+    },
+    {
+      "epoch": 0.24437927663734116,
+      "grad_norm": 1.7474775314331055,
+      "learning_rate": 1.7561094819159336e-05,
+      "loss": 0.0647,
+      "step": 1000
+    },
+    {
+      "epoch": 0.26881720430107525,
+      "grad_norm": 3.5915794372558594,
+      "learning_rate": 1.7316715542521995e-05,
+      "loss": 0.0598,
+      "step": 1100
+    },
+    {
+      "epoch": 0.2932551319648094,
+      "grad_norm": 0.5882957577705383,
+      "learning_rate": 1.7072336265884656e-05,
+      "loss": 0.0635,
+      "step": 1200
+    },
+    {
+      "epoch": 0.3176930596285435,
+      "grad_norm": 3.578653335571289,
+      "learning_rate": 1.6827956989247314e-05,
+      "loss": 0.0666,
+      "step": 1300
+    },
+    {
+      "epoch": 0.3421309872922776,
+      "grad_norm": 0.5485109090805054,
+      "learning_rate": 1.6583577712609973e-05,
+      "loss": 0.0583,
+      "step": 1400
+    },
+    {
+      "epoch": 0.36656891495601174,
+      "grad_norm": 0.6193661689758301,
+      "learning_rate": 1.633919843597263e-05,
+      "loss": 0.0637,
+      "step": 1500
+    },
+    {
+      "epoch": 0.39100684261974583,
+      "grad_norm": 0.11104666441679001,
+      "learning_rate": 1.609481915933529e-05,
+      "loss": 0.0505,
+      "step": 1600
+    },
+    {
+      "epoch": 0.41544477028348,
+      "grad_norm": 0.13834528625011444,
+      "learning_rate": 1.5850439882697947e-05,
+      "loss": 0.0535,
+      "step": 1700
+    },
+    {
+      "epoch": 0.4398826979472141,
+      "grad_norm": 0.19737549126148224,
+      "learning_rate": 1.5606060606060605e-05,
+      "loss": 0.0503,
+      "step": 1800
+    },
+    {
+      "epoch": 0.46432062561094817,
+      "grad_norm": 5.043758392333984,
+      "learning_rate": 1.5361681329423267e-05,
+      "loss": 0.0512,
+      "step": 1900
+    },
+    {
+      "epoch": 0.4887585532746823,
+      "grad_norm": 0.07497064024209976,
+      "learning_rate": 1.5117302052785925e-05,
+      "loss": 0.0526,
+      "step": 2000
+    },
+    {
+      "epoch": 0.5131964809384164,
+      "grad_norm": 1.9213156700134277,
+      "learning_rate": 1.4872922776148583e-05,
+      "loss": 0.051,
+      "step": 2100
+    },
+    {
+      "epoch": 0.5376344086021505,
+      "grad_norm": 1.2963168621063232,
+      "learning_rate": 1.4628543499511243e-05,
+      "loss": 0.0429,
+      "step": 2200
+    },
+    {
+      "epoch": 0.5620723362658846,
+      "grad_norm": 1.5551583766937256,
+      "learning_rate": 1.4384164222873903e-05,
+      "loss": 0.0602,
+      "step": 2300
+    },
+    {
+      "epoch": 0.5865102639296188,
+      "grad_norm": 2.956341028213501,
+      "learning_rate": 1.4139784946236561e-05,
+      "loss": 0.0564,
+      "step": 2400
+    },
+    {
+      "epoch": 0.6109481915933529,
+      "grad_norm": 0.2880280911922455,
+      "learning_rate": 1.3895405669599221e-05,
+      "loss": 0.0425,
+      "step": 2500
+    },
+    {
+      "epoch": 0.635386119257087,
+      "grad_norm": 0.6562920808792114,
+      "learning_rate": 1.3651026392961877e-05,
+      "loss": 0.0456,
+      "step": 2600
+    },
+    {
+      "epoch": 0.6598240469208211,
+      "grad_norm": 0.09532313793897629,
+      "learning_rate": 1.3406647116324536e-05,
+      "loss": 0.051,
+      "step": 2700
+    },
+    {
+      "epoch": 0.6842619745845552,
+      "grad_norm": 2.781747817993164,
+      "learning_rate": 1.3162267839687195e-05,
+      "loss": 0.0512,
+      "step": 2800
+    },
+    {
+      "epoch": 0.7086999022482894,
+      "grad_norm": 2.1303281784057617,
+      "learning_rate": 1.2917888563049854e-05,
+      "loss": 0.0519,
+      "step": 2900
+    },
+    {
+      "epoch": 0.7331378299120235,
+      "grad_norm": 0.10773918032646179,
+      "learning_rate": 1.2673509286412513e-05,
+      "loss": 0.042,
+      "step": 3000
+    },
+    {
+      "epoch": 0.7575757575757576,
+      "grad_norm": 0.533173143863678,
+      "learning_rate": 1.2429130009775172e-05,
+      "loss": 0.0569,
+      "step": 3100
+    },
+    {
+      "epoch": 0.7820136852394917,
+      "grad_norm": 2.882176637649536,
+      "learning_rate": 1.2184750733137831e-05,
+      "loss": 0.0421,
+      "step": 3200
+    },
+    {
+      "epoch": 0.8064516129032258,
+      "grad_norm": 5.4323530197143555,
+      "learning_rate": 1.194037145650049e-05,
+      "loss": 0.0458,
+      "step": 3300
+    },
+    {
+      "epoch": 0.83088954056696,
+      "grad_norm": 0.08420676738023758,
+      "learning_rate": 1.169599217986315e-05,
+      "loss": 0.0432,
+      "step": 3400
+    },
+    {
+      "epoch": 0.855327468230694,
+      "grad_norm": 3.6947717666625977,
+      "learning_rate": 1.1451612903225808e-05,
+      "loss": 0.0387,
+      "step": 3500
+    },
+    {
+      "epoch": 0.8797653958944281,
+      "grad_norm": 4.411167621612549,
+      "learning_rate": 1.1209677419354839e-05,
+      "loss": 0.0515,
+      "step": 3600
+    },
+    {
+      "epoch": 0.9042033235581622,
+      "grad_norm": 3.9330861568450928,
+      "learning_rate": 1.0965298142717497e-05,
+      "loss": 0.0368,
+      "step": 3700
+    },
+    {
+      "epoch": 0.9286412512218963,
+      "grad_norm": 0.9437419772148132,
+      "learning_rate": 1.0720918866080157e-05,
+      "loss": 0.0479,
+      "step": 3800
+    },
+    {
+      "epoch": 0.9530791788856305,
+      "grad_norm": 1.0870046615600586,
+      "learning_rate": 1.0476539589442815e-05,
+      "loss": 0.0426,
+      "step": 3900
+    },
+    {
+      "epoch": 0.9775171065493646,
+      "grad_norm": 3.1951255798339844,
+      "learning_rate": 1.0232160312805475e-05,
+      "loss": 0.0432,
+      "step": 4000
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9891518737672583,
+      "eval_f1": 0.9928387101834639,
+      "eval_loss": 0.04053397476673126,
+      "eval_runtime": 158.0778,
+      "eval_samples_per_second": 532.409,
+      "eval_steps_per_second": 11.096,
+      "step": 4092
+    }
+  ],
+  "logging_steps": 100,
+  "max_steps": 8184,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 2,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.6013285411072e+16,
+  "train_batch_size": 48,
+  "trial_name": null,
+  "trial_params": null
+}

Floressek/sentiment_classification_from_distillbert/checkpoint-4092/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0c534883427a071f1d9f3ba8e1a112e5e016307e4c8c2c116719a636f815013c
+size 5841

Floressek/sentiment_classification_from_distillbert/checkpoint-4092/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

Floressek/sentiment_classification_from_distillbert/checkpoint-8184/config.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "dtype": "float32",
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "transformers_version": "4.57.1",
+  "vocab_size": 30522
+}

Floressek/sentiment_classification_from_distillbert/checkpoint-8184/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5ef48f63397444fab7fe77a7c3e8113768986ff1c8e5e9126a66727aa030ec64
+size 267832560

Floressek/sentiment_classification_from_distillbert/checkpoint-8184/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:223c1ad8c221cdb8480bd0fbf758bce16ab32234cf8f118612402b10534a701a
+size 535727755

Floressek/sentiment_classification_from_distillbert/checkpoint-8184/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1344599c19119661a23b30409dd058766623df54c92c90cfbddc059d4d9b8506
+size 14645

Floressek/sentiment_classification_from_distillbert/checkpoint-8184/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0c83094e856654a01b4be2edab3b20eb796b993d8a6bc80224e3383365e815ba
+size 1383

Floressek/sentiment_classification_from_distillbert/checkpoint-8184/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cd6f8ed4f35d1035d3220bdfe3aa23843396e8ea037faf54ec8c9dc5fe556d41
+size 1465

Floressek/sentiment_classification_from_distillbert/checkpoint-8184/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

Floressek/sentiment_classification_from_distillbert/checkpoint-8184/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

Floressek/sentiment_classification_from_distillbert/checkpoint-8184/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

Floressek/sentiment_classification_from_distillbert/checkpoint-8184/trainer_state.json ADDED Viewed

	@@ -0,0 +1,621 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 8184,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.024437927663734114,
+      "grad_norm": 4.433139801025391,
+      "learning_rate": 1.9760508308895406e-05,
+      "loss": 0.2466,
+      "step": 100
+    },
+    {
+      "epoch": 0.04887585532746823,
+      "grad_norm": 2.9566471576690674,
+      "learning_rate": 1.9516129032258068e-05,
+      "loss": 0.0958,
+      "step": 200
+    },
+    {
+      "epoch": 0.07331378299120235,
+      "grad_norm": 3.056684732437134,
+      "learning_rate": 1.9271749755620726e-05,
+      "loss": 0.0854,
+      "step": 300
+    },
+    {
+      "epoch": 0.09775171065493646,
+      "grad_norm": 0.7034033536911011,
+      "learning_rate": 1.9027370478983384e-05,
+      "loss": 0.0854,
+      "step": 400
+    },
+    {
+      "epoch": 0.12218963831867058,
+      "grad_norm": 2.2177963256835938,
+      "learning_rate": 1.8782991202346042e-05,
+      "loss": 0.0851,
+      "step": 500
+    },
+    {
+      "epoch": 0.1466275659824047,
+      "grad_norm": 0.9197642803192139,
+      "learning_rate": 1.85386119257087e-05,
+      "loss": 0.0802,
+      "step": 600
+    },
+    {
+      "epoch": 0.1710654936461388,
+      "grad_norm": 2.132237672805786,
+      "learning_rate": 1.829423264907136e-05,
+      "loss": 0.068,
+      "step": 700
+    },
+    {
+      "epoch": 0.19550342130987292,
+      "grad_norm": 1.3075214624404907,
+      "learning_rate": 1.804985337243402e-05,
+      "loss": 0.0679,
+      "step": 800
+    },
+    {
+      "epoch": 0.21994134897360704,
+      "grad_norm": 2.7458581924438477,
+      "learning_rate": 1.7805474095796678e-05,
+      "loss": 0.0698,
+      "step": 900
+    },
+    {
+      "epoch": 0.24437927663734116,
+      "grad_norm": 1.7474775314331055,
+      "learning_rate": 1.7561094819159336e-05,
+      "loss": 0.0647,
+      "step": 1000
+    },
+    {
+      "epoch": 0.26881720430107525,
+      "grad_norm": 3.5915794372558594,
+      "learning_rate": 1.7316715542521995e-05,
+      "loss": 0.0598,
+      "step": 1100
+    },
+    {
+      "epoch": 0.2932551319648094,
+      "grad_norm": 0.5882957577705383,
+      "learning_rate": 1.7072336265884656e-05,
+      "loss": 0.0635,
+      "step": 1200
+    },
+    {
+      "epoch": 0.3176930596285435,
+      "grad_norm": 3.578653335571289,
+      "learning_rate": 1.6827956989247314e-05,
+      "loss": 0.0666,
+      "step": 1300
+    },
+    {
+      "epoch": 0.3421309872922776,
+      "grad_norm": 0.5485109090805054,
+      "learning_rate": 1.6583577712609973e-05,
+      "loss": 0.0583,
+      "step": 1400
+    },
+    {
+      "epoch": 0.36656891495601174,
+      "grad_norm": 0.6193661689758301,
+      "learning_rate": 1.633919843597263e-05,
+      "loss": 0.0637,
+      "step": 1500
+    },
+    {
+      "epoch": 0.39100684261974583,
+      "grad_norm": 0.11104666441679001,
+      "learning_rate": 1.609481915933529e-05,
+      "loss": 0.0505,
+      "step": 1600
+    },
+    {
+      "epoch": 0.41544477028348,
+      "grad_norm": 0.13834528625011444,
+      "learning_rate": 1.5850439882697947e-05,
+      "loss": 0.0535,
+      "step": 1700
+    },
+    {
+      "epoch": 0.4398826979472141,
+      "grad_norm": 0.19737549126148224,
+      "learning_rate": 1.5606060606060605e-05,
+      "loss": 0.0503,
+      "step": 1800
+    },
+    {
+      "epoch": 0.46432062561094817,
+      "grad_norm": 5.043758392333984,
+      "learning_rate": 1.5361681329423267e-05,
+      "loss": 0.0512,
+      "step": 1900
+    },
+    {
+      "epoch": 0.4887585532746823,
+      "grad_norm": 0.07497064024209976,
+      "learning_rate": 1.5117302052785925e-05,
+      "loss": 0.0526,
+      "step": 2000
+    },
+    {
+      "epoch": 0.5131964809384164,
+      "grad_norm": 1.9213156700134277,
+      "learning_rate": 1.4872922776148583e-05,
+      "loss": 0.051,
+      "step": 2100
+    },
+    {
+      "epoch": 0.5376344086021505,
+      "grad_norm": 1.2963168621063232,
+      "learning_rate": 1.4628543499511243e-05,
+      "loss": 0.0429,
+      "step": 2200
+    },
+    {
+      "epoch": 0.5620723362658846,
+      "grad_norm": 1.5551583766937256,
+      "learning_rate": 1.4384164222873903e-05,
+      "loss": 0.0602,
+      "step": 2300
+    },
+    {
+      "epoch": 0.5865102639296188,
+      "grad_norm": 2.956341028213501,
+      "learning_rate": 1.4139784946236561e-05,
+      "loss": 0.0564,
+      "step": 2400
+    },
+    {
+      "epoch": 0.6109481915933529,
+      "grad_norm": 0.2880280911922455,
+      "learning_rate": 1.3895405669599221e-05,
+      "loss": 0.0425,
+      "step": 2500
+    },
+    {
+      "epoch": 0.635386119257087,
+      "grad_norm": 0.6562920808792114,
+      "learning_rate": 1.3651026392961877e-05,
+      "loss": 0.0456,
+      "step": 2600
+    },
+    {
+      "epoch": 0.6598240469208211,
+      "grad_norm": 0.09532313793897629,
+      "learning_rate": 1.3406647116324536e-05,
+      "loss": 0.051,
+      "step": 2700
+    },
+    {
+      "epoch": 0.6842619745845552,
+      "grad_norm": 2.781747817993164,
+      "learning_rate": 1.3162267839687195e-05,
+      "loss": 0.0512,
+      "step": 2800
+    },
+    {
+      "epoch": 0.7086999022482894,
+      "grad_norm": 2.1303281784057617,
+      "learning_rate": 1.2917888563049854e-05,
+      "loss": 0.0519,
+      "step": 2900
+    },
+    {
+      "epoch": 0.7331378299120235,
+      "grad_norm": 0.10773918032646179,
+      "learning_rate": 1.2673509286412513e-05,
+      "loss": 0.042,
+      "step": 3000
+    },
+    {
+      "epoch": 0.7575757575757576,
+      "grad_norm": 0.533173143863678,
+      "learning_rate": 1.2429130009775172e-05,
+      "loss": 0.0569,
+      "step": 3100
+    },
+    {
+      "epoch": 0.7820136852394917,
+      "grad_norm": 2.882176637649536,
+      "learning_rate": 1.2184750733137831e-05,
+      "loss": 0.0421,
+      "step": 3200
+    },
+    {
+      "epoch": 0.8064516129032258,
+      "grad_norm": 5.4323530197143555,
+      "learning_rate": 1.194037145650049e-05,
+      "loss": 0.0458,
+      "step": 3300
+    },
+    {
+      "epoch": 0.83088954056696,
+      "grad_norm": 0.08420676738023758,
+      "learning_rate": 1.169599217986315e-05,
+      "loss": 0.0432,
+      "step": 3400
+    },
+    {
+      "epoch": 0.855327468230694,
+      "grad_norm": 3.6947717666625977,
+      "learning_rate": 1.1451612903225808e-05,
+      "loss": 0.0387,
+      "step": 3500
+    },
+    {
+      "epoch": 0.8797653958944281,
+      "grad_norm": 4.411167621612549,
+      "learning_rate": 1.1209677419354839e-05,
+      "loss": 0.0515,
+      "step": 3600
+    },
+    {
+      "epoch": 0.9042033235581622,
+      "grad_norm": 3.9330861568450928,
+      "learning_rate": 1.0965298142717497e-05,
+      "loss": 0.0368,
+      "step": 3700
+    },
+    {
+      "epoch": 0.9286412512218963,
+      "grad_norm": 0.9437419772148132,
+      "learning_rate": 1.0720918866080157e-05,
+      "loss": 0.0479,
+      "step": 3800
+    },
+    {
+      "epoch": 0.9530791788856305,
+      "grad_norm": 1.0870046615600586,
+      "learning_rate": 1.0476539589442815e-05,
+      "loss": 0.0426,
+      "step": 3900
+    },
+    {
+      "epoch": 0.9775171065493646,
+      "grad_norm": 3.1951255798339844,
+      "learning_rate": 1.0232160312805475e-05,
+      "loss": 0.0432,
+      "step": 4000
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9891518737672583,
+      "eval_f1": 0.9928387101834639,
+      "eval_loss": 0.04053397476673126,
+      "eval_runtime": 158.0778,
+      "eval_samples_per_second": 532.409,
+      "eval_steps_per_second": 11.096,
+      "step": 4092
+    },
+    {
+      "epoch": 1.0019550342130987,
+      "grad_norm": 0.5268033146858215,
+      "learning_rate": 9.987781036168133e-06,
+      "loss": 0.0386,
+      "step": 4100
+    },
+    {
+      "epoch": 1.0263929618768328,
+      "grad_norm": 0.3988477289676666,
+      "learning_rate": 9.743401759530793e-06,
+      "loss": 0.0224,
+      "step": 4200
+    },
+    {
+      "epoch": 1.050830889540567,
+      "grad_norm": 0.031836945563554764,
+      "learning_rate": 9.499022482893451e-06,
+      "loss": 0.0344,
+      "step": 4300
+    },
+    {
+      "epoch": 1.075268817204301,
+      "grad_norm": 1.4545081853866577,
+      "learning_rate": 9.25464320625611e-06,
+      "loss": 0.0285,
+      "step": 4400
+    },
+    {
+      "epoch": 1.099706744868035,
+      "grad_norm": 0.054912444204092026,
+      "learning_rate": 9.01026392961877e-06,
+      "loss": 0.0176,
+      "step": 4500
+    },
+    {
+      "epoch": 1.1241446725317692,
+      "grad_norm": 1.042144775390625,
+      "learning_rate": 8.765884652981427e-06,
+      "loss": 0.0235,
+      "step": 4600
+    },
+    {
+      "epoch": 1.1485826001955035,
+      "grad_norm": 0.12319644540548325,
+      "learning_rate": 8.521505376344087e-06,
+      "loss": 0.0274,
+      "step": 4700
+    },
+    {
+      "epoch": 1.1730205278592376,
+      "grad_norm": 0.08448143303394318,
+      "learning_rate": 8.277126099706745e-06,
+      "loss": 0.0261,
+      "step": 4800
+    },
+    {
+      "epoch": 1.1974584555229717,
+      "grad_norm": 0.06239945441484451,
+      "learning_rate": 8.032746823069404e-06,
+      "loss": 0.022,
+      "step": 4900
+    },
+    {
+      "epoch": 1.2218963831867058,
+      "grad_norm": 0.0412888340651989,
+      "learning_rate": 7.788367546432064e-06,
+      "loss": 0.0239,
+      "step": 5000
+    },
+    {
+      "epoch": 1.2463343108504399,
+      "grad_norm": 0.10470504313707352,
+      "learning_rate": 7.543988269794722e-06,
+      "loss": 0.0256,
+      "step": 5100
+    },
+    {
+      "epoch": 1.270772238514174,
+      "grad_norm": 0.3927100896835327,
+      "learning_rate": 7.299608993157381e-06,
+      "loss": 0.0299,
+      "step": 5200
+    },
+    {
+      "epoch": 1.295210166177908,
+      "grad_norm": 0.2635032534599304,
+      "learning_rate": 7.05522971652004e-06,
+      "loss": 0.0223,
+      "step": 5300
+    },
+    {
+      "epoch": 1.3196480938416422,
+      "grad_norm": 0.05280297249555588,
+      "learning_rate": 6.810850439882698e-06,
+      "loss": 0.0319,
+      "step": 5400
+    },
+    {
+      "epoch": 1.3440860215053765,
+      "grad_norm": 0.02359873428940773,
+      "learning_rate": 6.566471163245357e-06,
+      "loss": 0.02,
+      "step": 5500
+    },
+    {
+      "epoch": 1.3685239491691106,
+      "grad_norm": 0.42642369866371155,
+      "learning_rate": 6.324535679374389e-06,
+      "loss": 0.0241,
+      "step": 5600
+    },
+    {
+      "epoch": 1.3929618768328447,
+      "grad_norm": 0.7084789872169495,
+      "learning_rate": 6.080156402737049e-06,
+      "loss": 0.0195,
+      "step": 5700
+    },
+    {
+      "epoch": 1.4173998044965788,
+      "grad_norm": 0.14894872903823853,
+      "learning_rate": 5.835777126099708e-06,
+      "loss": 0.0233,
+      "step": 5800
+    },
+    {
+      "epoch": 1.4418377321603129,
+      "grad_norm": 6.313684463500977,
+      "learning_rate": 5.591397849462365e-06,
+      "loss": 0.0181,
+      "step": 5900
+    },
+    {
+      "epoch": 1.466275659824047,
+      "grad_norm": 0.9010400772094727,
+      "learning_rate": 5.347018572825024e-06,
+      "loss": 0.0243,
+      "step": 6000
+    },
+    {
+      "epoch": 1.490713587487781,
+      "grad_norm": 0.15028172731399536,
+      "learning_rate": 5.102639296187683e-06,
+      "loss": 0.0227,
+      "step": 6100
+    },
+    {
+      "epoch": 1.5151515151515151,
+      "grad_norm": 1.0572513341903687,
+      "learning_rate": 4.858260019550342e-06,
+      "loss": 0.019,
+      "step": 6200
+    },
+    {
+      "epoch": 1.5395894428152492,
+      "grad_norm": 0.056791041046381,
+      "learning_rate": 4.613880742913001e-06,
+      "loss": 0.0204,
+      "step": 6300
+    },
+    {
+      "epoch": 1.5640273704789833,
+      "grad_norm": 0.3077963590621948,
+      "learning_rate": 4.36950146627566e-06,
+      "loss": 0.0253,
+      "step": 6400
+    },
+    {
+      "epoch": 1.5884652981427174,
+      "grad_norm": 0.03899073228240013,
+      "learning_rate": 4.125122189638319e-06,
+      "loss": 0.0216,
+      "step": 6500
+    },
+    {
+      "epoch": 1.6129032258064515,
+      "grad_norm": 1.412708044052124,
+      "learning_rate": 3.8807429130009776e-06,
+      "loss": 0.0224,
+      "step": 6600
+    },
+    {
+      "epoch": 1.6373411534701856,
+      "grad_norm": 0.08187337219715118,
+      "learning_rate": 3.6363636363636366e-06,
+      "loss": 0.0178,
+      "step": 6700
+    },
+    {
+      "epoch": 1.6617790811339197,
+      "grad_norm": 0.04208606481552124,
+      "learning_rate": 3.391984359726295e-06,
+      "loss": 0.0247,
+      "step": 6800
+    },
+    {
+      "epoch": 1.6862170087976538,
+      "grad_norm": 0.0923227071762085,
+      "learning_rate": 3.147605083088954e-06,
+      "loss": 0.0207,
+      "step": 6900
+    },
+    {
+      "epoch": 1.710654936461388,
+      "grad_norm": 1.2065573930740356,
+      "learning_rate": 2.903225806451613e-06,
+      "loss": 0.0362,
+      "step": 7000
+    },
+    {
+      "epoch": 1.7350928641251222,
+      "grad_norm": 5.345006942749023,
+      "learning_rate": 2.658846529814272e-06,
+      "loss": 0.0274,
+      "step": 7100
+    },
+    {
+      "epoch": 1.7595307917888563,
+      "grad_norm": 0.1414783000946045,
+      "learning_rate": 2.414467253176931e-06,
+      "loss": 0.0204,
+      "step": 7200
+    },
+    {
+      "epoch": 1.7839687194525904,
+      "grad_norm": 1.9135044813156128,
+      "learning_rate": 2.17008797653959e-06,
+      "loss": 0.0279,
+      "step": 7300
+    },
+    {
+      "epoch": 1.8084066471163245,
+      "grad_norm": 1.5857988595962524,
+      "learning_rate": 1.9257086999022484e-06,
+      "loss": 0.0251,
+      "step": 7400
+    },
+    {
+      "epoch": 1.8328445747800588,
+      "grad_norm": 0.38852691650390625,
+      "learning_rate": 1.6813294232649072e-06,
+      "loss": 0.0199,
+      "step": 7500
+    },
+    {
+      "epoch": 1.857282502443793,
+      "grad_norm": 0.09283141791820526,
+      "learning_rate": 1.4369501466275662e-06,
+      "loss": 0.0178,
+      "step": 7600
+    },
+    {
+      "epoch": 1.881720430107527,
+      "grad_norm": 0.04146512970328331,
+      "learning_rate": 1.192570869990225e-06,
+      "loss": 0.017,
+      "step": 7700
+    },
+    {
+      "epoch": 1.906158357771261,
+      "grad_norm": 0.029652154073119164,
+      "learning_rate": 9.481915933528838e-07,
+      "loss": 0.0193,
+      "step": 7800
+    },
+    {
+      "epoch": 1.9305962854349952,
+      "grad_norm": 0.04845303297042847,
+      "learning_rate": 7.038123167155427e-07,
+      "loss": 0.0287,
+      "step": 7900
+    },
+    {
+      "epoch": 1.9550342130987293,
+      "grad_norm": 0.05037612095475197,
+      "learning_rate": 4.618768328445748e-07,
+      "loss": 0.0257,
+      "step": 8000
+    },
+    {
+      "epoch": 1.9794721407624634,
+      "grad_norm": 0.9069479703903198,
+      "learning_rate": 2.1749755620723366e-07,
+      "loss": 0.0299,
+      "step": 8100
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.9917183527007438,
+      "eval_f1": 0.994545440316787,
+      "eval_loss": 0.03528362512588501,
+      "eval_runtime": 158.882,
+      "eval_samples_per_second": 529.714,
+      "eval_steps_per_second": 11.04,
+      "step": 8184
+    }
+  ],
+  "logging_steps": 100,
+  "max_steps": 8184,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 2,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5.2026570822144e+16,
+  "train_batch_size": 48,
+  "trial_name": null,
+  "trial_params": null
+}

Floressek/sentiment_classification_from_distillbert/checkpoint-8184/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0c534883427a071f1d9f3ba8e1a112e5e016307e4c8c2c116719a636f815013c
+size 5841

Floressek/sentiment_classification_from_distillbert/checkpoint-8184/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

Floressek/sentiment_classification_from_distillbert/config.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "dtype": "float32",
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "transformers_version": "4.57.1",
+  "vocab_size": 30522
+}

Floressek/sentiment_classification_from_distillbert/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5ef48f63397444fab7fe77a7c3e8113768986ff1c8e5e9126a66727aa030ec64
+size 267832560

Floressek/sentiment_classification_from_distillbert/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

Floressek/sentiment_classification_from_distillbert/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

Floressek/sentiment_classification_from_distillbert/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

Floressek/sentiment_classification_from_distillbert/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0c534883427a071f1d9f3ba8e1a112e5e016307e4c8c2c116719a636f815013c
+size 5841

Floressek/sentiment_classification_from_distillbert/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

Szymon_Florek_Model_fine_tuning.ipynb ADDED Viewed

	@@ -0,0 +1,1145 @@

+{
+ "cells": [
+  {
+   "metadata": {
+    "collapsed": true
+   },
+   "cell_type": "markdown",
+   "source": "# Fine-tuning a Pretrained Model for sentiment analysis",
+   "id": "d26037aadad0840b"
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "## Importing necessary libraries and data\n",
+   "id": "15d09dfe44d655d4"
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T17:17:28.523157Z",
+     "start_time": "2025-11-14T17:17:23.902525Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "!pip install datasets evaluate transformers[sentencepiece]\n",
+    "!pip install ipywidgets\n",
+    "!pip install torch\n",
+    "!pip install transformers[torch]\n",
+    "!pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu118\n",
+    "!pip install scikit-learn"
+   ],
+   "id": "efdad8b2b5ab54d",
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Requirement already satisfied: datasets in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (4.4.1)\n",
+      "Requirement already satisfied: evaluate in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (0.4.6)\n",
+      "Requirement already satisfied: transformers[sentencepiece] in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (4.57.1)\n",
+      "Requirement already satisfied: filelock in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (3.20.0)\n",
+      "Requirement already satisfied: numpy>=1.17 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (2.3.4)\n",
+      "Requirement already satisfied: pyarrow>=21.0.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (22.0.0)\n",
+      "Requirement already satisfied: dill<0.4.1,>=0.3.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (0.4.0)\n",
+      "Requirement already satisfied: pandas in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (2.3.3)\n",
+      "Requirement already satisfied: requests>=2.32.2 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (2.32.5)\n",
+      "Requirement already satisfied: httpx<1.0.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (0.28.1)\n",
+      "Requirement already satisfied: tqdm>=4.66.3 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (4.67.1)\n",
+      "Requirement already satisfied: xxhash in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (3.6.0)\n",
+      "Requirement already satisfied: multiprocess<0.70.19 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (0.70.18)\n",
+      "Requirement already satisfied: fsspec<=2025.10.0,>=2023.1.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from fsspec[http]<=2025.10.0,>=2023.1.0->datasets) (2025.10.0)\n",
+      "Requirement already satisfied: huggingface-hub<2.0,>=0.25.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (0.36.0)\n",
+      "Requirement already satisfied: packaging in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (25.0)\n",
+      "Requirement already satisfied: pyyaml>=5.1 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from datasets) (6.0.3)\n",
+      "Requirement already satisfied: aiohttp!=4.0.0a0,!=4.0.0a1 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from fsspec[http]<=2025.10.0,>=2023.1.0->datasets) (3.13.2)\n",
+      "Requirement already satisfied: anyio in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from httpx<1.0.0->datasets) (4.11.0)\n",
+      "Requirement already satisfied: certifi in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from httpx<1.0.0->datasets) (2025.11.12)\n",
+      "Requirement already satisfied: httpcore==1.* in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from httpx<1.0.0->datasets) (1.0.9)\n",
+      "Requirement already satisfied: idna in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from httpx<1.0.0->datasets) (3.11)\n",
+      "Requirement already satisfied: h11>=0.16 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from httpcore==1.*->httpx<1.0.0->datasets) (0.16.0)\n",
+      "Requirement already satisfied: typing-extensions>=3.7.4.3 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from huggingface-hub<2.0,>=0.25.0->datasets) (4.15.0)\n",
+      "Requirement already satisfied: regex!=2019.12.17 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[sentencepiece]) (2025.11.3)\n",
+      "Requirement already satisfied: tokenizers<=0.23.0,>=0.22.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[sentencepiece]) (0.22.1)\n",
+      "Requirement already satisfied: safetensors>=0.4.3 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[sentencepiece]) (0.6.2)\n",
+      "Requirement already satisfied: sentencepiece!=0.1.92,>=0.1.91 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[sentencepiece]) (0.2.1)\n",
+      "Requirement already satisfied: protobuf in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[sentencepiece]) (6.33.1)\n",
+      "Requirement already satisfied: aiohappyeyeballs>=2.5.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.10.0,>=2023.1.0->datasets) (2.6.1)\n",
+      "Requirement already satisfied: aiosignal>=1.4.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.10.0,>=2023.1.0->datasets) (1.4.0)\n",
+      "Requirement already satisfied: attrs>=17.3.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.10.0,>=2023.1.0->datasets) (25.4.0)\n",
+      "Requirement already satisfied: frozenlist>=1.1.1 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.10.0,>=2023.1.0->datasets) (1.8.0)\n",
+      "Requirement already satisfied: multidict<7.0,>=4.5 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.10.0,>=2023.1.0->datasets) (6.7.0)\n",
+      "Requirement already satisfied: propcache>=0.2.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.10.0,>=2023.1.0->datasets) (0.4.1)\n",
+      "Requirement already satisfied: yarl<2.0,>=1.17.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.10.0,>=2023.1.0->datasets) (1.22.0)\n",
+      "Requirement already satisfied: charset_normalizer<4,>=2 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from requests>=2.32.2->datasets) (3.4.4)\n",
+      "Requirement already satisfied: urllib3<3,>=1.21.1 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from requests>=2.32.2->datasets) (2.5.0)\n",
+      "Requirement already satisfied: colorama in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from tqdm>=4.66.3->datasets) (0.4.6)\n",
+      "Requirement already satisfied: sniffio>=1.1 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from anyio->httpx<1.0.0->datasets) (1.3.1)\n",
+      "Requirement already satisfied: python-dateutil>=2.8.2 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from pandas->datasets) (2.9.0.post0)\n",
+      "Requirement already satisfied: pytz>=2020.1 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from pandas->datasets) (2025.2)\n",
+      "Requirement already satisfied: tzdata>=2022.7 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from pandas->datasets) (2025.2)\n",
+      "Requirement already satisfied: six>=1.5 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from python-dateutil>=2.8.2->pandas->datasets) (1.17.0)\n",
+      "Requirement already satisfied: ipywidgets in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (8.1.8)\n",
+      "Requirement already satisfied: comm>=0.1.3 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipywidgets) (0.2.3)\n",
+      "Requirement already satisfied: ipython>=6.1.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipywidgets) (9.7.0)\n",
+      "Requirement already satisfied: traitlets>=4.3.1 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipywidgets) (5.14.3)\n",
+      "Requirement already satisfied: widgetsnbextension~=4.0.14 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipywidgets) (4.0.15)\n",
+      "Requirement already satisfied: jupyterlab_widgets~=3.0.15 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipywidgets) (3.0.16)\n",
+      "Requirement already satisfied: colorama>=0.4.4 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipython>=6.1.0->ipywidgets) (0.4.6)\n",
+      "Requirement already satisfied: decorator>=4.3.2 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipython>=6.1.0->ipywidgets) (5.2.1)\n",
+      "Requirement already satisfied: ipython-pygments-lexers>=1.0.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipython>=6.1.0->ipywidgets) (1.1.1)\n",
+      "Requirement already satisfied: jedi>=0.18.1 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipython>=6.1.0->ipywidgets) (0.19.2)\n",
+      "Requirement already satisfied: matplotlib-inline>=0.1.5 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipython>=6.1.0->ipywidgets) (0.2.1)\n",
+      "Requirement already satisfied: prompt_toolkit<3.1.0,>=3.0.41 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipython>=6.1.0->ipywidgets) (3.0.52)\n",
+      "Requirement already satisfied: pygments>=2.11.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipython>=6.1.0->ipywidgets) (2.19.2)\n",
+      "Requirement already satisfied: stack_data>=0.6.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from ipython>=6.1.0->ipywidgets) (0.6.3)\n",
+      "Requirement already satisfied: wcwidth in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from prompt_toolkit<3.1.0,>=3.0.41->ipython>=6.1.0->ipywidgets) (0.2.14)\n",
+      "Requirement already satisfied: parso<0.9.0,>=0.8.4 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from jedi>=0.18.1->ipython>=6.1.0->ipywidgets) (0.8.5)\n",
+      "Requirement already satisfied: executing>=1.2.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from stack_data>=0.6.0->ipython>=6.1.0->ipywidgets) (2.2.1)\n",
+      "Requirement already satisfied: asttokens>=2.1.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from stack_data>=0.6.0->ipython>=6.1.0->ipywidgets) (3.0.0)\n",
+      "Requirement already satisfied: pure-eval in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from stack_data>=0.6.0->ipython>=6.1.0->ipywidgets) (0.2.3)\n",
+      "Requirement already satisfied: torch in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (2.7.1+cu118)\n",
+      "Requirement already satisfied: filelock in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (3.20.0)\n",
+      "Requirement already satisfied: typing-extensions>=4.10.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (4.15.0)\n",
+      "Requirement already satisfied: sympy>=1.13.3 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (1.14.0)\n",
+      "Requirement already satisfied: networkx in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (3.5)\n",
+      "Requirement already satisfied: jinja2 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (3.1.6)\n",
+      "Requirement already satisfied: fsspec in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (2025.10.0)\n",
+      "Requirement already satisfied: setuptools in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (80.9.0)\n",
+      "Requirement already satisfied: mpmath<1.4,>=1.1.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from sympy>=1.13.3->torch) (1.3.0)\n",
+      "Requirement already satisfied: MarkupSafe>=2.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from jinja2->torch) (3.0.3)\n",
+      "Requirement already satisfied: transformers[torch] in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (4.57.1)\n",
+      "Requirement already satisfied: filelock in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[torch]) (3.20.0)\n",
+      "Requirement already satisfied: huggingface-hub<1.0,>=0.34.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[torch]) (0.36.0)\n",
+      "Requirement already satisfied: numpy>=1.17 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[torch]) (2.3.4)\n",
+      "Requirement already satisfied: packaging>=20.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[torch]) (25.0)\n",
+      "Requirement already satisfied: pyyaml>=5.1 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[torch]) (6.0.3)\n",
+      "Requirement already satisfied: regex!=2019.12.17 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[torch]) (2025.11.3)\n",
+      "Requirement already satisfied: requests in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[torch]) (2.32.5)\n",
+      "Requirement already satisfied: tokenizers<=0.23.0,>=0.22.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[torch]) (0.22.1)\n",
+      "Requirement already satisfied: safetensors>=0.4.3 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[torch]) (0.6.2)\n",
+      "Requirement already satisfied: tqdm>=4.27 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[torch]) (4.67.1)\n",
+      "Requirement already satisfied: torch>=2.2 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[torch]) (2.7.1+cu118)\n",
+      "Requirement already satisfied: accelerate>=0.26.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from transformers[torch]) (1.11.0)\n",
+      "Requirement already satisfied: fsspec>=2023.5.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from huggingface-hub<1.0,>=0.34.0->transformers[torch]) (2025.10.0)\n",
+      "Requirement already satisfied: typing-extensions>=3.7.4.3 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from huggingface-hub<1.0,>=0.34.0->transformers[torch]) (4.15.0)\n",
+      "Requirement already satisfied: psutil in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from accelerate>=0.26.0->transformers[torch]) (7.1.3)\n",
+      "Requirement already satisfied: sympy>=1.13.3 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch>=2.2->transformers[torch]) (1.14.0)\n",
+      "Requirement already satisfied: networkx in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch>=2.2->transformers[torch]) (3.5)\n",
+      "Requirement already satisfied: jinja2 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch>=2.2->transformers[torch]) (3.1.6)\n",
+      "Requirement already satisfied: setuptools in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch>=2.2->transformers[torch]) (80.9.0)\n",
+      "Requirement already satisfied: mpmath<1.4,>=1.1.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from sympy>=1.13.3->torch>=2.2->transformers[torch]) (1.3.0)\n",
+      "Requirement already satisfied: colorama in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from tqdm>=4.27->transformers[torch]) (0.4.6)\n",
+      "Requirement already satisfied: MarkupSafe>=2.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from jinja2->torch>=2.2->transformers[torch]) (3.0.3)\n",
+      "Requirement already satisfied: charset_normalizer<4,>=2 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from requests->transformers[torch]) (3.4.4)\n",
+      "Requirement already satisfied: idna<4,>=2.5 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from requests->transformers[torch]) (3.11)\n",
+      "Requirement already satisfied: urllib3<3,>=1.21.1 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from requests->transformers[torch]) (2.5.0)\n",
+      "Requirement already satisfied: certifi>=2017.4.17 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from requests->transformers[torch]) (2025.11.12)\n",
+      "Looking in indexes: https://download.pytorch.org/whl/cu118\n",
+      "Requirement already satisfied: torch in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (2.7.1+cu118)\n",
+      "Requirement already satisfied: torchvision in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (0.22.1+cu118)\n",
+      "Requirement already satisfied: torchaudio in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (2.7.1+cu118)\n",
+      "Requirement already satisfied: filelock in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (3.20.0)\n",
+      "Requirement already satisfied: typing-extensions>=4.10.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (4.15.0)\n",
+      "Requirement already satisfied: sympy>=1.13.3 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (1.14.0)\n",
+      "Requirement already satisfied: networkx in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (3.5)\n",
+      "Requirement already satisfied: jinja2 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (3.1.6)\n",
+      "Requirement already satisfied: fsspec in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (2025.10.0)\n",
+      "Requirement already satisfied: setuptools in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torch) (80.9.0)\n",
+      "Requirement already satisfied: numpy in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torchvision) (2.3.4)\n",
+      "Requirement already satisfied: pillow!=8.3.*,>=5.3.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from torchvision) (11.3.0)\n",
+      "Requirement already satisfied: mpmath<1.4,>=1.1.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from sympy>=1.13.3->torch) (1.3.0)\n",
+      "Requirement already satisfied: MarkupSafe>=2.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from jinja2->torch) (3.0.3)\n",
+      "Requirement already satisfied: scikit-learn in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (1.7.2)\n",
+      "Requirement already satisfied: numpy>=1.22.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from scikit-learn) (2.3.4)\n",
+      "Requirement already satisfied: scipy>=1.8.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from scikit-learn) (1.16.3)\n",
+      "Requirement already satisfied: joblib>=1.2.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from scikit-learn) (1.5.2)\n",
+      "Requirement already satisfied: threadpoolctl>=3.1.0 in c:\\users\\szyme\\pycharmprojects\\languageprocessinglab\\.venv\\lib\\site-packages (from scikit-learn) (3.6.0)\n"
+     ]
+    }
+   ],
+   "execution_count": 4
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T18:39:53.784036Z",
+     "start_time": "2025-11-14T18:39:53.693711Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "!nvidia-smi\n",
+    "import torch\n",
+    "\n",
+    "print(f\"CUDA available: {torch.cuda.is_available()}\")\n",
+    "if torch.cuda.is_available():\n",
+    "    print(f\"Device: {torch.cuda.get_device_name(0)}\")\n",
+    "else:\n",
+    "    print(\"WARNING: Training on CPU will be very slow!\")"
+   ],
+   "id": "f6d0e86c409e9a9d",
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Fri Nov 14 19:39:53 2025       \n",
+      "+-----------------------------------------------------------------------------------------+\n",
+      "| NVIDIA-SMI 581.42                 Driver Version: 581.42         CUDA Version: 13.0     |\n",
+      "+-----------------------------------------+------------------------+----------------------+\n",
+      "| GPU  Name                  Driver-Model | Bus-Id          Disp.A | Volatile Uncorr. ECC |\n",
+      "| Fan  Temp   Perf          Pwr:Usage/Cap |           Memory-Usage | GPU-Util  Compute M. |\n",
+      "|                                         |                        |               MIG M. |\n",
+      "|=========================================+========================+======================|\n",
+      "|   0  NVIDIA GeForce RTX 4070      WDDM  |   00000000:01:00.0  On |                  N/A |\n",
+      "|  0%   43C    P5             25W /  215W |    4740MiB /  12282MiB |     21%      Default |\n",
+      "|                                         |                        |                  N/A |\n",
+      "+-----------------------------------------+------------------------+----------------------+\n",
+      "\n",
+      "+-----------------------------------------------------------------------------------------+\n",
+      "| Processes:                                                                              |\n",
+      "|  GPU   GI   CI              PID   Type   Process name                        GPU Memory |\n",
+      "|        ID   ID                                                               Usage      |\n",
+      "|=========================================================================================|\n",
+      "|    0   N/A  N/A            1416    C+G   C:\\Windows\\System32\\dwm.exe           N/A      |\n",
+      "|    0   N/A  N/A            2332    C+G   ....0.3595.53\\msedgewebview2.exe      N/A      |\n",
+      "|    0   N/A  N/A            2736    C+G   ...xyewy\\ShellExperienceHost.exe      N/A      |\n",
+      "|    0   N/A  N/A            5108    C+G   ...5n1h2txyewy\\TextInputHost.exe      N/A      |\n",
+      "|    0   N/A  N/A            7252    C+G   ...8bbwe\\PhoneExperienceHost.exe      N/A      |\n",
+      "|    0   N/A  N/A           11540    C+G   ...4__8wekyb3d8bbwe\\ms-teams.exe      N/A      |\n",
+      "|    0   N/A  N/A           12376    C+G   ...l\\Programs\\Opera GX\\opera.exe      N/A      |\n",
+      "|    0   N/A  N/A           12668    C+G   ...GABYTE\\Control Center\\GCC.exe      N/A      |\n",
+      "|    0   N/A  N/A           14740    C+G   ...lus\\logioptionsplus_agent.exe      N/A      |\n",
+      "|    0   N/A  N/A           14780    C+G   ...D\\CNext\\CNext\\AMDRSSrcExt.exe      N/A      |\n",
+      "|    0   N/A  N/A           15060    C+G   C:\\Windows\\explorer.exe               N/A      |\n",
+      "|    0   N/A  N/A           15140    C+G   ...indows\\System32\\ShellHost.exe      N/A      |\n",
+      "|    0   N/A  N/A           16828    C+G   ..._cw5n1h2txyewy\\SearchHost.exe      N/A      |\n",
+      "|    0   N/A  N/A           16836    C+G   ...y\\StartMenuExperienceHost.exe      N/A      |\n",
+      "|    0   N/A  N/A           19100    C+G   ....0.3595.53\\msedgewebview2.exe      N/A      |\n",
+      "|    0   N/A  N/A           19252    C+G   ...64__zpdnekdrzrea0\\Spotify.exe      N/A      |\n",
+      "|    0   N/A  N/A           20520    C+G   ...Next\\CNext\\RadeonSoftware.exe      N/A      |\n",
+      "|    0   N/A  N/A           20576    C+G   ...roadcast\\NVIDIA Broadcast.exe      N/A      |\n",
+      "|    0   N/A  N/A           21188    C+G   ...cord\\app-1.0.9214\\Discord.exe      N/A      |\n",
+      "|    0   N/A  N/A           22276    C+G   ...lpaper_engine\\wallpaper64.exe      N/A      |\n",
+      "|    0   N/A  N/A           23288    C+G   ...l\\Programs\\Opera GX\\opera.exe      N/A      |\n",
+      "|    0   N/A  N/A           23576    C+G   ...__8yrtsj140pw4g\\app\\Slack.exe      N/A      |\n",
+      "|    0   N/A  N/A           23656    C+G   ...zcv7bpp5a\\Raycast\\Raycast.exe      N/A      |\n",
+      "|    0   N/A  N/A           24616    C+G   ...__8yrtsj140pw4g\\app\\Slack.exe      N/A      |\n",
+      "|    0   N/A  N/A           24772    C+G   ....0.3595.53\\msedgewebview2.exe      N/A      |\n",
+      "|    0   N/A  N/A           28520    C+G   ...4__8wekyb3d8bbwe\\ms-teams.exe      N/A      |\n",
+      "|    0   N/A  N/A           29960    C+G   ....0.3595.53\\msedgewebview2.exe      N/A      |\n",
+      "|    0   N/A  N/A           31076    C+G   ...0_x64__8wekyb3d8bbwe\\Todo.exe      N/A      |\n",
+      "|    0   N/A  N/A           31724      C   ...gLab\\.venv\\Scripts\\python.exe      N/A      |\n",
+      "|    0   N/A  N/A           33752    C+G   ...harm 2\\jbr\\bin\\cef_server.exe      N/A      |\n",
+      "|    0   N/A  N/A           35756    C+G   ...Claude\\app-1.0.332\\claude.exe      N/A      |\n",
+      "|    0   N/A  N/A           36000    C+G   ...em32\\ApplicationFrameHost.exe      N/A      |\n",
+      "|    0   N/A  N/A           36392    C+G   C:\\Windows\\System32\\Taskmgr.exe       N/A      |\n",
+      "+-----------------------------------------------------------------------------------------+\n",
+      "CUDA available: True\n",
+      "Device: NVIDIA GeForce RTX 4070\n"
+     ]
+    }
+   ],
+   "execution_count": 28
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T20:21:55.196741Z",
+     "start_time": "2025-11-14T20:21:52.456375Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "from pathlib import Path\n",
+    "from urllib.request import urlretrieve\n",
+    "import zipfile\n",
+    "import pandas as pd\n",
+    "\n",
+    "base_dir = Path().resolve()\n",
+    "\n",
+    "amazon_mobile_reviews_url = \"https://eduds.blob.core.windows.net/nlp/Amazon_Unlocked_Mobile.csv.zip\"\n",
+    "filename = \"data/Amazon_Unlocked_Mobile.csv.zip\"\n",
+    "data_dir = base_dir / \"data\"\n",
+    "\n",
+    "zip_path = data_dir / \"Amazon_Unlocked_Mobile.csv.zip\"\n",
+    "csv_path = data_dir / \"Amazon_Unlocked_Mobile.csv\"\n",
+    "\n",
+    "urlretrieve(amazon_mobile_reviews_url, filename)\n",
+    "\n",
+    "with zipfile.ZipFile(zip_path) as zfile:\n",
+    "    zfile.extractall(data_dir)\n",
+    "\n",
+    "df = pd.read_csv(csv_path)"
+   ],
+   "id": "af23e8e3d03e3bfb",
+   "outputs": [],
+   "execution_count": 63
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T20:21:56.503693Z",
+     "start_time": "2025-11-14T20:21:56.440111Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "df.info()\n",
+    "df.describe()\n",
+    "df.head()"
+   ],
+   "id": "27b0bab46de0d18d",
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "<class 'pandas.core.frame.DataFrame'>\n",
+      "RangeIndex: 413840 entries, 0 to 413839\n",
+      "Data columns (total 6 columns):\n",
+      " #   Column        Non-Null Count   Dtype  \n",
+      "---  ------        --------------   -----  \n",
+      " 0   Product Name  413840 non-null  object \n",
+      " 1   Brand Name    348669 non-null  object \n",
+      " 2   Price         407907 non-null  float64\n",
+      " 3   Rating        413840 non-null  int64  \n",
+      " 4   Reviews       413770 non-null  object \n",
+      " 5   Review Votes  401544 non-null  float64\n",
+      "dtypes: float64(2), int64(1), object(3)\n",
+      "memory usage: 18.9+ MB\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "                                        Product Name Brand Name   Price  \\\n",
+       "0  \"CLEAR CLEAN ESN\" Sprint EPIC 4G Galaxy SPH-D7...    Samsung  199.99   \n",
+       "1  \"CLEAR CLEAN ESN\" Sprint EPIC 4G Galaxy SPH-D7...    Samsung  199.99   \n",
+       "2  \"CLEAR CLEAN ESN\" Sprint EPIC 4G Galaxy SPH-D7...    Samsung  199.99   \n",
+       "3  \"CLEAR CLEAN ESN\" Sprint EPIC 4G Galaxy SPH-D7...    Samsung  199.99   \n",
+       "4  \"CLEAR CLEAN ESN\" Sprint EPIC 4G Galaxy SPH-D7...    Samsung  199.99   \n",
+       "\n",
+       "   Rating                                            Reviews  Review Votes  \n",
+       "0       5  I feel so LUCKY to have found this used (phone...           1.0  \n",
+       "1       4  nice phone, nice up grade from my pantach revu...           0.0  \n",
+       "2       5                                       Very pleased           0.0  \n",
+       "3       4  It works good but it goes slow sometimes but i...           0.0  \n",
+       "4       4  Great phone to replace my lost phone. The only...           0.0  "
+      ],
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>Product Name</th>\n",
+       "      <th>Brand Name</th>\n",
+       "      <th>Price</th>\n",
+       "      <th>Rating</th>\n",
+       "      <th>Reviews</th>\n",
+       "      <th>Review Votes</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>\"CLEAR CLEAN ESN\" Sprint EPIC 4G Galaxy SPH-D7...</td>\n",
+       "      <td>Samsung</td>\n",
+       "      <td>199.99</td>\n",
+       "      <td>5</td>\n",
+       "      <td>I feel so LUCKY to have found this used (phone...</td>\n",
+       "      <td>1.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>\"CLEAR CLEAN ESN\" Sprint EPIC 4G Galaxy SPH-D7...</td>\n",
+       "      <td>Samsung</td>\n",
+       "      <td>199.99</td>\n",
+       "      <td>4</td>\n",
+       "      <td>nice phone, nice up grade from my pantach revu...</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>\"CLEAR CLEAN ESN\" Sprint EPIC 4G Galaxy SPH-D7...</td>\n",
+       "      <td>Samsung</td>\n",
+       "      <td>199.99</td>\n",
+       "      <td>5</td>\n",
+       "      <td>Very pleased</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>\"CLEAR CLEAN ESN\" Sprint EPIC 4G Galaxy SPH-D7...</td>\n",
+       "      <td>Samsung</td>\n",
+       "      <td>199.99</td>\n",
+       "      <td>4</td>\n",
+       "      <td>It works good but it goes slow sometimes but i...</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>\"CLEAR CLEAN ESN\" Sprint EPIC 4G Galaxy SPH-D7...</td>\n",
+       "      <td>Samsung</td>\n",
+       "      <td>199.99</td>\n",
+       "      <td>4</td>\n",
+       "      <td>Great phone to replace my lost phone. The only...</td>\n",
+       "      <td>0.0</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ]
+     },
+     "execution_count": 64,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "execution_count": 64
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "## CONFIGURATION\n",
+   "id": "a44e589066e2e256"
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T18:46:29.881682Z",
+     "start_time": "2025-11-14T18:46:29.879491Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "DATA_URL = \"https://eduds.blob.core.windows.net/nlp/Amazon_Unlocked_Mobile.csv.zip\"\n",
+    "DATA_FILE = \"data/Amazon_Unlocked_Mobile.csv\"\n",
+    "MODEL_CHECKPOINT = \"distilbert-base-uncased\"\n",
+    "REPO_NAME = \"Floressek/sentiment_classification_from_distillbert\"\n",
+    "HUGGING_FACE_TOKEN = \"here input your token\"\n",
+    "\n",
+    "MAX_REVIEW_LENGTH = 128\n",
+    "TEST_SIZE = 0.3\n",
+    "BATCH_SIZE = 48\n",
+    "BATCH_SIZE_TOKEN = 1000\n",
+    "LEARNING_RATE = 2e-5\n",
+    "NUM_EPOCHS = 2\n",
+    "WEIGHT_DECAY = 0.01\n",
+    "SEED = 100"
+   ],
+   "id": "2cf90b8ba07d0a63",
+   "outputs": [],
+   "execution_count": 45
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "## Data cleaning\n",
+   "id": "fbce9d6f95c91c27"
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T18:46:31.582547Z",
+     "start_time": "2025-11-14T18:46:31.574356Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "df = df.drop(columns=[\"Brand Name\", \"Price\", \"Review Votes\", \"Product Name\"])\n",
+    "df.head()"
+   ],
+   "id": "d6daa3969babb120",
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "   Rating                                            Reviews\n",
+       "0       5  I feel so LUCKY to have found this used (phone...\n",
+       "1       4  nice phone, nice up grade from my pantach revu...\n",
+       "2       5                                       Very pleased\n",
+       "3       4  It works good but it goes slow sometimes but i...\n",
+       "4       4  Great phone to replace my lost phone. The only..."
+      ],
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>Rating</th>\n",
+       "      <th>Reviews</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>5</td>\n",
+       "      <td>I feel so LUCKY to have found this used (phone...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>4</td>\n",
+       "      <td>nice phone, nice up grade from my pantach revu...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>5</td>\n",
+       "      <td>Very pleased</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>4</td>\n",
+       "      <td>It works good but it goes slow sometimes but i...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>4</td>\n",
+       "      <td>Great phone to replace my lost phone. The only...</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ]
+     },
+     "execution_count": 46,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "execution_count": 46
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T18:46:34.926211Z",
+     "start_time": "2025-11-14T18:46:33.614096Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "from datasets import Dataset\n",
+    "\n",
+    "dataset = Dataset.from_pandas(df)\n",
+    "\n",
+    "dataset = dataset.filter(\n",
+    "    lambda x: (\n",
+    "            x[\"Reviews\"] is not None\n",
+    "            and len(x[\"Reviews\"].split()) < MAX_REVIEW_LENGTH\n",
+    "            and x[\"Rating\"] in [1, 5]  # skrajnosci do binary classification\n",
+    "    )\n",
+    ")\n",
+    "\n",
+    "dataset_split = dataset.train_test_split(test_size=TEST_SIZE, seed=SEED)"
+   ],
+   "id": "40a44a79b98aa996",
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "Filter:   0%|          | 0/413840 [00:00<?, ? examples/s]"
+      ],
+      "application/vnd.jupyter.widget-view+json": {
+       "version_major": 2,
+       "version_minor": 0,
+       "model_id": "5023c01162324b84afb19ec45a970c56"
+      }
+     },
+     "metadata": {},
+     "output_type": "display_data",
+     "jetTransient": {
+      "display_id": null
+     }
+    }
+   ],
+   "execution_count": 47
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "### Tokenization",
+   "id": "f1cb6bd3ccecc50d"
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T18:46:37.851802Z",
+     "start_time": "2025-11-14T18:46:37.100084Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "from datasets import DatasetDict\n",
+    "from typing import Any\n",
+    "from transformers import AutoTokenizer\n",
+    "\n",
+    "tokenizer = AutoTokenizer.from_pretrained(MODEL_CHECKPOINT)\n",
+    "\n",
+    "\n",
+    "# zostawiamy inputs id z tokenizacji i attention mask dla padding/tresc oraz labels\n",
+    "def tokenize_and_label(dataset: DatasetDict, tokenizer: Any):\n",
+    "    def tokenize_function(example):\n",
+    "        return tokenizer(example[\"Reviews\"], padding=\"max_length\", truncation=True)\n",
+    "\n",
+    "    def convert_to_binary_label(example):\n",
+    "        return {'label': [0 if r == 1 else 1 for r in example['Rating']]}\n",
+    "\n",
+    "    tokenized = dataset.map(tokenize_function, batched=True, batch_size=BATCH_SIZE_TOKEN)\n",
+    "    tokenized = tokenized.map(convert_to_binary_label, batched=True, batch_size=BATCH_SIZE_TOKEN)\n",
+    "    tokenized = tokenized.remove_columns([\"Reviews\", \"Rating\"])\n",
+    "\n",
+    "    return tokenized"
+   ],
+   "id": "18c877bae841c93e",
+   "outputs": [],
+   "execution_count": 48
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T18:46:41.756880Z",
+     "start_time": "2025-11-14T18:46:41.754675Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "import numpy as np\n",
+    "from evaluate import load\n",
+    "\n",
+    "\n",
+    "def compute_metrics(eval_pred) -> dict:\n",
+    "    accuracy_metric = load(\"accuracy\")\n",
+    "    f1_metric = load(\"f1\")\n",
+    "\n",
+    "    logits, labels = eval_pred\n",
+    "    predictions = np.argmax(logits, axis=-1)\n",
+    "\n",
+    "    accuracy = accuracy_metric.compute(predictions=predictions, references=labels)[\"accuracy\"]\n",
+    "    f1 = f1_metric.compute(predictions=predictions, references=labels)[\"f1\"]\n",
+    "\n",
+    "    return {\"accuracy\": accuracy, \"f1\": f1}"
+   ],
+   "id": "763efe8d9ac72643",
+   "outputs": [],
+   "execution_count": 50
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "## Huggingface - logging and model loading\n",
+   "id": "b73061c3bcedc4a2"
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T18:46:44.096470Z",
+     "start_time": "2025-11-14T18:46:43.924416Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "from huggingface_hub import login\n",
+    "\n",
+    "token = HUGGING_FACE_TOKEN\n",
+    "\n",
+    "if token:\n",
+    "    login(token=HUGGING_FACE_TOKEN)\n",
+    "else:\n",
+    "    login()"
+   ],
+   "id": "b439612b50fed578",
+   "outputs": [],
+   "execution_count": 51
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "## Train and fine-tuning the model\n",
+   "id": "9560b042d0525b99"
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T19:29:10.301060Z",
+     "start_time": "2025-11-14T18:46:45.568724Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "from transformers import AutoModelForSequenceClassification, TrainingArguments, Trainer\n",
+    "\n",
+    "\n",
+    "def train_model(tokenized_datasets: DatasetDict, tokenizer) -> Trainer:\n",
+    "    model = AutoModelForSequenceClassification.from_pretrained(\n",
+    "        MODEL_CHECKPOINT,\n",
+    "        num_labels=2,\n",
+    "    )\n",
+    "\n",
+    "    training_args = TrainingArguments(\n",
+    "        output_dir=REPO_NAME,\n",
+    "        learning_rate=LEARNING_RATE,\n",
+    "        per_device_train_batch_size=BATCH_SIZE,\n",
+    "        per_device_eval_batch_size=BATCH_SIZE,\n",
+    "        num_train_epochs=NUM_EPOCHS,\n",
+    "        weight_decay=WEIGHT_DECAY,\n",
+    "        save_strategy=\"epoch\",\n",
+    "        eval_strategy=\"epoch\",\n",
+    "        push_to_hub=True,\n",
+    "        remove_unused_columns=False,\n",
+    "        logging_steps=100,\n",
+    "        fp16=True,\n",
+    "    )\n",
+    "\n",
+    "    trainer = Trainer(\n",
+    "        model=model,\n",
+    "        args=training_args,\n",
+    "        train_dataset=tokenized_datasets['train'],\n",
+    "        eval_dataset=tokenized_datasets['test'],\n",
+    "        processing_class=tokenizer,\n",
+    "        compute_metrics=compute_metrics\n",
+    "    )\n",
+    "\n",
+    "    trainer.train()\n",
+    "\n",
+    "    return trainer\n",
+    "\n",
+    "\n",
+    "print(f\"Train size: {len(dataset_split['train'])}\")\n",
+    "print(f\"Test size: {len(dataset_split['test'])}\")\n",
+    "\n",
+    "tokenized_datasets = tokenize_and_label(dataset_split, tokenizer)\n",
+    "\n",
+    "trainer = train_model(tokenized_datasets, tokenizer)"
+   ],
+   "id": "f2baddc39582ea90",
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Train size: 196375\n",
+      "Test size: 84162\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "Map:   0%|          | 0/196375 [00:00<?, ? examples/s]"
+      ],
+      "application/vnd.jupyter.widget-view+json": {
+       "version_major": 2,
+       "version_minor": 0,
+       "model_id": "9eca0885f7e941e9ba0225ecab5226b5"
+      }
+     },
+     "metadata": {},
+     "output_type": "display_data",
+     "jetTransient": {
+      "display_id": null
+     }
+    },
+    {
+     "data": {
+      "text/plain": [
+       "Map:   0%|          | 0/84162 [00:00<?, ? examples/s]"
+      ],
+      "application/vnd.jupyter.widget-view+json": {
+       "version_major": 2,
+       "version_minor": 0,
+       "model_id": "46e17d5252ff4edba4613665ce78610f"
+      }
+     },
+     "metadata": {},
+     "output_type": "display_data",
+     "jetTransient": {
+      "display_id": null
+     }
+    },
+    {
+     "data": {
+      "text/plain": [
+       "Map:   0%|          | 0/196375 [00:00<?, ? examples/s]"
+      ],
+      "application/vnd.jupyter.widget-view+json": {
+       "version_major": 2,
+       "version_minor": 0,
+       "model_id": "b0899afc630842dd9c6de08b7d186a3b"
+      }
+     },
+     "metadata": {},
+     "output_type": "display_data",
+     "jetTransient": {
+      "display_id": null
+     }
+    },
+    {
+     "data": {
+      "text/plain": [
+       "Map:   0%|          | 0/84162 [00:00<?, ? examples/s]"
+      ],
+      "application/vnd.jupyter.widget-view+json": {
+       "version_major": 2,
+       "version_minor": 0,
+       "model_id": "669f11f90f5d4ac19919c0ae3772bf7b"
+      }
+     },
+     "metadata": {},
+     "output_type": "display_data",
+     "jetTransient": {
+      "display_id": null
+     }
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Some weights of DistilBertForSequenceClassification were not initialized from the model checkpoint at distilbert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight', 'pre_classifier.bias', 'pre_classifier.weight']\n",
+      "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "<IPython.core.display.HTML object>"
+      ],
+      "text/html": [
+       "\n",
+       "    <div>\n",
+       "      \n",
+       "      <progress value='8184' max='8184' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
+       "      [8184/8184 41:33, Epoch 2/2]\n",
+       "    </div>\n",
+       "    <table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       " <tr style=\"text-align: left;\">\n",
+       "      <th>Epoch</th>\n",
+       "      <th>Training Loss</th>\n",
+       "      <th>Validation Loss</th>\n",
+       "      <th>Accuracy</th>\n",
+       "      <th>F1</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <td>1</td>\n",
+       "      <td>0.043200</td>\n",
+       "      <td>0.040534</td>\n",
+       "      <td>0.989152</td>\n",
+       "      <td>0.992839</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <td>2</td>\n",
+       "      <td>0.029900</td>\n",
+       "      <td>0.035284</td>\n",
+       "      <td>0.991718</td>\n",
+       "      <td>0.994545</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table><p>"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data",
+     "jetTransient": {
+      "display_id": "5232456d49be4c01fb108dc77e31f262"
+     }
+    },
+    {
+     "data": {
+      "text/plain": [
+       "Downloading builder script: 0.00B [00:00, ?B/s]"
+      ],
+      "application/vnd.jupyter.widget-view+json": {
+       "version_major": 2,
+       "version_minor": 0,
+       "model_id": "6ea920f26713434d9390bbe9cfa3a896"
+      }
+     },
+     "metadata": {},
+     "output_type": "display_data",
+     "jetTransient": {
+      "display_id": null
+     }
+    },
+    {
+     "data": {
+      "text/plain": [
+       "Downloading builder script: 0.00B [00:00, ?B/s]"
+      ],
+      "application/vnd.jupyter.widget-view+json": {
+       "version_major": 2,
+       "version_minor": 0,
+       "model_id": "b661d468c9394cf7a2f3e161a223adf1"
+      }
+     },
+     "metadata": {},
+     "output_type": "display_data",
+     "jetTransient": {
+      "display_id": null
+     }
+    },
+    {
+     "data": {
+      "text/plain": [
+       "Downloading builder script: 0.00B [00:00, ?B/s]"
+      ],
+      "application/vnd.jupyter.widget-view+json": {
+       "version_major": 2,
+       "version_minor": 0,
+       "model_id": "e755ba88b1e4457b8bab9944d4b1412f"
+      }
+     },
+     "metadata": {},
+     "output_type": "display_data",
+     "jetTransient": {
+      "display_id": null
+     }
+    }
+   ],
+   "execution_count": 52
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "## Testing the newly fine-tuned model\n",
+   "id": "195c0e81bf298c1c"
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T19:56:16.772843Z",
+     "start_time": "2025-11-14T19:56:16.769490Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "\n",
+    "def create_classifier(model_path=f\"./{REPO_NAME}\"):\n",
+    "    tokenizer = AutoTokenizer.from_pretrained(model_path)\n",
+    "    model = AutoModelForSequenceClassification.from_pretrained(model_path)\n",
+    "\n",
+    "    return pipeline(\"text-classification\", model=model, tokenizer=tokenizer)\n",
+    "\n",
+    "\n",
+    "def test_classifier(classifier) -> None:\n",
+    "    examples = [\n",
+    "        \"Shame. I wish I hadn't buy it.\",\n",
+    "        \"Great handset!\",\n",
+    "        \"Terrible product, waste of money\",\n",
+    "        \"Best phone ever, highly recommend!\"\n",
+    "    ]\n",
+    "\n",
+    "    for text in examples:\n",
+    "        result = classifier(text)\n",
+    "        print(f\"Text: {text}\")\n",
+    "        print(f\"Result: {result}\\n\")\n"
+   ],
+   "id": "c1ce352b5ebe328c",
+   "outputs": [],
+   "execution_count": 53
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "### Eval metrics",
+   "id": "d4c5787afb9e6ae7"
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T20:06:29.136185Z",
+     "start_time": "2025-11-14T20:03:59.964777Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "from transformers import AutoModelForSequenceClassification\n",
+    "from sklearn.metrics import confusion_matrix, classification_report, roc_auc_score, precision_recall_curve, auc\n",
+    "import numpy as np\n",
+    "import torch\n",
+    "\n",
+    "model_path = f\"./{REPO_NAME}\"\n",
+    "model = AutoModelForSequenceClassification.from_pretrained(model_path)\n",
+    "print(model)\n",
+    "\n",
+    "preds = trainer.predict(tokenized_datasets[\"test\"])\n",
+    "logits = preds.predictions\n",
+    "y_true = preds.label_ids\n",
+    "y_pred = np.argmax(logits, axis=-1)\n",
+    "probs = torch.softmax(torch.from_numpy(logits), dim=-1).numpy()[:, 1]\n",
+    "\n",
+    "cm = confusion_matrix(y_true, y_pred)\n",
+    "tn, fp, fn, tp = cm.ravel()\n",
+    "roc_auc = roc_auc_score(y_true, probs)\n",
+    "prec_curve, rec_curve, _ = precision_recall_curve(y_true, probs)\n",
+    "pr_auc = auc(rec_curve, prec_curve)\n",
+    "report = classification_report(y_true, y_pred, digits=4)\n",
+    "\n",
+    "print(\"Confusion matrix:\")\n",
+    "print(cm)\n",
+    "print(f\"TP={tp} FP={fp} TN={tn} FN={fn}\")\n",
+    "print(f\"ROC-AUC={roc_auc:.4f} PR-AUC={pr_auc:.4f}\")\n",
+    "print(report)\n"
+   ],
+   "id": "e3308ae685c70928",
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Architecture: DistilBertForSequenceClassification\n",
+      "DistilBertConfig {\n",
+      "  \"activation\": \"gelu\",\n",
+      "  \"architectures\": [\n",
+      "    \"DistilBertForSequenceClassification\"\n",
+      "  ],\n",
+      "  \"attention_dropout\": 0.1,\n",
+      "  \"dim\": 768,\n",
+      "  \"dropout\": 0.1,\n",
+      "  \"dtype\": \"float32\",\n",
+      "  \"hidden_dim\": 3072,\n",
+      "  \"initializer_range\": 0.02,\n",
+      "  \"max_position_embeddings\": 512,\n",
+      "  \"model_type\": \"distilbert\",\n",
+      "  \"n_heads\": 12,\n",
+      "  \"n_layers\": 6,\n",
+      "  \"pad_token_id\": 0,\n",
+      "  \"problem_type\": \"single_label_classification\",\n",
+      "  \"qa_dropout\": 0.1,\n",
+      "  \"seq_classif_dropout\": 0.2,\n",
+      "  \"sinusoidal_pos_embds\": false,\n",
+      "  \"tie_weights_\": true,\n",
+      "  \"transformers_version\": \"4.57.1\",\n",
+      "  \"vocab_size\": 30522\n",
+      "}\n",
+      "\n",
+      "Total params: 66,955,010\n",
+      "Trainable params: 66,955,010\n",
+      "Confusion matrix:\n",
+      "[[19922   352]\n",
+      " [  345 63543]]\n",
+      "TP=63543 FP=352 TN=19922 FN=345\n",
+      "ROC-AUC=0.9983 PR-AUC=0.9994\n",
+      "              precision    recall  f1-score   support\n",
+      "\n",
+      "           0     0.9830    0.9826    0.9828     20274\n",
+      "           1     0.9945    0.9946    0.9945     63888\n",
+      "\n",
+      "    accuracy                         0.9917     84162\n",
+      "   macro avg     0.9887    0.9886    0.9887     84162\n",
+      "weighted avg     0.9917    0.9917    0.9917     84162\n",
+      "\n"
+     ]
+    }
+   ],
+   "execution_count": 62
+  },
+  {
+   "metadata": {},
+   "cell_type": "markdown",
+   "source": "### Testing the model with text samples",
+   "id": "6fcdad5dc49bc568"
+  },
+  {
+   "metadata": {
+    "ExecuteTime": {
+     "end_time": "2025-11-14T19:59:26.564660Z",
+     "start_time": "2025-11-14T19:59:26.258924Z"
+    }
+   },
+   "cell_type": "code",
+   "source": [
+    "# Pomijam bo mialem w trakcie uczenia eval wlaczony\n",
+    "# eval_results = trainer.evaluate()\n",
+    "# print(f\"Evaluation results: {eval_results}\")\n",
+    "\n",
+    "print(\"Testing the fine-tuned model:\")\n",
+    "classifier = create_classifier()\n",
+    "test_classifier(classifier)"
+   ],
+   "id": "993ea8f31d059b8d",
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Device set to use cuda:0\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Testing the fine-tuned model:\n",
+      "Text: Shame. I wish I hadn't buy it.\n",
+      "Result: [{'label': 'LABEL_0', 'score': 0.9975292086601257}]\n",
+      "\n",
+      "Text: Great handset!\n",
+      "Result: [{'label': 'LABEL_1', 'score': 0.9996094107627869}]\n",
+      "\n",
+      "Text: Terrible product, waste of money\n",
+      "Result: [{'label': 'LABEL_0', 'score': 0.998723566532135}]\n",
+      "\n",
+      "Text: Best phone ever, highly recommend!\n",
+      "Result: [{'label': 'LABEL_1', 'score': 0.9996873140335083}]\n",
+      "\n"
+     ]
+    }
+   ],
+   "execution_count": 58
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 2
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython2",
+   "version": "2.7.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}

data/Amazon_Unlocked_Mobile.csv ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:097abeefe303816e0f5e9c9ff380adb25910cf46307d2c104911eae8d0304e76
+size 131879567

data/Amazon_Unlocked_Mobile.csv.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:801af84059ea0c660aa082b0f07363fcefe224827ba7231248ecc69d95a739f3
+size 34182461