mr-kush commited on
Commit
ac52c9d
·
verified ·
1 Parent(s): 6dfdb7c

mr-kush/sambodhan-department-classification-model

Browse files
README.md ADDED
@@ -0,0 +1,79 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: transformers
3
+ license: mit
4
+ base_model: FacebookAI/xlm-roberta-base
5
+ tags:
6
+ - generated_from_trainer
7
+ metrics:
8
+ - accuracy
9
+ - f1
10
+ - precision
11
+ - recall
12
+ model-index:
13
+ - name: trainer_output
14
+ results: []
15
+ ---
16
+
17
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
18
+ should probably proofread and complete it, then remove this comment. -->
19
+
20
+ # trainer_output
21
+
22
+ This model is a fine-tuned version of [FacebookAI/xlm-roberta-base](https://huggingface.co/FacebookAI/xlm-roberta-base) on an unknown dataset.
23
+ It achieves the following results on the evaluation set:
24
+ - Loss: 2.0023
25
+ - Accuracy: 0.8598
26
+ - F1: 0.8668
27
+ - Precision: 0.8770
28
+ - Recall: 0.8598
29
+
30
+ ## Model description
31
+
32
+ More information needed
33
+
34
+ ## Intended uses & limitations
35
+
36
+ More information needed
37
+
38
+ ## Training and evaluation data
39
+
40
+ More information needed
41
+
42
+ ## Training procedure
43
+
44
+ ### Training hyperparameters
45
+
46
+ The following hyperparameters were used during training:
47
+ - learning_rate: 2e-05
48
+ - train_batch_size: 16
49
+ - eval_batch_size: 32
50
+ - seed: 42
51
+ - optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
52
+ - lr_scheduler_type: linear
53
+ - num_epochs: 3
54
+ - mixed_precision_training: Native AMP
55
+
56
+ ### Training results
57
+
58
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 | Precision | Recall |
59
+ |:-------------:|:------:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|
60
+ | No log | 0.2439 | 20 | 1.6724 | 0.8537 | 0.8597 | 0.8721 | 0.8537 |
61
+ | No log | 0.4878 | 40 | 2.1847 | 0.8598 | 0.8618 | 0.8640 | 0.8598 |
62
+ | 0.3126 | 0.7317 | 60 | 2.0168 | 0.8598 | 0.8630 | 0.8673 | 0.8598 |
63
+ | 0.3126 | 0.9756 | 80 | 2.4119 | 0.8780 | 0.8804 | 0.8904 | 0.8780 |
64
+ | 0.2521 | 1.2195 | 100 | 2.2020 | 0.8902 | 0.8884 | 0.8899 | 0.8902 |
65
+ | 0.2521 | 1.4634 | 120 | 2.2252 | 0.8902 | 0.8893 | 0.8908 | 0.8902 |
66
+ | 0.2521 | 1.7073 | 140 | 1.9534 | 0.8476 | 0.8579 | 0.8738 | 0.8476 |
67
+ | 0.2102 | 1.9512 | 160 | 2.0566 | 0.8963 | 0.8952 | 0.8948 | 0.8963 |
68
+ | 0.2102 | 2.1951 | 180 | 2.1647 | 0.8659 | 0.8714 | 0.8799 | 0.8659 |
69
+ | 0.0475 | 2.4390 | 200 | 2.2178 | 0.8659 | 0.8713 | 0.8795 | 0.8659 |
70
+ | 0.0475 | 2.6829 | 220 | 2.2616 | 0.8659 | 0.8713 | 0.8795 | 0.8659 |
71
+ | 0.0475 | 2.9268 | 240 | 2.2667 | 0.8659 | 0.8713 | 0.8795 | 0.8659 |
72
+
73
+
74
+ ### Framework versions
75
+
76
+ - Transformers 4.56.2
77
+ - Pytorch 2.8.0+cu126
78
+ - Datasets 4.0.0
79
+ - Tokenizers 0.22.1
config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "XLMRobertaForSequenceClassification"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "bos_token_id": 0,
7
+ "classifier_dropout": null,
8
+ "dtype": "float32",
9
+ "eos_token_id": 2,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.1,
12
+ "hidden_size": 768,
13
+ "id2label": {
14
+ "0": "Municipal Governance & Community Services",
15
+ "1": "Education, Health & Social Welfare",
16
+ "2": "Infrastructure, Utilities & Natural Resources",
17
+ "3": "Security & Law Enforcement"
18
+ },
19
+ "initializer_range": 0.02,
20
+ "intermediate_size": 3072,
21
+ "label2id": {
22
+ "Education, Health & Social Welfare": 1,
23
+ "Infrastructure, Utilities & Natural Resources": 2,
24
+ "Municipal Governance & Community Services": 0,
25
+ "Security & Law Enforcement": 3
26
+ },
27
+ "layer_norm_eps": 1e-05,
28
+ "max_position_embeddings": 514,
29
+ "model_type": "xlm-roberta",
30
+ "num_attention_heads": 12,
31
+ "num_hidden_layers": 12,
32
+ "output_past": true,
33
+ "pad_token_id": 1,
34
+ "position_embedding_type": "absolute",
35
+ "problem_type": "single_label_classification",
36
+ "transformers_version": "4.56.2",
37
+ "type_vocab_size": 1,
38
+ "use_cache": true,
39
+ "vocab_size": 250002
40
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f23191f371d6e832144db6ce0c1ce92c30a6000355dc7bbba87312ae84b6848a
3
+ size 1112211160
runs/Oct09_03-37-32_36bf646bbd29/events.out.tfevents.1759981063.36bf646bbd29.429.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27f02e654830c658d498692d0ac8f3a4cf0e5888952b2b703ea5d0d85c1d7d33
3
+ size 5447
runs/Oct09_03-40-22_36bf646bbd29/events.out.tfevents.1759981225.36bf646bbd29.429.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9aa8746164ab80ec2e82a3e2185af2f263df59761be8a283d89299a955b4981c
3
+ size 7671
runs/Oct09_04-15-55_36bf646bbd29/events.out.tfevents.1759983358.36bf646bbd29.429.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:402542aeb5b016d32679beea05dcedfd23af2df8562b5f49d63017cb33509dd3
3
+ size 8568
runs/Oct09_04-19-58_36bf646bbd29/events.out.tfevents.1759983599.36bf646bbd29.429.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:862635d89fa413168f36ccb6518699fc1ea7ce219bcfb2dd0c8fdef503ec5e48
3
+ size 5508
runs/Oct09_04-21-42_36bf646bbd29/events.out.tfevents.1759983706.36bf646bbd29.429.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bd3a863f0fe265437e1c1c5e66f8672b70a3162c8b63b98c93c7d8fff777269
3
+ size 12308
runs/Oct09_04-21-42_36bf646bbd29/events.out.tfevents.1759983972.36bf646bbd29.429.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65051518ed264eb1d31249e36ee6ea3348321861610bc6171dea78f14e315d8b
3
+ size 560
runs/Oct09_04-21-42_36bf646bbd29/events.out.tfevents.1759984981.36bf646bbd29.429.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:950be66e7f7b55bfceada0fd9b50068ec1096bb10349acc767950bc10d612087
3
+ size 5508
runs/Oct09_04-21-42_36bf646bbd29/events.out.tfevents.1759985057.36bf646bbd29.429.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4595f6b7c20befda1830869937ffebc42399ad7a64c65f7240fa730f0f35bc2b
3
+ size 5774
runs/Oct09_04-21-42_36bf646bbd29/events.out.tfevents.1759985125.36bf646bbd29.429.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1953ec6602397ea8db0f0e157cd9ef3abb2b1a555a740f7571e07336db184c1
3
+ size 12308
runs/Oct09_04-21-42_36bf646bbd29/events.out.tfevents.1759985368.36bf646bbd29.429.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd5663754a2998f365babd7d0f8eed9abf736ec9acad1e026c2b313e59e927c3
3
+ size 560
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d008b51eda27ee0e3bfc1b7de3791d7398bdac675c3538373706c07582d967af
3
+ size 5777