CIRCL/cwe-parent-vulnerability-classification-roberta-base
Browse files- README.md +48 -48
- config.json +52 -52
- emissions.csv +2 -2
- metrics.json +6 -6
- model.safetensors +1 -1
README.md
CHANGED
|
@@ -18,9 +18,9 @@ should probably proofread and complete it, then remove this comment. -->
|
|
| 18 |
|
| 19 |
This model is a fine-tuned version of [roberta-base](https://huggingface.co/roberta-base) on an unknown dataset.
|
| 20 |
It achieves the following results on the evaluation set:
|
| 21 |
-
- Loss: 1.
|
| 22 |
-
- Accuracy: 0.
|
| 23 |
-
- F1 Macro: 0.
|
| 24 |
|
| 25 |
## Model description
|
| 26 |
|
|
@@ -40,8 +40,8 @@ More information needed
|
|
| 40 |
|
| 41 |
The following hyperparameters were used during training:
|
| 42 |
- learning_rate: 1e-05
|
| 43 |
-
- train_batch_size:
|
| 44 |
-
- eval_batch_size:
|
| 45 |
- seed: 42
|
| 46 |
- optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
|
| 47 |
- lr_scheduler_type: linear
|
|
@@ -51,51 +51,51 @@ The following hyperparameters were used during training:
|
|
| 51 |
|
| 52 |
| Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 Macro |
|
| 53 |
|:-------------:|:-----:|:----:|:---------------:|:--------:|:--------:|
|
| 54 |
-
| 3.
|
| 55 |
-
|
|
| 56 |
-
| 2.
|
| 57 |
-
|
|
| 58 |
-
| 1.
|
| 59 |
-
| 1.
|
| 60 |
-
| 1.
|
| 61 |
-
|
|
| 62 |
-
|
|
| 63 |
-
| 0.
|
| 64 |
-
| 0.
|
| 65 |
-
| 0.
|
| 66 |
-
| 0.
|
| 67 |
-
| 0.
|
| 68 |
-
| 0.
|
| 69 |
-
| 0.
|
| 70 |
-
| 0.
|
| 71 |
-
| 0.
|
| 72 |
-
| 0.
|
| 73 |
-
| 0.
|
| 74 |
-
| 0.
|
| 75 |
-
| 0.
|
| 76 |
-
| 0.
|
| 77 |
-
| 0.
|
| 78 |
-
| 0.
|
| 79 |
-
| 0.
|
| 80 |
-
| 0.
|
| 81 |
-
| 0.
|
| 82 |
-
| 0.
|
| 83 |
-
| 0.
|
| 84 |
-
| 0.
|
| 85 |
-
| 0.
|
| 86 |
-
| 0.
|
| 87 |
-
| 0.
|
| 88 |
-
| 0.
|
| 89 |
-
| 0.
|
| 90 |
-
| 0.
|
| 91 |
-
| 0.
|
| 92 |
-
| 0.
|
| 93 |
-
| 0.
|
| 94 |
|
| 95 |
|
| 96 |
### Framework versions
|
| 97 |
|
| 98 |
-
- Transformers 4.57.
|
| 99 |
- Pytorch 2.9.1+cu128
|
| 100 |
-
- Datasets 4.4.
|
| 101 |
-
- Tokenizers 0.22.
|
|
|
|
| 18 |
|
| 19 |
This model is a fine-tuned version of [roberta-base](https://huggingface.co/roberta-base) on an unknown dataset.
|
| 20 |
It achieves the following results on the evaluation set:
|
| 21 |
+
- Loss: 1.7510
|
| 22 |
+
- Accuracy: 0.5455
|
| 23 |
+
- F1 Macro: 0.3776
|
| 24 |
|
| 25 |
## Model description
|
| 26 |
|
|
|
|
| 40 |
|
| 41 |
The following hyperparameters were used during training:
|
| 42 |
- learning_rate: 1e-05
|
| 43 |
+
- train_batch_size: 64
|
| 44 |
+
- eval_batch_size: 64
|
| 45 |
- seed: 42
|
| 46 |
- optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
|
| 47 |
- lr_scheduler_type: linear
|
|
|
|
| 51 |
|
| 52 |
| Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 Macro |
|
| 53 |
|:-------------:|:-----:|:----:|:---------------:|:--------:|:--------:|
|
| 54 |
+
| 3.226 | 1.0 | 125 | 3.1362 | 0.0382 | 0.0035 |
|
| 55 |
+
| 3.0244 | 2.0 | 250 | 2.9390 | 0.2155 | 0.1215 |
|
| 56 |
+
| 2.589 | 3.0 | 375 | 2.3469 | 0.4141 | 0.2521 |
|
| 57 |
+
| 2.1614 | 4.0 | 500 | 2.0701 | 0.4355 | 0.2551 |
|
| 58 |
+
| 1.8396 | 5.0 | 625 | 1.9336 | 0.4467 | 0.2748 |
|
| 59 |
+
| 1.5698 | 6.0 | 750 | 1.9086 | 0.4905 | 0.2938 |
|
| 60 |
+
| 1.4142 | 7.0 | 875 | 1.7933 | 0.5174 | 0.3416 |
|
| 61 |
+
| 1.2292 | 8.0 | 1000 | 1.7510 | 0.5455 | 0.3776 |
|
| 62 |
+
| 1.1182 | 9.0 | 1125 | 1.7681 | 0.5713 | 0.3803 |
|
| 63 |
+
| 0.9924 | 10.0 | 1250 | 1.8151 | 0.6083 | 0.4059 |
|
| 64 |
+
| 0.9307 | 11.0 | 1375 | 1.8391 | 0.6218 | 0.4379 |
|
| 65 |
+
| 0.7875 | 12.0 | 1500 | 1.8065 | 0.6038 | 0.4048 |
|
| 66 |
+
| 0.6308 | 13.0 | 1625 | 1.9221 | 0.6409 | 0.4210 |
|
| 67 |
+
| 0.7327 | 14.0 | 1750 | 1.9986 | 0.6465 | 0.4775 |
|
| 68 |
+
| 0.5175 | 15.0 | 1875 | 2.0520 | 0.6644 | 0.4316 |
|
| 69 |
+
| 0.5302 | 16.0 | 2000 | 2.0989 | 0.6712 | 0.4528 |
|
| 70 |
+
| 0.38 | 17.0 | 2125 | 2.0826 | 0.6734 | 0.4669 |
|
| 71 |
+
| 0.3768 | 18.0 | 2250 | 2.1953 | 0.6611 | 0.4544 |
|
| 72 |
+
| 0.3653 | 19.0 | 2375 | 2.2217 | 0.6880 | 0.5000 |
|
| 73 |
+
| 0.3349 | 20.0 | 2500 | 2.1911 | 0.6880 | 0.4951 |
|
| 74 |
+
| 0.2563 | 21.0 | 2625 | 2.2999 | 0.6813 | 0.4771 |
|
| 75 |
+
| 0.2513 | 22.0 | 2750 | 2.4158 | 0.7037 | 0.4640 |
|
| 76 |
+
| 0.2154 | 23.0 | 2875 | 2.4323 | 0.7138 | 0.4689 |
|
| 77 |
+
| 0.1889 | 24.0 | 3000 | 2.4296 | 0.7037 | 0.4733 |
|
| 78 |
+
| 0.2042 | 25.0 | 3125 | 2.5223 | 0.7071 | 0.4411 |
|
| 79 |
+
| 0.1774 | 26.0 | 3250 | 2.5476 | 0.7037 | 0.5083 |
|
| 80 |
+
| 0.156 | 27.0 | 3375 | 2.5737 | 0.7205 | 0.5236 |
|
| 81 |
+
| 0.1406 | 28.0 | 3500 | 2.6518 | 0.7048 | 0.5220 |
|
| 82 |
+
| 0.144 | 29.0 | 3625 | 2.6388 | 0.7015 | 0.4789 |
|
| 83 |
+
| 0.1119 | 30.0 | 3750 | 2.7159 | 0.7228 | 0.5003 |
|
| 84 |
+
| 0.1187 | 31.0 | 3875 | 2.7170 | 0.7071 | 0.4973 |
|
| 85 |
+
| 0.1095 | 32.0 | 4000 | 2.7796 | 0.7160 | 0.4707 |
|
| 86 |
+
| 0.1082 | 33.0 | 4125 | 2.7926 | 0.7239 | 0.5038 |
|
| 87 |
+
| 0.0976 | 34.0 | 4250 | 2.8240 | 0.7149 | 0.4515 |
|
| 88 |
+
| 0.0885 | 35.0 | 4375 | 2.8532 | 0.7149 | 0.4466 |
|
| 89 |
+
| 0.0872 | 36.0 | 4500 | 2.8697 | 0.7183 | 0.4700 |
|
| 90 |
+
| 0.0795 | 37.0 | 4625 | 2.8467 | 0.7138 | 0.4994 |
|
| 91 |
+
| 0.0878 | 38.0 | 4750 | 2.8566 | 0.7104 | 0.4673 |
|
| 92 |
+
| 0.0886 | 39.0 | 4875 | 2.8951 | 0.7127 | 0.4667 |
|
| 93 |
+
| 0.086 | 40.0 | 5000 | 2.8841 | 0.7127 | 0.4683 |
|
| 94 |
|
| 95 |
|
| 96 |
### Framework versions
|
| 97 |
|
| 98 |
+
- Transformers 4.57.3
|
| 99 |
- Pytorch 2.9.1+cu128
|
| 100 |
+
- Datasets 4.4.2
|
| 101 |
+
- Tokenizers 0.22.2
|
config.json
CHANGED
|
@@ -11,62 +11,62 @@
|
|
| 11 |
"hidden_dropout_prob": 0.1,
|
| 12 |
"hidden_size": 768,
|
| 13 |
"id2label": {
|
| 14 |
-
"0": "
|
| 15 |
-
"1": "
|
| 16 |
-
"2": "
|
| 17 |
-
"3": "
|
| 18 |
-
"4": "
|
| 19 |
-
"5": "
|
| 20 |
-
"6": "
|
| 21 |
-
"7": "
|
| 22 |
-
"8": "
|
| 23 |
-
"9": "
|
| 24 |
-
"10": "
|
| 25 |
-
"11": "
|
| 26 |
-
"12": "
|
| 27 |
-
"13": "
|
| 28 |
-
"14": "
|
| 29 |
-
"15": "
|
| 30 |
-
"16": "
|
| 31 |
-
"17": "
|
| 32 |
-
"18": "
|
| 33 |
-
"19": "
|
| 34 |
-
"20": "
|
| 35 |
-
"21": "
|
| 36 |
-
"22": "
|
| 37 |
-
"23": "
|
| 38 |
-
"24": "
|
| 39 |
-
"25": "
|
| 40 |
},
|
| 41 |
"initializer_range": 0.02,
|
| 42 |
"intermediate_size": 3072,
|
| 43 |
"label2id": {
|
| 44 |
-
"
|
| 45 |
-
"
|
| 46 |
-
"
|
| 47 |
-
"
|
| 48 |
-
"
|
| 49 |
-
"
|
| 50 |
-
"
|
| 51 |
-
"
|
| 52 |
-
"
|
| 53 |
-
"
|
| 54 |
-
"
|
| 55 |
-
"
|
| 56 |
-
"
|
| 57 |
-
"
|
| 58 |
-
"
|
| 59 |
-
"
|
| 60 |
-
"
|
| 61 |
-
"
|
| 62 |
-
"
|
| 63 |
-
"
|
| 64 |
-
"
|
| 65 |
-
"
|
| 66 |
-
"
|
| 67 |
-
"
|
| 68 |
-
"
|
| 69 |
-
"
|
| 70 |
},
|
| 71 |
"layer_norm_eps": 1e-05,
|
| 72 |
"max_position_embeddings": 514,
|
|
|
|
| 11 |
"hidden_dropout_prob": 0.1,
|
| 12 |
"hidden_size": 768,
|
| 13 |
"id2label": {
|
| 14 |
+
"0": "1025",
|
| 15 |
+
"1": "1071",
|
| 16 |
+
"2": "131",
|
| 17 |
+
"3": "138",
|
| 18 |
+
"4": "284",
|
| 19 |
+
"5": "285",
|
| 20 |
+
"6": "435",
|
| 21 |
+
"7": "436",
|
| 22 |
+
"8": "595",
|
| 23 |
+
"9": "657",
|
| 24 |
+
"10": "664",
|
| 25 |
+
"11": "682",
|
| 26 |
+
"12": "684",
|
| 27 |
+
"13": "691",
|
| 28 |
+
"14": "693",
|
| 29 |
+
"15": "697",
|
| 30 |
+
"16": "703",
|
| 31 |
+
"17": "706",
|
| 32 |
+
"18": "707",
|
| 33 |
+
"19": "710",
|
| 34 |
+
"20": "74",
|
| 35 |
+
"21": "754",
|
| 36 |
+
"22": "829",
|
| 37 |
+
"23": "862",
|
| 38 |
+
"24": "913",
|
| 39 |
+
"25": "94"
|
| 40 |
},
|
| 41 |
"initializer_range": 0.02,
|
| 42 |
"intermediate_size": 3072,
|
| 43 |
"label2id": {
|
| 44 |
+
"1025": 0,
|
| 45 |
+
"1071": 1,
|
| 46 |
+
"131": 2,
|
| 47 |
+
"138": 3,
|
| 48 |
+
"284": 4,
|
| 49 |
+
"285": 5,
|
| 50 |
+
"435": 6,
|
| 51 |
+
"436": 7,
|
| 52 |
+
"595": 8,
|
| 53 |
+
"657": 9,
|
| 54 |
+
"664": 10,
|
| 55 |
+
"682": 11,
|
| 56 |
+
"684": 12,
|
| 57 |
+
"691": 13,
|
| 58 |
+
"693": 14,
|
| 59 |
+
"697": 15,
|
| 60 |
+
"703": 16,
|
| 61 |
+
"706": 17,
|
| 62 |
+
"707": 18,
|
| 63 |
+
"710": 19,
|
| 64 |
+
"74": 20,
|
| 65 |
+
"754": 21,
|
| 66 |
+
"829": 22,
|
| 67 |
+
"862": 23,
|
| 68 |
+
"913": 24,
|
| 69 |
+
"94": 25
|
| 70 |
},
|
| 71 |
"layer_norm_eps": 1e-05,
|
| 72 |
"max_position_embeddings": 514,
|
emissions.csv
CHANGED
|
@@ -1,2 +1,2 @@
|
|
| 1 |
-
timestamp,project_name,run_id,experiment_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
|
| 2 |
-
|
|
|
|
| 1 |
+
timestamp,project_name,run_id,experiment_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,water_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,cpu_utilization_percent,gpu_utilization_percent,ram_utilization_percent,ram_used_gb,on_cloud,pue,wue
|
| 2 |
+
2026-01-13T21:56:14,codecarbon,393db334-33a7-40a5-8744-5c0c0b8e9695,5b0fa12a-3dd7-45bb-9766-cc326314d9f1,1567.7256346759968,0.06313669868117386,4.02727985590555e-05,368.66620928434594,938.1824499334339,70.0,0.1616492382015093,0.407745279251518,0.030405019717430055,0.5997995371704574,0.0,Luxembourg,LUX,,,,Linux-6.8.0-90-generic-x86_64-with-glibc2.39,3.12.3,3.2.1,224,Intel(R) Xeon(R) Platinum 8480+,4,4 x NVIDIA L40S,6.1661,49.7498,2015.3354835510254,machine,0.6375481386392811,72.2033055198973,4.556418485237484,91.88500246187536,N,1.0,0.0
|
metrics.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
{
|
| 2 |
-
"eval_loss": 1.
|
| 3 |
-
"eval_accuracy": 0.
|
| 4 |
-
"eval_f1_macro": 0.
|
| 5 |
-
"eval_runtime": 1.
|
| 6 |
-
"eval_samples_per_second":
|
| 7 |
-
"eval_steps_per_second":
|
| 8 |
"epoch": 40.0
|
| 9 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"eval_loss": 1.7509655952453613,
|
| 3 |
+
"eval_accuracy": 0.5454545454545454,
|
| 4 |
+
"eval_f1_macro": 0.37756565971323075,
|
| 5 |
+
"eval_runtime": 1.6377,
|
| 6 |
+
"eval_samples_per_second": 544.058,
|
| 7 |
+
"eval_steps_per_second": 8.549,
|
| 8 |
"epoch": 40.0
|
| 9 |
}
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 498686648
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c2fe7e35982d93c50286a9784e87bbf66572abaff64e2bd958814eddd688e89
|
| 3 |
size 498686648
|