Upload folder using huggingface_hub
Browse files- README.md +4 -4
- history.csv +3 -3
- metrics.json +27 -27
- model.pt +1 -1
- multitask_training.png +2 -2
- tokenizer/tokenizer_config.json +2 -0
README.md
CHANGED
|
@@ -16,12 +16,12 @@ Multi-task transformer with shared MoE layers for:
|
|
| 16 |
## Performance
|
| 17 |
|
| 18 |
### Classification
|
| 19 |
-
- Validation Accuracy: 0.
|
| 20 |
|
| 21 |
### Summarization
|
| 22 |
-
- ROUGE-1: 0.
|
| 23 |
-
- ROUGE-2: 0.
|
| 24 |
-
- ROUGE-L: 0.
|
| 25 |
|
| 26 |
## Benefits
|
| 27 |
|
|
|
|
| 16 |
## Performance
|
| 17 |
|
| 18 |
### Classification
|
| 19 |
+
- Validation Accuracy: 0.3420
|
| 20 |
|
| 21 |
### Summarization
|
| 22 |
+
- ROUGE-1: 0.2250
|
| 23 |
+
- ROUGE-2: 0.0333
|
| 24 |
+
- ROUGE-L: 0.2078
|
| 25 |
|
| 26 |
## Benefits
|
| 27 |
|
history.csv
CHANGED
|
@@ -1,4 +1,4 @@
|
|
| 1 |
epoch,train_sum_loss,train_class_loss,train_class_acc,val_sum_loss,val_class_loss,val_class_acc,val_rouge1,val_rouge2,val_rougeL
|
| 2 |
-
1,6.
|
| 3 |
-
2,5.
|
| 4 |
-
3,4.
|
|
|
|
| 1 |
epoch,train_sum_loss,train_class_loss,train_class_acc,val_sum_loss,val_class_loss,val_class_acc,val_rouge1,val_rouge2,val_rougeL
|
| 2 |
+
1,6.272962152862549,1.0185239918708802,0.4368,5.8008860549926755,1.1023406219482421,0.304,0.17660690248954364,0.018371370658335634,0.15689190075772386
|
| 3 |
+
2,5.219159950256348,1.099994719696045,0.3462,5.416218318939209,1.0967657680511476,0.386,0.21779871449217764,0.028536134623968267,0.19329056631523484
|
| 4 |
+
3,4.404316672515869,1.0899620735168456,0.361,5.30168932723999,1.7727555074691772,0.342,0.22501668712961082,0.03326989668183761,0.20778061653444058
|
metrics.json
CHANGED
|
@@ -2,39 +2,39 @@
|
|
| 2 |
"history": [
|
| 3 |
{
|
| 4 |
"epoch": 1,
|
| 5 |
-
"train_sum_loss": 6.
|
| 6 |
-
"train_class_loss": 1.
|
| 7 |
-
"train_class_acc": 0.
|
| 8 |
-
"val_sum_loss":
|
| 9 |
-
"val_class_loss": 1.
|
| 10 |
-
"val_class_acc": 0.
|
| 11 |
-
"val_rouge1": 0.
|
| 12 |
-
"val_rouge2": 0.
|
| 13 |
-
"val_rougeL": 0.
|
| 14 |
},
|
| 15 |
{
|
| 16 |
"epoch": 2,
|
| 17 |
-
"train_sum_loss": 5.
|
| 18 |
-
"train_class_loss": 1.
|
| 19 |
-
"train_class_acc": 0.
|
| 20 |
-
"val_sum_loss": 5.
|
| 21 |
-
"val_class_loss":
|
| 22 |
-
"val_class_acc": 0.
|
| 23 |
-
"val_rouge1": 0.
|
| 24 |
-
"val_rouge2": 0.
|
| 25 |
-
"val_rougeL": 0.
|
| 26 |
},
|
| 27 |
{
|
| 28 |
"epoch": 3,
|
| 29 |
-
"train_sum_loss": 4.
|
| 30 |
-
"train_class_loss": 1.
|
| 31 |
-
"train_class_acc": 0.
|
| 32 |
-
"val_sum_loss": 5.
|
| 33 |
-
"val_class_loss": 1.
|
| 34 |
-
"val_class_acc": 0.
|
| 35 |
-
"val_rouge1": 0.
|
| 36 |
-
"val_rouge2": 0.
|
| 37 |
-
"val_rougeL": 0.
|
| 38 |
}
|
| 39 |
],
|
| 40 |
"config": {
|
|
|
|
| 2 |
"history": [
|
| 3 |
{
|
| 4 |
"epoch": 1,
|
| 5 |
+
"train_sum_loss": 6.272962152862549,
|
| 6 |
+
"train_class_loss": 1.0185239918708802,
|
| 7 |
+
"train_class_acc": 0.4368,
|
| 8 |
+
"val_sum_loss": 5.8008860549926755,
|
| 9 |
+
"val_class_loss": 1.1023406219482421,
|
| 10 |
+
"val_class_acc": 0.304,
|
| 11 |
+
"val_rouge1": 0.17660690248954364,
|
| 12 |
+
"val_rouge2": 0.018371370658335634,
|
| 13 |
+
"val_rougeL": 0.15689190075772386
|
| 14 |
},
|
| 15 |
{
|
| 16 |
"epoch": 2,
|
| 17 |
+
"train_sum_loss": 5.219159950256348,
|
| 18 |
+
"train_class_loss": 1.099994719696045,
|
| 19 |
+
"train_class_acc": 0.3462,
|
| 20 |
+
"val_sum_loss": 5.416218318939209,
|
| 21 |
+
"val_class_loss": 1.0967657680511476,
|
| 22 |
+
"val_class_acc": 0.386,
|
| 23 |
+
"val_rouge1": 0.21779871449217764,
|
| 24 |
+
"val_rouge2": 0.028536134623968267,
|
| 25 |
+
"val_rougeL": 0.19329056631523484
|
| 26 |
},
|
| 27 |
{
|
| 28 |
"epoch": 3,
|
| 29 |
+
"train_sum_loss": 4.404316672515869,
|
| 30 |
+
"train_class_loss": 1.0899620735168456,
|
| 31 |
+
"train_class_acc": 0.361,
|
| 32 |
+
"val_sum_loss": 5.30168932723999,
|
| 33 |
+
"val_class_loss": 1.7727555074691772,
|
| 34 |
+
"val_class_acc": 0.342,
|
| 35 |
+
"val_rouge1": 0.22501668712961082,
|
| 36 |
+
"val_rouge2": 0.03326989668183761,
|
| 37 |
+
"val_rougeL": 0.20778061653444058
|
| 38 |
}
|
| 39 |
],
|
| 40 |
"config": {
|
model.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 385512714
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b2545d4f075dd3d1dfeadaa8b83777d84078f8373b4f4ee7c4418f5186bd3b97
|
| 3 |
size 385512714
|
multitask_training.png
CHANGED
|
Git LFS Details
|
|
Git LFS Details
|
tokenizer/tokenizer_config.json
CHANGED
|
@@ -1,4 +1,5 @@
|
|
| 1 |
{
|
|
|
|
| 2 |
"added_tokens_decoder": {
|
| 3 |
"0": {
|
| 4 |
"content": "<pad>",
|
|
@@ -930,6 +931,7 @@
|
|
| 930 |
"clean_up_tokenization_spaces": true,
|
| 931 |
"eos_token": "</s>",
|
| 932 |
"extra_ids": 100,
|
|
|
|
| 933 |
"model_max_length": 512,
|
| 934 |
"pad_token": "<pad>",
|
| 935 |
"tokenizer_class": "T5Tokenizer",
|
|
|
|
| 1 |
{
|
| 2 |
+
"add_prefix_space": null,
|
| 3 |
"added_tokens_decoder": {
|
| 4 |
"0": {
|
| 5 |
"content": "<pad>",
|
|
|
|
| 931 |
"clean_up_tokenization_spaces": true,
|
| 932 |
"eos_token": "</s>",
|
| 933 |
"extra_ids": 100,
|
| 934 |
+
"extra_special_tokens": {},
|
| 935 |
"model_max_length": 512,
|
| 936 |
"pad_token": "<pad>",
|
| 937 |
"tokenizer_class": "T5Tokenizer",
|