Deepu1965 commited on
Commit
37abcc2
·
verified ·
1 Parent(s): 81c6299

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -16,12 +16,12 @@ Multi-task transformer with shared MoE layers for:
16
  ## Performance
17
 
18
  ### Classification
19
- - Validation Accuracy: 0.3580
20
 
21
  ### Summarization
22
- - ROUGE-1: 0.2154
23
- - ROUGE-2: 0.0298
24
- - ROUGE-L: 0.1842
25
 
26
  ## Benefits
27
 
 
16
  ## Performance
17
 
18
  ### Classification
19
+ - Validation Accuracy: 0.3420
20
 
21
  ### Summarization
22
+ - ROUGE-1: 0.2250
23
+ - ROUGE-2: 0.0333
24
+ - ROUGE-L: 0.2078
25
 
26
  ## Benefits
27
 
history.csv CHANGED
@@ -1,4 +1,4 @@
1
  epoch,train_sum_loss,train_class_loss,train_class_acc,val_sum_loss,val_class_loss,val_class_acc,val_rouge1,val_rouge2,val_rougeL
2
- 1,6.539164045969645,1.080719949245453,0.407,6.074222045898438,1.0701570644378662,0.344,0.1856974871518223,0.01907572984467157,0.16932123951907738
3
- 2,5.473755016326904,1.0669607858657837,0.3973333333333333,5.697721607208252,0.9951665096282959,0.506,0.2045861270829145,0.024241315885172792,0.17770470477158784
4
- 3,4.5570032602945965,1.0329711267153423,0.4613333333333333,5.637807807922363,1.338168493270874,0.358,0.21535871469554163,0.02978786749856711,0.1842483145510327
 
1
  epoch,train_sum_loss,train_class_loss,train_class_acc,val_sum_loss,val_class_loss,val_class_acc,val_rouge1,val_rouge2,val_rougeL
2
+ 1,6.272962152862549,1.0185239918708802,0.4368,5.8008860549926755,1.1023406219482421,0.304,0.17660690248954364,0.018371370658335634,0.15689190075772386
3
+ 2,5.219159950256348,1.099994719696045,0.3462,5.416218318939209,1.0967657680511476,0.386,0.21779871449217764,0.028536134623968267,0.19329056631523484
4
+ 3,4.404316672515869,1.0899620735168456,0.361,5.30168932723999,1.7727555074691772,0.342,0.22501668712961082,0.03326989668183761,0.20778061653444058
metrics.json CHANGED
@@ -2,39 +2,39 @@
2
  "history": [
3
  {
4
  "epoch": 1,
5
- "train_sum_loss": 6.539164045969645,
6
- "train_class_loss": 1.080719949245453,
7
- "train_class_acc": 0.407,
8
- "val_sum_loss": 6.074222045898438,
9
- "val_class_loss": 1.0701570644378662,
10
- "val_class_acc": 0.344,
11
- "val_rouge1": 0.1856974871518223,
12
- "val_rouge2": 0.01907572984467157,
13
- "val_rougeL": 0.16932123951907738
14
  },
15
  {
16
  "epoch": 2,
17
- "train_sum_loss": 5.473755016326904,
18
- "train_class_loss": 1.0669607858657837,
19
- "train_class_acc": 0.3973333333333333,
20
- "val_sum_loss": 5.697721607208252,
21
- "val_class_loss": 0.9951665096282959,
22
- "val_class_acc": 0.506,
23
- "val_rouge1": 0.2045861270829145,
24
- "val_rouge2": 0.024241315885172792,
25
- "val_rougeL": 0.17770470477158784
26
  },
27
  {
28
  "epoch": 3,
29
- "train_sum_loss": 4.5570032602945965,
30
- "train_class_loss": 1.0329711267153423,
31
- "train_class_acc": 0.4613333333333333,
32
- "val_sum_loss": 5.637807807922363,
33
- "val_class_loss": 1.338168493270874,
34
- "val_class_acc": 0.358,
35
- "val_rouge1": 0.21535871469554163,
36
- "val_rouge2": 0.02978786749856711,
37
- "val_rougeL": 0.1842483145510327
38
  }
39
  ],
40
  "config": {
 
2
  "history": [
3
  {
4
  "epoch": 1,
5
+ "train_sum_loss": 6.272962152862549,
6
+ "train_class_loss": 1.0185239918708802,
7
+ "train_class_acc": 0.4368,
8
+ "val_sum_loss": 5.8008860549926755,
9
+ "val_class_loss": 1.1023406219482421,
10
+ "val_class_acc": 0.304,
11
+ "val_rouge1": 0.17660690248954364,
12
+ "val_rouge2": 0.018371370658335634,
13
+ "val_rougeL": 0.15689190075772386
14
  },
15
  {
16
  "epoch": 2,
17
+ "train_sum_loss": 5.219159950256348,
18
+ "train_class_loss": 1.099994719696045,
19
+ "train_class_acc": 0.3462,
20
+ "val_sum_loss": 5.416218318939209,
21
+ "val_class_loss": 1.0967657680511476,
22
+ "val_class_acc": 0.386,
23
+ "val_rouge1": 0.21779871449217764,
24
+ "val_rouge2": 0.028536134623968267,
25
+ "val_rougeL": 0.19329056631523484
26
  },
27
  {
28
  "epoch": 3,
29
+ "train_sum_loss": 4.404316672515869,
30
+ "train_class_loss": 1.0899620735168456,
31
+ "train_class_acc": 0.361,
32
+ "val_sum_loss": 5.30168932723999,
33
+ "val_class_loss": 1.7727555074691772,
34
+ "val_class_acc": 0.342,
35
+ "val_rouge1": 0.22501668712961082,
36
+ "val_rouge2": 0.03326989668183761,
37
+ "val_rougeL": 0.20778061653444058
38
  }
39
  ],
40
  "config": {
model.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30128df14f8ee585a1c686f17af6e9df803766e5ac6d55d8c59c5c93ba437131
3
  size 385512714
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2545d4f075dd3d1dfeadaa8b83777d84078f8373b4f4ee7c4418f5186bd3b97
3
  size 385512714
multitask_training.png CHANGED

Git LFS Details

  • SHA256: 641dabb0ce4b672eb9d60406f1cf411f627e439ee28d2069fd4d9c97f9e466c0
  • Pointer size: 131 Bytes
  • Size of remote file: 207 kB

Git LFS Details

  • SHA256: a6bd5b65983e400f9d274f230c40b74d600e9b8d0e757e6ffbc505402288b9ee
  • Pointer size: 131 Bytes
  • Size of remote file: 189 kB
tokenizer/tokenizer_config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<pad>",
@@ -930,6 +931,7 @@
930
  "clean_up_tokenization_spaces": true,
931
  "eos_token": "</s>",
932
  "extra_ids": 100,
 
933
  "model_max_length": 512,
934
  "pad_token": "<pad>",
935
  "tokenizer_class": "T5Tokenizer",
 
1
  {
2
+ "add_prefix_space": null,
3
  "added_tokens_decoder": {
4
  "0": {
5
  "content": "<pad>",
 
931
  "clean_up_tokenization_spaces": true,
932
  "eos_token": "</s>",
933
  "extra_ids": 100,
934
+ "extra_special_tokens": {},
935
  "model_max_length": 512,
936
  "pad_token": "<pad>",
937
  "tokenizer_class": "T5Tokenizer",