ldrace commited on
Commit
5e87f63
·
1 Parent(s): 6372cd7

Training in progress, step 500

Browse files
Files changed (25) hide show
  1. .gitignore +1 -0
  2. config.json +70 -0
  3. merges.txt +0 -0
  4. pytorch_model.bin +3 -0
  5. runs/Apr28_19-09-53_67c60f377191/1682709489.6553383/events.out.tfevents.1682709489.67c60f377191.97290.1 +3 -0
  6. runs/Apr28_19-09-53_67c60f377191/1682710073.1903777/events.out.tfevents.1682710073.67c60f377191.97290.3 +3 -0
  7. runs/Apr28_19-09-53_67c60f377191/1682710148.1196187/events.out.tfevents.1682710148.67c60f377191.97290.5 +3 -0
  8. runs/Apr28_19-09-53_67c60f377191/events.out.tfevents.1682709489.67c60f377191.97290.0 +3 -0
  9. runs/Apr28_19-09-53_67c60f377191/events.out.tfevents.1682710073.67c60f377191.97290.2 +3 -0
  10. runs/Apr28_19-09-53_67c60f377191/events.out.tfevents.1682710148.67c60f377191.97290.4 +3 -0
  11. runs/Apr28_19-32-54_67c60f377191/1682710397.1319244/events.out.tfevents.1682710397.67c60f377191.97290.7 +3 -0
  12. runs/Apr28_19-32-54_67c60f377191/events.out.tfevents.1682710397.67c60f377191.97290.6 +3 -0
  13. runs/Apr28_20-02-15_67c60f377191/1682712162.3723226/events.out.tfevents.1682712162.67c60f377191.114718.1 +3 -0
  14. runs/Apr28_20-02-15_67c60f377191/events.out.tfevents.1682712162.67c60f377191.114718.0 +3 -0
  15. runs/Apr28_20-04-31_67c60f377191/1682712296.560953/events.out.tfevents.1682712296.67c60f377191.114718.3 +3 -0
  16. runs/Apr28_20-04-31_67c60f377191/events.out.tfevents.1682712296.67c60f377191.114718.2 +3 -0
  17. runs/Apr28_20-06-50_67c60f377191/1682712414.4738984/events.out.tfevents.1682712414.67c60f377191.120172.1 +3 -0
  18. runs/Apr28_20-06-50_67c60f377191/events.out.tfevents.1682712414.67c60f377191.120172.0 +3 -0
  19. runs/Apr28_20-12-15_67c60f377191/1682712739.5568504/events.out.tfevents.1682712739.67c60f377191.121745.1 +3 -0
  20. runs/Apr28_20-12-15_67c60f377191/events.out.tfevents.1682712739.67c60f377191.121745.0 +3 -0
  21. special_tokens_map.json +15 -0
  22. tokenizer.json +0 -0
  23. tokenizer_config.json +15 -0
  24. training_args.bin +3 -0
  25. vocab.json +0 -0
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "facebook/bart-large-cnn",
3
+ "_num_labels": 3,
4
+ "activation_dropout": 0.0,
5
+ "activation_function": "gelu",
6
+ "add_final_layer_norm": false,
7
+ "architectures": [
8
+ "BartForConditionalGeneration"
9
+ ],
10
+ "attention_dropout": 0.0,
11
+ "bos_token_id": 0,
12
+ "classif_dropout": 0.0,
13
+ "classifier_dropout": 0.0,
14
+ "d_model": 1024,
15
+ "decoder_attention_heads": 16,
16
+ "decoder_ffn_dim": 4096,
17
+ "decoder_layerdrop": 0.0,
18
+ "decoder_layers": 12,
19
+ "decoder_start_token_id": 2,
20
+ "dropout": 0.1,
21
+ "early_stopping": true,
22
+ "encoder_attention_heads": 16,
23
+ "encoder_ffn_dim": 4096,
24
+ "encoder_layerdrop": 0.0,
25
+ "encoder_layers": 12,
26
+ "eos_token_id": 2,
27
+ "force_bos_token_to_be_generated": true,
28
+ "forced_bos_token_id": 0,
29
+ "forced_eos_token_id": 2,
30
+ "gradient_checkpointing": false,
31
+ "id2label": {
32
+ "0": "LABEL_0",
33
+ "1": "LABEL_1",
34
+ "2": "LABEL_2"
35
+ },
36
+ "init_std": 0.02,
37
+ "is_encoder_decoder": true,
38
+ "label2id": {
39
+ "LABEL_0": 0,
40
+ "LABEL_1": 1,
41
+ "LABEL_2": 2
42
+ },
43
+ "length_penalty": 2.0,
44
+ "max_length": 142,
45
+ "max_position_embeddings": 1024,
46
+ "min_length": 56,
47
+ "model_type": "bart",
48
+ "no_repeat_ngram_size": 3,
49
+ "normalize_before": false,
50
+ "num_beams": 4,
51
+ "num_hidden_layers": 12,
52
+ "output_past": true,
53
+ "pad_token_id": 1,
54
+ "prefix": " ",
55
+ "scale_embedding": false,
56
+ "task_specific_params": {
57
+ "summarization": {
58
+ "early_stopping": true,
59
+ "length_penalty": 2.0,
60
+ "max_length": 142,
61
+ "min_length": 56,
62
+ "no_repeat_ngram_size": 3,
63
+ "num_beams": 4
64
+ }
65
+ },
66
+ "torch_dtype": "float32",
67
+ "transformers_version": "4.28.1",
68
+ "use_cache": true,
69
+ "vocab_size": 50264
70
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10a4ebc05ca6708f2ab962937e63594cf2038ecd65ffab470f83b94418010df6
3
+ size 1625537293
runs/Apr28_19-09-53_67c60f377191/1682709489.6553383/events.out.tfevents.1682709489.67c60f377191.97290.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89bde7b50da7ffa12a94b3e54b3ce3768f089ebd94166c4a3c4bcf041fd3adb6
3
+ size 6199
runs/Apr28_19-09-53_67c60f377191/1682710073.1903777/events.out.tfevents.1682710073.67c60f377191.97290.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd8fd009b22094f1ea3a5c0de72c32e8d0e801ccb172fc6226a2b66398b1a0e0
3
+ size 6199
runs/Apr28_19-09-53_67c60f377191/1682710148.1196187/events.out.tfevents.1682710148.67c60f377191.97290.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:688ea12b8921bd3cb74c2f9c27e3e12eeb7de81d9aaa4aa4ad003d51b3dd5a9f
3
+ size 6199
runs/Apr28_19-09-53_67c60f377191/events.out.tfevents.1682709489.67c60f377191.97290.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d483e880de2874e498013d7b8d2f35f71eb426b2a2198981ee702718efe4275
3
+ size 5174
runs/Apr28_19-09-53_67c60f377191/events.out.tfevents.1682710073.67c60f377191.97290.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73df2b5dfc8c8f25281e18f5d753f22143108b6916301acdb9c1d3e4125fa91b
3
+ size 5174
runs/Apr28_19-09-53_67c60f377191/events.out.tfevents.1682710148.67c60f377191.97290.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b24fb3482915eae5e240d8d5258f1aeff8ec378210726c83d1e53d184485b6
3
+ size 5174
runs/Apr28_19-32-54_67c60f377191/1682710397.1319244/events.out.tfevents.1682710397.67c60f377191.97290.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:078cac593fb2c8bcbcdd521129dc59e47965f24923cc62687f8802853a9c7377
3
+ size 6205
runs/Apr28_19-32-54_67c60f377191/events.out.tfevents.1682710397.67c60f377191.97290.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66ea851502d994ea92c41e65705c9552200c54fde86e5941f469ee62e3a36f21
3
+ size 5168
runs/Apr28_20-02-15_67c60f377191/1682712162.3723226/events.out.tfevents.1682712162.67c60f377191.114718.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34e356a385615b0e683e204be0e0edd91339c27645dde80880e5ec70c02abf6d
3
+ size 6205
runs/Apr28_20-02-15_67c60f377191/events.out.tfevents.1682712162.67c60f377191.114718.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50d8b6ff53e3159ccbb435e69db7ac56dbede643a217b17a9b462431cccd4e82
3
+ size 5166
runs/Apr28_20-04-31_67c60f377191/1682712296.560953/events.out.tfevents.1682712296.67c60f377191.114718.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65b6919ffa92d7428dc14cf6adc8534db596ea12b91f310f0f8fd83658f44aae
3
+ size 6205
runs/Apr28_20-04-31_67c60f377191/events.out.tfevents.1682712296.67c60f377191.114718.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ee35f0e1e8748b84b004abfafb214ad1b85cf527f0b7bf4d11b32ec70e397ce
3
+ size 4184
runs/Apr28_20-06-50_67c60f377191/1682712414.4738984/events.out.tfevents.1682712414.67c60f377191.120172.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2154f72978d96b32c4e9176c8d35d122c1a96ae166bbbf44e72d2e2067bb803
3
+ size 6205
runs/Apr28_20-06-50_67c60f377191/events.out.tfevents.1682712414.67c60f377191.120172.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e34bbb03de416f8ccd527f5061e73e0ba962c4dc314c5ea8314a7c1e25a4dfb
3
+ size 5167
runs/Apr28_20-12-15_67c60f377191/1682712739.5568504/events.out.tfevents.1682712739.67c60f377191.121745.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e422d648cc5950e60ff934737911c48ca538b2239703387b71d3b167dff99aa7
3
+ size 6205
runs/Apr28_20-12-15_67c60f377191/events.out.tfevents.1682712739.67c60f377191.121745.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbe2b247d626679ae35c545dc5a7eb27ebab9a1c551ff1f9a7cfcc196bdb9588
3
+ size 5167
special_tokens_map.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<s>",
4
+ "eos_token": "</s>",
5
+ "mask_token": {
6
+ "content": "<mask>",
7
+ "lstrip": true,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
+ "pad_token": "<pad>",
13
+ "sep_token": "</s>",
14
+ "unk_token": "<unk>"
15
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "bos_token": "<s>",
4
+ "clean_up_tokenization_spaces": true,
5
+ "cls_token": "<s>",
6
+ "eos_token": "</s>",
7
+ "errors": "replace",
8
+ "mask_token": "<mask>",
9
+ "model_max_length": 1024,
10
+ "pad_token": "<pad>",
11
+ "sep_token": "</s>",
12
+ "tokenizer_class": "BartTokenizer",
13
+ "trim_offsets": true,
14
+ "unk_token": "<unk>"
15
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ec9012c9ac5be42607f759f62ec1197d799432c6692413905b5410e2e0b3b53
3
+ size 3771
vocab.json ADDED
The diff for this file is too large to render. See raw diff