lavokvv commited on
Commit
48223ee
·
1 Parent(s): 7f8da8b

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "flaubert/flaubert_base_cased",
3
  "amp": 1,
4
  "architectures": [
5
  "FlaubertForSequenceClassification"
@@ -12,7 +12,7 @@
12
  "causal": false,
13
  "clip_grad_norm": 5,
14
  "dropout": 0.1,
15
- "emb_dim": 768,
16
  "embed_init_std": 0.02209708691207961,
17
  "encoder_only": true,
18
  "end_n_top": 5,
@@ -48,8 +48,8 @@
48
  "langs": [
49
  "fr"
50
  ],
51
- "layer_norm_eps": 1e-12,
52
- "layerdrop": 0.0,
53
  "lg_sampling_factor": -1,
54
  "lgs": "fr",
55
  "mask_index": 5,
@@ -64,12 +64,12 @@
64
  ]
65
  ],
66
  "model_type": "flaubert",
67
- "n_heads": 12,
68
  "n_langs": 1,
69
- "n_layers": 12,
70
  "pad_index": 2,
71
  "pad_token_id": 2,
72
- "pre_norm": false,
73
  "problem_type": "single_label_classification",
74
  "sample_alpha": 0,
75
  "share_inout_emb": true,
 
1
  {
2
+ "_name_or_path": "flaubert/flaubert_small_cased",
3
  "amp": 1,
4
  "architectures": [
5
  "FlaubertForSequenceClassification"
 
12
  "causal": false,
13
  "clip_grad_norm": 5,
14
  "dropout": 0.1,
15
+ "emb_dim": 512,
16
  "embed_init_std": 0.02209708691207961,
17
  "encoder_only": true,
18
  "end_n_top": 5,
 
48
  "langs": [
49
  "fr"
50
  ],
51
+ "layer_norm_eps": 1e-06,
52
+ "layerdrop": 0.2,
53
  "lg_sampling_factor": -1,
54
  "lgs": "fr",
55
  "mask_index": 5,
 
64
  ]
65
  ],
66
  "model_type": "flaubert",
67
+ "n_heads": 8,
68
  "n_langs": 1,
69
+ "n_layers": 6,
70
  "pad_index": 2,
71
  "pad_token_id": 2,
72
+ "pre_norm": true,
73
  "problem_type": "single_label_classification",
74
  "sample_alpha": 0,
75
  "share_inout_emb": true,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f2d5fa6cc61a3a44534f439e4f30e229baa422072c279ee983f0e20bdbeb39b
3
- size 553012965
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d35855a79c71f7c2afb0f02667fed5bb4c0378f46998b1d0f574fad5d23f28c
3
+ size 217510949
runs/May15_16-33-14_00a28a6b8d46/1684168508.8759987/events.out.tfevents.1684168508.00a28a6b8d46.15988.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed81ee94cd0d1e9a641656d678e7e879786566ed129d41edc3dc59b18e5ed305
3
+ size 5892
runs/May15_16-33-14_00a28a6b8d46/events.out.tfevents.1684168508.00a28a6b8d46.15988.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6877e7a5bdee7f6ad611661d0e17294b43c0cf11880cc2dde715bad7af476e30
3
+ size 5229
runs/May15_16-45-45_00a28a6b8d46/1684169201.8727658/events.out.tfevents.1684169201.00a28a6b8d46.15988.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bac9e7001c1a569f5a5e8018f853713b92b2fd67013d95e6b60e73568ff8d21d
3
+ size 5898
runs/May15_16-45-45_00a28a6b8d46/events.out.tfevents.1684169201.00a28a6b8d46.15988.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44d1ac9572be2742333b78f19b13dcf65fc431236ec95e44f0ffd441f4ca19a3
3
+ size 5213
runs/May15_16-49-34_00a28a6b8d46/1684169406.4611292/events.out.tfevents.1684169406.00a28a6b8d46.15988.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:236fd249d4dd841c48b1ebc75fbd271c50a675800f209497650d373e62368217
3
+ size 5898
runs/May15_16-49-34_00a28a6b8d46/events.out.tfevents.1684169406.00a28a6b8d46.15988.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24132fdcf2191c10b34332be646b8b676eb249e50874d1aa47c0edc21d68c78d
3
+ size 5536
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cfa561034f17a42f3883392bfbd5eb29f288266ae58fc3a8f4b70e2e5eb9fd9
3
  size 3899
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c78aaade2fe753729aa5b791e3a81bb88924b327043cf60e0787548880541005
3
  size 3899