Training in progress, epoch 1

Files changed (9) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "flaubert/flaubert_base_cased",
   "amp": 1,
   "architectures": [
     "FlaubertForSequenceClassification"
@@ -12,7 +12,7 @@
   "causal": false,
   "clip_grad_norm": 5,
   "dropout": 0.1,
-  "emb_dim": 768,
   "embed_init_std": 0.02209708691207961,
   "encoder_only": true,
   "end_n_top": 5,
@@ -48,8 +48,8 @@
   "langs": [
     "fr"
   ],
-  "layer_norm_eps": 1e-12,
-  "layerdrop": 0.0,
   "lg_sampling_factor": -1,
   "lgs": "fr",
   "mask_index": 5,
@@ -64,12 +64,12 @@
     ]
   ],
   "model_type": "flaubert",
-  "n_heads": 12,
   "n_langs": 1,
-  "n_layers": 12,
   "pad_index": 2,
   "pad_token_id": 2,
-  "pre_norm": false,
   "problem_type": "single_label_classification",
   "sample_alpha": 0,
   "share_inout_emb": true,

 {
+  "_name_or_path": "flaubert/flaubert_small_cased",
   "amp": 1,
   "architectures": [
     "FlaubertForSequenceClassification"
   "causal": false,
   "clip_grad_norm": 5,
   "dropout": 0.1,
+  "emb_dim": 512,
   "embed_init_std": 0.02209708691207961,
   "encoder_only": true,
   "end_n_top": 5,
   "langs": [
     "fr"
   ],
+  "layer_norm_eps": 1e-06,
+  "layerdrop": 0.2,
   "lg_sampling_factor": -1,
   "lgs": "fr",
   "mask_index": 5,
     ]
   ],
   "model_type": "flaubert",
+  "n_heads": 8,
   "n_langs": 1,
+  "n_layers": 6,
   "pad_index": 2,
   "pad_token_id": 2,
+  "pre_norm": true,
   "problem_type": "single_label_classification",
   "sample_alpha": 0,
   "share_inout_emb": true,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8f2d5fa6cc61a3a44534f439e4f30e229baa422072c279ee983f0e20bdbeb39b
-size 553012965

 version https://git-lfs.github.com/spec/v1
+oid sha256:9d35855a79c71f7c2afb0f02667fed5bb4c0378f46998b1d0f574fad5d23f28c
+size 217510949

runs/May15_16-33-14_00a28a6b8d46/1684168508.8759987/events.out.tfevents.1684168508.00a28a6b8d46.15988.5 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:ed81ee94cd0d1e9a641656d678e7e879786566ed129d41edc3dc59b18e5ed305
+size 5892

runs/May15_16-33-14_00a28a6b8d46/events.out.tfevents.1684168508.00a28a6b8d46.15988.4 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6877e7a5bdee7f6ad611661d0e17294b43c0cf11880cc2dde715bad7af476e30
+size 5229

runs/May15_16-45-45_00a28a6b8d46/1684169201.8727658/events.out.tfevents.1684169201.00a28a6b8d46.15988.7 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:bac9e7001c1a569f5a5e8018f853713b92b2fd67013d95e6b60e73568ff8d21d
+size 5898

runs/May15_16-45-45_00a28a6b8d46/events.out.tfevents.1684169201.00a28a6b8d46.15988.6 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:44d1ac9572be2742333b78f19b13dcf65fc431236ec95e44f0ffd441f4ca19a3
+size 5213

runs/May15_16-49-34_00a28a6b8d46/1684169406.4611292/events.out.tfevents.1684169406.00a28a6b8d46.15988.9 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:236fd249d4dd841c48b1ebc75fbd271c50a675800f209497650d373e62368217
+size 5898

runs/May15_16-49-34_00a28a6b8d46/events.out.tfevents.1684169406.00a28a6b8d46.15988.8 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:24132fdcf2191c10b34332be646b8b676eb249e50874d1aa47c0edc21d68c78d
+size 5536

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6cfa561034f17a42f3883392bfbd5eb29f288266ae58fc3a8f4b70e2e5eb9fd9
 size 3899

 version https://git-lfs.github.com/spec/v1
+oid sha256:c78aaade2fe753729aa5b791e3a81bb88924b327043cf60e0787548880541005
 size 3899