SadeghK commited on
Commit
1795dc9
·
verified ·
1 Parent(s): d2e52c5

Uploading the model files for PL-BERT for Persian

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ step_305000_loss=1.4_val_loss=0.35_token_loss=1.2.t7 filter=lfs diff=lfs merge=lfs -text
config_fa.yml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ log_dir: "Checkpoint_fa"
2
+ mixed_precision: "fp16"
3
+ data_folder: "wikipedia_fa.processed"
4
+ batch_size: 48
5
+ save_interval: 5000
6
+ log_interval: 10
7
+ num_process: 1 # number of GPUs
8
+ num_steps: 2000000
9
+
10
+ dataset_params:
11
+ tokenizer: "HooshvareLab/bert-base-parsbert-uncased"
12
+ token_separator: " " # token used for phoneme separator (space)
13
+ token_mask: "M" # token used for phoneme mask (M)
14
+ word_separator: 3039 # token used for word separator (<formula>)
15
+ token_maps: "token_fa_maps.pkl" # token map path
16
+
17
+ max_mel_length: 512 # max phoneme length
18
+
19
+ word_mask_prob: 0.15 # probability to mask the entire word
20
+ phoneme_mask_prob: 0.1 # probability to mask each phoneme
21
+ replace_prob: 0.2 # probablity to replace phonemes
22
+
23
+ model_params:
24
+ vocab_size: 178
25
+ hidden_size: 768
26
+ num_attention_heads: 12
27
+ intermediate_size: 2048
28
+ max_position_embeddings: 512
29
+ num_hidden_layers: 12
30
+ dropout: 0.1
step_305000_loss=1.4_val_loss=0.35_token_loss=1.2.t7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57b1af0d1985e967acce8691ae4a04bb1e44f881fc6fc9c30321aacdbf1a32bd
3
+ size 764258718
token_fa_maps.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6751f277ecad951f541adbed21d6d92a38e5307c5a2b935714a59abb214b89c
3
+ size 2228273
wikipedia_fa.processed.tar.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b898fe466fba4c6d4b8511d0aae8aed42d894038a683dae24bed350646afe874
3
+ size 171694383