JonnyBP commited on
Commit
273e995
·
1 Parent(s): 6cef02d

feat: add features.yaml. #3

Browse files
Files changed (1) hide show
  1. configs/features.yaml +22 -0
configs/features.yaml ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ preprocessing:
2
+ lowercase: true
3
+ remove_urls: true
4
+ remove_mentions: true
5
+ remove_emojis: true
6
+ remove_special_chars: true
7
+ remove_stopwords: true
8
+ lemmatize: true
9
+ min_token_length: 2
10
+ language: en
11
+
12
+ vectorization:
13
+ method: tfidf # tfidf | bow | both
14
+ tfidf:
15
+ max_features: 10000
16
+ ngram_range: [1, 2]
17
+ sublinear_tf: true
18
+ min_df: 2
19
+ bow:
20
+ max_features: 10000
21
+ ngram_range: [1, 1]
22
+ min_df: 2