File size: 775 Bytes
9e2ba5f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
# data
DATA_DIR = "../inputs/"
ORIGINAL_TRAIN = DATA_DIR + "train.csv"
MODIFIED_TRAIN = DATA_DIR + "modified_train.csv"
TEST_DATA = DATA_DIR + "test.csv"
MODIFIED_TEST = DATA_DIR + "modified_test.csv"
SUBMISSION = DATA_DIR + "sample_submission.csv"
MODEL_DIR = "../models/"
IMAGES = "../images/"

# features
ID = "id"
TEXT = "text"
KEYWORD = "keyword"
LOCATION = "location"
FOLD = "kfold"
TOKENS = "tokens"

# created features
ALL_TEXT = "all_text"
CLEANED_TEXT = "cleaned_text"

# target
TARGET = "target"
RELABELED_TARGET = "relabeled_target"

# Pretrained Word2Vec
PRETRAINED_WORD2VEC = "word2vec-google-news-300"
EMBED_SIZE = 300

# TRAINING
HIDDEN_DIM = 256
TARGET_DIM = 1
BATCH_SIZE = 32
N_EPOCHS = 8
N_SPLITS = 5
LEARNING_RATE = 1e-3
MAXLEN = 202
VOCAB_SIZE = 172901