-
Notifications
You must be signed in to change notification settings - Fork 33
/
constants.py
39 lines (29 loc) · 1.12 KB
/
constants.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
# CONSTANTS YOU NEED TO MODIFY
#whether to train on GPU
CUDA=True
# root directory that contains the training/testing data
DATA_HOME="/dfs/scratch0/reddit/conflict/prediction"
LOG_DIR="/dfs/scratch0/reddit/conflict/prediction"
#whether to show results on the test set
PRINT_TEST=False
# CONSTANTS YOU MAY WANT TO MODIFY (BUT DON"T NEED TO)
TRAIN_DATA=DATA_HOME+"/preprocessed_train_data.pkl"
VAL_DATA=DATA_HOME+"/preprocessed_val_data.pkl"
TEST_DATA=DATA_HOME+"/preprocessed_test_data.pkl"
BATCH_SIZE=512
#NOTE: THESE PREPROCESSED FILES HAVE A FIXED BATCH SIZE
WORD_EMBEDS=DATA_HOME+"/embeddings/glove_word_embeds.txt"
USER_EMBEDS=DATA_HOME+"/embeddings/user_vecs.npy"
USER_IDS=DATA_HOME+"/embeddings/user_vecs.vocab"
SUBREDDIT_EMBEDS=DATA_HOME+"/embeddings/sub_vecs.npy"
SUBREDDIT_IDS=DATA_HOME+"/embeddings/sub_vecs.vocab"
POST_INFO=DATA_HOME+"/detailed_data/post_crosslink_info.tsv"
LABEL_INFO=DATA_HOME+"/detailed_data/label_info.tsv"
PREPROCESSED_DATA=DATA_HOME+"/detailed_data/tokenized_posts.tsv"
VOCAB_SIZE = 174558
NUM_USERS = 118381
NUM_SUBREDDITS = 51278
WORD_EMBED_DIM = 300
METAFEAT_LEN = 263
NUM_CLASSES = 1
MAX_LEN=50