-
Notifications
You must be signed in to change notification settings - Fork 0
/
config-qm7drugs.py
60 lines (60 loc) · 1.61 KB
/
config-qm7drugs.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
config = {
# absolute paths
"repository_folder": "/home/haeberle/molekuehl/",
###
"config_name": "qm7drugs",
"database": "qm7",
"representation": "FCHL",
###
# corresponding names must be in targets/targets.csv
"target_names": [
"sildenafil",
"penicillin",
"troglitazone",
"imatinib",
"pemetrexed",
"oxycodone",
"pregabalin",
"apixaban",
"salbutamol",
"oseltamivir",
],
"in_database": False,
"plot_average_target_names": [
"sildenafil",
"penicillin",
"troglitazone",
"imatinib",
"pemetrexed",
"oxycodone",
"pregabalin",
"apixaban",
"salbutamol",
"oseltamivir",
],
###
"generate_database": True,
"generate_targets": True,
"cur_subset": True,
"fps_subset": True,
"sml_subset": True,
"algo_model": True,
"algo_subset": True,
"learning_curves": ["algo", "sml", "fps", "cur", "random"],
"plots_individual": ["algo", "fps", "sml", "cur", "random"],
"plots_average": ["algo", "fps", "sml", "cur", "random"],
###
"scope": "local_vector",
"penalty": 0,
"duplicates": 1,
"timelimit": 10 * 3600, # 10 hours
"PoolSearchMode": 2,
"number_of_fragments": 1024, # size of subset selected
"verbose": True,
###
"learning_curve_ticks": [2**k for k in range(4, 11)],
"FPS_timelimit": 600, # 10 mins
###
"random_state": None, # for multiple random subset selection, don't use a fixed state!
"CV": 5, # number of cross-validation for random learning curves
}