forked from stevenshave/SimilarityLab
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathconfig.py
More file actions
37 lines (31 loc) · 1.86 KB
/
config.py
File metadata and controls
37 lines (31 loc) · 1.86 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
import os
from pathlib import Path
class Config(object):
SECRET_KEY = os.environ.get('FLASK_SECRET_KEY') or '3Sy63TSRyVBaq6G37Ch7lXYMLQPuYgkUfRAN1Av4ltc'
CELERY_BROKER_URL = 'redis://localhost:6379/0'
#CELERY_RESULT_BACKEND = 'redis://localhost:6379/0'
DATASETS_DIRECTORY=Path("/home/ubuntu/data/")
# Datasets take as arguments: Unique ID, SDF filename prefix, Description
DATASETS=[
[2, "eMolecules202103-qed-0.67", "eMolecules-2021-03 Druglike (QED>=0.67, 12,708,687 unique molecules)"],
[3, "eMolecules202103", "eMolecules-2021-03 (29,368,630 unique molecules)"],
[0, "10ktestset", "Small set of 10k druglike molecules (QED scores > 0.9)"],
[1, "selechem-fdaapproved", "FDA approved drugs from Selleckchem (2,238 unique molecules)"],
[4, "drugbank", "Drugbank 5.1.8 (10,081 unique molecules)"],
]
NUM_TO_KEEP_CHOICES=[100,200,500,1000,2000]
assert len(set([d[0] for d in DATASETS]))==len(DATASETS), "Not all dataset IDs unique"
QUERY_SIMILARS_DIRECTORY=DATASETS_DIRECTORY/"queries/similars/"
QUERY_TARGETS_DIRECTORY=DATASETS_DIRECTORY/"queries/targets/"
CHEMBL_VERSION_NUMBER=28
CHEMBL_USRCATSL_ROOT=DATASETS_DIRECTORY/"chembl28_actives.sdf.usrcatsl"
CHEMBL_USRCATSL_BIN=Path(str(CHEMBL_USRCATSL_ROOT)+".bin")
assert(CHEMBL_USRCATSL_BIN.exists()),"Missing bin file"
CHEMBL_USRCATSL_SMI=Path(str(CHEMBL_USRCATSL_ROOT)+".smi")
assert (CHEMBL_USRCATSL_SMI), "Missing smiles file"
CCHEMBLID_TO_TCHEMBLIDS_PATH=DATASETS_DIRECTORY/"cchemblid_to_tchemblids.json"
assert CCHEMBLID_TO_TCHEMBLIDS_PATH.exists(), "Missing cchemblid_to_tchemblids.json"
TCHEMBLIDS_TO_PREFNAMES_PATH=DATASETS_DIRECTORY/"tchemblids_to_prefnames.json"
assert TCHEMBLIDS_TO_PREFNAMES_PATH.exists(), "Missing tchemblids_to_prefnames.json"
CCHEMBLID_TO_TCHEMBLIDS=None
TCHEMBLIDS_TO_PREFNAMES=None