-
Notifications
You must be signed in to change notification settings - Fork 1
/
pubrunner.yml
28 lines (27 loc) · 1003 Bytes
/
pubrunner.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
name: FoodRelations
version: 0.1
url: https://github.com/jakelever/foodrelations
resources:
all:
- PUBCHEM
- FOODON
full:
- PUBMED:
format: bioc
- AGRICOLA:
format: bioc
test:
- PUBMED_TWOFILES:
rename: PUBMED
format: bioc
- AGRICOLA_TWOFILES:
rename: AGRICOLA
format: bioc
build:
- python generateDrugTerms.py --pubChemMeshPharmFile {IN:PUBCHEM}/MeSH-Pharm --stopwords stopwords.chemical.plusCommon.txt --outFile {OUT:chemical.json}
- cp food.json {OUT:food.json}
run:
- python cooccurrenceExtractor.py --biocFile {IN:AGRICOLA/%} --wordlist1 {IN:food.json} --wordlist2 {IN:chemical.json} --outFile {OUT:tmp/%.cooccurrences}
- python cooccurrenceExtractor.py --biocFile {IN:PUBMED/%} --wordlist1 {IN:food.json} --wordlist2 {IN:chemical.json} --outFile {OUT:tmp/%.cooccurrences}
- python combineCooccurrences.py --inDir {IN:tmp} --outFile {OUT:results.txt}
output: results.txt