-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathpipeline.yaml
57 lines (57 loc) · 1.88 KB
/
pipeline.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
CovidGraphPipeline:
- name: CREATE_FULL_TEXT_INDEXES
image_repo: covidgraph/graph-processing-fulltext-indexes
- name: JHU
image_repo: covidgraph/data_jhu_population
dependencies:
- CREATE_FULL_TEXT_INDEXES
- name: BIOBASE
info_link: https://git.connect.dzd-ev.de/dzdconnectpipeline/dataloading_biobase
desc: Load different bio science repos into neo4j
image_repo: registry-gl.connect.dzd-ev.de:443/dzdconnectpipeline/dataloading_biobase
tag: prod
env_vars:
RUN_MODE: NotTest
- name: ONTOLOGIES
info_link: https://git.connect.dzd-ev.de/dzdconnectpipeline/dataloading_ontologies
desc: Load biomedical ontologies and mappings from biomedical entities to ontologies.
image_repo: registry-gl.connect.dzd-ev.de:443/dzdconnectpipeline/dataloading_ontologies
tag: prod
env_vars:
OBO_ONTOLOGIES: go,doid,mp,pato,hp
dependencies:
- BIOBASE
- name: LENS_PATENT_DATA
image_repo: covidgraph/data-lens-org-covid19-patents
- name: CORD19
image_repo: covidgraph/data-cord19
env_vars:
CONFIGS_PAPER_BATCH_SIZE: 300
CONFIGS_NO_OF_PROCESSES: 12
volumes: { "/tmp/data/cord19": { "bind": "/app/dataset", "mode": "rw" } }
- name: TEXT_FRAGGER
image_repo: covidgraph/graph-processing_fragmentize_text
dependencies:
- CORD19
- LENS_PATENT_DATA
- name: TEXT_GENE_MATCH
image_repo: covidgraph/graph-processing_text_gene_match
dependencies:
- CORD19
- LENS_PATENT_DATA
- BIOBASE
- TEXT_FRAGGER
- name: CLINICAL_TRIALS_GOV
image_repo: covidgraph/data-clinical_trials_gov
- name: HELOMICS_HETIONET
image_repo: helomics/data_hetionet
- name: BIOBERT
image_repo: covidgraph/data-biobert
dependencies:
- CORD19
- name: MASYMOS
image_repo: covidgraph/data_masymos
env_vars:
SOURCE: ${MASYMOS_SOURCE_FILE}
dependencies:
- CORD19