forked from VEuPathDB/stable_identifier_authority
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrun_new_organism_allocation.py
63 lines (53 loc) · 3.16 KB
/
run_new_organism_allocation.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
"""
Copyright [2017-2021] EMBL-European Bioinformatics Institute
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
"""
import configparser
import sys
from allocation_service.event_input import GffFilePasser
from allocation_service.annotation_events import EventCollection
from allocation_service.osid_service import OSIDService
from allocation_service.event_output import GFFAnnotations, AnnotationEventFile, SessionService
from session_service.rest_api import DataBaseConnection, AssigningApplication, ProductionDatabase
if __name__ == '__main__':
allocation_config_file = './allocation_service/allocation_pipeline.conf'
session_config_file = './session_service/session_service.conf'
allocation_config = configparser.ConfigParser()
allocation_config.read(allocation_config_file)
pipeline_name = allocation_config['PIPELINE']['name']
pipeline_version = allocation_config['PIPELINE']['version']
commit_message = allocation_config['PIPELINE']['message']
input_gff_path = allocation_config['FILE']['input_gff']
output_gff_path = allocation_config['FILE']['output_gff']
event_file_path = allocation_config['FILE']['event']
allowed_gene_models = allocation_config['FILE']['allowed_gene_models']
allowed_bio_types = allocation_config['FILE']['allowed_bio_types']
organism_production_name = allocation_config['ProductionOrganism']['name']
production_database_name = allocation_config['ProductionOrganism']['database']
event_input = GffFilePasser(input_gff_path, allowed_gene_models, allowed_bio_types)
osid_service = OSIDService(allocation_config)
event_collection = EventCollection(organism_production_name, event_input, osid_service)
event_collection.create()
session_database = DataBaseConnection(session_config_file)
assigning_application = AssigningApplication(session_database)
application_id = assigning_application.get(name=pipeline_name, version=pipeline_version)
if not application_id:
sys.exit('Please add the assigning pipeline to the assigning_application table in the session database')
production_database = ProductionDatabase(session_database)
production_database_id = production_database.get(name=production_database_name)
if not production_database_id:
production_database_id = production_database.post(name=production_database_name)
session_service = SessionService(session_database, application_id, production_database_id,
commit_message, event_collection)
gff_annotation = GFFAnnotations(input_gff_path, output_gff_path, event_collection)
gff_annotation.annotate_gff()
event_file = AnnotationEventFile(event_collection, event_file_path)
event_file.write_event_file()