From fc5b18dd9ef931592bb4bba73a023aab4b6491ad Mon Sep 17 00:00:00 2001 From: Helena Rasche Date: Tue, 19 Dec 2023 12:46:27 +0100 Subject: [PATCH] cleanups --- _plugins/jekyll-topic-filter.rb | 14 +- .../tutorials/minerva-pathways/tutorial.md | 17 +- ...A-Seq_BY-COVID_Pipeline__Analysis-test.yml | 212 +++++ ...ow-mRNA-Seq_BY-COVID_Pipeline__Analysis.ga | 809 ++++++++++++++++++ ...flow-mRNA-Seq_BY-COVID_Pipeline__Counts.ga | 560 ++++++++++++ 5 files changed, 1603 insertions(+), 9 deletions(-) create mode 100644 topics/transcriptomics/tutorials/minerva-pathways/workflows/Galaxy-Workflow-mRNA-Seq_BY-COVID_Pipeline__Analysis-test.yml create mode 100644 topics/transcriptomics/tutorials/minerva-pathways/workflows/Galaxy-Workflow-mRNA-Seq_BY-COVID_Pipeline__Analysis.ga create mode 100644 topics/transcriptomics/tutorials/minerva-pathways/workflows/Galaxy-Workflow-mRNA-Seq_BY-COVID_Pipeline__Counts.ga diff --git a/_plugins/jekyll-topic-filter.rb b/_plugins/jekyll-topic-filter.rb index b06bd330bc1dde..ee1603db493ce8 100644 --- a/_plugins/jekyll-topic-filter.rb +++ b/_plugins/jekyll-topic-filter.rb @@ -1,5 +1,4 @@ # frozen_string_literal: true - require 'json' require 'yaml' require './_plugins/gtn' @@ -963,6 +962,19 @@ def identify_contributors(materials, site) def identify_funders(materials, site) TopicFilter.identify_funders(materials, site) end + + def to_material(site, page) + topic = page['path'].split('/')[1] + material = page['path'].split('/')[3] + ret = TopicFilter.fetch_tutorial_material(site, topic, material) + Jekyll.logger.warning "Could not find material #{topic} #{material}" if ret.nil? + ret + end + + def get_workflow(site, page, workflow) + mat = self.to_material(site, page) + mat['workflows'].select{|w| w['workflow'] == workflow }[0] + end end end diff --git a/topics/transcriptomics/tutorials/minerva-pathways/tutorial.md b/topics/transcriptomics/tutorials/minerva-pathways/tutorial.md index 0383dd41b0cc68..b3bfda5e03e1f9 100644 --- a/topics/transcriptomics/tutorials/minerva-pathways/tutorial.md +++ b/topics/transcriptomics/tutorials/minerva-pathways/tutorial.md @@ -142,8 +142,6 @@ work. > {: .hands_on} -## Data Download - ## Analysis We have split this workflow into two parts, based only on how long the first portion of the workflow takes to execute. The rough runtime of the workflow portions when this was being developed can be broken down as follows: @@ -161,7 +159,7 @@ As such we recommend you skip to [Limma](#limma) to progress to the efficient portion. The data provided in the Zenodo record is from the entire analysis, analysed with the Counts step that can be skipped: -### Counts +### Data Download We'll start by downloading our fastq files from the [GEO Dataset GSE182152](https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE182152) @@ -182,13 +180,16 @@ We'll start by downloading our fastq files from the [GEO Dataset GSE182152](http > {: .hands_on} +### Counts + + With that done, we can start to analyse the data using HISAT2 and featureCounts > Run the Workflow > > 1. **Import the workflow** into Galaxy > -> {% snippet faqs/galaxy/workflows_run_wfh.md title="mRNA-Seq BY-COVID Pipeline" wfhub_id="688" %} +> {% snippet faqs/galaxy/workflows_run_wfh.md title="mRNA-Seq BY-COVID Pipeline" wfhub_id="688" box_type="none" %} > {: .hands_on} @@ -273,9 +274,9 @@ MultiQC report. Looking at the report we see generally reasonable quality data. > - Click `Build` > > 1. From **Rules** menu, select `Add / Modify Column Definitions` -> - `Add Definition`, `Collection Name`, Select Column `C` -> - `Add Definition`, `List Identifier(s)`, Select Column `B` -> - `Add Definition`, `URL`, Column `A` +> - `Add Definition` → `Collection Name` → Select Column `C` +> - `Add Definition` → `List Identifier(s)` → Select Column `B` +> - `Add Definition` → `URL` → Column `A` > {: .hands_on} @@ -284,7 +285,7 @@ MultiQC report. Looking at the report we see generally reasonable quality data. > > 1. Run the workflow with the Factor Data from the first Hands on, and the datasets from the workflow or Zenodo download, depending on your path: > -> {% snippet faqs/galaxy/workflows_run_wfh.md title="mRNA-Seq BY-COVID Pipeline" wfhub_id="689" %} +> {% snippet faqs/galaxy/workflows_run_wfh.md title="mRNA-Seq BY-COVID Pipeline" wfhub_id="689" box_type="none" %} > {: .hands_on} diff --git a/topics/transcriptomics/tutorials/minerva-pathways/workflows/Galaxy-Workflow-mRNA-Seq_BY-COVID_Pipeline__Analysis-test.yml b/topics/transcriptomics/tutorials/minerva-pathways/workflows/Galaxy-Workflow-mRNA-Seq_BY-COVID_Pipeline__Analysis-test.yml new file mode 100644 index 00000000000000..4fab0ff351e770 --- /dev/null +++ b/topics/transcriptomics/tutorials/minerva-pathways/workflows/Galaxy-Workflow-mRNA-Seq_BY-COVID_Pipeline__Analysis-test.yml @@ -0,0 +1,212 @@ +- doc: Test outline for mRNA-Seq-BY-COVID-Pipeline-Analysis + job: + factordata: + class: File + location: https://zenodo.org/records/10405036/files/factordata.tabular + filetype: tabular + 'featureCounts: Counts': + class: Collection + collection_type: list + elements: + - class: File + identifier: SRR15462516 + location: https://zenodo.org/records/10405036/files/SRR15462516.featureCounts.tabular + - class: File + identifier: SRR15462517 + location: https://zenodo.org/records/10405036/files/SRR15462517.featureCounts.tabular + - class: File + identifier: SRR15462518 + location: https://zenodo.org/records/10405036/files/SRR15462518.featureCounts.tabular + - class: File + identifier: SRR15462519 + location: https://zenodo.org/records/10405036/files/SRR15462519.featureCounts.tabular + - class: File + identifier: SRR15462520 + location: https://zenodo.org/records/10405036/files/SRR15462520.featureCounts.tabular + - class: File + identifier: SRR15462521 + location: https://zenodo.org/records/10405036/files/SRR15462521.featureCounts.tabular + - class: File + identifier: SRR15462522 + location: https://zenodo.org/records/10405036/files/SRR15462522.featureCounts.tabular + - class: File + identifier: SRR15462523 + location: https://zenodo.org/records/10405036/files/SRR15462523.featureCounts.tabular + - class: File + identifier: SRR15462524 + location: https://zenodo.org/records/10405036/files/SRR15462524.featureCounts.tabular + - class: File + identifier: SRR15462525 + location: https://zenodo.org/records/10405036/files/SRR15462525.featureCounts.tabular + - class: File + identifier: SRR15462526 + location: https://zenodo.org/records/10405036/files/SRR15462526.featureCounts.tabular + - class: File + identifier: SRR15462527 + location: https://zenodo.org/records/10405036/files/SRR15462527.featureCounts.tabular + - class: File + identifier: SRR15462528 + location: https://zenodo.org/records/10405036/files/SRR15462528.featureCounts.tabular + - class: File + identifier: SRR15462529 + location: https://zenodo.org/records/10405036/files/SRR15462529.featureCounts.tabular + - class: File + identifier: SRR15462530 + location: https://zenodo.org/records/10405036/files/SRR15462530.featureCounts.tabular + - class: File + identifier: SRR16681520 + location: https://zenodo.org/records/10405036/files/SRR16681520.featureCounts.tabular + - class: File + identifier: SRR16681521 + location: https://zenodo.org/records/10405036/files/SRR16681521.featureCounts.tabular + - class: File + identifier: SRR16681522 + location: https://zenodo.org/records/10405036/files/SRR16681522.featureCounts.tabular + - class: File + identifier: SRR16681523 + location: https://zenodo.org/records/10405036/files/SRR16681523.featureCounts.tabular + - class: File + identifier: SRR16681524 + location: https://zenodo.org/records/10405036/files/SRR16681524.featureCounts.tabular + - class: File + identifier: SRR16681525 + location: https://zenodo.org/records/10405036/files/SRR16681525.featureCounts.tabular + - class: File + identifier: SRR16681526 + location: https://zenodo.org/records/10405036/files/SRR16681526.featureCounts.tabular + - class: File + identifier: SRR16681527 + location: https://zenodo.org/records/10405036/files/SRR16681527.featureCounts.tabular + - class: File + identifier: SRR16681528 + location: https://zenodo.org/records/10405036/files/SRR16681528.featureCounts.tabular + - class: File + identifier: SRR16681529 + location: https://zenodo.org/records/10405036/files/SRR16681529.featureCounts.tabular + - class: File + identifier: SRR16681530 + location: https://zenodo.org/records/10405036/files/SRR16681530.featureCounts.tabular + - class: File + identifier: SRR16681531 + location: https://zenodo.org/records/10405036/files/SRR16681531.featureCounts.tabular + - class: File + identifier: SRR16681532 + location: https://zenodo.org/records/10405036/files/SRR16681532.featureCounts.tabular + - class: File + identifier: SRR16681533 + location: https://zenodo.org/records/10405036/files/SRR16681533.featureCounts.tabular + - class: File + identifier: SRR16681534 + location: https://zenodo.org/records/10405036/files/SRR16681534.featureCounts.tabular + - class: File + identifier: SRR16681535 + location: https://zenodo.org/records/10405036/files/SRR16681535.featureCounts.tabular + - class: File + identifier: SRR16681536 + location: https://zenodo.org/records/10405036/files/SRR16681536.featureCounts.tabular + - class: File + identifier: SRR16681537 + location: https://zenodo.org/records/10405036/files/SRR16681537.featureCounts.tabular + - class: File + identifier: SRR16681538 + location: https://zenodo.org/records/10405036/files/SRR16681538.featureCounts.tabular + - class: File + identifier: SRR16681539 + location: https://zenodo.org/records/10405036/files/SRR16681539.featureCounts.tabular + - class: File + identifier: SRR16681540 + location: https://zenodo.org/records/10405036/files/SRR16681540.featureCounts.tabular + - class: File + identifier: SRR16681541 + location: https://zenodo.org/records/10405036/files/SRR16681541.featureCounts.tabular + - class: File + identifier: SRR16681542 + location: https://zenodo.org/records/10405036/files/SRR16681542.featureCounts.tabular + - class: File + identifier: SRR16681543 + location: https://zenodo.org/records/10405036/files/SRR16681543.featureCounts.tabular + - class: File + identifier: SRR16681544 + location: https://zenodo.org/records/10405036/files/SRR16681544.featureCounts.tabular + - class: File + identifier: SRR16681545 + location: https://zenodo.org/records/10405036/files/SRR16681545.featureCounts.tabular + - class: File + identifier: SRR16681546 + location: https://zenodo.org/records/10405036/files/SRR16681546.featureCounts.tabular + - class: File + identifier: SRR16681547 + location: https://zenodo.org/records/10405036/files/SRR16681547.featureCounts.tabular + - class: File + identifier: SRR16681548 + location: https://zenodo.org/records/10405036/files/SRR16681548.featureCounts.tabular + - class: File + identifier: SRR16681549 + location: https://zenodo.org/records/10405036/files/SRR16681549.featureCounts.tabular + - class: File + identifier: SRR16681550 + location: https://zenodo.org/records/10405036/files/SRR16681550.featureCounts.tabular + - class: File + identifier: SRR16681551 + location: https://zenodo.org/records/10405036/files/SRR16681551.featureCounts.tabular + - class: File + identifier: SRR16681552 + location: https://zenodo.org/records/10405036/files/SRR16681552.featureCounts.tabular + - class: File + identifier: SRR16681553 + location: https://zenodo.org/records/10405036/files/SRR16681553.featureCounts.tabular + - class: File + identifier: SRR16681554 + location: https://zenodo.org/records/10405036/files/SRR16681554.featureCounts.tabular + - class: File + identifier: SRR16681555 + location: https://zenodo.org/records/10405036/files/SRR16681555.featureCounts.tabular + - class: File + identifier: SRR16681556 + location: https://zenodo.org/records/10405036/files/SRR16681556.featureCounts.tabular + - class: File + identifier: SRR16681557 + location: https://zenodo.org/records/10405036/files/SRR16681557.featureCounts.tabular + - class: File + identifier: SRR16681558 + location: https://zenodo.org/records/10405036/files/SRR16681558.featureCounts.tabular + - class: File + identifier: SRR16681559 + location: https://zenodo.org/records/10405036/files/SRR16681559.featureCounts.tabular + - class: File + identifier: SRR16681560 + location: https://zenodo.org/records/10405036/files/SRR16681560.featureCounts.tabular + - class: File + identifier: SRR16681561 + location: https://zenodo.org/records/10405036/files/SRR16681561.featureCounts.tabular + - class: File + identifier: SRR16681562 + location: https://zenodo.org/records/10405036/files/SRR16681562.featureCounts.tabular + - class: File + identifier: SRR16681563 + location: https://zenodo.org/records/10405036/files/SRR16681563.featureCounts.tabular + - class: File + identifier: SRR16681564 + location: https://zenodo.org/records/10405036/files/SRR16681564.featureCounts.tabular + - class: File + identifier: SRR16681565 + location: https://zenodo.org/records/10405036/files/SRR16681565.featureCounts.tabular + - class: File + identifier: SRR16681566 + location: https://zenodo.org/records/10405036/files/SRR16681566.featureCounts.tabular + 'featureCounts: Lengths': + class: Collection + collection_type: list + elements: + - class: File + identifier: gene_lengths + location: https://zenodo.org/records/10405036/files/gene_lengths.tabular + outputs: + count_data: + asserts: + has_text: + text: "SRR15462519" + minerva_table: + asserts: + has_text: + text: "TRIM25" diff --git a/topics/transcriptomics/tutorials/minerva-pathways/workflows/Galaxy-Workflow-mRNA-Seq_BY-COVID_Pipeline__Analysis.ga b/topics/transcriptomics/tutorials/minerva-pathways/workflows/Galaxy-Workflow-mRNA-Seq_BY-COVID_Pipeline__Analysis.ga new file mode 100644 index 00000000000000..e786597fa9945b --- /dev/null +++ b/topics/transcriptomics/tutorials/minerva-pathways/workflows/Galaxy-Workflow-mRNA-Seq_BY-COVID_Pipeline__Analysis.ga @@ -0,0 +1,809 @@ +{ + "a_galaxy_workflow": "true", + "annotation": "Analyse Bulk RNA-Seq data in preparation for downstream Pathways analysis with MINERVA", + "creator": [ + { + "class": "Person", + "identifier": "0000-0002-4282-9103", + "name": "Iacopo Cristoferi" + }, + { + "class": "Person", + "identifier": "0000-0001-9760-8992", + "name": "Helena Rasche" + }, + { + "class": "Organization", + "name": "Clinical Bioinformatics Unit, Pathology Department, Eramus Medical Center" + } + ], + "format-version": "0.1", + "license": "GPL-3.0-or-later", + "name": "mRNA-Seq BY-COVID Pipeline: Analysis", + "steps": { + "0": { + "annotation": "count data collection with two column datasets (gene_id, count)", + "content_id": null, + "errors": null, + "id": 0, + "input_connections": {}, + "inputs": [ + { + "description": "count data collection with two column datasets (gene_id, count)", + "name": "featureCounts: Counts" + } + ], + "label": "featureCounts: Counts", + "name": "Input dataset collection", + "outputs": [], + "position": { + "left": 0, + "top": 26 + }, + "tool_id": null, + "tool_state": "{\"optional\": false, \"tag\": null, \"collection_type\": \"list\"}", + "tool_version": null, + "type": "data_collection_input", + "uuid": "dd496c2b-e61f-4a54-8cd4-501cc302b758", + "when": null, + "workflow_outputs": [] + }, + "1": { + "annotation": "A two column factor table with (Sample Identifier, Condition)\n\nThis workflow assumes a 1 factor, 2 level analysis, and was specifically designed around SARS-CoV-2 analysis with two levels, e.g.\n```\nSampleName \tGroup\nSRR16683284 \tCOVID\nSRR16683283 \tCOVID SRR16683271 \thealthy\nSRR16683270 \thealthy \n```", + "content_id": null, + "errors": null, + "id": 1, + "input_connections": {}, + "inputs": [ + { + "description": "A two column factor table with (Sample Identifier, Condition)\n\nThis workflow assumes a 1 factor, 2 level analysis, and was specifically designed around SARS-CoV-2 analysis with two levels, e.g.\n```\nSampleName \tGroup\nSRR16683284 \tCOVID\nSRR16683283 \tCOVID SRR16683271 \thealthy\nSRR16683270 \thealthy \n```", + "name": "factordata" + } + ], + "label": "factordata", + "name": "Input dataset", + "outputs": [], + "position": { + "left": 840, + "top": 164 + }, + "tool_id": null, + "tool_state": "{\"optional\": false, \"tag\": null}", + "tool_version": null, + "type": "data_input", + "uuid": "fa67df3e-0730-45b1-af83-ff184c28afcb", + "when": null, + "workflow_outputs": [] + }, + "2": { + "annotation": "featureCounts Lengths collection", + "content_id": null, + "errors": null, + "id": 2, + "input_connections": {}, + "inputs": [ + { + "description": "featureCounts Lengths collection", + "name": "featureCounts: Lengths" + } + ], + "label": "featureCounts: Lengths", + "name": "Input dataset collection", + "outputs": [], + "position": { + "left": 1130, + "top": 311 + }, + "tool_id": null, + "tool_state": "{\"optional\": false, \"tag\": null, \"collection_type\": \"list\"}", + "tool_version": null, + "type": "data_collection_input", + "uuid": "bd753c88-7d30-4ade-b5e9-e1139390d3b4", + "when": null, + "workflow_outputs": [] + }, + "3": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/iuc/collection_column_join/collection_column_join/0.0.3", + "errors": null, + "id": 3, + "input_connections": { + "input_tabular": { + "id": 0, + "output_name": "output" + } + }, + "inputs": [], + "label": null, + "name": "Column join", + "outputs": [ + { + "name": "tabular_output", + "type": "tabular" + } + ], + "position": { + "left": 280, + "top": 0 + }, + "post_job_actions": { + "HideDatasetActiontabular_output": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "tabular_output" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/iuc/collection_column_join/collection_column_join/0.0.3", + "tool_shed_repository": { + "changeset_revision": "3ddd99c7efee", + "name": "collection_column_join", + "owner": "iuc", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"__input_ext\": \"tabular\", \"__workflow_invocation_uuid__\": \"b5e0048e20c111ee806d001e67d2ec02\", \"chromInfo\": \"/opt/galaxy/tool-data/shared/ucsc/chrom/hg19.len\", \"fill_char\": \".\", \"has_header\": \"1\", \"identifier_column\": \"1\", \"include_outputs\": null, \"input_tabular\": {\"__class__\": \"ConnectedValue\"}, \"old_col_in_header\": false, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "0.0.3", + "type": "tool", + "uuid": "c0d05785-2f60-4f78-8e20-719eddd164bd", + "when": null, + "workflow_outputs": [] + }, + "4": { + "annotation": "", + "content_id": "__EXTRACT_DATASET__", + "errors": null, + "id": 4, + "input_connections": { + "input": { + "id": 2, + "output_name": "output" + } + }, + "inputs": [], + "label": null, + "name": "Extract dataset", + "outputs": [ + { + "name": "output", + "type": "data" + } + ], + "position": { + "left": 1410, + "top": 295 + }, + "post_job_actions": { + "ChangeDatatypeActionoutput": { + "action_arguments": { + "newtype": "tabular" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "output" + }, + "HideDatasetActionoutput": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output" + } + }, + "tool_id": "__EXTRACT_DATASET__", + "tool_state": "{\"input\": {\"__class__\": \"ConnectedValue\"}, \"which\": {\"which_dataset\": \"first\", \"__current_case__\": 0}, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "1.0.1", + "type": "tool", + "uuid": "fac9c7f1-c3de-4125-9ab5-1c5fd5c7ba4b", + "when": null, + "workflow_outputs": [] + }, + "5": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/bgruening/text_processing/tp_sort_header_tool/1.1.1", + "errors": null, + "id": 5, + "input_connections": { + "infile": { + "id": 3, + "output_name": "tabular_output" + } + }, + "inputs": [], + "label": "countdata", + "name": "Sort", + "outputs": [ + { + "name": "outfile", + "type": "input" + } + ], + "position": { + "left": 560, + "top": 20 + }, + "post_job_actions": { + "HideDatasetActionoutfile": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outfile" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/bgruening/text_processing/tp_sort_header_tool/1.1.1", + "tool_shed_repository": { + "changeset_revision": "ddf54b12c295", + "name": "text_processing", + "owner": "bgruening", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"header\": \"0\", \"ignore_case\": false, \"infile\": {\"__class__\": \"ConnectedValue\"}, \"sortkeys\": [{\"__index__\": 0, \"column\": \"1\", \"order\": \"r\", \"style\": \"\"}], \"unique\": false, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "1.1.1", + "type": "tool", + "uuid": "cef3f59c-a9a8-435c-b959-7884b12bb28d", + "when": null, + "workflow_outputs": [ + { + "label": "count_data", + "output_name": "outfile", + "uuid": "e8dcfaaf-0d8d-46eb-8cc9-ce2fbdfc45e5" + } + ] + }, + "6": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/iuc/annotatemyids/annotatemyids/3.16.0+galaxy1", + "errors": null, + "id": 6, + "input_connections": { + "id_file": { + "id": 3, + "output_name": "tabular_output" + } + }, + "inputs": [], + "label": "annodata", + "name": "annotateMyIDs", + "outputs": [ + { + "name": "out_tab", + "type": "tabular" + } + ], + "position": { + "left": 560, + "top": 199 + }, + "post_job_actions": { + "HideDatasetActionout_tab": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_tab" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/iuc/annotatemyids/annotatemyids/3.16.0+galaxy1", + "tool_shed_repository": { + "changeset_revision": "133f36c29579", + "name": "annotatemyids", + "owner": "iuc", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"__input_ext\": \"tabular\", \"chromInfo\": \"/opt/galaxy/tool-data/shared/ucsc/chrom/hg19.len\", \"file_has_header\": true, \"id_file\": {\"__class__\": \"ConnectedValue\"}, \"id_type\": \"ENTREZID\", \"organism\": \"Hs\", \"output_cols\": [\"ENTREZID\", \"SYMBOL\", \"GENENAME\"], \"remove_dups\": false, \"rscriptOpt\": false, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "3.16.0+galaxy1", + "type": "tool", + "uuid": "40e99045-e905-410f-a765-9ffac34426ce", + "when": null, + "workflow_outputs": [] + }, + "7": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/bgruening/text_processing/tp_replace_in_line/1.1.2", + "errors": null, + "id": 7, + "input_connections": { + "infile": { + "id": 5, + "output_name": "outfile" + } + }, + "inputs": [], + "label": null, + "name": "Replace Text", + "outputs": [ + { + "name": "outfile", + "type": "input" + } + ], + "position": { + "left": 840, + "top": 10 + }, + "post_job_actions": { + "HideDatasetActionoutfile": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outfile" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/bgruening/text_processing/tp_replace_in_line/1.1.2", + "tool_shed_repository": { + "changeset_revision": "ddf54b12c295", + "name": "text_processing", + "owner": "bgruening", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"infile\": {\"__class__\": \"ConnectedValue\"}, \"replacements\": [{\"__index__\": 0, \"find_pattern\": \" uncompressed.fastqsanger\", \"replace_pattern\": null}], \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "1.1.2", + "type": "tool", + "uuid": "58622be8-a7ee-4d09-86bc-6fc36e4f6439", + "when": null, + "workflow_outputs": [] + }, + "8": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/iuc/limma_voom/limma_voom/3.50.1+galaxy0", + "errors": null, + "id": 8, + "input_connections": { + "anno|geneanno": { + "id": 6, + "output_name": "out_tab" + }, + "input|counts": { + "id": 7, + "output_name": "outfile" + }, + "input|fact|finfo": { + "id": 1, + "output_name": "output" + } + }, + "inputs": [], + "label": "limma DEG analysis", + "name": "limma", + "outputs": [ + { + "name": "outTables", + "type": "input" + }, + { + "name": "outReport", + "type": "html" + } + ], + "position": { + "left": 1130, + "top": 32 + }, + "post_job_actions": { + "HideDatasetActionoutTables": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outTables" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/iuc/limma_voom/limma_voom/3.50.1+galaxy0", + "tool_shed_repository": { + "changeset_revision": "d6f5fa4ee473", + "name": "limma_voom", + "owner": "iuc", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"adv\": {\"lfc\": \"0.0\", \"pVal\": \"0.05\", \"pAdjust\": \"BH\", \"treat\": false, \"topgenes\": \"10\", \"normalisationOption\": \"TMM\", \"robOption\": true}, \"anno\": {\"annoOpt\": \"yes\", \"__current_case__\": 0, \"geneanno\": {\"__class__\": \"ConnectedValue\"}}, \"cont\": {\"cfile\": \"no\", \"__current_case__\": 1, \"rep_contrast\": [{\"__index__\": 0, \"contrast\": \"COVID-healthy\"}]}, \"deMethod\": {\"de_select\": \"voom\", \"__current_case__\": 0, \"weightOption\": false}, \"f\": {\"filt\": {\"filt_select\": \"yes\", \"__current_case__\": 0, \"cformat\": {\"format_select\": \"cpm\", \"__current_case__\": 0, \"cpmReq\": \"0.5\", \"cpmSampleReq\": \"1\"}}}, \"input\": {\"format\": \"matrix\", \"__current_case__\": 1, \"counts\": {\"__class__\": \"ConnectedValue\"}, \"fact\": {\"ffile\": \"yes\", \"__current_case__\": 0, \"finfo\": {\"__class__\": \"ConnectedValue\"}}}, \"out\": {\"plots\": \"i\", \"filtCounts\": false, \"normCounts\": false, \"libinfo\": false, \"rscript\": false, \"rdaOption\": false}, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "3.50.1+galaxy0", + "type": "tool", + "uuid": "c53a2cee-7e2e-4e97-a946-0857a4ca88f7", + "when": null, + "workflow_outputs": [ + { + "label": "limma_report", + "output_name": "outReport", + "uuid": "1c8d7950-1003-4c86-9986-c6ed1264cd8b" + } + ] + }, + "9": { + "annotation": "", + "content_id": "__EXTRACT_DATASET__", + "errors": null, + "id": 9, + "input_connections": { + "input": { + "id": 8, + "output_name": "outTables" + } + }, + "inputs": [], + "label": null, + "name": "Extract dataset", + "outputs": [ + { + "name": "output", + "type": "data" + } + ], + "position": { + "left": 1410, + "top": 77 + }, + "post_job_actions": { + "ChangeDatatypeActionoutput": { + "action_arguments": { + "newtype": "tabular" + }, + "action_type": "ChangeDatatypeAction", + "output_name": "output" + }, + "HideDatasetActionoutput": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output" + } + }, + "tool_id": "__EXTRACT_DATASET__", + "tool_state": "{\"input\": {\"__class__\": \"ConnectedValue\"}, \"which\": {\"which_dataset\": \"first\", \"__current_case__\": 0}, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "1.0.1", + "type": "tool", + "uuid": "abfacce9-feb6-444b-8b7f-d90c8d833a93", + "when": null, + "workflow_outputs": [] + }, + "10": { + "annotation": "", + "content_id": "Cut1", + "errors": null, + "id": 10, + "input_connections": { + "input": { + "id": 9, + "output_name": "output" + } + }, + "inputs": [], + "label": "MINERVA Formatting", + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 1690, + "top": 99 + }, + "post_job_actions": { + "RenameDatasetActionout_file1": { + "action_arguments": { + "newname": "Minerva-Ready Table" + }, + "action_type": "RenameDatasetAction", + "output_name": "out_file1" + } + }, + "tool_id": "Cut1", + "tool_state": "{\"columnList\": \"c2,c4,c7,c8\", \"delimiter\": \"T\", \"input\": {\"__class__\": \"ConnectedValue\"}, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "1.0.2", + "type": "tool", + "uuid": "71f54cbc-6a51-4703-8919-ee11f036c9fa", + "when": null, + "workflow_outputs": [ + { + "label": "minerva_table", + "output_name": "out_file1", + "uuid": "9ce4f48b-e742-4b7c-9bde-5d51f11068d3" + } + ] + }, + "11": { + "annotation": "", + "content_id": "join1", + "errors": null, + "id": 11, + "input_connections": { + "input1": { + "id": 9, + "output_name": "output" + }, + "input2": { + "id": 4, + "output_name": "output" + } + }, + "inputs": [], + "label": null, + "name": "Join two Datasets", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 1690, + "top": 253 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_id": "join1", + "tool_state": "{\"field1\": \"1\", \"field2\": \"1\", \"fill_empty_columns\": {\"fill_empty_columns_switch\": \"no_fill\", \"__current_case__\": 0}, \"header\": \"\", \"input1\": {\"__class__\": \"ConnectedValue\"}, \"input2\": {\"__class__\": \"ConnectedValue\"}, \"partial\": \"\", \"unmatched\": \"\", \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "2.1.3", + "type": "tool", + "uuid": "8fa51a1e-13d2-4cc7-8d16-42987fe42372", + "when": null, + "workflow_outputs": [] + }, + "12": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.4", + "errors": null, + "id": 12, + "input_connections": { + "input": { + "id": 11, + "output_name": "out_file1" + } + }, + "inputs": [], + "label": null, + "name": "Compute", + "outputs": [ + { + "name": "out_file1", + "type": "input" + } + ], + "position": { + "left": 1970, + "top": 278 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/column_maker/Add_a_column1/1.4", + "tool_shed_repository": { + "changeset_revision": "9cd341095afd", + "name": "column_maker", + "owner": "devteam", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"avoid_scientific_notation\": \"no\", \"cond\": \"c8<0.05\", \"header_lines_conditional\": {\"header_lines_select\": \"no\", \"__current_case__\": 0}, \"input\": {\"__class__\": \"ConnectedValue\"}, \"round\": \"no\", \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "1.4", + "type": "tool", + "uuid": "6f0a6827-6b13-4f29-aa65-7c0f571c90a3", + "when": null, + "workflow_outputs": [] + }, + "13": { + "annotation": "", + "content_id": "Cut1", + "errors": null, + "id": 13, + "input_connections": { + "input": { + "id": 12, + "output_name": "out_file1" + } + }, + "inputs": [], + "label": null, + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 2250, + "top": 278 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_id": "Cut1", + "tool_state": "{\"columnList\": \"c1,c11,c12\", \"delimiter\": \"T\", \"input\": {\"__class__\": \"ConnectedValue\"}, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "1.0.2", + "type": "tool", + "uuid": "ec6527a0-b2c9-4672-9085-694359109ccc", + "when": null, + "workflow_outputs": [] + }, + "14": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/bgruening/text_processing/tp_sorted_uniq/1.1.0", + "errors": null, + "id": 14, + "input_connections": { + "infile": { + "id": 13, + "output_name": "out_file1" + } + }, + "inputs": [], + "label": null, + "name": "Unique", + "outputs": [ + { + "name": "outfile", + "type": "input" + } + ], + "position": { + "left": 2530, + "top": 268 + }, + "post_job_actions": { + "HideDatasetActionoutfile": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outfile" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/bgruening/text_processing/tp_sorted_uniq/1.1.0", + "tool_shed_repository": { + "changeset_revision": "ddf54b12c295", + "name": "text_processing", + "owner": "bgruening", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"adv_opts\": {\"adv_opts_selector\": \"advanced\", \"__current_case__\": 1, \"column_start\": \"1\", \"column_end\": \"1\"}, \"ignore_case\": false, \"infile\": {\"__class__\": \"ConnectedValue\"}, \"is_numeric\": false, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "1.1.0", + "type": "tool", + "uuid": "ba06ee56-5e0b-4060-8f82-72d8f6216a3d", + "when": null, + "workflow_outputs": [] + }, + "15": { + "annotation": "", + "content_id": "Cut1", + "errors": null, + "id": 15, + "input_connections": { + "input": { + "id": 14, + "output_name": "outfile" + } + }, + "inputs": [], + "label": null, + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 2810, + "top": 278 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_id": "Cut1", + "tool_state": "{\"columnList\": \"c1,c3\", \"delimiter\": \"T\", \"input\": {\"__class__\": \"ConnectedValue\"}, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "1.0.2", + "type": "tool", + "uuid": "6aca0995-d028-4438-befd-b1bd5edf625a", + "when": null, + "workflow_outputs": [] + }, + "16": { + "annotation": "", + "content_id": "Cut1", + "errors": null, + "id": 16, + "input_connections": { + "input": { + "id": 14, + "output_name": "outfile" + } + }, + "inputs": [], + "label": null, + "name": "Cut", + "outputs": [ + { + "name": "out_file1", + "type": "tabular" + } + ], + "position": { + "left": 2810, + "top": 412 + }, + "post_job_actions": { + "HideDatasetActionout_file1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out_file1" + } + }, + "tool_id": "Cut1", + "tool_state": "{\"columnList\": \"c1,c2\", \"delimiter\": \"T\", \"input\": {\"__class__\": \"ConnectedValue\"}, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "1.0.2", + "type": "tool", + "uuid": "d1110fac-d46d-4bff-a407-47d09bd91626", + "when": null, + "workflow_outputs": [] + }, + "17": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/iuc/goseq/goseq/1.50.0+galaxy0", + "errors": null, + "id": 17, + "input_connections": { + "dge_file": { + "id": 15, + "output_name": "out_file1" + }, + "length_file": { + "id": 16, + "output_name": "out_file1" + } + }, + "inputs": [ + { + "description": "runtime parameter for tool goseq", + "name": "dge_file" + }, + { + "description": "runtime parameter for tool goseq", + "name": "length_file" + } + ], + "label": null, + "name": "goseq", + "outputs": [ + { + "name": "wallenius_tab", + "type": "tabular" + }, + { + "name": "top_plot", + "type": "pdf" + }, + { + "name": "cat_genes_tab", + "type": "tabular" + } + ], + "position": { + "left": 3090, + "top": 294 + }, + "post_job_actions": {}, + "tool_id": "toolshed.g2.bx.psu.edu/repos/iuc/goseq/goseq/1.50.0+galaxy0", + "tool_shed_repository": { + "changeset_revision": "602de62d995b", + "name": "goseq", + "owner": "iuc", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"adv\": {\"p_adj_method\": \"BH\", \"use_genes_without_cat\": false}, \"categorySource\": {\"catSource\": \"getgo\", \"__current_case__\": 0, \"genome\": \"hg38\", \"gene_id\": \"knownGene\", \"fetchcats\": [\"GO:CC\", \"GO:BP\", \"GO:MF\", \"KEGG\"]}, \"dge_file\": {\"__class__\": \"RuntimeValue\"}, \"length_file\": {\"__class__\": \"RuntimeValue\"}, \"methods\": {\"wallenius\": true, \"hypergeometric\": false, \"repcnt\": \"0\"}, \"out\": {\"topgo_plot\": true, \"make_plots\": false, \"cat_genes\": true, \"rdata_out\": false}, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "1.50.0+galaxy0", + "type": "tool", + "uuid": "dfe128ab-0b7f-49f0-bb33-eb68559f6ebe", + "when": null, + "workflow_outputs": [] + } + }, + "tags": [ + "name:BY-COVID" + ], + "uuid": "bf94ada6-2c22-4cd7-b0a7-7b8ebd1556f4", + "version": 26 +} \ No newline at end of file diff --git a/topics/transcriptomics/tutorials/minerva-pathways/workflows/Galaxy-Workflow-mRNA-Seq_BY-COVID_Pipeline__Counts.ga b/topics/transcriptomics/tutorials/minerva-pathways/workflows/Galaxy-Workflow-mRNA-Seq_BY-COVID_Pipeline__Counts.ga new file mode 100644 index 00000000000000..4970c3a2c7cdad --- /dev/null +++ b/topics/transcriptomics/tutorials/minerva-pathways/workflows/Galaxy-Workflow-mRNA-Seq_BY-COVID_Pipeline__Counts.ga @@ -0,0 +1,560 @@ +{ + "a_galaxy_workflow": "true", + "annotation": "This portion of the workflow produces sets of feature Counts ready for analysis by limma/etc.", + "creator": [ + { + "class": "Person", + "identifier": "0000-0002-4282-9103", + "name": "Iacopo Cristoferi" + }, + { + "class": "Person", + "identifier": "0000-0001-9760-8992", + "name": "Helena Rasche" + }, + { + "class": "Organization", + "name": "Clinical Bioinformatics Unit, Pathology Department, Eramus Medical Center" + } + ], + "format-version": "0.1", + "license": "GPL-3.0-or-later", + "name": "mRNA-Seq BY-COVID Pipeline: Counts", + "steps": { + "0": { + "annotation": "Input list of fastqsanger format sequencing data", + "content_id": null, + "errors": null, + "id": 0, + "input_connections": {}, + "inputs": [ + { + "description": "Input list of fastqsanger format sequencing data", + "name": "mRNA-Seq Reads" + } + ], + "label": "mRNA-Seq Reads", + "name": "Input dataset collection", + "outputs": [], + "position": { + "left": 0, + "top": 0 + }, + "tool_id": null, + "tool_state": "{\"optional\": false, \"tag\": null, \"collection_type\": \"list\"}", + "tool_version": null, + "type": "data_collection_input", + "uuid": "dd496c2b-e61f-4a54-8cd4-501cc302b758", + "when": null, + "workflow_outputs": [] + }, + "1": { + "annotation": "Export of UCSC Genome, just the genes.", + "content_id": null, + "errors": null, + "id": 1, + "input_connections": {}, + "inputs": [ + { + "description": "Export of UCSC Genome, just the genes.", + "name": "UCSC Genome" + } + ], + "label": "UCSC Genome", + "name": "Input dataset", + "outputs": [], + "position": { + "left": 560, + "top": 734 + }, + "tool_id": null, + "tool_state": "{\"optional\": false, \"tag\": null}", + "tool_version": null, + "type": "data_input", + "uuid": "71a430b7-df7c-46a5-8826-f881a122b376", + "when": null, + "workflow_outputs": [] + }, + "2": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/devteam/fastqc/fastqc/0.74+galaxy0", + "errors": null, + "id": 2, + "input_connections": { + "input_file": { + "id": 0, + "output_name": "output" + } + }, + "inputs": [], + "label": null, + "name": "FastQC", + "outputs": [ + { + "name": "html_file", + "type": "html" + }, + { + "name": "text_file", + "type": "txt" + } + ], + "position": { + "left": 280, + "top": 5 + }, + "post_job_actions": { + "HideDatasetActionhtml_file": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "html_file" + }, + "HideDatasetActiontext_file": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "text_file" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/fastqc/fastqc/0.74+galaxy0", + "tool_shed_repository": { + "changeset_revision": "5ec9f6bceaee", + "name": "fastqc", + "owner": "devteam", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"__input_ext\": \"fastqsanger.gz\", \"adapters\": null, \"chromInfo\": \"/opt/galaxy/tool-data/shared/ucsc/chrom/?.len\", \"contaminants\": null, \"input_file\": {\"__class__\": \"ConnectedValue\"}, \"input_file|__identifier__\": \"SRR16683252\", \"kmers\": \"7\", \"limits\": null, \"min_length\": null, \"nogroup\": false, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "0.74+galaxy0", + "type": "tool", + "uuid": "fcd4b97f-f2cd-4779-ba55-619f89d281ab", + "when": null, + "workflow_outputs": [] + }, + "3": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/lparsons/cutadapt/cutadapt/4.4+galaxy0", + "errors": null, + "id": 3, + "input_connections": { + "library|input_1": { + "id": 0, + "output_name": "output" + } + }, + "inputs": [], + "label": null, + "name": "Cutadapt", + "outputs": [ + { + "name": "out1", + "type": "fastqsanger" + }, + { + "name": "report", + "type": "txt" + } + ], + "position": { + "left": 280, + "top": 484 + }, + "post_job_actions": { + "HideDatasetActionout1": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "out1" + }, + "HideDatasetActionreport": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "report" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/lparsons/cutadapt/cutadapt/4.4+galaxy0", + "tool_shed_repository": { + "changeset_revision": "8c0175e03cee", + "name": "cutadapt", + "owner": "lparsons", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"__input_ext\": \"input\", \"adapter_options\": {\"action\": \"trim\", \"internal\": \"\", \"error_rate\": \"0.1\", \"no_indels\": false, \"times\": \"1\", \"overlap\": \"3\", \"match_read_wildcards\": \" \", \"revcomp\": false}, \"chromInfo\": \"/opt/galaxy/tool-data/shared/ucsc/chrom/?.len\", \"filter_options\": {\"discard_trimmed\": false, \"discard_untrimmed\": false, \"minimum_length\": \"20\", \"maximum_length\": null, \"length_R2_options\": {\"length_R2_status\": \"False\", \"__current_case__\": 1}, \"max_n\": null, \"pair_filter\": \"any\", \"max_expected_errors\": null, \"discard_cassava\": false}, \"input_1|__identifier__\": \"SRR16683252\", \"library\": {\"type\": \"single\", \"__current_case__\": 0, \"input_1\": {\"__class__\": \"ConnectedValue\"}, \"r1\": {\"adapters\": [{\"__index__\": 0, \"adapter_source\": {\"adapter_source_list\": \"user\", \"__current_case__\": 0, \"adapter_name\": \"Nextera\", \"adapter\": \"CTGTCTCTTATA\"}, \"single_noindels\": false}, {\"__index__\": 1, \"adapter_source\": {\"adapter_source_list\": \"user\", \"__current_case__\": 0, \"adapter_name\": \"TruSeq\", \"adapter\": \"AGATCGGAAGAGCACACGTCTGAACTCCAGTCAC\"}, \"single_noindels\": false}], \"front_adapters\": [], \"anywhere_adapters\": [], \"cut\": \"0\"}}, \"output_selector\": [\"report\"], \"read_mod_options\": {\"quality_cutoff\": \"20\", \"nextseq_trim\": \"0\", \"trim_n\": false, \"strip_suffix\": null, \"shorten_options\": {\"shorten_values\": \"False\", \"__current_case__\": 1}, \"length_tag\": null, \"rename\": null, \"zero_cap\": false}, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "4.4+galaxy0", + "type": "tool", + "uuid": "613277db-66d2-456e-ab58-b31110aa7710", + "when": null, + "workflow_outputs": [] + }, + "4": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/devteam/fastqc/fastqc/0.74+galaxy0", + "errors": null, + "id": 4, + "input_connections": { + "input_file": { + "id": 3, + "output_name": "out1" + } + }, + "inputs": [], + "label": null, + "name": "FastQC", + "outputs": [ + { + "name": "html_file", + "type": "html" + }, + { + "name": "text_file", + "type": "txt" + } + ], + "position": { + "left": 560, + "top": 154 + }, + "post_job_actions": { + "HideDatasetActionhtml_file": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "html_file" + }, + "HideDatasetActiontext_file": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "text_file" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/devteam/fastqc/fastqc/0.74+galaxy0", + "tool_shed_repository": { + "changeset_revision": "5ec9f6bceaee", + "name": "fastqc", + "owner": "devteam", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"__input_ext\": \"fastqsanger.gz\", \"adapters\": null, \"chromInfo\": \"/opt/galaxy/tool-data/shared/ucsc/chrom/?.len\", \"contaminants\": null, \"input_file\": {\"__class__\": \"ConnectedValue\"}, \"input_file|__identifier__\": \"SRR16683252\", \"kmers\": \"7\", \"limits\": null, \"min_length\": null, \"nogroup\": false, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "0.74+galaxy0", + "type": "tool", + "uuid": "d98ef5cd-bcac-4144-8c3a-08f37719bcb8", + "when": null, + "workflow_outputs": [] + }, + "5": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/iuc/hisat2/hisat2/2.2.1+galaxy1", + "errors": null, + "id": 5, + "input_connections": { + "library|input_1": { + "id": 3, + "output_name": "out1" + } + }, + "inputs": [], + "label": null, + "name": "HISAT2", + "outputs": [ + { + "name": "output_alignments", + "type": "bam" + }, + { + "name": "summary_file", + "type": "txt" + } + ], + "position": { + "left": 560, + "top": 450 + }, + "post_job_actions": { + "HideDatasetActionoutput_alignments": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output_alignments" + }, + "HideDatasetActionsummary_file": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "summary_file" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/iuc/hisat2/hisat2/2.2.1+galaxy1", + "tool_shed_repository": { + "changeset_revision": "f4af63aaf57a", + "name": "hisat2", + "owner": "iuc", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"__input_ext\": \"input\", \"__workflow_invocation_uuid__\": \"b5e0048e20c111ee806d001e67d2ec02\", \"adv\": {\"input_options\": {\"input_options_selector\": \"defaults\", \"__current_case__\": 0}, \"alignment_options\": {\"alignment_options_selector\": \"defaults\", \"__current_case__\": 0}, \"scoring_options\": {\"scoring_options_selector\": \"defaults\", \"__current_case__\": 0}, \"spliced_options\": {\"spliced_options_selector\": \"defaults\", \"__current_case__\": 0}, \"reporting_options\": {\"reporting_options_selector\": \"defaults\", \"__current_case__\": 0}, \"output_options\": {\"output_options_selector\": \"defaults\", \"__current_case__\": 0}, \"sam_options\": {\"sam_options_selector\": \"defaults\", \"__current_case__\": 0}, \"other_options\": {\"other_options_selector\": \"defaults\", \"__current_case__\": 0}}, \"chromInfo\": \"/opt/galaxy/tool-data/shared/ucsc/chrom/?.len\", \"input_1|__identifier__\": \"SRR15462524.fastq.gz\", \"library\": {\"type\": \"single\", \"__current_case__\": 0, \"input_1\": {\"__class__\": \"ConnectedValue\"}, \"rna_strandness\": \"F\"}, \"reference_genome\": {\"source\": \"indexed\", \"__current_case__\": 0, \"index\": \"hg19\"}, \"sum\": {\"new_summary\": true, \"summary_file\": true}, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "2.2.1+galaxy1", + "type": "tool", + "uuid": "ba1890a3-5f99-4f42-a963-f9b749477dba", + "when": null, + "workflow_outputs": [] + }, + "6": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/iuc/featurecounts/featurecounts/2.0.3+galaxy1", + "errors": null, + "id": 6, + "input_connections": { + "alignment": { + "id": 5, + "output_name": "output_alignments" + } + }, + "inputs": [], + "label": null, + "name": "featureCounts", + "outputs": [ + { + "name": "output_short", + "type": "tabular" + }, + { + "name": "output_summary", + "type": "tabular" + }, + { + "name": "output_feature_lengths", + "type": "tabular" + } + ], + "position": { + "left": 860, + "top": 249 + }, + "post_job_actions": { + "HideDatasetActionoutput_feature_lengths": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output_feature_lengths" + }, + "HideDatasetActionoutput_short": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output_short" + }, + "HideDatasetActionoutput_summary": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output_summary" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/iuc/featurecounts/featurecounts/2.0.3+galaxy1", + "tool_shed_repository": { + "changeset_revision": "6f66ae7c5f7a", + "name": "featurecounts", + "owner": "iuc", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"alignment\": {\"__class__\": \"ConnectedValue\"}, \"anno\": {\"anno_select\": \"builtin\", \"__current_case__\": 0, \"bgenome\": \"hg19\"}, \"extended_parameters\": {\"multifeatures\": {\"multifeat\": \"-O -M\", \"__current_case__\": 3, \"fraction\": false}, \"exon_exon_junction_read_counting_enabled\": {\"count_exon_exon_junction_reads\": \"\", \"__current_case__\": 1}, \"long_reads\": false, \"by_read_group\": false, \"largest_overlap\": false, \"min_overlap\": \"1\", \"frac_overlap\": \"0\", \"frac_overlap_feature\": \"0\", \"read_extension_5p\": \"0\", \"read_extension_3p\": \"0\", \"read_reduction\": \"\", \"R\": false}, \"format\": \"tabdel_short\", \"include_feature_length_file\": true, \"pe_parameters\": {\"paired_end_status\": \"single_end\", \"__current_case__\": 0}, \"read_filtering_parameters\": {\"mapping_quality\": \"0\", \"splitonly\": \"\", \"primary\": false, \"ignore_dup\": false}, \"strand_specificity\": \"1\", \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "2.0.3+galaxy1", + "type": "tool", + "uuid": "e185d096-a0fa-47b2-9a54-a217235e1693", + "when": null, + "workflow_outputs": [ + { + "label": "output_feature_lengths", + "output_name": "output_feature_lengths", + "uuid": "5cb5bd5d-df81-4463-8002-e89551780f01" + }, + { + "label": "output_short", + "output_name": "output_short", + "uuid": "5dec13e1-0011-472c-a72d-6715fe55c23c" + } + ] + }, + "7": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/nilesh/rseqc/rseqc_read_distribution/5.0.1+galaxy2", + "errors": null, + "id": 7, + "input_connections": { + "input": { + "id": 5, + "output_name": "output_alignments" + }, + "refgene": { + "id": 1, + "output_name": "output" + } + }, + "inputs": [], + "label": null, + "name": "Read Distribution", + "outputs": [ + { + "name": "output", + "type": "txt" + } + ], + "position": { + "left": 860, + "top": 504 + }, + "post_job_actions": { + "HideDatasetActionoutput": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "output" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/nilesh/rseqc/rseqc_read_distribution/5.0.1+galaxy2", + "tool_shed_repository": { + "changeset_revision": "473382134e56", + "name": "rseqc", + "owner": "nilesh", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"__input_ext\": \"input\", \"__workflow_invocation_uuid__\": \"b5e0048e20c111ee806d001e67d2ec02\", \"chromInfo\": \"/opt/galaxy/tool-data/shared/ucsc/chrom/hg19.len\", \"input\": {\"__class__\": \"ConnectedValue\"}, \"input|__identifier__\": \"SRR15462524.fastq.gz\", \"refgene\": {\"__class__\": \"ConnectedValue\"}, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "5.0.1+galaxy2", + "type": "tool", + "uuid": "dc003494-4baf-4b17-90d1-3e835cfcdba9", + "when": null, + "workflow_outputs": [] + }, + "8": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/nilesh/rseqc/rseqc_geneBody_coverage/5.0.1+galaxy2", + "errors": null, + "id": 8, + "input_connections": { + "batch_mode|input": { + "id": 5, + "output_name": "output_alignments" + }, + "refgene": { + "id": 1, + "output_name": "output" + } + }, + "inputs": [], + "label": null, + "name": "Gene Body Coverage (BAM)", + "outputs": [ + { + "name": "outputcurvespdf", + "type": "pdf" + }, + { + "name": "outputtxt", + "type": "txt" + } + ], + "position": { + "left": 860, + "top": 688 + }, + "post_job_actions": { + "HideDatasetActionoutputcurvespdf": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outputcurvespdf" + }, + "HideDatasetActionoutputtxt": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "outputtxt" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/nilesh/rseqc/rseqc_geneBody_coverage/5.0.1+galaxy2", + "tool_shed_repository": { + "changeset_revision": "473382134e56", + "name": "rseqc", + "owner": "nilesh", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"__input_ext\": \"input\", \"__workflow_invocation_uuid__\": \"b5e0048e20c111ee806d001e67d2ec02\", \"batch_mode\": {\"batch_mode_selector\": \"batch\", \"__current_case__\": 0, \"input\": {\"__class__\": \"ConnectedValue\"}}, \"chromInfo\": \"/opt/galaxy/tool-data/shared/ucsc/chrom/hg19.len\", \"input|__identifier__\": \"SRR15462524.fastq.gz\", \"minimum_length\": \"100\", \"refgene\": {\"__class__\": \"ConnectedValue\"}, \"rscript_output\": false, \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "5.0.1+galaxy2", + "type": "tool", + "uuid": "b38af1f6-6d3a-4a7d-ba53-0a2c18c297f0", + "when": null, + "workflow_outputs": [] + }, + "9": { + "annotation": "", + "content_id": "toolshed.g2.bx.psu.edu/repos/iuc/multiqc/multiqc/1.11+galaxy1", + "errors": null, + "id": 9, + "input_connections": { + "results_0|software_cond|output_0|input": { + "id": 2, + "output_name": "text_file" + }, + "results_0|software_cond|output_1|input": { + "id": 4, + "output_name": "text_file" + }, + "results_1|software_cond|input": { + "id": 3, + "output_name": "report" + }, + "results_2|software_cond|input": { + "id": 5, + "output_name": "summary_file" + }, + "results_3|software_cond|output_0|type|input": { + "id": 7, + "output_name": "output" + }, + "results_3|software_cond|output_1|type|input": { + "id": 8, + "output_name": "outputtxt" + }, + "results_4|software_cond|input": { + "id": 6, + "output_name": "output_summary" + } + }, + "inputs": [], + "label": "Multi QC raw reads", + "name": "MultiQC", + "outputs": [ + { + "name": "stats", + "type": "input" + }, + { + "name": "html_report", + "type": "html" + } + ], + "position": { + "left": 1160, + "top": 121 + }, + "post_job_actions": { + "HideDatasetActionstats": { + "action_arguments": {}, + "action_type": "HideDatasetAction", + "output_name": "stats" + } + }, + "tool_id": "toolshed.g2.bx.psu.edu/repos/iuc/multiqc/multiqc/1.11+galaxy1", + "tool_shed_repository": { + "changeset_revision": "abfd8a6544d7", + "name": "multiqc", + "owner": "iuc", + "tool_shed": "toolshed.g2.bx.psu.edu" + }, + "tool_state": "{\"comment\": \"\", \"export\": false, \"flat\": false, \"results\": [{\"__index__\": 0, \"software_cond\": {\"software\": \"fastqc\", \"__current_case__\": 8, \"output\": [{\"__index__\": 0, \"type\": \"data\", \"input\": {\"__class__\": \"ConnectedValue\"}}, {\"__index__\": 1, \"type\": \"data\", \"input\": {\"__class__\": \"ConnectedValue\"}}]}}, {\"__index__\": 1, \"software_cond\": {\"software\": \"cutadapt\", \"__current_case__\": 5, \"input\": {\"__class__\": \"ConnectedValue\"}}}, {\"__index__\": 2, \"software_cond\": {\"software\": \"hisat2\", \"__current_case__\": 13, \"input\": {\"__class__\": \"ConnectedValue\"}}}, {\"__index__\": 3, \"software_cond\": {\"software\": \"rseqc\", \"__current_case__\": 22, \"output\": [{\"__index__\": 0, \"type\": {\"type\": \"read_distribution\", \"__current_case__\": 6, \"input\": {\"__class__\": \"ConnectedValue\"}}}, {\"__index__\": 1, \"type\": {\"type\": \"gene_body_coverage\", \"__current_case__\": 1, \"input\": {\"__class__\": \"ConnectedValue\"}}}]}}, {\"__index__\": 4, \"software_cond\": {\"software\": \"featureCounts\", \"__current_case__\": 9, \"input\": {\"__class__\": \"ConnectedValue\"}}}], \"saveLog\": false, \"title\": \"\", \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": "1.11+galaxy1", + "type": "tool", + "uuid": "30a849cc-437d-4a40-861b-797e69f8a1e3", + "when": null, + "workflow_outputs": [ + { + "label": "html_report", + "output_name": "html_report", + "uuid": "9217af4e-e34c-4a49-9d67-4b3df511ac2c" + } + ] + } + }, + "tags": [ + "name:BY-COVID" + ], + "uuid": "e066322d-3c51-42bb-8693-f40b67b8851e", + "version": 4 +} \ No newline at end of file