-
Notifications
You must be signed in to change notification settings - Fork 0
/
goenrichment.xml
executable file
·151 lines (132 loc) · 7.5 KB
/
goenrichment.xml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
<tool id="goenrichment" name="GOEnrichment" version="2.0.1">
<description>performs GO enrichment analysis of a set of gene products</description>
<requirements>
<requirement type="package" version="2.0.1">goenrichment</requirement>
</requirements>
<command detect_errors="exit_code">goenrichment
--go '${go}'
--annotation '${annotation}'
--study '${study}'
#if str($population) != 'None'
--population '${population}'
#end if
--correction ${correction}
$summarize
$singletons
$relations
--graph_format $graph
--cut_off $cutoff
--mf_result '${mf_result}'
--bp_result '${bp_result}'
--cc_result '${cc_result}'
--mf_graph '${mf_graph}'
--bp_graph '${bp_graph}'
--cc_graph '${cc_graph}'
</command>
<inputs>
<param name="go" type="data" format="obo,owl" label="Gene Ontology File" help="Gene Ontology file in OBO or OWL format (see http://geneontology.org/page/download-ontology)"/>
<param name="annotation" type="data" format="tabular,txt" label="Gene Product Annotation File" help="Tabular file containing annotations from gene products to GO terms (in GAF or BLAST2GO format, or a simple two-column table)"/>
<param name="study" type="data" format="txt" label="Study Set File" help="File containing the gene products corresponding to the study set (one per line)"/>
<param name="population" type="data" format="txt" optional="true" label="Population Set File (Optional)" help="File containing the gene products corresponding to the population set (one per line). If no file is submitted, the population set will be the set of all gene products listed in the annotation file."/>
<param name="correction" type="select" label="Multiple Test Correction" help="The multiple test correction method to use (Benjamini-Hochberg is recommended).">
<option value="Benjamini-Hochberg" selected="true"/>
<option value="SDA"/>
<option value="Bonferroni-Holm"/>
<option value="Sidak"/>
<option value="Bonferroni"/>
</param>
<param name="cutoff" type="select" label="P-Value Cut-Off" help="The corrected p-value (or q-value) cut-off to apply for the graph output.">
<option value="1.0"/>
<option value="0.1"/>
<option value="0.05"/>
<option value="0.01" selected="true"/>
</param>
<param name="graph" type="select" label="Output Graph Format" help="The format of the output graphs (png, svg, or tabular for importing into cytoscape).">
<option value="png" selected="true"/>
<option value="svg"/>
<option value="tabular"/>
</param>
<param name="summarize" type="boolean" checked="true" truevalue="--summarize_output" falsevalue="" label="Summarize Output" help="Whether to produce a summarized list of GO terms or the full list of those that are statistically significant"/>
<param name="singletons" type="boolean" checked="true" truevalue="--ignore_singletons" falsevalue="" label="Exclude Singletons" help="Whether to exclude GO terms that are annotated to a single gene product in the study set"/>
<param name="relations" type="boolean" checked="false" truevalue="--use_all_relations" falsevalue="" label="Use All Relations" help="Whether to infer annotations through 'part_of' and other non-hierarchical relationships, or only through 'is_a' relations"/>
</inputs>
<outputs>
<data name="mf_table" format="tabular" label="${study.name} MF Table"/>
<data name="bp_table" format="tabular" label="${study.name} BP Table"/>
<data name="cc_table" format="tabular" label="${study.name} CC Table"/>
<data name="mf_graph" format="png" label="${study.name} MF Graph">
<change_format>
<when input="graph" value="svg" format="svg"/>
<when input="graph" value="tabular" format="tabular"/>
</change_format>
</data>
<data name="bp_graph" format="png" label="${study.name} BP Graph">
<change_format>
<when input="graph" value="svg" format="svg"/>
<when input="graph" value="tabular" format="tabular"/>
</change_format>
</data>
<data name="cc_graph" format="png" label="${study.name} CC Graph">
<change_format>
<when input="graph" value="svg" format="svg"/>
<when input="graph" value="tabular" format="tabular"/>
</change_format>
</data>
</outputs>
<tests>
<test>
<param name="go" ftype="obo" value="go.obo"/>
<param name="annotation" ftype="txt" value="annotations.tab"/>
<param name="study" ftype="txt" value="study.txt"/>
<param name="summarize" value="false"/>
<output name="mf_result" ftype="tabular" file="MF_result.txt" lines_diff="0"/>
</test>
<test>
<param name="go" ftype="obo" value="go.obo"/>
<param name="annotation" ftype="txt" value="annotations.tab"/>
<param name="study" ftype="txt" value="study.txt"/>
<param name="population" ftype="txt" value="population.txt"/>
<param name="summarize" value="false"/>
<output name="mf_result" ftype="tabular" file="MF_result.txt" lines_diff="0"/>
</test>
</tests>
<help>
.. class:: infomark
GOEnrichment is a Java application that can be used to analyze gene product sets (e.g., from microarray or RNAseq experiments) for enriched GO terms.
-----
.. class:: infomark
GOEnrichment requires:
- A Gene Ontology file in either OBO or OWL format (see http://geneontology.org/page/download-ontology).
- A tabular annotation file in GAF (http://geneontology.org/page/download-annotations) format, BLAST2GO format, or a simple two-column table (e.g. from BioMart) with gene product ids in the first column and GO terms in the second one.
- A list of gene products comprising the study set (a flat text file with one gene product per line).
- Optionally, a list of gene products comprising the population set (if none is submitted, the population set will be the set of gene products listed in the annotation file).
-----
.. class:: infomark
GOEnrichment produces a tabular result file and a graph file for each GO type (MF - Molecular Function, BP - Biological Process and CC - Cellular Component):
- The result file is a tabular list of all GO terms present in the study set and their respective p-values.
- The graph file can be either a png image, an svg image, or a text file for importing into cytoscape (together with the result file).
-----
.. class:: infomark
The graph is colored by p-value: terms with p-value above cut-off appear in white; and the color gets darker as the p-value decreases
.. image:: https://github.com/DanFaria/GOEnrichment/raw/master/Scale.png
:width: 600
:height: 315
(see the scale at https://github.com/DanFaria/GOEnrichment/blob/master/Scale.png). In addition to the name of each GO term, the graph
shows its frequency in the study set. Dashed edges indicate that one or more intermediate terms were ommited from the graph.
-----
.. class:: warningmark
Gene products listed in either the study or population set files that are not present in the annotation file will be ignored.
</help>
<citations>
<citation type="bibtex">
@misc{githubgoenrichment,
author = {Faria, Daniel},
year = {2017},
title = {GOEnrichment},
publisher = {GitHub},
journal = {GitHub repository},
url = {https://github.com/DanFaria/GOEnrichment},
}
</citation>
</citations>
</tool>