Mercurial > repos > bgruening > alevin
comparison alevin.xml @ 11:e661a3269313 draft
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/salmon commit 10ccc47885ce71e602d66e157bd475f1facbd042
author | bgruening |
---|---|
date | Mon, 05 Dec 2022 15:47:45 +0000 |
parents | e4c01dcece8b |
children | c9944a2600f1 |
comparison
equal
deleted
inserted
replaced
10:e4c01dcece8b | 11:e661a3269313 |
---|---|
1 <tool id="alevin" name="Alevin" version="@VERSION@+@GALAXY_VERSION@" profile="@PROFILE_VERSION@"> | 1 <tool id="alevin" name="Alevin" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE_VERSION@"> |
2 <description>Quantification and analysis of 3’ tagged-end single-cell sequencing data</description> | 2 <description>Quantification and analysis of 3-prime tagged-end single-cell sequencing data</description> |
3 <macros> | 3 <macros> |
4 <import>macros.xml</import> | 4 <import>macros.xml</import> |
5 </macros> | 5 </macros> |
6 <expand macro="requirements"/> | 6 <expand macro="requirements"/> |
7 <command detect_errors="exit_code"><![CDATA[ | 7 <command detect_errors="exit_code"><![CDATA[ |
59 -i $index_path | 59 -i $index_path |
60 -r zcat ./unmate.fastq | 60 -r zcat ./unmate.fastq |
61 #end if | 61 #end if |
62 -o ./output | 62 -o ./output |
63 -p "\${GALAXY_SLOTS:-4}" | 63 -p "\${GALAXY_SLOTS:-4}" |
64 ${protocol} | 64 ${protocol_cond.protocol} |
65 #if $protocol_cond.protocol == '--indropV2' | |
66 --w1 '${protocol_cond.w1}' | |
67 #end if | |
65 --tgMap ./alevinmap.tsv | 68 --tgMap ./alevinmap.tsv |
66 #if $whitelist: | 69 #if $whitelist: |
67 --whitelist '${optional.whitelist}' | 70 --whitelist '${optional.whitelist}' |
68 #end if | 71 #end if |
69 #if $optional.numCellBootstraps: | 72 #if $optional.numCellBootstraps: |
83 #end if | 86 #end if |
84 #if $optional.keepCBFraction: | 87 #if $optional.keepCBFraction: |
85 --keepCBFraction '${optional.keepCBFraction}' | 88 --keepCBFraction '${optional.keepCBFraction}' |
86 #end if | 89 #end if |
87 ${optional.noDedup} | 90 ${optional.noDedup} |
88 ${optional.dumpBfh} | 91 #if 'dumpBfh' in $output_files: |
89 ${optional.dumpFeatures} | 92 --dumpBfh |
90 ${optional.dumpUmiGraph} | 93 #end if |
94 #if 'dumpFeatures' in $output_files: | |
95 --dumpFeatures | |
96 #end if | |
97 #if 'dumpUmiGraph' in $output_files: | |
98 --dumpUmiGraph | |
99 #end if | |
91 ${optional.dumpMtx} | 100 ${optional.dumpMtx} |
92 #if $optional.lowRegionMinNumBarcodes: | |
93 --lowregionMinNumBarcodes '${optional.lowRegionMinNumBarcodes}' | |
94 #end if | |
95 #if $optional.maxNumBarcodes: | 101 #if $optional.maxNumBarcodes: |
96 --maxNumBarcodes '${optional.maxNumBarcodes}' | 102 --maxNumBarcodes '${optional.maxNumBarcodes}' |
97 #end if | 103 #end if |
98 #if $optional.freqThreshold: | 104 #if $optional.freqThreshold: |
99 --freqThreshold '${optional.freqThreshold}' | 105 --freqThreshold '${optional.freqThreshold}' |
100 #end if | 106 #end if |
101 | 107 ## && gunzip output/alevin/quants_tier_mat.gz -> the output is binary file |
102 #if $optional.dumpMtx != "--dumpMtx": | 108 #if $optional.dumpMtx != "--dumpMtx": |
103 && python '$__tool_directory__/vpolo_convert.py' -m | 109 && python '$__tool_directory__/vpolo_convert.py' -m |
104 #else: | 110 #else: |
105 && gunzip output/alevin/quants_mat.mtx.gz | 111 && gunzip output/alevin/quants_mat.mtx.gz |
106 #end if | 112 #end if |
107 #if $optional.dumpUmiGraph: | 113 #if 'dumpUmiGraph' in $output_files: |
108 && python '$__tool_directory__/vpolo_convert.py' -u | 114 && python '$__tool_directory__/vpolo_convert.py' -u |
109 && sh '$__tool_directory__/umiout.sh' | 115 && sh '$__tool_directory__/umiout.sh' |
110 #end if | 116 #end if |
111 | 117 ## those gzip file include binary datasets |
112 && gunzip output/alevin/quants_tier_mat.gz | 118 ## #if $optional.numCellBootstraps: |
113 #if $optional.numCellBootstraps: | 119 ## && gunzip output/alevin/quants_mean_mat.gz |
114 && gunzip output/alevin/quants_mean_mat.gz | 120 ## && gunzip output/alevin/quants_var_mat.gz |
115 && gunzip output/alevin/quants_var_mat.gz | 121 ## #end if |
116 #end if | 122 #if 'auxiliar_info' in $output_files |
117 | 123 && tar -zcvf aux_info.tar.gz output/aux_info |
118 && gunzip output/aux_info/fld.gz | 124 #end if |
119 && gunzip output/aux_info/observed_bias.gz | |
120 && gunzip output/aux_info/observed_bias_3p.gz | |
121 ]]> | 125 ]]> |
122 </command> | 126 </command> |
123 <inputs> | 127 <inputs> |
124 <expand macro="index"/> | 128 <expand macro="index"/> |
125 <conditional name="pairstraight"> | 129 <conditional name="pairstraight"> |
126 <param name="readselect" label="Single or paired-end reads?" type="select"> | 130 <param name="readselect" label="Single or paired-end reads?" type="select"> |
127 <option value="paired">Paired-end</option> | 131 <option value="paired">Paired-end</option> |
128 <option value="unmated">Single-end</option> | 132 <option value="unmated">Single-end</option> |
129 </param> | 133 </param> |
130 <when value="paired"> | 134 <when value="paired"> |
131 <param name="file1" type="data" format="fastq,fastq.gz,fastqsanger.gz,fastq.bz2" help="CB+UMI raw sequence file(s)"/> | 135 <param name="file1" type="data" format="fastq,fastq.gz,fastqsanger.gz,fastq.bz2" label="Mate pair 1" help="CB+UMI raw sequence file(s)"/> |
132 <param name="file2" type="data" format="fastq,fastq.gz,fastqsanger.gz,fastq.bz2" help="Read-sequence file(s)"/> | 136 <param name="file2" type="data" format="fastq,fastq.gz,fastqsanger.gz,fastq.bz2" label="Mate pair 2" help="Read-sequence file(s)"/> |
133 <expand macro="stranded_pe"/> | 137 <expand macro="stranded_pe"/> |
134 </when> | 138 </when> |
135 <when value="unmated"> | 139 <when value="unmated"> |
136 <param name="unmatedreads" type="data" format="fastq,fastq.gz,fastqsanger.gz,fastq.bz2" label="Unmated reads files"/> | 140 <param name="unmatedreads" type="data" format="fastq,fastq.gz,fastqsanger.gz,fastq.bz2" label="Unmated reads files"/> |
137 <expand macro="stranded_se"/> | 141 <expand macro="stranded_se"/> |
138 </when> | 142 </when> |
139 </conditional> | 143 </conditional> |
140 <param name="protocol" type="select"> | 144 <conditional name="protocol_cond"> |
141 <option value="--dropseq">DropSeq Single Cell protocol</option> | 145 <param name="protocol" type="select" label="Type of single-cell protocol" help="In cases where single-cell protocol supports variable length cellbarcodes, alevin adds nucleotide padding to make the lengths uniform. Furthermore, the padding scheme ensures that there are no collisions added in the process."> |
142 <option value="--chromium">10x chromium v2 Single Cell protocol</option> | 146 <option value="--dropseq">DropSeq Single Cell protocol</option> |
143 <option value="--chromiumV3">10x chromium v3 Single Cell protocol</option> | 147 <option value="--chromium">10x chromium v2 Single Cell protocol</option> |
144 <option value="--gemcode">Gemcode v1 Single Cell protocol</option> | 148 <option value="--chromiumV3">10x chromium v3 Single Cell protocol</option> |
145 <option value="--celseq">CEL-Seq Single Cell protocol</option> | 149 <option value="--gemcode">Gemcode v1 Single Cell protocol</option> |
146 <option value="--celseq2">CEL-Seq2 Single Cell protocol</option> | 150 <option value="--celseq">CEL-Seq Single Cell protocol</option> |
151 <option value="--celseq2">CEL-Seq2 Single Cell protocol</option> | |
152 <option value="--sciseq3">Sci-RNA-seq3 protocol</option> | |
153 <option value="--indropV2">InDrop v2 protocol</option> | |
154 <option value="--splitSeqV1">SplitSeqV1 protocol</option> | |
155 <option value="--splitSeqV2">SplitSeqV2 protocol</option> | |
156 </param> | |
157 <when value="--dropseq"/> | |
158 <when value="--chromium"/> | |
159 <when value="--chromiumV3"/> | |
160 <when value="--gemcode"/> | |
161 <when value="--celseq"/> | |
162 <when value="--celseq2"/> | |
163 <when value="--sciseq3"/> | |
164 <when value="--indropV2"> | |
165 <param argument="--w1" type="text" value="" label="w1 adapters"> | |
166 <sanitizer invalid_char=""> | |
167 <valid initial="string.letters"/> | |
168 </sanitizer> | |
169 <validator type="regex">[ATGC]+</validator> | |
170 </param> | |
171 </when> | |
172 <when value="--splitSeqV1"/> | |
173 <when value="--splitSeqV2"/> | |
174 </conditional> | |
175 <param name="tgmap" type="data" format="tsv,tabular" label="Transcript to gene map file" help="Tsv with no header, containing two columns mapping each transcript present in the reference to the corresponding gene (the first column is a transcript and the second is the corresponding gene)."/> | |
176 <param name="output_files" type="select" multiple="true" display="checkboxes" label="Extra output files"> | |
177 <option value="salmon_log">Salmon Quant log file</option> | |
178 <option value="fragment_length">Observed fragment length distribution</option> | |
179 <option value="auxiliar_info">Auxiliar info files</option> | |
180 <option value="dumpUmiGraph">Per cell level parsimonious Umi graph (--dumpUmiGraph)</option> | |
181 <option value="dumpFeatures">Features used by the CB classification and their counts at each cell level (--dumpFeatures)</option> | |
182 <option value="dumpBfh">Full CB-EC-UMI-count data-structure (--dumpBfh)</option> | |
183 <option value="commands">Commands info file</option> | |
147 </param> | 184 </param> |
148 <param name="tgmap" type="data" format="tsv,tabular" label="Transcript to gene map file" help="Tsv with no header, containing two columns mapping each transcript present in the reference to the corresponding gene (the first column is a transcript and the second is the corresponding gene)."/> | 185 <section name="optional" title="Advanced options" expanded="false"> |
149 <param name="allout" type="boolean" label="Retrieve all output files" truevalue="Yes" falsevalue="No" checked="false" help="If not selected, all log, info.txt, and json files output by Alevin will not be retrieved"/> | 186 <param argument="--whitelist" type="data" format="tsv,tabular" optional="true" label="Whitelist file" help="Explicitly specify whitelist CP for cell detection and CB sequence correction. If not specified, putative CBs generated."/> |
150 <section name="optional" title="Optional commands" expanded="false"> | 187 <param argument="--noDedup" type="boolean" truevalue="--noDedup" falsevalue="" checked="false" label="Skip deduplication step" help="Causes pipeline to only perform CB correction, then maps the read-sequences to the transcriptome generating the interim data-structure of CB-EqClass-UMI-count. Used in parallel with --dumpBarcodeEq or --dumpBfh for the purposes of obtaining raw information or debugging."/> |
151 <param name="whitelist" type="data" format="tsv,tabular" optional="true" label="Whitelist file" help="Explicitly specify whitelist CP for cell detection and CB sequence correction. If not specified, putative CBs generated."/> | 188 <param argument="--mrna" type="data" format="tsv" optional="true" label="Mito-RNA genes file" help="Single column tsv of mitochondrial genes which are to be used as a feature for CB whitelising naive Bayes classification."/> |
152 <param name="noDedup" type="boolean" truevalue="--noDedup" falsevalue="" checked="false" help="Causes pipeline to only perform CB correction, then maps the read-sequences to the transcriptome generating the interim data-structure of CB-EqClass-UMI-count. Used in parallel with --dumpBarcodeEq or --dumpBfh for the purposes of obtaining raw information or debugging."/> | 189 <param argument="--rrna" type="data" format="tsv" optional="true" label="Ribosomal RNA file" help="Single column tsv of ribosomal genes which are to be used as a feature for CB whitelising naive Bayes classification."/> |
153 <param name="mrna" type="data" format="tsv" optional="true" help="Single column tsv of mitochondrial genes which are to be used as a feature for CB whitelising naive Bayes classification."/> | 190 <param argument="--dumpMtx" type="boolean" truevalue="--dumpMtx" falsevalue="" checked="false" label=" Dump cell v transcripts count matrix in MTX format" help="Converts the default binary format of alevin for gene-count matrix into a human readable mtx (matrix market exchange) sparse format."/> |
154 <param name="rrna" type="data" format="tsv" optional="true" help="Single column tsv of ribosomal genes which are to be used as a feature for CB whitelising naive Bayes classification."/> | 191 <param argument="--forceCells" type="integer" min="0" optional="true" label="Number of cells" help="Explicitly specify the number of cells."/> |
155 <param name="dumpBfh" type="boolean" truevalue="--dumpBfh" falsevalue="" checked="false" help="Dumps the full CB-EqClass-UMI-count data-structure for the purposed of allowing raw data analysis and debugging."/> | 192 <param argument="--expectCells" type="integer" min="0" optional="true" label="Upper bound on expected number of cells" help="define a close upper bound on expected number of cells."/> |
156 <param name="dumpFeatures" type="boolean" truevalue="--dumpFeatures" falsevalue="" checked="false" help="Dumps all features used by the CB classification and their counts at each cell level. Generally, this is used for the purposes of debugging."/> | 193 <param argument="--numCellBootstraps" type="integer" min="0" value="0" optional="true" label="Generate mean and variance for cell x gene matrix by boostrap" help="Performs certain number of bootstrap and generate the mean and variance of the count matrix"/> |
157 <param name="dumpUmiGraph" type="boolean" truevalue="--dumpUmiGraph" falsevalue="" checked="false" help="Dump the per-cell level umi graph"/> | 194 <param argument="--minScoreFraction" type="float" optional="true" label="Minimum allowed score for a mapping" help="This value controls the minimum allowed score for a mapping to be considered valid. It matters only when --validateMappings has been passed to Salmon. The maximum possible score for a fragment is ms = read_len * ma (or ms = (left_read_len + right_read_len) * ma for paired-end reads). |
158 <param name="dumpMtx" type="boolean" truevalue="--dumpMtx" falsevalue="" checked="false" help="Converts the default binary format of alevin for gene-count matrix into a human readable mtx (matrix market exchange) sparse format."/> | |
159 <param name="forceCells" type="integer" optional="true" help="Explicitly specify the number of cells."/> | |
160 <param name="expectCells" type="integer" optional="true" help="define a close upper bound on expected number of cells."/> | |
161 <param name="numCellBootstraps" type="integer" optional="true" help="Performs certain number of bootstrap and generate the mean and variance of the count matrix"/> | |
162 <param name="minScoreFraction" type="float" optional="true" help="This value controls the minimum allowed score for a mapping to be considered valid. It matters only when --validateMappings has been passed to Salmon. The maximum possible score for a fragment is ms = read_len * ma (or ms = (left_read_len + right_read_len) * ma for paired-end reads). | |
163 The argument to --minScoreFraction determines what fraction of the maximum score s a mapping must achieve to be potentially retained. For a minimum score fraction of f, only mappings with a score less than (f * s) will be kept. Mappings with lower scores will be considered as low-quality, and will be discarded."/> | 195 The argument to --minScoreFraction determines what fraction of the maximum score s a mapping must achieve to be potentially retained. For a minimum score fraction of f, only mappings with a score less than (f * s) will be kept. Mappings with lower scores will be considered as low-quality, and will be discarded."/> |
164 <param name="keepCBFraction" type="float" optional="true" help="Fraction of cellular barcodes to keep (Between 0 and 1)."/> | 196 <param argument="--keepCBFraction" type="float" min="0" max="1" optional="true" label="Fraction of cellular barcodes to keep" help="Use 1 to quantify all"/> |
165 <param name="lowRegionMinNumBarcodes" type="integer" optional="true" help="Minimum number of cell barcodes to use fo learning low confidence region (defaults to 200)"/> | 197 <param argument="--maxNumBarcodes" type="integer" min="0" value="100000" label="Maximum allowable limit to process the cell barcodes" help="Default: 100000"/> |
166 <param name="maxNumBarcodes" type="integer" optional="true" help="Maximum allowable limit to process the cell barcodes. Defaults to 100000"/> | 198 <param argument="--freqThreshold" type="integer" min="0" value="10" optional="true" label="Minimum frequency for a barcode to be considered" help="Default: 10"/> |
167 <param name="freqThreshold" type="integer" optional="true" help="Minimum frequency for a barcode to be considered. Defaults to 10"/> | |
168 </section> | 199 </section> |
169 </inputs> | 200 </inputs> |
170 <outputs> | 201 <outputs> |
171 <data name="quants_mat_tsv" label="quants_mat.tsv" format="txt" from_work_dir="quants_mat.tsv"> | 202 <data name="quants_mat_tsv" label="${tool.name} on ${on_string}: per-cell gene-count matrix (tabular)" format="txt" from_work_dir="quants_mat.tsv"> |
172 <filter>optional["dumpMtx"] is not True</filter> | 203 <filter>optional["dumpMtx"] is not True</filter> |
173 </data> | 204 </data> |
174 <data name="quants_mat_mtx" label="quants_mat.mtx" format="mtx" from_work_dir="output/alevin/quants_mat.mtx"> | 205 <data name="quants_mat_mtx" label="${tool.name} on ${on_string}: per-cell gene-count matrix (MTX)" format="mtx" from_work_dir="output/alevin/quants_mat.mtx"> |
175 <filter>optional["dumpMtx"]</filter> | 206 <filter>optional["dumpMtx"]</filter> |
176 </data> | 207 </data> |
177 <data name="raw_cb_frequency_txt" label="raw_cb_frequency.txt" format="txt" from_work_dir="output/alevin/raw_cb_frequency.txt"> | 208 <data name="quants_mat_gz" label="${tool.name} on ${on_string}: per-cell level gene-count matrix (binary)" format="gz" from_work_dir="output/alevin/quants_mat.gz"/> |
178 <filter>optional["dumpFeatures"]</filter> | 209 <data name="quants_mat_cols_txt" label="${tool.name} on ${on_string}: column headers (gene-ids)" format="txt" from_work_dir="output/alevin/quants_mat_cols.txt"/> |
179 </data> | 210 <data name="quants_mat_rows_txt" label="${tool.name} on ${on_string}: row index (CB-ids)" format="txt" from_work_dir="output/alevin/quants_mat_rows.txt"/> |
180 <data name="quants_mat_cols_txt" label="quants_mat_cols.txt" format="txt" from_work_dir="output/alevin/quants_mat_cols.txt"/> | 211 <data name="quants_tier_mat" label="${tool.name} on ${on_string}: tier categorization" format="gz" from_work_dir="output/alevin/quants_tier_mat.gz"/> |
181 <data name="quants_mat_rows_txt" label="quants_mat_rows.txt" format="txt" from_work_dir="output/alevin/quants_mat_rows.txt"/> | 212 <data name="featureDump_txt" label="${tool.name} on ${on_string}: cell-level information (featureDump)" format="txt" from_work_dir="output/alevin/featureDump.txt"/> |
182 <data name="quants_tier_mat" label="quants_tier_mat" format="mtx" from_work_dir="output/alevin/quants_tier_mat"/> | 213 <data name="raw_cb_frequency_txt" label="${tool.name} on ${on_string}: raw CB classification frequencies" format="txt" from_work_dir="output/alevin/raw_cb_frequency.txt"> |
183 <data name="alevin_log" label="alevin.log" format="txt" from_work_dir="output/alevin/alevin.log"> | 214 <filter>output_files and 'dumpFeatures' in output_files</filter> |
184 <filter>allout</filter> | 215 </data> |
185 </data> | 216 <data name="whitelist_txt" label="${tool.name} on ${on_string}: whitelist" format="txt" from_work_dir="output/alevin/whitelist.txt"/> |
186 <data name="featureDump_txt" label="featureDump.txt" format="txt" from_work_dir="output/alevin/featureDump.txt"/> | 217 |
187 <data name="whitelist_txt" label="whitelist.txt" format="txt" from_work_dir="output/alevin/whitelist.txt"/> | 218 <data name="auxiliar_files" label="${tool.name} on ${on_string}: auxiliar info files" format="tgz" from_work_dir="aux_info.tar.gz"> |
188 <data name="bfh_txt" label="bfh.txt" format="txt" from_work_dir="output/alevin/bfh.txt"> | 219 <filter>output_files and 'auxiliar_info' in output_files</filter> |
189 <filter>optional["dumpBfh"]</filter> | 220 </data> |
190 </data> | 221 <data name="salmon_quant_log" format="txt" label="${tool.name} on ${on_string}: Salmon log file" from_work_dir="output/logs/salmon_quant.log"> |
191 <data name="quants_mean_mat" label="quants_mean_mat" format="mtx" from_work_dir="output/alevin/quants_mean_mat"> | 222 <filter>output_files and 'salmon_log' in output_files</filter> |
223 </data> | |
224 <data name="cmd_info" label="${tool.name} on ${on_string}: command info (JSON)" format="json" from_work_dir="output/cmd_info.json"> | |
225 <filter>output_files and 'commands' in output_files</filter> | |
226 </data> | |
227 <data name="flenDist_txt" format="txt" label="${tool.name} on ${on_string}: observed fragment length distribution" from_work_dir="output/libParams/flenDist.txt"> | |
228 <filter>output_files and 'fragment_length' in output_files</filter> | |
229 </data> | |
230 <data name="bfh_txt" label="${tool.name} on ${on_string}: full CB-EC-UMI-count data-structure" format="txt" from_work_dir="output/alevin/bfh.txt"> | |
231 <filter>output_files and 'dumpBfh' in output_files</filter> | |
232 </data> | |
233 <data name="quants_mean_mat" label="${tool.name} on ${on_string}: count matrix mean file" format="gz" from_work_dir="output/alevin/quants_mean_mat.gz"> | |
192 <filter>optional["numCellBootstraps"]</filter> | 234 <filter>optional["numCellBootstraps"]</filter> |
193 </data> | 235 </data> |
194 <data name="quants_var_mat" label="quants_var_mat" format="mtx" from_work_dir="output/alevin/quants_var_mat"> | 236 <data name="quants_var_mat" label="${tool.name} on ${on_string}: count matrix variance file" format="gz" from_work_dir="output/alevin/quants_var_mat.gz"> |
195 <filter>optional["numCellBootstraps"]</filter> | 237 <filter>optional["numCellBootstraps"]</filter> |
196 </data> | 238 </data> |
197 <data name="quants_boot_rows_txt" label="quants_boot_rows.txt" format="txt" from_work_dir="output/alevin/quants_boot_rows.txt"> | 239 <data name="quants_boot_rows_txt" label="${tool.name} on ${on_string}: bootstraps rows" format="txt" from_work_dir="output/alevin/quants_boot_rows.txt"> |
198 <filter>optional["numCellBootstraps"]</filter> | 240 <filter>optional["numCellBootstraps"]</filter> |
199 </data> | 241 </data> |
200 <data name="alevinmeta_info_json" format="json" label="meta_info.json" from_work_dir="output/aux_info/alevin_meta_info.json"> | 242 <collection name="umigraphs" type="list" label="${tool.name} on ${on_string}: UMI graph PDFs"> |
201 <filter>allout</filter> | 243 <filter>output_files and 'dumpUmiGraph' in output_files</filter> |
202 </data> | 244 <discover_datasets pattern="(?P<name>.+)\.pdf" format="pdf" directory="fixed"/> |
203 <data name="ambig_info_tsv" format="tsv" label="ambig_info.tsv" from_work_dir="output/aux_info/ambig_info.tsv"> | |
204 <filter>allout</filter> | |
205 </data> | |
206 <data name="meta_info_json" format="json" label="meta_info.json" from_work_dir="output/aux_info/meta_info.json"> | |
207 <filter>allout</filter> | |
208 </data> | |
209 <data name="expected_bias" format="txt" label="expected_bias" from_work_dir="output/aux_info/fld"/> | |
210 <data name="observed_bias" format="txt" label="observed_bias" from_work_dir="output/aux_info/observed_bias"/> | |
211 <data name="observed_bias_3p" format="txt" label="observed_bias_3p" from_work_dir="output/aux_info/observed_bias_3p"/> | |
212 <data name="flenDist_txt" format="txt" label="flenDist.txt" from_work_dir="output/libParams/flenDist.txt"/> | |
213 <data name="salmon_quant_log" format="txt" label="salmon_quant.log" from_work_dir="output/logs/salmon_quant.log"> | |
214 <filter>allout</filter> | |
215 </data> | |
216 <collection name="umigraphs" type="list" label="Umi graph PDFs"> | |
217 <filter>optional["dumpUmiGraph"]</filter> | |
218 <discover_datasets pattern="__name_and_ext__" ext="pdf" directory="fixed"/> | |
219 </collection> | 245 </collection> |
220 <data name="cmd_info.json" label="cmd_info.json" format="json" from_work_dir="output/cmd_info.json"> | |
221 <filter>allout</filter> | |
222 </data> | |
223 </outputs> | 246 </outputs> |
224 <tests> | 247 <tests> |
248 <test expect_num_outputs="8"> | |
249 <conditional name="refTranscriptSource"> | |
250 <param name="TranscriptSource" value="history"/> | |
251 <section name="s_index"> | |
252 <param name="fasta" value="minitranscript.fa"/> | |
253 </section> | |
254 </conditional> | |
255 <conditional name="pairstraight"> | |
256 <param name="readselect" value="paired"/> | |
257 <param name="file1" value="fastqs/moreminifastq1.fastq.gz"/> | |
258 <param name="file2" value="fastqs/moreminifastq2.fastq.gz"/> | |
259 <param name="orientation" value="I"/> | |
260 <param name="strandedness" value="SR"/> | |
261 </conditional> | |
262 <conditional name="protocol_cond"> | |
263 <param name="protocol" value="--chromium"/> | |
264 </conditional> | |
265 <param name="tgmap" value="minitxp.tsv"/> | |
266 <param name="output_files" value="dumpFeatures"/> | |
267 <section name="optional"> | |
268 <param name="keepCBFraction" value="1"/> | |
269 <param name="freqThreshold" value="5"/> | |
270 <param name="dumpMtx" value="true"/> | |
271 </section> | |
272 <output name="quants_mat_mtx" file="alevin_mat_01.mtx" ftype="mtx" sort="true"/> | |
273 </test> | |
225 <test expect_num_outputs="11"> | 274 <test expect_num_outputs="11"> |
226 <conditional name="refTranscriptSource"> | 275 <conditional name="refTranscriptSource"> |
227 <param name="TranscriptSource" value="history"/> | 276 <param name="TranscriptSource" value="history"/> |
228 <section name="s_index"> | 277 <section name="s_index"> |
229 <param name="fasta" value="minitranscript.fa"/> | 278 <param name="fasta" value="minitranscript.fa"/> |
234 <param name="file1" value="fastqs/moreminifastq1.fastq.gz"/> | 283 <param name="file1" value="fastqs/moreminifastq1.fastq.gz"/> |
235 <param name="file2" value="fastqs/moreminifastq2.fastq.gz"/> | 284 <param name="file2" value="fastqs/moreminifastq2.fastq.gz"/> |
236 <param name="orientation" value="I"/> | 285 <param name="orientation" value="I"/> |
237 <param name="strandedness" value="SR"/> | 286 <param name="strandedness" value="SR"/> |
238 </conditional> | 287 </conditional> |
239 <param name="protocol" value="--chromium"/> | 288 <conditional name="protocol_cond"> |
289 <param name="protocol" value="--chromium"/> | |
290 </conditional> | |
240 <param name="tgmap" value="minitxp.tsv"/> | 291 <param name="tgmap" value="minitxp.tsv"/> |
292 <param name="output_files" value="dumpFeatures"/> | |
241 <section name="optional"> | 293 <section name="optional"> |
242 <param name="keepCBFraction" value="1"/> | 294 <param name="keepCBFraction" value="1"/> |
243 <param name="dumpFeatures" value="Yes"/> | 295 <param name="numCellBootstraps" value="2"/> |
244 <param name="freqThreshold" value="5"/> | 296 <param name="freqThreshold" value="5"/> |
245 <param name="dumpMtx" value="Yes"/> | 297 <param name="dumpMtx" value="true"/> |
246 </section> | 298 </section> |
247 <output name="quants_mat_mtx" file="alevin_mat.mtx" ftype="mtx" sort="true" lines_diff="62"/> | 299 <output name="quants_mat_mtx" file="alevin_mat_02.mtx" ftype="mtx" sort="true"/> |
300 </test> | |
301 <test expect_num_outputs="8"> | |
302 <conditional name="refTranscriptSource"> | |
303 <param name="TranscriptSource" value="history"/> | |
304 <section name="s_index"> | |
305 <param name="fasta" value="minitranscript.fa"/> | |
306 </section> | |
307 </conditional> | |
308 <conditional name="pairstraight"> | |
309 <param name="readselect" value="paired"/> | |
310 <param name="file1" value="fastqs/moreminifastq1.fastq.gz"/> | |
311 <param name="file2" value="fastqs/moreminifastq2.fastq.gz"/> | |
312 <param name="orientation" value="I"/> | |
313 <param name="strandedness" value="SR"/> | |
314 </conditional> | |
315 <conditional name="protocol_cond"> | |
316 <param name="protocol" value="-\-indropV2"/> | |
317 <param name="w1" value="ATCAT"/> | |
318 </conditional> | |
319 <param name="tgmap" value="minitxp.tsv"/> | |
320 <param name="output_files" value="dumpFeatures"/> | |
321 <section name="optional"> | |
322 <param name="keepCBFraction" value="1"/> | |
323 <param name="freqThreshold" value="5"/> | |
324 <param name="dumpMtx" value="true"/> | |
325 </section> | |
326 <output name="quants_mat_mtx" file="alevin_mat_indropV2.mtx" ftype="mtx" sort="true"/> | |
248 </test> | 327 </test> |
249 <test expect_num_outputs="14"> | 328 <test expect_num_outputs="14"> |
250 <conditional name="refTranscriptSource"> | 329 <conditional name="refTranscriptSource"> |
251 <param name="TranscriptSource" value="history"/> | 330 <param name="TranscriptSource" value="history"/> |
252 <section name="s_index"> | 331 <section name="s_index"> |
258 <param name="file1" value="fastqs/moreminifastq1.fastq.gz"/> | 337 <param name="file1" value="fastqs/moreminifastq1.fastq.gz"/> |
259 <param name="file2" value="fastqs/moreminifastq2.fastq.gz"/> | 338 <param name="file2" value="fastqs/moreminifastq2.fastq.gz"/> |
260 <param name="orientation" value="I"/> | 339 <param name="orientation" value="I"/> |
261 <param name="strandedness" value="SR"/> | 340 <param name="strandedness" value="SR"/> |
262 </conditional> | 341 </conditional> |
263 <param name="protocol" value="--chromium"/> | 342 <conditional name="protocol_cond"> |
343 <param name="protocol" value="--chromium"/> | |
344 </conditional> | |
264 <param name="tgmap" value="minitxp.tsv"/> | 345 <param name="tgmap" value="minitxp.tsv"/> |
346 <param name="output_files" value="dumpFeatures,salmon_log,fragment_length,auxiliar_info,dumpUmiGraph,dumpBfh,commands"/> | |
265 <section name="optional"> | 347 <section name="optional"> |
266 <param name="keepCBFraction" value="1"/> | 348 <param name="dumpMtx" value="true"/> |
267 <param name="dumpFeatures" value="Yes"/> | |
268 <param name="numCellBootstraps" value="2"/> | |
269 <param name="freqThreshold" value="5"/> | |
270 <param name="dumpMtx" value="Yes"/> | |
271 </section> | 349 </section> |
272 <output name="quants_mat_mtx" file="alevin_mat.mtx" ftype="mtx" sort="true" lines_diff="62"/> | 350 <output name="quants_mat_mtx" file="alevin_mat.mtx" ftype="mtx" sort="true"/> |
351 <output name="salmon_quant_log" ftype="txt"> | |
352 <assert_contents> | |
353 <has_text text="Index contained 322 targets"/> | |
354 <has_text text="Counted 14 total reads in the equivalence classes"/> | |
355 </assert_contents> | |
356 </output> | |
357 <output name="flenDist_txt" file="length_distribution.txt" ftype="txt"/> | |
358 <output name="auxiliar_files" ftype="tgz"> | |
359 <assert_contents> | |
360 <has_size value="1898" delta="100"/> | |
361 </assert_contents> | |
362 </output> | |
363 <output_collection name="umigraphs" type="list" count="14"> | |
364 <element name="AGTGGGATCTTAACCT"> | |
365 <assert_contents> | |
366 <has_size value="4017" delta="1000"/> | |
367 </assert_contents> | |
368 </element> | |
369 </output_collection> | |
370 <output name="bfh_txt" file="full_data_structure.txt" ftype="txt"/> | |
273 </test> | 371 </test> |
274 </tests> | 372 </tests> |
275 <help><![CDATA[ | 373 <help><![CDATA[ |
276 @salmonhelp@ | 374 @salmonhelp@ |
277 @alevinhelp@ | 375 @alevinhelp@ |