comparison rg_rnaStarSolo.xml @ 14:1cd2511a396e draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/rgrnastar commit 904cd12820a09a8e7ce7d01c64fa22f1ed93ed17
author iuc
date Wed, 22 Feb 2023 18:01:29 +0000
parents 9ee34ba73ebf
children b8f5f6e87f5c
comparison
equal deleted inserted replaced
13:9ee34ba73ebf 14:1cd2511a396e
120 #end if 120 #end if
121 ## Splice junctions are always under "raw" directory 121 ## Splice junctions are always under "raw" directory
122 122
123 --soloOutFormatFeaturesGeneField3 '${solo.soloOutFormatFeaturesGeneField3}' 123 --soloOutFormatFeaturesGeneField3 '${solo.soloOutFormatFeaturesGeneField3}'
124 124
125 ## Unmapped
126 '$solo.outSAMunmapped'
127 ## Read MAPQ
128 --outSAMmapqUnique ${solo.outSAMmapqUnique}
125 ## Limits 129 ## Limits
126 @LIMITS@ 130 @LIMITS@
127 131
128 ##outWig: 132 ##outWig:
129 @OUTWIG@ 133 @OUTWIG@
187 <when value="indexed"> 191 <when value="indexed">
188 <conditional name="GTFconditional"> 192 <conditional name="GTFconditional">
189 <param name="GTFselect" type="select" 193 <param name="GTFselect" type="select"
190 label="Reference genome with annotation" 194 label="Reference genome with annotation"
191 help="Select the '... with builtin gene-model' option to select from the list of available indexes that were built with splice junction information. Select the '... without builtin gene-model' option to select from the list of available indexes without annotated splice junctions, and provide your own splice junction annonations."> 195 help="Select the '... with builtin gene-model' option to select from the list of available indexes that were built with splice junction information. Select the '... without builtin gene-model' option to select from the list of available indexes without annotated splice junctions, and provide your own splice junction annonations.">
192 <option value="without-gtf" selected='true'>use genome reference without builtin gene-model</option> 196 <option value="without-gtf-with-gtf" selected='true'>use genome reference without builtin gene-model</option>
193 <option value="with-gtf">use genome reference with builtin gene-model</option> 197 <option value="with-gtf">use genome reference with builtin gene-model</option>
194 </param> 198 </param>
195 <when value="with-gtf"> 199 <when value="with-gtf">
196 <expand macro="index_selection" with_gene_model="1" /> 200 <expand macro="index_selection" with_gene_model="1" />
197 </when> 201 </when>
198 <when value="without-gtf"> 202 <when value="without-gtf-with-gtf">
199 <expand macro="index_selection" with_gene_model="0" /> 203 <expand macro="index_selection" with_gene_model="0" />
200 <expand macro="SJDBOPTIONS"/> 204 <expand macro="SJDBOPTIONS"/>
201 </when> 205 </when>
202 </conditional> 206 </conditional>
203 </when> 207 </when>
323 <param name="cell_ids" format="txt,tsv" type="data" label="File containing cell IDs of the samples. One ID per line in order of samples in the above collection."/> 327 <param name="cell_ids" format="txt,tsv" type="data" label="File containing cell IDs of the samples. One ID per line in order of samples in the above collection."/>
324 <conditional name="umidedup"> 328 <conditional name="umidedup">
325 <param argument="--soloUMIdedup" type="select" label="UMI deduplication (collapsing) algorithm" help="All has all UMIs with 1 mismatch distance to each other collapsed, Directional follows the 'directional' method given in UMI-tools, Exact collapses only exactly matching UMIs."> 329 <param argument="--soloUMIdedup" type="select" label="UMI deduplication (collapsing) algorithm" help="All has all UMIs with 1 mismatch distance to each other collapsed, Directional follows the 'directional' method given in UMI-tools, Exact collapses only exactly matching UMIs.">
326 <expand macro="umidedup_options" /> 330 <expand macro="umidedup_options" />
327 <option value="Exact" >Exact</option> 331 <option value="Exact" >Exact</option>
328 <option value="NoDedup" >CellRanger2-4 algorithm</option> 332 <option value="NoDedup" >Do not deduplicate UMIs</option>
329 </param> 333 </param>
330 <when value="1MM_All"/> 334 <when value="1MM_All"/>
331 <when value="1MM_Directional_UMItools"/> 335 <when value="1MM_Directional_UMItools"/>
332 <when value="1MM_Directional"/> 336 <when value="1MM_Directional"/>
333 <when value="Exact"/> 337 <when value="Exact"/>
386 <param argument="--outSAMattributes" type="select" display="checkboxes" multiple="true" optional="true" 390 <param argument="--outSAMattributes" type="select" display="checkboxes" multiple="true" optional="true"
387 label="Read alignment tags to include in the BAM output"> 391 label="Read alignment tags to include in the BAM output">
388 <expand macro="common_SAM_attributes"/> 392 <expand macro="common_SAM_attributes"/>
389 <option value="CR">CR Cellular barcode sequence bases (uncorrected)</option> 393 <option value="CR">CR Cellular barcode sequence bases (uncorrected)</option>
390 <option value="CY">CY Phred quality of the cellular barcode sequence in the CR tag</option> 394 <option value="CY">CY Phred quality of the cellular barcode sequence in the CR tag</option>
395 <option value="UR">UR UMI (uncorrected)</option>
396 <option value="UY">UY Phred quality of the UMI</option>
391 <option value="GX">GX Gene ID</option> 397 <option value="GX">GX Gene ID</option>
392 <option value="GN">GN Gene name</option> 398 <option value="GN">GN Gene name</option>
393 <option value="CB">CB Cell identifier (corrected)</option> 399 <option value="CB">CB Cell identifier (corrected)</option>
394 <option value="UB">UB UMI (corrected)</option> 400 <option value="UB">UB UMI (corrected)</option>
401 <option value="sM">sM assessment of CB and UMI</option>
402 <option value="sS">sS sequence of the entire barcode (CB,UMI,adapter...)</option>
403 <option value="sQ">quality of the entire barcode</option>
395 </param> 404 </param>
396 <param name="quantModeGene" type="boolean" truevalue="GeneCounts" falsevalue="" checked="false" label="Output global gene count" help="Can be used by MultiQC" /> 405 <param name="quantModeGene" type="boolean" truevalue="GeneCounts" falsevalue="" checked="false" label="Output global gene count" help="Can be used by MultiQC" />
406 <param argument="--outSAMunmapped" type="boolean" truevalue="--outSAMunmapped Within" falsevalue="--outSAMunmapped None" checked="false" label="Output unmapped reads in the BAM" />
407 <expand macro="outSAMmapqUnique"/>
397 <expand macro="limits" /> 408 <expand macro="limits" />
398 </section> 409 </section>
399 <expand macro="outWig"/> 410 <expand macro="outWig"/>
400 </inputs> 411 </inputs>
401 <outputs> 412 <outputs>
455 <expand macro="dbKeyActions" /> 466 <expand macro="dbKeyActions" />
456 </data> 467 </data>
457 <data format="txt" name="output_stats" label="${tool.name} on ${on_string}: Barcode/Feature Statistic Summaries"/> 468 <data format="txt" name="output_stats" label="${tool.name} on ${on_string}: Barcode/Feature Statistic Summaries"/>
458 <data name="reads_per_gene" format="tabular" label="${tool.name} on ${on_string}: combined reads per gene" from_work_dir="ReadsPerGene.out.tab"> 469 <data name="reads_per_gene" format="tabular" label="${tool.name} on ${on_string}: combined reads per gene" from_work_dir="ReadsPerGene.out.tab">
459 <filter>solo['quantModeGene']</filter> 470 <filter>solo['quantModeGene']</filter>
460 <expand macro="dbKeyActions" />
461 <expand macro="outCountActions" /> 471 <expand macro="outCountActions" />
462 </data> 472 </data>
463 <expand macro="outWigOutputs"/> 473 <expand macro="outWigOutputs"/>
464 </outputs> 474 </outputs>
465 <!-- Generating test data that is big enough for STARsolo to detect and small enough 475 <!-- Generating test data that is big enough for STARsolo to detect and small enough
535 <output name="reads_per_gene" > 545 <output name="reads_per_gene" >
536 <assert_contents> 546 <assert_contents>
537 <has_line_matching expression="ENSG00000279493\s+0\s+0\s+0" /> 547 <has_line_matching expression="ENSG00000279493\s+0\s+0\s+0" />
538 <has_line_matching expression="ENSG00000275464\s+38\s+1\s+40" /> 548 <has_line_matching expression="ENSG00000275464\s+38\s+1\s+40" />
539 </assert_contents> 549 </assert_contents>
550 <metadata name="column_names" value="GeneID,Counts_unstrand,Counts_firstStrand,Counts_secondStrand" />
540 </output> 551 </output>
541 </test> 552 </test>
542 <test expect_num_outputs="6"> 553 <test expect_num_outputs="6">
543 <!-- test 2 --> 554 <!-- test 2 -->
544 <!-- same as above, but using custom and no reads_per_gene--> 555 <!-- same as above, but using custom, no reads_per_gene and include unmapped reads-->
545 <conditional name="refGenomeSource"> 556 <conditional name="refGenomeSource">
546 <param name="geneSource" value="history" /> 557 <param name="geneSource" value="history" />
547 <param name="genomeFastaFiles" value="filtered3.Homo_sapiens.GRCh38.dna.chromosome.21.fa.gz" /> 558 <param name="genomeFastaFiles" value="filtered3.Homo_sapiens.GRCh38.dna.chromosome.21.fa.gz" />
548 <param name="genomeSAindexNbases" value="4" /> 559 <param name="genomeSAindexNbases" value="4" />
549 <param name="sjdbOverhang" value="100" /> 560 <param name="sjdbOverhang" value="100" />
566 </conditional> 577 </conditional>
567 </conditional> 578 </conditional>
568 <section name="solo" > 579 <section name="solo" >
569 <param name="soloStrand" value="Forward" /> 580 <param name="soloStrand" value="Forward" />
570 <param name="soloFeatures" value="Gene" /> 581 <param name="soloFeatures" value="Gene" />
582 <param name="outSAMunmapped" value="true" />
571 </section> 583 </section>
572 <output name="output_barcodes_filtered" > 584 <output name="output_barcodes_filtered" >
573 <assert_contents> 585 <assert_contents>
574 <!-- first and last line --> 586 <!-- first and last line -->
575 <has_line line="ACACCGGTCTAACGGT" /> 587 <has_line line="ACACCGGTCTAACGGT" />
595 <assert_contents> 607 <assert_contents>
596 <has_line_matching expression="\s+noUnmapped\s+5823" /> 608 <has_line_matching expression="\s+noUnmapped\s+5823" />
597 <has_line_matching expression="\s+yesUMIs\s+8" /> 609 <has_line_matching expression="\s+yesUMIs\s+8" />
598 </assert_contents> 610 </assert_contents>
599 </output> 611 </output>
600 <output name="output_BAM" value="filtered3.bam" compare="sim_size" delta="600" /> 612 <output name="output_BAM">
613 <assert_contents>
614 <has_size value="884669" delta="80000" />
615 </assert_contents>
616 </output>
601 </test> 617 </test>
602 <test expect_num_outputs="6"> 618 <test expect_num_outputs="6">
603 <!-- test 3 --> 619 <!-- test 3 -->
604 <!-- Multiple repeats test --> 620 <!-- Multiple repeats test -->
605 <conditional name="refGenomeSource"> 621 <conditional name="refGenomeSource">
1151 <has_line_matching expression="10\s+2\s+1" /> 1167 <has_line_matching expression="10\s+2\s+1" />
1152 <has_n_lines n="107" /> 1168 <has_n_lines n="107" />
1153 </assert_contents> 1169 </assert_contents>
1154 </output> 1170 </output>
1155 </test> 1171 </test>
1172 <test expect_num_outputs="7">
1173 <!-- test 11 indexed -->
1174 <conditional name="refGenomeSource">
1175 <param name="geneSource" value="indexed" />
1176 <conditional name="GTFconditional">
1177 <param name="GTFselect" value="without-gtf-with-gtf" />
1178 <param name="genomeDir" value="000" />
1179 <param name="sjdbOverhang" value="75"/>
1180 <param name="sjdbGTFfile" value="test1.gtf" ftype="gtf"/>
1181 </conditional>
1182 </conditional>
1183 <conditional name="sc" >
1184 <param name="solo_type" value="CB_UMI_Simple" />
1185 <conditional name="input_types">
1186 <param name="use" value="repeat" />
1187 <param name="input1" value="pbmc_1k_v2_L001.R1.10k.fastq.gz" ftype="fastqsanger.gz" />
1188 <param name="input2" value="pbmc_1k_v2_L001.R2.10k.fastq.gz" ftype="fastqsanger.gz" />
1189 </conditional>
1190 <param name="soloCBwhitelist" value="filtered.barcodes.txt" />
1191 <conditional name="params">
1192 <param name="chemistry" value="Cv3" />
1193 </conditional>
1194 <conditional name="umidedup">
1195 <param name="soloUMIdedup" value="1MM_All" />
1196 </conditional>
1197 </conditional>
1198 <section name="solo" >
1199 <conditional name="filter">
1200 <param name="filter_type" value="no_filter" />
1201 </conditional>
1202 <param name="soloStrand" value="Forward" />
1203 <param name="soloFeatures" value="Gene" />
1204 <param name="quantModeGene" value="true" />
1205 </section>
1206 <output name="output_barcodes" >
1207 <assert_contents>
1208 <!-- first and last line -->
1209 <has_line line="AAACCTGAGCGCTCCA" />
1210 <has_line line="TTTGGTTAGTGGGCTA" />
1211 <has_n_lines n="394" />
1212 </assert_contents>
1213 </output>
1214 <output name="output_genes">
1215 <assert_contents>
1216 <has_line_matching expression="GENE1\s+GENE1\s+Gene\s+Expression" />
1217 <has_n_lines n="1" />
1218 </assert_contents>
1219 </output>
1220 <output name="output_matrix" >
1221 <assert_contents>
1222 <has_line_matching expression="1\s+394\s+31" />
1223 <has_line_matching expression="1\s+2\s+1" />
1224 <has_n_lines n="34" />
1225 </assert_contents>
1226 </output>
1227 <output name="output_stats" >
1228 <assert_contents>
1229 <has_line_matching expression="\s+noUnmapped\s+6335" />
1230 <has_line_matching expression="\s+yesUMIs\s+33" />
1231 </assert_contents>
1232 </output>
1233 <output name="output_BAM">
1234 <assert_contents>
1235 <has_size value="7133" delta="1000"/>
1236 </assert_contents>
1237 </output>
1238 <output name="reads_per_gene" >
1239 <assert_contents>
1240 <has_line_matching expression="GENE1\s+41\s+41\s+0" />
1241 </assert_contents>
1242 </output>
1243 </test>
1156 </tests> 1244 </tests>
1157 <help><![CDATA[ 1245 <help><![CDATA[
1158 **What it does** 1246 **What it does**
1159 1247
1160 **STARSolo** is a turnkey solution for analyzing droplet single cell RNA sequencing data (e.g. 10X Genomics Chromium System) built directly into STAR_ code. STARsolo takes raw FASTQ reads files as input, and performs the following operations: 1248 **STARSolo** is a turnkey solution for analyzing droplet single cell RNA sequencing data (e.g. 10X Genomics Chromium System) built directly into STAR_ code. STARsolo takes raw FASTQ reads files as input, and performs the following operations: