Mercurial > repos > iuc > rna_starsolo
comparison rg_rnaStarSolo.xml @ 14:1cd2511a396e draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/rgrnastar commit 904cd12820a09a8e7ce7d01c64fa22f1ed93ed17
author | iuc |
---|---|
date | Wed, 22 Feb 2023 18:01:29 +0000 |
parents | 9ee34ba73ebf |
children | b8f5f6e87f5c |
comparison
equal
deleted
inserted
replaced
13:9ee34ba73ebf | 14:1cd2511a396e |
---|---|
120 #end if | 120 #end if |
121 ## Splice junctions are always under "raw" directory | 121 ## Splice junctions are always under "raw" directory |
122 | 122 |
123 --soloOutFormatFeaturesGeneField3 '${solo.soloOutFormatFeaturesGeneField3}' | 123 --soloOutFormatFeaturesGeneField3 '${solo.soloOutFormatFeaturesGeneField3}' |
124 | 124 |
125 ## Unmapped | |
126 '$solo.outSAMunmapped' | |
127 ## Read MAPQ | |
128 --outSAMmapqUnique ${solo.outSAMmapqUnique} | |
125 ## Limits | 129 ## Limits |
126 @LIMITS@ | 130 @LIMITS@ |
127 | 131 |
128 ##outWig: | 132 ##outWig: |
129 @OUTWIG@ | 133 @OUTWIG@ |
187 <when value="indexed"> | 191 <when value="indexed"> |
188 <conditional name="GTFconditional"> | 192 <conditional name="GTFconditional"> |
189 <param name="GTFselect" type="select" | 193 <param name="GTFselect" type="select" |
190 label="Reference genome with annotation" | 194 label="Reference genome with annotation" |
191 help="Select the '... with builtin gene-model' option to select from the list of available indexes that were built with splice junction information. Select the '... without builtin gene-model' option to select from the list of available indexes without annotated splice junctions, and provide your own splice junction annonations."> | 195 help="Select the '... with builtin gene-model' option to select from the list of available indexes that were built with splice junction information. Select the '... without builtin gene-model' option to select from the list of available indexes without annotated splice junctions, and provide your own splice junction annonations."> |
192 <option value="without-gtf" selected='true'>use genome reference without builtin gene-model</option> | 196 <option value="without-gtf-with-gtf" selected='true'>use genome reference without builtin gene-model</option> |
193 <option value="with-gtf">use genome reference with builtin gene-model</option> | 197 <option value="with-gtf">use genome reference with builtin gene-model</option> |
194 </param> | 198 </param> |
195 <when value="with-gtf"> | 199 <when value="with-gtf"> |
196 <expand macro="index_selection" with_gene_model="1" /> | 200 <expand macro="index_selection" with_gene_model="1" /> |
197 </when> | 201 </when> |
198 <when value="without-gtf"> | 202 <when value="without-gtf-with-gtf"> |
199 <expand macro="index_selection" with_gene_model="0" /> | 203 <expand macro="index_selection" with_gene_model="0" /> |
200 <expand macro="SJDBOPTIONS"/> | 204 <expand macro="SJDBOPTIONS"/> |
201 </when> | 205 </when> |
202 </conditional> | 206 </conditional> |
203 </when> | 207 </when> |
323 <param name="cell_ids" format="txt,tsv" type="data" label="File containing cell IDs of the samples. One ID per line in order of samples in the above collection."/> | 327 <param name="cell_ids" format="txt,tsv" type="data" label="File containing cell IDs of the samples. One ID per line in order of samples in the above collection."/> |
324 <conditional name="umidedup"> | 328 <conditional name="umidedup"> |
325 <param argument="--soloUMIdedup" type="select" label="UMI deduplication (collapsing) algorithm" help="All has all UMIs with 1 mismatch distance to each other collapsed, Directional follows the 'directional' method given in UMI-tools, Exact collapses only exactly matching UMIs."> | 329 <param argument="--soloUMIdedup" type="select" label="UMI deduplication (collapsing) algorithm" help="All has all UMIs with 1 mismatch distance to each other collapsed, Directional follows the 'directional' method given in UMI-tools, Exact collapses only exactly matching UMIs."> |
326 <expand macro="umidedup_options" /> | 330 <expand macro="umidedup_options" /> |
327 <option value="Exact" >Exact</option> | 331 <option value="Exact" >Exact</option> |
328 <option value="NoDedup" >CellRanger2-4 algorithm</option> | 332 <option value="NoDedup" >Do not deduplicate UMIs</option> |
329 </param> | 333 </param> |
330 <when value="1MM_All"/> | 334 <when value="1MM_All"/> |
331 <when value="1MM_Directional_UMItools"/> | 335 <when value="1MM_Directional_UMItools"/> |
332 <when value="1MM_Directional"/> | 336 <when value="1MM_Directional"/> |
333 <when value="Exact"/> | 337 <when value="Exact"/> |
386 <param argument="--outSAMattributes" type="select" display="checkboxes" multiple="true" optional="true" | 390 <param argument="--outSAMattributes" type="select" display="checkboxes" multiple="true" optional="true" |
387 label="Read alignment tags to include in the BAM output"> | 391 label="Read alignment tags to include in the BAM output"> |
388 <expand macro="common_SAM_attributes"/> | 392 <expand macro="common_SAM_attributes"/> |
389 <option value="CR">CR Cellular barcode sequence bases (uncorrected)</option> | 393 <option value="CR">CR Cellular barcode sequence bases (uncorrected)</option> |
390 <option value="CY">CY Phred quality of the cellular barcode sequence in the CR tag</option> | 394 <option value="CY">CY Phred quality of the cellular barcode sequence in the CR tag</option> |
395 <option value="UR">UR UMI (uncorrected)</option> | |
396 <option value="UY">UY Phred quality of the UMI</option> | |
391 <option value="GX">GX Gene ID</option> | 397 <option value="GX">GX Gene ID</option> |
392 <option value="GN">GN Gene name</option> | 398 <option value="GN">GN Gene name</option> |
393 <option value="CB">CB Cell identifier (corrected)</option> | 399 <option value="CB">CB Cell identifier (corrected)</option> |
394 <option value="UB">UB UMI (corrected)</option> | 400 <option value="UB">UB UMI (corrected)</option> |
401 <option value="sM">sM assessment of CB and UMI</option> | |
402 <option value="sS">sS sequence of the entire barcode (CB,UMI,adapter...)</option> | |
403 <option value="sQ">quality of the entire barcode</option> | |
395 </param> | 404 </param> |
396 <param name="quantModeGene" type="boolean" truevalue="GeneCounts" falsevalue="" checked="false" label="Output global gene count" help="Can be used by MultiQC" /> | 405 <param name="quantModeGene" type="boolean" truevalue="GeneCounts" falsevalue="" checked="false" label="Output global gene count" help="Can be used by MultiQC" /> |
406 <param argument="--outSAMunmapped" type="boolean" truevalue="--outSAMunmapped Within" falsevalue="--outSAMunmapped None" checked="false" label="Output unmapped reads in the BAM" /> | |
407 <expand macro="outSAMmapqUnique"/> | |
397 <expand macro="limits" /> | 408 <expand macro="limits" /> |
398 </section> | 409 </section> |
399 <expand macro="outWig"/> | 410 <expand macro="outWig"/> |
400 </inputs> | 411 </inputs> |
401 <outputs> | 412 <outputs> |
455 <expand macro="dbKeyActions" /> | 466 <expand macro="dbKeyActions" /> |
456 </data> | 467 </data> |
457 <data format="txt" name="output_stats" label="${tool.name} on ${on_string}: Barcode/Feature Statistic Summaries"/> | 468 <data format="txt" name="output_stats" label="${tool.name} on ${on_string}: Barcode/Feature Statistic Summaries"/> |
458 <data name="reads_per_gene" format="tabular" label="${tool.name} on ${on_string}: combined reads per gene" from_work_dir="ReadsPerGene.out.tab"> | 469 <data name="reads_per_gene" format="tabular" label="${tool.name} on ${on_string}: combined reads per gene" from_work_dir="ReadsPerGene.out.tab"> |
459 <filter>solo['quantModeGene']</filter> | 470 <filter>solo['quantModeGene']</filter> |
460 <expand macro="dbKeyActions" /> | |
461 <expand macro="outCountActions" /> | 471 <expand macro="outCountActions" /> |
462 </data> | 472 </data> |
463 <expand macro="outWigOutputs"/> | 473 <expand macro="outWigOutputs"/> |
464 </outputs> | 474 </outputs> |
465 <!-- Generating test data that is big enough for STARsolo to detect and small enough | 475 <!-- Generating test data that is big enough for STARsolo to detect and small enough |
535 <output name="reads_per_gene" > | 545 <output name="reads_per_gene" > |
536 <assert_contents> | 546 <assert_contents> |
537 <has_line_matching expression="ENSG00000279493\s+0\s+0\s+0" /> | 547 <has_line_matching expression="ENSG00000279493\s+0\s+0\s+0" /> |
538 <has_line_matching expression="ENSG00000275464\s+38\s+1\s+40" /> | 548 <has_line_matching expression="ENSG00000275464\s+38\s+1\s+40" /> |
539 </assert_contents> | 549 </assert_contents> |
550 <metadata name="column_names" value="GeneID,Counts_unstrand,Counts_firstStrand,Counts_secondStrand" /> | |
540 </output> | 551 </output> |
541 </test> | 552 </test> |
542 <test expect_num_outputs="6"> | 553 <test expect_num_outputs="6"> |
543 <!-- test 2 --> | 554 <!-- test 2 --> |
544 <!-- same as above, but using custom and no reads_per_gene--> | 555 <!-- same as above, but using custom, no reads_per_gene and include unmapped reads--> |
545 <conditional name="refGenomeSource"> | 556 <conditional name="refGenomeSource"> |
546 <param name="geneSource" value="history" /> | 557 <param name="geneSource" value="history" /> |
547 <param name="genomeFastaFiles" value="filtered3.Homo_sapiens.GRCh38.dna.chromosome.21.fa.gz" /> | 558 <param name="genomeFastaFiles" value="filtered3.Homo_sapiens.GRCh38.dna.chromosome.21.fa.gz" /> |
548 <param name="genomeSAindexNbases" value="4" /> | 559 <param name="genomeSAindexNbases" value="4" /> |
549 <param name="sjdbOverhang" value="100" /> | 560 <param name="sjdbOverhang" value="100" /> |
566 </conditional> | 577 </conditional> |
567 </conditional> | 578 </conditional> |
568 <section name="solo" > | 579 <section name="solo" > |
569 <param name="soloStrand" value="Forward" /> | 580 <param name="soloStrand" value="Forward" /> |
570 <param name="soloFeatures" value="Gene" /> | 581 <param name="soloFeatures" value="Gene" /> |
582 <param name="outSAMunmapped" value="true" /> | |
571 </section> | 583 </section> |
572 <output name="output_barcodes_filtered" > | 584 <output name="output_barcodes_filtered" > |
573 <assert_contents> | 585 <assert_contents> |
574 <!-- first and last line --> | 586 <!-- first and last line --> |
575 <has_line line="ACACCGGTCTAACGGT" /> | 587 <has_line line="ACACCGGTCTAACGGT" /> |
595 <assert_contents> | 607 <assert_contents> |
596 <has_line_matching expression="\s+noUnmapped\s+5823" /> | 608 <has_line_matching expression="\s+noUnmapped\s+5823" /> |
597 <has_line_matching expression="\s+yesUMIs\s+8" /> | 609 <has_line_matching expression="\s+yesUMIs\s+8" /> |
598 </assert_contents> | 610 </assert_contents> |
599 </output> | 611 </output> |
600 <output name="output_BAM" value="filtered3.bam" compare="sim_size" delta="600" /> | 612 <output name="output_BAM"> |
613 <assert_contents> | |
614 <has_size value="884669" delta="80000" /> | |
615 </assert_contents> | |
616 </output> | |
601 </test> | 617 </test> |
602 <test expect_num_outputs="6"> | 618 <test expect_num_outputs="6"> |
603 <!-- test 3 --> | 619 <!-- test 3 --> |
604 <!-- Multiple repeats test --> | 620 <!-- Multiple repeats test --> |
605 <conditional name="refGenomeSource"> | 621 <conditional name="refGenomeSource"> |
1151 <has_line_matching expression="10\s+2\s+1" /> | 1167 <has_line_matching expression="10\s+2\s+1" /> |
1152 <has_n_lines n="107" /> | 1168 <has_n_lines n="107" /> |
1153 </assert_contents> | 1169 </assert_contents> |
1154 </output> | 1170 </output> |
1155 </test> | 1171 </test> |
1172 <test expect_num_outputs="7"> | |
1173 <!-- test 11 indexed --> | |
1174 <conditional name="refGenomeSource"> | |
1175 <param name="geneSource" value="indexed" /> | |
1176 <conditional name="GTFconditional"> | |
1177 <param name="GTFselect" value="without-gtf-with-gtf" /> | |
1178 <param name="genomeDir" value="000" /> | |
1179 <param name="sjdbOverhang" value="75"/> | |
1180 <param name="sjdbGTFfile" value="test1.gtf" ftype="gtf"/> | |
1181 </conditional> | |
1182 </conditional> | |
1183 <conditional name="sc" > | |
1184 <param name="solo_type" value="CB_UMI_Simple" /> | |
1185 <conditional name="input_types"> | |
1186 <param name="use" value="repeat" /> | |
1187 <param name="input1" value="pbmc_1k_v2_L001.R1.10k.fastq.gz" ftype="fastqsanger.gz" /> | |
1188 <param name="input2" value="pbmc_1k_v2_L001.R2.10k.fastq.gz" ftype="fastqsanger.gz" /> | |
1189 </conditional> | |
1190 <param name="soloCBwhitelist" value="filtered.barcodes.txt" /> | |
1191 <conditional name="params"> | |
1192 <param name="chemistry" value="Cv3" /> | |
1193 </conditional> | |
1194 <conditional name="umidedup"> | |
1195 <param name="soloUMIdedup" value="1MM_All" /> | |
1196 </conditional> | |
1197 </conditional> | |
1198 <section name="solo" > | |
1199 <conditional name="filter"> | |
1200 <param name="filter_type" value="no_filter" /> | |
1201 </conditional> | |
1202 <param name="soloStrand" value="Forward" /> | |
1203 <param name="soloFeatures" value="Gene" /> | |
1204 <param name="quantModeGene" value="true" /> | |
1205 </section> | |
1206 <output name="output_barcodes" > | |
1207 <assert_contents> | |
1208 <!-- first and last line --> | |
1209 <has_line line="AAACCTGAGCGCTCCA" /> | |
1210 <has_line line="TTTGGTTAGTGGGCTA" /> | |
1211 <has_n_lines n="394" /> | |
1212 </assert_contents> | |
1213 </output> | |
1214 <output name="output_genes"> | |
1215 <assert_contents> | |
1216 <has_line_matching expression="GENE1\s+GENE1\s+Gene\s+Expression" /> | |
1217 <has_n_lines n="1" /> | |
1218 </assert_contents> | |
1219 </output> | |
1220 <output name="output_matrix" > | |
1221 <assert_contents> | |
1222 <has_line_matching expression="1\s+394\s+31" /> | |
1223 <has_line_matching expression="1\s+2\s+1" /> | |
1224 <has_n_lines n="34" /> | |
1225 </assert_contents> | |
1226 </output> | |
1227 <output name="output_stats" > | |
1228 <assert_contents> | |
1229 <has_line_matching expression="\s+noUnmapped\s+6335" /> | |
1230 <has_line_matching expression="\s+yesUMIs\s+33" /> | |
1231 </assert_contents> | |
1232 </output> | |
1233 <output name="output_BAM"> | |
1234 <assert_contents> | |
1235 <has_size value="7133" delta="1000"/> | |
1236 </assert_contents> | |
1237 </output> | |
1238 <output name="reads_per_gene" > | |
1239 <assert_contents> | |
1240 <has_line_matching expression="GENE1\s+41\s+41\s+0" /> | |
1241 </assert_contents> | |
1242 </output> | |
1243 </test> | |
1156 </tests> | 1244 </tests> |
1157 <help><![CDATA[ | 1245 <help><![CDATA[ |
1158 **What it does** | 1246 **What it does** |
1159 | 1247 |
1160 **STARSolo** is a turnkey solution for analyzing droplet single cell RNA sequencing data (e.g. 10X Genomics Chromium System) built directly into STAR_ code. STARsolo takes raw FASTQ reads files as input, and performs the following operations: | 1248 **STARSolo** is a turnkey solution for analyzing droplet single cell RNA sequencing data (e.g. 10X Genomics Chromium System) built directly into STAR_ code. STARsolo takes raw FASTQ reads files as input, and performs the following operations: |