| 3 | 1 <tool id="kb_python" name="kb_python" version="@VERSION@+galaxy2"> | 
| 0 | 2 	<description>performs gene and feature quantification on single-cell sequencing data.</description> | 
|  | 3 	<macros> | 
| 2 | 4 		<import>macros.xml</import> | 
|  | 5 	</macros> | 
|  | 6 	<requirements> | 
|  | 7 		<requirement type="package" version="@VERSION@"	>kb-python</requirement> | 
|  | 8 		<requirement type="package" version="1.0.0">jupyter</requirement> | 
|  | 9 	</requirements> | 
|  | 10 | 
| 0 | 11 	<stdio> | 
|  | 12 		<exit_code range="1:" /> | 
|  | 13 		<exit_code range=":-1" /> | 
|  | 14 		<regex match="Error:" /> | 
|  | 15 		<regex match="Exception:" /> | 
|  | 16 		<regex match="Exception :" /> | 
|  | 17 	</stdio> | 
|  | 18 	<command detect_errors="exit_code"><![CDATA[ | 
|  | 19 		mkdir ./index | 
|  | 20 		&& mkdir ./kb_outs | 
|  | 21 		#if $refTranscriptSource.TranscriptSource == "history": | 
|  | 22 			&& ln -s '${refTranscriptSource.h_index.index_file}' './index/kb_ref.idx' | 
|  | 23 			&& ln -s '${refTranscriptSource.h_index.t2g_file}' './index/t2g.txt' | 
|  | 24 			#if $workflow == "lamanno" or $workflow == "nucleus": | 
|  | 25 				&& ln -s '${refTranscriptSource.h_index.history_lamanno.cdna_t2c}' './index/cdna_t2c.txt' | 
|  | 26 				&& ln -s '${refTranscriptSource.h_index.history_lamanno.intron_t2c}' './index/intron_t2c.txt' | 
|  | 27 			#end if | 
|  | 28 			#set $index_path = './index' | 
|  | 29 		#else if $refTranscriptSource.TranscriptSource == "built": | 
|  | 30 			&& kb ref -i ./index/kb_ref.idx | 
|  | 31 				-g ./index/t2g.txt | 
|  | 32 				-f1 ./index/cdna.fa | 
|  | 33 				--workflow $workflow | 
|  | 34 				#if $workflow == "lamanno" or $workflow == "nucleus": | 
|  | 35 					-f2 ./index/intron.fa | 
|  | 36 					-c1 ./index/cdna_t2c.txt | 
|  | 37 					-c2 ./index/intron_t2c.txt | 
|  | 38 					--workflow $workflow | 
|  | 39 				#end if | 
| 3 | 40 				#if $workflow != "kite" and $workflow != "kite:10xFB": | 
| 0 | 41 					'${refTranscriptSource.s_index.genomic_fasta}' | 
|  | 42 					'${refTranscriptSource.s_index.genomic_gtf}' | 
|  | 43 				#else: | 
|  | 44 					'${refTranscriptSource.s_index.kite_table}' | 
|  | 45 				#end if | 
|  | 46 				#set $index_path = './index' | 
|  | 47         #end if | 
|  | 48 		&& kb count | 
|  | 49 		-t \${GALAXY_SLOTS:-1} | 
|  | 50 		-i $index_path/kb_ref.idx | 
|  | 51 		-g $index_path/t2g.txt | 
|  | 52 		#if $workflow == "lamanno" or  $workflow == "nucleus": | 
|  | 53 			-c1 $index_path/cdna_t2c.txt | 
|  | 54 			-c2 $index_path/intron_t2c.txt | 
|  | 55 		#end if | 
|  | 56 		-x $technology | 
|  | 57         #if $whitelist: | 
|  | 58             --whitelist '${optional.whitelist}' | 
|  | 59         #end if | 
| 1 | 60 		${optional.multimap} | 
|  | 61 		${optional.report} | 
| 0 | 62 		--workflow $workflow | 
|  | 63 		#if $extra_dtype != "none": | 
|  | 64 			$extra_dtype | 
|  | 65 		#end if | 
|  | 66 		-o ./kb_outs | 
|  | 67 		--cellranger | 
|  | 68 		$FASTQ1 | 
|  | 69 		$FASTQ2 | 
|  | 70 		]]> | 
|  | 71 	</command> | 
|  | 72 	<inputs> | 
|  | 73 		<param name="workflow" label="Select the workflow you want to use:" type="select" multiple="false" format="text" help="Type of workflow. Use `lamanno` for RNA velocity based on La Manno et al. 2018 logic. | 
|  | 74 		Use `nucleus` for RNA velocity on single-nucleus RNA-seq reads. Use `kite` for feature barcoding. Use `kite:10xFB` for 10x Genomics Feature Barcoding technology."> | 
|  | 75 			<option value="standard">standard</option> | 
|  | 76 			<option value="lamanno">lamanno</option> | 
|  | 77 			<option value="nucleus">nucleus</option> | 
|  | 78 			<option value="kite">kite</option> | 
| 3 | 79 			<option value="kite:10xFB">kite:10xFB (CITe-seq with Feature barcoding)</option> | 
| 0 | 80 		</param> | 
|  | 81 		<expand macro="index"/> | 
|  | 82 		<param name="technology" label="Select the scRNA-seq technology:" type="select" multiple="false" format="text" help="Choose the scRNA-seq technology used to generate the fastq data."> | 
|  | 83 			<option value="10XV1">10XV1</option> | 
|  | 84 			<option value="10XV2">10XV2</option> | 
|  | 85 			<option value="10XV3">10XV3</option> | 
|  | 86 			<option value="CELSEQ">CELSEQ</option> | 
|  | 87 			<option value="CELSEQ2">CELSEQ2</option> | 
|  | 88 			<option value="DROPSEQ">DROPSEQ</option> | 
|  | 89 			<option value="INDROPSV1">INDROPSV1</option> | 
|  | 90 			<option value="INDROPSV2">INDROPSV2</option> | 
|  | 91 			<option value="INDROPSV3">INDROPSV3</option> | 
|  | 92 			<option value="SCRUBSEQ">SCRUBSEQ</option> | 
|  | 93 			<option value="SURECELL">SURECELL</option> | 
|  | 94 		</param> | 
|  | 95 		<param name="FASTQ1" label="Select the R1 fastq file:" type="data" format="fastqsanger.gz" multiple="false"/> | 
|  | 96 		<param name="FASTQ2" label="Select the R2 fastq file:" type="data" format="fastqsanger.gz" multiple="false"/> | 
|  | 97 		<param name="extra_dtype" type="select" label="Do you want any additional output data type beside CellRanger?"> | 
|  | 98 			<option value="none" selected = "true">No</option> | 
|  | 99 			<option value="--loom">Loom</option> | 
|  | 100 			<option value="--h5ad">H5ad</option> | 
|  | 101 		</param> | 
|  | 102 		<section name="optional" title="Optional commands" expanded="false"> | 
|  | 103 			<param name="whitelist" type="data" format="tsv,tabular" optional="true" label="Whitelist file" help="Whitelisted barcodes to correct to. If not provided and bustools supports the technology, a pre-packaged whitelist is used. If not, the bustools | 
|  | 104 			whitelist command is used."/> | 
| 1 | 105 			<param name="multimap" type="boolean" optional="true" truevalue="--mm" falsevalue="" label="Include multi pseudoaligned reads?" help="Do you want to include reads that pseudoalign to multiple genes?"/> | 
|  | 106 			<param name="report" type="boolean" optional="true"  truevalue="--report" falsevalue=""  label="Create an html report?"  help="If true, will create an html report with mapping statistics and cell" checked="false"/> | 
| 0 | 107 		</section> | 
|  | 108 	</inputs> | 
|  | 109     <outputs> | 
|  | 110 		<data name="barcodes" label="cellranger barcodes" format="txt" from_work_dir="kb_outs/counts_unfiltered/cellranger/barcodes.tsv"/> | 
|  | 111 		<data name="genes" label="cellranger genes" format="txt" from_work_dir="kb_outs/counts_unfiltered/cellranger/genes.tsv"/> | 
|  | 112 		<data name="matrix" label="cellranger matrix" format="mtx" from_work_dir="kb_outs/counts_unfiltered/cellranger/matrix.mtx" /> | 
|  | 113 		<data name="inspect" label="inspect_report" format="json" from_work_dir="kb_outs/inspect.json"/> | 
|  | 114 		<data name="runinfo" label="run info" format="json" from_work_dir="kb_outs/run_info.json"/> | 
|  | 115 		<data name="kbinfo" label="kb info" format="json" from_work_dir="kb_outs/kb_info.json"/> | 
| 1 | 116 		<data name="kb_ref" label="kb_ref.idx" format="kallisto.idx" from_work_dir="index/kb_ref.idx"> | 
|  | 117 			<filter>refTranscriptSource['TranscriptSource'] == "built"</filter> | 
|  | 118 		</data> | 
|  | 119 		<data name="t2g" label="t2g.txt" format="txt" from_work_dir="index/t2g.txt"> | 
|  | 120 			<filter>refTranscriptSource['TranscriptSource'] == "built"</filter> | 
|  | 121 		</data> | 
| 0 | 122 		<data name="cdna_t2c" label="-c1 cdna_t2c.txt" format="txt" from_work_dir="index/cdna_t2c.txt"> | 
| 1 | 123 			<filter>refTranscriptSource['TranscriptSource'] == "built"</filter> | 
| 0 | 124 			<filter>workflow == "lamanno"</filter> | 
|  | 125 		</data> | 
|  | 126 		<data name="intron_t2c" label="-c2 intron_t2c.txt" format="txt" from_work_dir="index/intron_t2c.txt"> | 
| 1 | 127 			<filter>refTranscriptSource['TranscriptSource'] == "built"</filter> | 
| 0 | 128 			<filter>workflow == "lamanno"</filter> | 
|  | 129 		</data> | 
|  | 130 		<data name="adata" label="adata.h5ad" format="h5ad" from_work_dir="kb_outs/counts_unfiltered/adata.h5ad"> | 
|  | 131 			<filter	>extra_dtype == "--h5ad"</filter> | 
|  | 132 		</data> | 
|  | 133 		<data name="adata" label="adata.loom" format="loom" from_work_dir="kb_outs/counts_unfiltered/adata.loom"> | 
|  | 134 			<filter>extra_dtype == "--loom"</filter> | 
|  | 135 		</data> | 
| 1 | 136 		<data name="report" label="report.html" format="html" from_work_dir="kb_outs/report.html"> | 
|  | 137 			<filter>optional["report"]</filter> | 
|  | 138 		</data> | 
| 0 | 139 	</outputs> | 
|  | 140 	<tests> | 
|  | 141 		<expand macro="tests"/> | 
|  | 142 	</tests> | 
|  | 143 	<help><![CDATA[ | 
|  | 144 		This is a galaxy wrapper for kallisto-bustools (kb) for quantification of different types of single-cell sequencing data. The main kallisto-bustools homepage can be found under: | 
|  | 145 		'kallisto-bustools<https://www.kallistobus.tools/>'. | 
|  | 146 | 
|  | 147 		The kb count command runs the kallisto and bustools programs. It can be used for pre-processing of data from a variety of single-cell RNA-seq technologies, | 
|  | 148 		and for a number of different workflows (e.g. production of gene count matrices, RNA velocity analyses, etc.). | 
|  | 149 | 
|  | 150 		The kb package is developed and maintained by the Pachterlab under the MIT License. | 
|  | 151 	  ]]></help> | 
|  | 152 	<citations> | 
|  | 153         <citation type="doi">https://doi.org/10.1101/673285</citation> | 
|  | 154     </citations> | 
|  | 155 </tool> |