view UMI_riboseq_tool/UMI_riboseq.xml @ 12:3bd2e8301575 draft

author jackcurragh
date Mon, 25 Jul 2022 11:46:24 +0000
parents d003917eaf2c
children be4f6b1e3f75
line wrap: on
line source

<tool id="UMI_riboseq" name="UMIs to Header" version="0.1.8">
    <requirement type="package" version="1.75">biopython</requirement>
<command detect_errors="exit_code">
<![CDATA[ python3 '$__tool_directory__/' $reads $output $gzip $five_prime_UMI_length $three_prime_UMI_length]]>
    <param format="fastqsanger,fastqsanger.gz" name="reads" type="data" label="fastqsanger,fastqsanger.gz"/>
    <param name="gzip" type="boolean" truevalue="true" falsevalue="false" checked="True" label="Gzip the outputted FASTQ" />
    <param name="five_prime_UMI_length" type="integer" value=2 label="Number of UMI bases at the 5' end" help="2 for McGincy Ingolia Protocol" />
    <param name="three_prime_UMI_length" type="integer" value=5 label="Number of UMI bases at the 3' end)" help="5 for McGincy Ingolia Protocol" />

    <data format="fastqsanger" name="output"/>
        <param name="reads" value="sub_10k_reads.fq.gz"/>
        <output name="output" file="output"/>
        <param name="reads" value="sub_10k_reads2.fq"/>
        <output name="output" file="output2"/>
<![CDATA[ fastq/fastq.gz are input files with reads containing UMIs (already demultiplexed and adapters are removed).
          The output of the script is fastq/fastq.gz file where UMIs (7nt in total, 5'NN and 3'NNNNN preceding barcode consisting of 5nt) are in header of the read. It is designed for protocol: McGlincy NJ, Ingolia NT. Transcriptome-wide measurement of translation by ribosome profiling. Methods. 2017;126:112-129. doi:10.1016/j.ymeth.2017.05.028 ]]>
<citation type="bibtex"> @misc{FedorovaAD2022, author = {Fedorova Alla}, year = {2022}, title = {UMI_for_riboseq}, publisher = {GitHub}, journal = {GitHub repository}, url = {}, }