Mercurial > repos > portiahollyoak > temp
comparison temp.xml @ 12:ca36262102d8 draft
planemo upload for repository https://github.com/portiahollyoak/Tools commit 5d021f520b653582862ec98dd812a051b804aa50
author | portiahollyoak |
---|---|
date | Fri, 29 Apr 2016 05:47:54 -0400 |
parents | e19d9742c99b |
children | 72156de89c7a |
comparison
equal
deleted
inserted
replaced
11:e19d9742c99b | 12:ca36262102d8 |
---|---|
1 <tool id ="run_TEMP" name="Run TEMP" version=" 0.1.2"> | 1 <tool id ="run_TEMP" name="Run TEMP" version=" 0.1.4"> |
2 <description></description> | 2 <description></description> |
3 <requirements> | 3 <requirements> |
4 <!-- The following are classical toolshed packages and should be removed | 4 <!-- The following are classical toolshed packages and should be removed |
5 once conda is deemed stable--> | 5 once conda is deemed stable--> |
6 <requirement type="package" version="1.6.922">bioperl</requirement> | 6 <requirement type="package" version="1.6.922">bioperl</requirement> |
15 </requirements> | 15 </requirements> |
16 <stdio> | 16 <stdio> |
17 <exit_code range="1:" /> | 17 <exit_code range="1:" /> |
18 </stdio> | 18 </stdio> |
19 <command><![CDATA[ | 19 <command><![CDATA[ |
20 | |
21 ln -f -s "$alignment.metadata.bam_index" alignment.sorted.bam.bai && | 20 ln -f -s "$alignment.metadata.bam_index" alignment.sorted.bam.bai && |
22 ln -f -s "$alignment" alignment.sorted.bam && | 21 ln -f -s "$alignment" alignment.sorted.bam && |
23 bash $__tool_directory__/scripts/TEMP_Insertion.sh -x 30 -i alignment.sorted.bam -s $__tool_directory__/scripts -r "$consensus_te_seqs" -t "$bed_te_locations" -m 3 -f "$median_insertsize" -c \${GALAXY_SLOTS:-2} && | 22 bash $__tool_directory__/scripts/TEMP_Insertion.sh -x "$minimum_score_difference" -i alignment.sorted.bam -s $__tool_directory__/scripts -r "$consensus_te_seqs" -t "$te_locations" -m "$mismatches" -f "$median_insertsize" -c \${GALAXY_SLOTS:-2} && |
24 bash $__tool_directory__/scripts/TEMP_Absence.sh -i alignment.sorted.bam -s $__tool_directory__/scripts -r "$bed_te_locations" -t "$reference2bit" -f 500 -c \${GALAXY_SLOTS:-2} && | 23 bash $__tool_directory__/scripts/TEMP_Absence.sh -x "$minimum_score_difference" -i alignment.sorted.bam -s $__tool_directory__/scripts -r "$te_locations" -t "$reference2bit" -f 500 -c \${GALAXY_SLOTS:-2} && |
25 mv alignment.insertion.bp.bed $insertion_bed && | 24 zip archive.zip *insertion* *excision* *absence* && mv archive.zip $archive && |
26 mv alignment.insertion.refined.bp $insertion_bed_refined && | |
27 mv alignment.insertion.refined.bp.summary $insertion_summary && | 25 mv alignment.insertion.refined.bp.summary $insertion_summary && |
28 mv alignment.absence.refined.bp.summary $absence_summary && | 26 mv alignment.absence.refined.bp.summary $absence_summary |
29 zip archive.zip *insertion* *excision* *absence* && | |
30 mv archive.zip $archive | |
31 ]]></command> | 27 ]]></command> |
32 <inputs> | 28 <inputs> |
33 <param format="bam" name="alignment" type="data" label="Alignment bam file"/> | 29 <param format="bam" name="alignment" type="data" label="Alignment bam file"/> |
34 <param format="twobit" name="reference2bit" type="data" label="Reference twobit file"/> | 30 <param format="twobit" name="reference2bit" type="data" label="Reference twobit file"/> |
35 <param format="fasta" name="consensus_te_seqs" type="data" label="Consensus TE Seqs fasta file"/> | 31 <param format="fasta" name="consensus_te_seqs" type="data" label="Consensus TE Seqs fasta file"/> |
36 <param format="bed" name="bed_te_locations" type="data" label="TE Locations bed file"/> | 32 <param format="bed" name="te_locations" type="data" label="TE Locations bed file"/> |
37 <!-- | |
38 <param format="tabular" name="te_families" type="data" label="TE Families"/> | |
39 <param format="gff" name="gff_te_locations" type="data" label="Reference TE insertion Locations with Family ID names GFF file"/> | |
40 --> | |
41 <param format="txt" name="median_insertsize" type="data" label="Median Insert Length"/> | 33 <param format="txt" name="median_insertsize" type="data" label="Median Insert Length"/> |
34 <param name="mismatches" min="0" max="5" type="integer" value="3" label="Allow this many mismatches when aligning to TEs"/> | |
35 <param name="minimum_score_difference" type="integer" min="10" max="37" value="30" label="Minimum score difference between optimal and suboptimal alignment to consider read uniquely mapped"></param> | |
42 </inputs> | 36 </inputs> |
43 <outputs> | 37 <outputs> |
44 <data format="bed" type="data" name="insertion_bed" label="Insertion BED file" /> | |
45 <data format="bed" type="data" name="insertion_bed_refined" label="Insertion BED file (refined)" /> | |
46 <data format="bed" type="data" name="insertion_summary" label="Insertion summary file" /> | 38 <data format="bed" type="data" name="insertion_summary" label="Insertion summary file" /> |
47 <data format="bed" type="data" name="absence_summary" label="Absence summary file" /> | 39 <data format="bed" type="data" name="absence_summary" label="Absence summary file" /> |
48 <data format="zip" type="data" name="archive" label="Compressed output files" /> | 40 <data format="zip" type="data" name="archive" label="Compressed output files" /> |
49 </outputs> | 41 </outputs> |
50 <tests> | 42 <tests> |
51 <test> | 43 <test> |
52 <param name="alignment" value="test_chromosome.sorted.bam" ftype="bam"/> | 44 <param name="alignment" value="chr2l_bwa_mem.bam" ftype="bam"/> |
53 <param name="reference2bit" value="dm3_chr2L.2bit" ftype="twobit"/> | 45 <param name="reference2bit" value="dm6_chr2l.twobit" ftype="twobit"/> |
54 <param name="consensus_te_seqs" value="test_consensus.fa" ftype="fasta"/> | 46 <param name="consensus_te_seqs" value="test_consensus.fa" ftype="fasta"/> |
55 <param name="bed_te_locations" value="test_TE_annotation.bed" ftype="bed"/> | 47 <param name="te_locations" value="test_TE_annotation.gff3" ftype="bed"/> |
56 <output name="insertion_bed" file="test_chromosome.insertion.bp.bed" ftype="bed" /> | 48 <param name="median_insertsize" value="median_insert_size" ftype="txt"/> |
57 <output name="insertion_bed_refined" file="test_chromosome.insertion.refined.bp" ftype="bed"/> | |
58 <output name="insertion_summary" file="test_chromosome.insertion.refined.bp.summary" ftype="bed"/> | 49 <output name="insertion_summary" file="test_chromosome.insertion.refined.bp.summary" ftype="bed"/> |
59 <output name="absence_summary" file="test_chromosome.absence.refined.bp.summary" ftype="bed"/> | 50 <output name="absence_summary" file="test_chromosome.absence.refined.bp.summary" ftype="bed"/> |
60 </test> | 51 </test> |
61 </tests> | 52 </tests> |
62 <help> <![CDATA[ | 53 <help> <![CDATA[ |
69 Author: Jiali Zhuang (jiali.zhuang@umassmed.edu) and Jie Wang (jie.wangj@umassmed.edu) Weng Lab, University of Massachusetts Medical School, Worcester, MA, USA | 60 Author: Jiali Zhuang (jiali.zhuang@umassmed.edu) and Jie Wang (jie.wangj@umassmed.edu) Weng Lab, University of Massachusetts Medical School, Worcester, MA, USA |
70 | 61 |
71 For TE insertion analysis run TEMP_Insertion.sh in script. | 62 For TE insertion analysis run TEMP_Insertion.sh in script. |
72 For TE absence analysis run TEMP_Absence.sh in script. | 63 For TE absence analysis run TEMP_Absence.sh in script. |
73 | 64 |
65 Output files | |
66 ------------- | |
67 | |
68 | |
69 For TE insertion analysis there are 14 columns in the summary file:: | |
70 | |
71 Column 1: The chromosome where the detected insertion happens. | |
72 Column 2: The coordinate of the start position of the detected insertion. | |
73 Column 3: The coordinate of the end position of the detected insertion. | |
74 Column 4: The TE family that the detected insertion belongs to. | |
75 Column 5: The direction of the insertion. “Plus” means that the TE is integrated with the plus strand of the genome while “minus” means the TE is integrated with the minus strand. | |
76 Column 6: The class of the insertion. “1p1” means that the detected insertion is supported by reads at both sides. “2p” means the detected insertion is supported by more than 1 read at only 1 side. “Singleton” means the detected insertion is supported by only 1 read at 1 side. | |
77 Column 7: The total number of read pairs that support the detected insertion. | |
78 Column 8: The estimated population frequency of the detected insertion. | |
79 Columns 9 & 10: The coordinate of a junction and the number of the reads supporting it. If the junction is not found column 9 will be the arithmetic mean of the start and end coordinates and column 10 will have the value 0. | |
80 Columns 11 & 12: Same as Columns 9 & 10 except for the junction on the other strand. | |
81 Column 13: The number of reads supporting the detected insertion at the 5’ end of the TE (not including junction spanning reads). | |
82 Column 13: The number of reads supporting the detected insertion at the 3’ end of the TE (not including junction spanning reads). | |
83 | |
84 | |
85 For TE absence analysis there are 9 columns in the summary file:: | |
86 | |
87 Column 1: The chromosome where the detected absence happens. | |
88 Column 2: The coordinate of the start position of the detected absence. | |
89 Column 3: The coordinate of the end position of the detected absence. | |
90 Column 4: The TE family that the detected insertion belongs to. | |
91 Column 5: Junctions at 5’ of the excised TE. The two numbers are the coordinates of the junctions on the two strands. | |
92 Column 6: Junctions at 3’ of the excised TE. The two numbers are the coordinates of the junctions on the two strands. | |
93 Column 7: The number of reads supporting the absence. | |
94 Column 8: The number of reads supporting the reference (no absence). | |
95 Column 9: Estimated population frequency of the detected absence event. | |
96 | |
74 | 97 |
75 ]]> </help> | 98 ]]> </help> |
99 <citations> | |
100 <citation type="doi">10.1093/nar/gku323</citation> | |
101 </citations> | |
76 </tool> | 102 </tool> |