# HG changeset patch # User charles-bernard # Date 1475959125 14400 # Node ID 3909de8ec6446a6b0e1ad5e08451dab24ecd7ee6 # Parent 3771cb0a9e12627cd73b5a24e8ef31a58d873954 Uploaded diff -r 3771cb0a9e12 -r 3909de8ec644 alfa/alfa/alfa_wrapper.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/alfa/alfa/alfa_wrapper.xml Sat Oct 08 16:38:45 2016 -0400 @@ -0,0 +1,333 @@ + + - Compute and display distribution of reads by genomic categories + + + + bedtools + + + + + + + alfa_wrapper.sh ${ALFA_config} $logReport + + + + + + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + + + + + + + + + + + + + + + + + + + + + +
+ +
+ + + +
+ +
+ + + + + + + + + + + + + + + + + + +
+
+ + + + + + outputFiles['plot'] is True and outputOptions['plotFormat'] == 'pdf' + + + outputFiles['plot'] is True and outputOptions['plotFormat'] == 'png' + + + outputFiles['plot'] is True and outputOptions['plotFormat'] == 'png' + + + outputFiles['plot'] is True and outputOptions['plotFormat'] == 'svg' + + + outputFiles['plot'] is True and outputOptions['plotFormat'] == 'svg' + + + outputFiles['countFile'] is True + + + outputFiles['index'] is True + + + outputFiles['index'] is True + + + + + + projectName=$projectName + + ##__INPUT 1__## + annotationSource=$annotation.annotationSource['annotationSourceSelection'] + #if str ( $annotation.annotationSource['annotationSourceSelection'] ) == "index" + annotationFile=None + strandedIndex=$annotation.annotationSource['strandedIndex'] + unstrandedIndex=$annotation.annotationSource['unstrandedIndex'] + #else + #if str ( $annotation.annotationSource['annotationSourceSelection'] ) == "personal_gtf" + annotationFile=$annotation.annotationSource['annotationFile'] + #else + annotationFile=$annotation.annotationSource['annotationFile'] + #end if + strandedIndex=None + unstrandedIndex=None + #end if + + ##__INPUT 2__## + readsType=$reads.readsType['readsTypeSelection'] + #for $i, $r in enumerate ( $reads.readsType['readsList'] ) + readsFile[$i]=$r.readsFile + readsLabel[$i]=$r.readsLabel + #end for + strandness=$reads['strandness'] + + ##__OUTPUT FILES__## + plotChoice=$outputFiles['plot'] + countFileChoice=$outputFiles['countFile'] + indexChoice=$outputFiles['index'] + + outputPdf=$outputPdf + outputCategoriesPng=$outputCategoriesPng + outputBiotypesPng=$outputBiotypesPng + outputCategoriesSvg=$outputCategoriesSvg + outputBiotypesSvg=$outputBiotypesSvg + outputCountFile=$outputCountFile + outputStrandedIndex=$outputStrandedIndex + outputUnstrandedIndex=$outputUnstrandedIndex + + ##__OUTPUT OPTIONS__## + categoriesDepth=$outputOptions['categoriesDepth'] + plotFormat=$outputOptions['plotFormat'] + plotThresholdChoice=$outputOptions.plotThreshold['plotThresholdChoice'] + #if str ( $outputOptions.plotThreshold['plotThresholdChoice'] ) == "True" + yMin=$outputOptions.plotThreshold.yMin + yMax=$outputOptions.plotThreshold.yMax + #else + yMin=None + yMax=None + #end if + + + + + + +
+ + + + +
+
+ + + + + + + + +
+
+ + + +
+
+ + + + + +
+ + + + + + + +
+
+ + +**ALFA acronym** + +- Annotation.Landscape.For.Aligned reads + +---- + +**What it does** + + | ALFA provides a global overview of features distribution composing New Generation Sequencing dataset(s). + | + | Given a set of aligned reads (BAM files) and an annotation file (GTF format), the tool produces plots of the raw and normalized distributions of those reads among genomic categories (stop codon, 5'-UTR, CDS, intergenic, etc.) and biotypes (protein coding genes, miRNA, tRNA, etc.). Whatever the sequencing technique, whatever the organism. + +---- + +**Official documentation of the tool** + + +- https://github.com/biocompibens/ALFA + +---- + +**Detailed example** + +- https://github.com/biocompibens/ALFA#detailed-example + +---- + +**Nota Bene** + +1. **Input 1: Annotation File** + + + | ALFA requires as first input an annotation file (sequence, genome...) in gtf format in order to generate indexes that will be used in a 2nd step of the program. + | Indexes are files which list all the coordinates of all categories (stop codon, 5'-UTR, CDS, intergenic...) and biotypes (protein coding genes, miRNA, tRNA, ...) encountered in the annotated sequence. + +.. class:: warningmark + +Gtf File must be sorted. + +.. class:: infomark + +Generation of indexes from an annotation file may be time consuming (i.e ~10min for the human genome). Thus, ALFA allows the user to submit directly indexes generated in previous runs. + +2. **Input 2: Reads** + + | ALFA requires as second input a single or a set of mapped reads file(s) in either bam or bedgraph format. These files are required to intersect the coordinates of the mapped reads with the associated categories and biotypes on the annotated sequence. + | The strandness option determines which strand of the annotated sequence will be taken into account during this intersection. + +.. class:: warningmark + +Bam or Bedgraph file(s) must be sorted. + + + +3. **Output files** + + | The result of the intersection is a count file displaying the count of nucleotides in the reads for each genomic categories and biotypes. From this count file, plots of the raw and normalized distributions of the reads among these categories are generated. + | In the output files section, the user can choose what kind of files he desires as ALFA output. Categories Count File and Plots are proposed by default. + +.. class:: infomark + +The user can also select the 'indexes' option as output. This option is interesting if you plan to run ALFA again with the same submitted annotation file. *See Nota Bene/Input 1: Annotation File for more information.* + + +- `How the plots look like`_ + +.. _How the plots look like: https://github.com/biocompibens/ALFA#plots + +- `How they are generated`_ + +.. _How they are generated: https://github.com/biocompibens/ALFA#detailed-example + +---- + +**ALFA Developpers** + + | Benoît Noël and Mathieu Bahin: *compbio team, Institut de Biologie de l'Ecole Normale Supérieure de Paris* + + + + + + @MISC{ + author="Benoît Noël and Mathieu Bahin" + title="ALFA: Annotation Landscape For Aligned reads" + crossref="https://github.com/biocompibens/ALFA" + institution="Institut de Biologie de l'Ecole Normale Supérieure de Paris" + } + + +
\ No newline at end of file