# HG changeset patch # User jjohnson # Date 1629385997 0 # Node ID 604d9b0ad9a45cc2121232a44bbb28fdd1742e71 "planemo upload commit 77a5370a0978b5332bb3a9f063588a52a468ea08" diff -r 000000000000 -r 604d9b0ad9a4 fgbio_trim_fastq.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/fgbio_trim_fastq.xml Thu Aug 19 15:13:17 2021 +0000 @@ -0,0 +1,68 @@ + + Sorts the records in a FASTQ file based on the lexicographic ordering of their read names + + macros.xml + + + fgbio --version + + + + + + + + + + + + + + + + + + + + + + + + + + + (output_options['multiple_output'] is False) + + + + (library['type'] == 'paired' or library['type'] == 'paired_collection') + + + + + + diff -r 000000000000 -r 604d9b0ad9a4 macros.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/macros.xml Thu Aug 19 15:13:17 2021 +0000 @@ -0,0 +1,254 @@ + + 1.3.0 + 1 + + + fgbio + + + + + + @online{fgbio, + author = {Tim Fennell, Nils Homer}, + title = {fgbio}, + year = 2015, + url = {https://github.com/fulcrumgenomics/fgbio}, + urldate = {2021-03-01} + } + + + (([1-9][0-9]*[TBMS])*([+]|[1-9][0-9]*)[TBMS]) + @READ_STRUCTURE_PATTERN@(\s@READ_STRUCTURE_PATTERN@)* + + ^@READ_STRUCTURES_PATTERN@$ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + ^[A-Za-z][A-Za-z]$ + + + + + + + + + + + + + + + + + + + + + + pairs much like the CIGAR string in BAM files. Four kinds of operators are recognized: + + - T identifies a template read + - B identifies a sample barcode read + - M identifies a unique molecular index read + - S identifies a set of bases that should be skipped or ignored + +The last pair may be specified using a + sign instead of number to denote “all remaining bases”. This is useful if, e.g., fastqs have been trimmed and contain reads of varying length. For example to convert a paired-end run with an index read and where the first 5 bases of R1 are a UMI and the second five bases are monotemplate you might specify: + +:: + + --input r1.fq r2.fq i1.fq --read-structures 5M5S+T +T +B + +Alternative if you know your reads are of fixed length you could specify: + +:: + + --input r1.fq r2.fq i1.fq --read-structures 5M5S65T 75T 8B + + +]]> + + + + + +