Galaxy |

Changeset 0:2dfbcb88d16a (2020-05-13)

Next changeset 1:bf4ee2810759 (2020-07-16)

Commit message:
"planemo upload for repository https://github.com/mhammell-laboratory/TEtranscripts commit 0afd89b76ba658b8bc9faa1463a1aa160ddb2339"

added:
test-data/control1.bam
test-data/control2.bam
test-data/gtf.gtf
test-data/te.gtf
test-data/treatment1.bam
test-data/treatment2.bam
tetranscript.xml

diff -r 000000000000 -r 2dfbcb88d16a test-data/control1.bam

Binary file test-data/control1.bam has changed

diff -r 000000000000 -r 2dfbcb88d16a test-data/control2.bam

Binary file test-data/control2.bam has changed

diff -r 000000000000 -r 2dfbcb88d16a test-data/gtf.gtf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/gtf.gtf Wed May 13 12:57:29 2020 -0400

b'@@ -0,0 +1,779 @@\n+chrX\trefGene\texon\t14118058\t14118761\t.\t+\t.\tgene_id "l(1)G0007"; transcript_id "NM_167396"; exon_number "3"; exon_id "NM_167396.3"; gene_name "l(1)G0007";\n+chrX\trefGene\t3UTR\t14118656\t14118761\t.\t+\t.\tgene_id "l(1)G0007"; transcript_id "NM_167396"; exon_number "3"; exon_id "NM_167396.3"; gene_name "l(1)G0007";\n+chr2L\trefGene\texon\t18711071\t18711733\t.\t-\t.\tgene_id "Irk3"; transcript_id "NM_136059"; exon_number "1"; exon_id "NM_136059.1"; gene_name "Irk3";\n+chr2L\trefGene\t3UTR\t18711071\t18711336\t.\t-\t.\tgene_id "Irk3"; transcript_id "NM_136059"; exon_number "1"; exon_id "NM_136059.1"; gene_name "Irk3";\n+chr2L\trefGene\texon\t11128807\t11129335\t.\t+\t.\tgene_id "Nup160"; transcript_id "NM_135649"; exon_number "14"; exon_id "NM_135649.14"; gene_name "Nup160";\n+chr2L\trefGene\t3UTR\t11128927\t11129335\t.\t+\t.\tgene_id "Nup160"; transcript_id "NM_135649"; exon_number "14"; exon_id "NM_135649.14"; gene_name "Nup160";\n+chr2L\trefGene\texon\t10324379\t10324990\t.\t+\t.\tgene_id "CG4995"; transcript_id "NM_135536"; exon_number "5"; exon_id "NM_135536.5"; gene_name "CG4995";\n+chr2L\trefGene\tCDS\t10324379\t10324962\t.\t+\t2\tgene_id "CG4995"; transcript_id "NM_135536"; exon_number "5"; exon_id "NM_135536.5"; gene_name "CG4995";\n+chr2L\trefGene\t3UTR\t10324966\t10324990\t.\t+\t.\tgene_id "CG4995"; transcript_id "NM_135536"; exon_number "5"; exon_id "NM_135536.5"; gene_name "CG4995";\n+chr2L\trefGene\tstop_codon\t10324963\t10324965\t.\t+\t0\tgene_id "CG4995"; transcript_id "NM_135536"; exon_number "1"; exon_id "NM_135536.1"; gene_name "CG4995";\n+chr2L\trefGene\texon\t6487562\t6488372\t.\t-\t.\tgene_id "KFase"; transcript_id "NM_135192"; exon_number "1"; exon_id "NM_135192.1"; gene_name "KFase";\n+chr2L\trefGene\t3UTR\t6487562\t6487596\t.\t-\t.\tgene_id "KFase"; transcript_id "NM_135192"; exon_number "1"; exon_id "NM_135192.1"; gene_name "KFase";\n+chr2L\trefGene\texon\t6063562\t6063771\t.\t-\t.\tgene_id "Fbw5"; transcript_id "NM_135145"; exon_number "1"; exon_id "NM_135145.1"; gene_name "Fbw5";\n+chr2L\trefGene\t3UTR\t6063562\t6063687\t.\t-\t.\tgene_id "Fbw5"; transcript_id "NM_135145"; exon_number "1"; exon_id "NM_135145.1"; gene_name "Fbw5";\n+chr2L\trefGene\texon\t4461657\t4462563\t.\t-\t.\tgene_id "CG15443"; transcript_id "NM_134995"; exon_number "1"; exon_id "NM_134995.1"; gene_name "CG15443";\n+chr2L\trefGene\t3UTR\t4461657\t4461823\t.\t-\t.\tgene_id "CG15443"; transcript_id "NM_134995"; exon_number "1"; exon_id "NM_134995.1"; gene_name "CG15443";\n+chr2L\trefGene\texon\t5521281\t5522007\t.\t-\t.\tgene_id "CG7371"; transcript_id "NM_135087"; exon_number "1"; exon_id "NM_135087.1"; gene_name "CG7371";\n+chr2L\trefGene\t3UTR\t5521281\t5521377\t.\t-\t.\tgene_id "CG7371"; transcript_id "NM_135087"; exon_number "1"; exon_id "NM_135087.1"; gene_name "CG7371";\n+chr2L\trefGene\tstop_codon\t5521378\t5521380\t.\t-\t0\tgene_id "CG7371"; transcript_id "NM_135087"; exon_number "1"; exon_id "NM_135087.1"; gene_name "CG7371";\n+chr2L\trefGene\texon\t4969285\t4970216\t.\t+\t.\tgene_id "CG3756"; transcript_id "NM_135041"; exon_number "2"; exon_id "NM_135041.2"; gene_name "CG3756";\n+chr2L\trefGene\t3UTR\t4970147\t4970216\t.\t+\t.\tgene_id "CG3756"; transcript_id "NM_135041"; exon_number "2"; exon_id "NM_135041.2"; gene_name "CG3756";\n+chr2L\trefGene\texon\t4815680\t4815891\t.\t+\t.\tgene_id "CG15629"; transcript_id "NM_135015"; exon_number "4"; exon_id "NM_135015.4"; gene_name "CG15629";\n+chr2L\trefGene\tCDS\t4815680\t4815779\t.\t+\t1\tgene_id "CG15629"; transcript_id "NM_135015"; exon_number "4"; exon_id "NM_135015.4"; gene_name "CG15629";\n+chr2R\trefGene\texon\t3709615\t3709990\t.\t-\t.\tgene_id "cathD"; transcript_id "NM_143756"; exon_number "1"; exon_id "NM_143756.1"; gene_name "cathD";\n+chr2R\trefGene\t3UTR\t3709615\t3709729\t.\t-\t.\tgene_id "cathD"; transcript_id "NM_143756"; exon_number "1"; exon_id "NM_143756.1"; gene_name "cathD";\n+chr2R\trefGene\texon\t11428922\t11430003\t.\t+\t.\tgene_id "Vha36-1"; transcript_id "NM_143730"; exon_number "1"; exon_id "NM_143730.1"; gene_name "Vha36-1";\n+chr2R\trefGene\tCDS\t11429042\t11429779\t.\t+\t0\tgene_id "Vha36-1"; transcript_id "NM_143730"; exon_number "1"; exon_id "NM_143730.1"'..b'M_167248.1"; gene_name "sesB";\n+chrX\trefGene\t3UTR\t10675026\t10675653\t.\t-\t.\tgene_id "sesB"; transcript_id "NM_167248"; exon_number "1"; exon_id "NM_167248.1"; gene_name "sesB";\n+chrX\trefGene\texon\t10675026\t10676128\t.\t-\t.\tgene_id "sesB"; transcript_id "NM_078554"; exon_number "1"; exon_id "NM_078554.1"; gene_name "sesB";\n+chrX\trefGene\t3UTR\t10675026\t10675653\t.\t-\t.\tgene_id "sesB"; transcript_id "NM_078554"; exon_number "1"; exon_id "NM_078554.1"; gene_name "sesB";\n+chrX\trefGene\texon\t10675026\t10676128\t.\t-\t.\tgene_id "sesB"; transcript_id "NM_167246"; exon_number "1"; exon_id "NM_167246.1"; gene_name "sesB";\n+chrX\trefGene\t3UTR\t10675026\t10675653\t.\t-\t.\tgene_id "sesB"; transcript_id "NM_167246"; exon_number "1"; exon_id "NM_167246.1"; gene_name "sesB";\n+chrX\trefGene\texon\t12607694\t12609320\t.\t-\t.\tgene_id "Smr"; transcript_id "NM_001272562"; exon_number "8"; exon_id "NM_001272562.8"; gene_name "Smr";\n+chrX\trefGene\tCDS\t12607694\t12609320\t.\t-\t1\tgene_id "Smr"; transcript_id "NM_001272562"; exon_number "8"; exon_id "NM_001272562.8"; gene_name "Smr";\n+chrX\trefGene\texon\t12607694\t12609302\t.\t-\t.\tgene_id "Smr"; transcript_id "NM_167334"; exon_number "8"; exon_id "NM_167334.8"; gene_name "Smr";\n+chrX\trefGene\tCDS\t12607694\t12609302\t.\t-\t1\tgene_id "Smr"; transcript_id "NM_167334"; exon_number "8"; exon_id "NM_167334.8"; gene_name "Smr";\n+chrX\trefGene\texon\t12607694\t12609302\t.\t-\t.\tgene_id "Smr"; transcript_id "NM_167335"; exon_number "8"; exon_id "NM_167335.8"; gene_name "Smr";\n+chrX\trefGene\tCDS\t12607694\t12609302\t.\t-\t1\tgene_id "Smr"; transcript_id "NM_167335"; exon_number "8"; exon_id "NM_167335.8"; gene_name "Smr";\n+chrX\trefGene\texon\t12607694\t12609302\t.\t-\t.\tgene_id "Smr"; transcript_id "NM_080536"; exon_number "8"; exon_id "NM_080536.8"; gene_name "Smr";\n+chrX\trefGene\tCDS\t12607694\t12609302\t.\t-\t1\tgene_id "Smr"; transcript_id "NM_080536"; exon_number "8"; exon_id "NM_080536.8"; gene_name "Smr";\n+chrX\trefGene\texon\t16199192\t16201410\t.\t+\t.\tgene_id "CG3679"; transcript_id "NM_001272674"; exon_number "3"; exon_id "NM_001272674.3"; gene_name "CG3679";\n+chrX\trefGene\t3UTR\t16200248\t16201410\t.\t+\t.\tgene_id "CG3679"; transcript_id "NM_001272674"; exon_number "3"; exon_id "NM_001272674.3"; gene_name "CG3679";\n+chrX\trefGene\texon\t16779109\t16779892\t.\t+\t.\tgene_id "Rcp"; transcript_id "NM_132947"; exon_number "3"; exon_id "NM_132947.3"; gene_name "Rcp";\n+chrX\trefGene\t3UTR\t16779550\t16779892\t.\t+\t.\tgene_id "Rcp"; transcript_id "NM_132947"; exon_number "3"; exon_id "NM_132947.3"; gene_name "Rcp";\n+chrX\trefGene\texon\t16779109\t16779892\t.\t+\t.\tgene_id "Rcp"; transcript_id "NM_206770"; exon_number "4"; exon_id "NM_206770.4"; gene_name "Rcp";\n+chrX\trefGene\t3UTR\t16779550\t16779892\t.\t+\t.\tgene_id "Rcp"; transcript_id "NM_206770"; exon_number "4"; exon_id "NM_206770.4"; gene_name "Rcp";\n+chrX\trefGene\texon\t19510696\t19511958\t.\t-\t.\tgene_id "CG12788"; transcript_id "NM_001272782"; exon_number "1"; exon_id "NM_001272782.1"; gene_name "CG12788";\n+chrX\trefGene\t3UTR\t19510696\t19510942\t.\t-\t.\tgene_id "CG12788"; transcript_id "NM_001272782"; exon_number "1"; exon_id "NM_001272782.1"; gene_name "CG12788";\n+chrX\trefGene\texon\t19510696\t19512220\t.\t-\t.\tgene_id "Tim9b"; transcript_id "NM_001031903"; exon_number "1"; exon_id "NM_001031903.1"; gene_name "Tim9b";\n+chrX\trefGene\t3UTR\t19510696\t19511983\t.\t-\t.\tgene_id "Tim9b"; transcript_id "NM_001031903"; exon_number "1"; exon_id "NM_001031903.1"; gene_name "Tim9b";\n+chrX\trefGene\texon\t19510696\t19512220\t.\t-\t.\tgene_id "CG12788"; transcript_id "NM_001272783"; exon_number "1"; exon_id "NM_001272783.1"; gene_name "CG12788";\n+chrX\trefGene\t3UTR\t19510696\t19510942\t.\t-\t.\tgene_id "CG12788"; transcript_id "NM_001272783"; exon_number "1"; exon_id "NM_001272783.1"; gene_name "CG12788";\n+chrX\trefGene\texon\t19510696\t19512220\t.\t-\t.\tgene_id "CG12788"; transcript_id "NM_134485"; exon_number "1"; exon_id "NM_134485.1"; gene_name "CG12788";\n+chrX\trefGene\t3UTR\t19510696\t19510942\t.\t-\t.\tgene_id "CG12788"; transcript_id "NM_134485"; exon_number "1"; exon_id "NM_134485.1"; gene_name "CG12788";\n'

diff -r 000000000000 -r 2dfbcb88d16a test-data/te.gtf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/te.gtf Wed May 13 12:57:29 2020 -0400

b'@@ -0,0 +1,866 @@\n+chr4\tdm3_rmsk\texon\t343119\t348355\t.\t+\t.\tgene_id "Stalker2_I"; transcript_id "Stalker2_I_dup2"; family_id "Gypsy"; class_id "LTR";\n+chr4\tdm3_rmsk\texon\t954243\t955152\t.\t-\t.\tgene_id "DMCR1A"; transcript_id "DMCR1A_dup25"; family_id "CR1"; class_id "LINE";\n+chr4\tdm3_rmsk\texon\t1281301\t1285200\t.\t-\t.\tgene_id "TART"; transcript_id "TART_dup3"; family_id "telomeric"; class_id "LINE";\n+chr4\tdm3_rmsk\texon\t1298748\t1302519\t.\t-\t.\tgene_id "HETA"; transcript_id "HETA_dup2"; family_id "telomeric"; class_id "LINE";\n+chr4\tdm3_rmsk\texon\t1325146\t1336223\t.\t-\t.\tgene_id "TART"; transcript_id "TART_dup10"; family_id "telomeric"; class_id "LINE";\n+chr4\tdm3_rmsk\texon\t1338128\t1349150\t.\t-\t.\tgene_id "TART"; transcript_id "TART_dup15"; family_id "telomeric"; class_id "LINE";\n+chrU\tdm3_rmsk\texon\t191398\t191854\t.\t+\t.\tgene_id "BURDOCK_I"; transcript_id "BURDOCK_I_dup3"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t276311\t276724\t.\t+\t.\tgene_id "DM297_LTR"; transcript_id "DM297_LTR_dup5"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t276725\t281011\t.\t+\t.\tgene_id "DM297_I"; transcript_id "DM297_I_dup7"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t357869\t358422\t.\t-\t.\tgene_id "DMCR1A"; transcript_id "DMCR1A_dup58"; family_id "CR1"; class_id "LINE";\n+chrU\tdm3_rmsk\texon\t444361\t445162\t.\t-\t.\tgene_id "DM297_I"; transcript_id "DM297_I_dup10"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t445163\t445576\t.\t-\t.\tgene_id "DM297_LTR"; transcript_id "DM297_LTR_dup8"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t560147\t564265\t.\t+\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup5"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t585727\t586749\t.\t+\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup7"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t923349\t923833\t.\t-\t.\tgene_id "T412LTR"; transcript_id "T412LTR"; family_id "LTR"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t923724\t930674\t.\t-\t.\tgene_id "DM412"; transcript_id "DM412_dup20"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t930358\t930842\t.\t-\t.\tgene_id "T412LTR"; transcript_id "T412LTR_dup1"; family_id "LTR"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t977434\t977847\t.\t+\t.\tgene_id "DM297_LTR"; transcript_id "DM297_LTR_dup9"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t977848\t984017\t.\t+\t.\tgene_id "DM297_I"; transcript_id "DM297_I_dup11"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t1068318\t1074427\t.\t+\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup12"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t1145421\t1151606\t.\t-\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup14"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t1183521\t1184031\t.\t-\t.\tgene_id "DNAREP1_DM"; transcript_id "DNAREP1_DM_dup737"; family_id "Penelope"; class_id "LINE";\n+chrU\tdm3_rmsk\texon\t1210262\t1212598\t.\t-\t.\tgene_id "Gypsy12_LTR"; transcript_id "Gypsy12_LTR_dup7"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t1217990\t1220370\t.\t-\t.\tgene_id "Gypsy12_LTR"; transcript_id "Gypsy12_LTR_dup8"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t1223765\t1226146\t.\t-\t.\tgene_id "Gypsy12_LTR"; transcript_id "Gypsy12_LTR_dup9"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t1293346\t1293758\t.\t+\t.\tgene_id "DM297_LTR"; transcript_id "DM297_LTR_dup12"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t1293759\t1298196\t.\t+\t.\tgene_id "DM297_I"; transcript_id "DM297_I_dup15"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t1308708\t1311586\t.\t-\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup17"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t1420117\t1423754\t.\t+\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup22"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t1443400\t1449972\t.\t-\t.\tgene_id "NOMAD_I"; transcript_id "NOMAD_I_dup15"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3_rmsk\texon\t1572762\t1573180\t.\t-\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup24"; family_id "Gypsy"; class_id "LTR";\n+chrU\tdm3'..b'8"; family_id "Copia"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t24345996\t24346636\t.\t+\t.\tgene_id "Gypsy12_LTR"; transcript_id "Gypsy12_LTR_dup545"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t24360836\t24361477\t.\t+\t.\tgene_id "QUASIMODO_I"; transcript_id "QUASIMODO_I_dup723"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t24576989\t24577527\t.\t+\t.\tgene_id "IDEFIX_LTR"; transcript_id "IDEFIX_LTR_dup341"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t24811648\t24812150\t.\t+\t.\tgene_id "QUASIMODO_LTR"; transcript_id "QUASIMODO_LTR_dup391"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t25197241\t25197870\t.\t+\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup1185"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t25294542\t25294915\t.\t+\t.\tgene_id "IDEFIX_LTR"; transcript_id "IDEFIX_LTR_dup342"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t25304648\t25305061\t.\t+\t.\tgene_id "DM297_LTR"; transcript_id "DM297_LTR_dup253"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t25305062\t25305121\t.\t+\t.\tgene_id "DM297_I"; transcript_id "DM297_I_dup679"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t25319135\t25319332\t.\t-\t.\tgene_id "Copia2_LTR_DM"; transcript_id "Copia2_LTR_DM_dup129"; family_id "Copia"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t25431843\t25432469\t.\t+\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup1194"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t25722607\t25722945\t.\t+\t.\tgene_id "TIRANT_I"; transcript_id "TIRANT_I_dup139"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t25919521\t25919667\t.\t-\t.\tgene_id "Copia2_LTR_DM"; transcript_id "Copia2_LTR_DM_dup130"; family_id "Copia"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t26246267\t26246681\t.\t+\t.\tgene_id "DM297_LTR"; transcript_id "DM297_LTR_dup255"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t26246682\t26246789\t.\t+\t.\tgene_id "DM297_I"; transcript_id "DM297_I_dup682"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t26305984\t26306164\t.\t-\t.\tgene_id "QUASIMODO_LTR"; transcript_id "QUASIMODO_LTR_dup396"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t26399753\t26400360\t.\t+\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup1224"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t26779758\t26780354\t.\t+\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup1237"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t26821013\t26821485\t.\t-\t.\tgene_id "Gypsy4_I"; transcript_id "Gypsy4_I_dup648"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t27117304\t27117501\t.\t-\t.\tgene_id "Copia2_LTR_DM"; transcript_id "Copia2_LTR_DM_dup132"; family_id "Copia"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t27229943\t27230524\t.\t+\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup1247"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t27234053\t27234637\t.\t+\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup1248"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t27886616\t27886879\t.\t-\t.\tgene_id "IDEFIX_LTR"; transcript_id "IDEFIX_LTR_dup350"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t27905485\t27905571\t.\t-\t.\tgene_id "DM297_I"; transcript_id "DM297_I_dup690"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t27905572\t27905891\t.\t-\t.\tgene_id "DM297_LTR"; transcript_id "DM297_LTR_dup262"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t28209068\t28209265\t.\t+\t.\tgene_id "Copia2_LTR_DM"; transcript_id "Copia2_LTR_DM_dup133"; family_id "Copia"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t28715167\t28715519\t.\t+\t.\tgene_id "TABOR_I"; transcript_id "TABOR_I_dup112"; family_id "Gypsy"; class_id "LTR";\n+chrUextra\tdm3_rmsk\texon\t28866030\t28866253\t.\t+\t.\tgene_id "SAR_DM"; transcript_id "SAR_DM_dup7047"; family_id "Satellite"; class_id "Satellite";\n+chrUextra\tdm3_rmsk\texon\t28961580\t28961826\t.\t-\t.\tgene_id "STALKER4_I"; transcript_id "STALKER4_I_dup1265"; family_id "Gypsy"; class_id "LTR";\n'

diff -r 000000000000 -r 2dfbcb88d16a test-data/treatment1.bam

Binary file test-data/treatment1.bam has changed

diff -r 000000000000 -r 2dfbcb88d16a test-data/treatment2.bam

Binary file test-data/treatment2.bam has changed

diff -r 000000000000 -r 2dfbcb88d16a tetranscript.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tetranscript.xml Wed May 13 12:57:29 2020 -0400

[

b'@@ -0,0 +1,299 @@\n+<?xml version="1.0"?>\n+<tool id="tetoolkit_tetranscripts" name="TEtranscripts" version="@TOOL_VERSION@+@WRAPPER_VERSION@">\n+ <description>annotates reads to genes and transposable elements</description>\n+ <macros>\n+ <token name="@TOOL_VERSION@">2.1.4</token>\n+ <token name="@WRAPPER_VERSION@">galaxy0</token>\n+ </macros>\n+ <requirements>\n+ <requirement type="package" version="@TOOL_VERSION@">tetranscripts</requirement>\n+ </requirements>\n+ <version_command>TEtranscripts --version</version_command>\n+ <command detect_errors="exit_code"><![CDATA[\n+ ## initialize\n+ ## file extension is required\n+ ln -s \'$GTF\' \'gene_annotation.gtf\' &&\n+ ln -s \'$TE\' \'transposable_annotation.gtf\' &&\n+\n+ ## run\n+ TEtranscripts\n+ ## required\n+ -t\n+ #for $s in $sample_rep\n+ \'${s.t}\'\n+ #end for\n+ -c\n+ #for $s in $sample_rep\n+ \'${s.c}\'\n+ #end for\n+ --GTF \'gene_annotation.gtf\'\n+ --TE \'transposable_annotation.gtf\'\n+ ## optional\n+ --stranded \'$io.stranded\'\n+ $io.sortByPos\n+ --project \'result\'\n+ --mode \'$ap.mode\'\n+ --minread $ap.minread\n+ #if $ap.fragmentLength\n+ --fragmentLength $ap.fragmentLength\n+ #end if\n+ --iteration $ap.iteration\n+ --padj $ap.padj\n+ --foldchange $ap.foldchange\n+ #if \'log\' in $ap.out\n+ --verbose 3\n+ |& tee log.txt\n+ #end if\n+ ]]></command>\n+ <inputs>\n+ <repeat name="sample_rep" min="2" title="Select input data">\n+ <param argument="-t" type="data" format="bam" label="Treatment sample file"/>\n+ <param argument="-c" type="data" format="bam" label="Control sample file"/>\n+ </repeat>\n+ <param argument="--GTF" type="data" format="gtf" label="Select GTF file for gene annotations"/>\n+ <param argument="--TE" type="data" format="gtf" label="Select GTF file for transposable element annotations"/>\n+ <section name="io" title="Input options">\n+ <param argument="--stranded" type="select" label="Select library type">\n+ <option value="no">Library is unstranded (no)</option>\n+ <option value="forward">Second-strand cDNA library e.g. QIAseq stranded (forward)</option>\n+ <option value="reverse">First-strand cDNA library e.g. Illumina TruSeq stranded (reverse)</option>\n+ </param>\n+ <param argument="--sortByPos" type="boolean" truevalue="--sortByPos" falsevalue="" label="Are input files sorted by chromosome position?"/>\n+ </section>\n+ <section name="ap" title="Advanced parameters">\n+ <param argument="--mode" type="select" label="Set TE counting mode">\n+ <option value="multi">Distribute among all alignments (multi)</option>\n+ <option value="uniq">Unique mappers only (uniq)</option>\n+ </param>\n+ <param argument="--minread" type="integer" value="1" min="0" label="Set read count cutoff"/>\n+ <param argument="--fragmentLength" type="integer" min="0" optional="true" label="Set average length of fragment used for single-end sequencing" help="For paired-end, estimated from the input alignment file. For single-end, ignored by default."/>\n+ <param argument="--iteration" type="integer" value="100" min="0" label="Set maximum number of iterations used to optimize multi-reads assignment"/>\n+ <param argument="--padj" type="float" value="0.05" min="0.0" max="1.0" label="Set FDR cutoff for significance"/>\n+ <param argument="--foldchange" type="float" value="1.0" min="0.0" label="Set fold-change ratio (absolute) cutoff for differential expression"/>\n+ <param name="out" type="select" multiple="true'..b'hing expression="gene.+"/>\n+ \n+ <has_text_matching expression="TIRANT.+"/>\n+ </assert_contents>\n+ </output>\n+ <output name="out_deseq2">\n+ <assert_contents>\n+ <has_n_lines n="14"/>\n+ <has_text_matching expression="data.+"/>\n+ </assert_contents>\n+ </output>\n+ <output name="out_log">\n+ <assert_contents>\n+ <has_text_matching expression="INFO.+"/>\n+ </assert_contents>\n+ </output>\n+ <output name="out_gta">\n+ <assert_contents>\n+ <has_n_lines n="23"/>\n+ <has_line line="baseMean	log2FoldChange	lfcSE	stat	pvalue	padj"/>\n+ \n+ <has_text_matching expression="TART.+"/>\n+ </assert_contents>\n+ </output>\n+ <output name="out_sgt">\n+ <assert_contents>\n+ <has_n_lines n="2"/>\n+ <has_line line="baseMean	log2FoldChange	lfcSE	stat	pvalue	padj"/>\n+ <has_text_matching expression="Gypsy12.+"/>\n+ </assert_contents>\n+ </output>\n+ </test>\n+ </tests>\n+ <help><![CDATA[\n+.. class:: infomark\n+\n+**What it does**\n+\n+TEtranscripts is a software package that utilizes both unambiguously (uniquely) and ambiguously (multi-) mapped reads to perform differential enrichment analyses from high throughput sequencing experiments. Currently, most expression analysis software packates are not optimized for handling the complexities involved in quantifying highly repetitive regions of the genome, especially transposable elements (TE), from short sequencing reads. Although transposon elements make up between 20 to 80% of many eukaryotic genomes and contribute significantly to the cellular transcriptome output, the difficulty in quantifying their abundances from high throughput sequencing experiments has led them to be largely ignored in most studies. The TEtranscripts provides a noticeable improvement in the recovery of TE transcripts from RNA-Seq experiments and identification of peaks associated with repetitive regions of the genome.\n+\n+**Input**\n+\n+GTF files for gene annotation can be obtained from `UCSC RefSeq <http://genome.ucsc.edu/cgi-bin/hgTables>`_, Ensembl, `iGenomes <http://support.illumina.com/sequencing/sequencing_software/igenome.html>`_ or other annotation databases. GTF files for TE annotations are customly generated from `UCSC RepeatMasker <http://genome.ucsc.edu/cgi-bin/hgTables>`_ or other annotation database. They contain two custom attributes, class_id and family_id, corresponding to the class (e.g. LINE) and family (e.g. L1) of the corresponding transposable element. A unique ID (e.g. L1Md_Gf_dup1) is also assigned for each TE annotation in the transcript_id attribute.\n+\n+**Output**\n+\n+TEtranscripts quantifies both gene and transposable element (TE) transcript abundances from RNA-Seq experiments, utilizing both uniquely and ambiguously mapped short read sequences. It processes the short reads alignments (BAM files) and proportionally assigns read counts to the corresponding gene or TE based on the user-provided annotation files (GTF files). In addition, TEtranscripts combines multiple libraries and perform differential analysis using DESeq2.\n+\n+.. class:: infomark\n+\n+**References**\n+\n+More information are available on the `project website <http://hammelllab.labsites.cshl.edu/software/#TEtranscripts>`_ and `github <https://github.com/mhammell-laboratory/TEtranscripts>`_.\n+ ]]></help>\n+ <citations>\n+ <citation type="doi">10.1093/bioinformatics/btv422</citation>\n+ <citation type="doi">10.1007/978-1-4939-7710-9_11</citation>\n+ </citations>\n+</tool>\n\\ No newline at end of file\n'