Repository 'apollo_export'
hg clone https://toolshed.g2.bx.psu.edu/repos/gga/apollo_export

Changeset 13:b763acecfb57 (2020-06-29)
Previous changeset 12:257230cd202f (2020-04-24) Next changeset 14:0d4234488bd0 (2020-08-19)
Commit message:
"planemo upload for repository https://github.com/galaxy-genome-annotation/galaxy-tools/tree/master/tools/apollo commit 7bf18c69becc57152efdadedf7ebd0bcfa382a15"
modified:
create_features_from_gff3.py
export.py
export.xml
fetch_organism_jbrowse.py
macros.xml
test-data/create_org/output.json
test-data/create_org/output2.json
test-data/export/cdna.fa
test-data/export/cds.fa
test-data/export/pep.fa
added:
test-data/load_gff3/output.txt
removed:
test-data/load_gff3/output.tsv
b
diff -r 257230cd202f -r b763acecfb57 create_features_from_gff3.py
--- a/create_features_from_gff3.py Fri Apr 24 08:55:57 2020 -0400
+++ b/create_features_from_gff3.py Mon Jun 29 09:11:39 2020 -0400
b
@@ -1,5 +1,6 @@
 #!/usr/bin/env python
 import argparse
+import json
 import logging
 
 from apollo import accessible_organisms
@@ -16,6 +17,8 @@
     parser = argparse.ArgumentParser(description='Sample script to add an attribute to a feature via web services')
     parser.add_argument('email', help='User Email')
     parser.add_argument('--source', help='URL where the input dataset can be found.')
+    parser.add_argument('--use_name', action='store_true', help='Use the given name instead of generating one.')
+    parser.add_argument('--disable_cds_recalculation', action='store_true', help='Disable CDS recalculation and instead use the one provided.')
     OrgOrGuess(parser)
 
     parser.add_argument('gff3', type=argparse.FileType('r'), help='GFF3 file')
@@ -42,4 +45,5 @@
     if not orgs:
         raise Exception("You do not have write permission on this organism")
 
-    wa.annotations.load_gff3(org_cn, args.gff3, args.source)
+    load_result = wa.annotations.load_gff3(org_cn, args.gff3, args.source, use_name=args.use_name, disable_cds_recalculation=args.disable_cds_recalculation)
+    print(json.dumps(load_result, indent=2))
b
diff -r 257230cd202f -r b763acecfb57 export.py
--- a/export.py Fri Apr 24 08:55:57 2020 -0400
+++ b/export.py Mon Jun 29 09:11:39 2020 -0400
[
@@ -52,28 +52,28 @@
 
         uuid_gff = wa.io.write_downloadable(org['commonName'], 'GFF3', export_gff3_fasta=True, sequences=seqs)
         if 'error' in uuid_gff or 'uuid' not in uuid_gff:
-            raise Exception("Apollo failed to prepare the file for download: %s" % uuid_gff)
+            raise Exception("Apollo failed to prepare the GFF3 file for download: %s" % uuid_gff)
         args.gff.write(wa.io.download(uuid_gff['uuid'], output_format="text"))
 
         time.sleep(1)
 
         uuid_vcf = wa.io.write_downloadable(org['commonName'], 'VCF', sequences=seqs)
         if 'error' in uuid_vcf or 'uuid' not in uuid_vcf:
-            raise Exception("Apollo failed to prepare the file for download: %s" % uuid_vcf)
+            raise Exception("Apollo failed to prepare the VCF file for download: %s" % uuid_vcf)
         args.vcf.write(wa.io.download(uuid_vcf['uuid'], output_format="text"))
 
         time.sleep(1)
 
         uuid_fa = wa.io.write_downloadable(org['commonName'], 'FASTA', sequences=seqs, seq_type='cdna')
         if 'error' in uuid_fa or 'uuid' not in uuid_fa:
-            raise Exception("Apollo failed to prepare the file for download: %s" % uuid_fa)
+            raise Exception("Apollo failed to prepare the cdna FASTA file for download: %s" % uuid_fa)
         args.fasta_cdna.write(wa.io.download(uuid_fa['uuid'], output_format="text"))
 
         time.sleep(1)
 
         uuid_fa = wa.io.write_downloadable(org['commonName'], 'FASTA', sequences=seqs, seq_type='cds')
         if 'error' in uuid_fa or 'uuid' not in uuid_fa:
-            raise Exception("Apollo failed to prepare the file for download: %s" % uuid_fa)
+            raise Exception("Apollo failed to prepare the cds FASTA file for download: %s" % uuid_fa)
         args.fasta_cds.write(wa.io.download(uuid_fa['uuid'], output_format="text"))
 
         time.sleep(1)
b
diff -r 257230cd202f -r b763acecfb57 export.xml
--- a/export.xml Fri Apr 24 08:55:57 2020 -0400
+++ b/export.xml Mon Jun 29 09:11:39 2020 -0400
b
@@ -49,7 +49,6 @@
               <assert_contents>
                   <has_text text="##sequence-region Merlin 1 172788" />
                   <has_text text="owner=admin@local.host;" />
-                  <has_text text="Name=cds-not-under-exon" />
               </assert_contents>
           </output>
           <output name="fasta_pep" file="export/pep.fa" lines_diff="12"/>
@@ -59,7 +58,6 @@
           <output name="json_out">
               <assert_contents>
                   <has_text text="test_organism" />
-                  <has_text text="apollo_shared_dir/org1" />
               </assert_contents>
           </output>
       </test>
b
diff -r 257230cd202f -r b763acecfb57 fetch_organism_jbrowse.py
--- a/fetch_organism_jbrowse.py Fri Apr 24 08:55:57 2020 -0400
+++ b/fetch_organism_jbrowse.py Mon Jun 29 09:11:39 2020 -0400
b
@@ -57,7 +57,7 @@
 
 
 if __name__ == '__main__':
-    parser = argparse.ArgumentParser(description='Sample script to add an attribute to a feature via web services')
+    parser = argparse.ArgumentParser(description='Script to fetch organism data dir from apollo')
     OrgOrGuess(parser)
     parser.add_argument('target_dir', help='Target directory')
     parser.add_argument('email', help='User Email')
b
diff -r 257230cd202f -r b763acecfb57 macros.xml
--- a/macros.xml Fri Apr 24 08:55:57 2020 -0400
+++ b/macros.xml Mon Jun 29 09:11:39 2020 -0400
b
@@ -1,10 +1,10 @@
 <?xml version="1.0"?>
 <macros>
-  <token name="@WRAPPER_VERSION@">4.2.1</token>
+  <token name="@WRAPPER_VERSION@">4.2.3</token>
 
   <xml name="requirements">
     <requirements>
-      <requirement type="package" version="4.2.1">apollo</requirement>
+      <requirement type="package" version="4.2.3">apollo</requirement>
       <yield/>
     </requirements>
   </xml>
b
diff -r 257230cd202f -r b763acecfb57 test-data/create_org/output.json
--- a/test-data/create_org/output.json Fri Apr 24 08:55:57 2020 -0400
+++ b/test-data/create_org/output.json Mon Jun 29 09:11:39 2020 -0400
b
@@ -1,7 +1,7 @@
 {
   "commonName": "Test org",
   "blatdb": "/data/temporary/apollo_data/1384-Test_org/searchDatabaseData/genome.2bit",
-  "metadata": "{\"creator\":\"20\"}",
+  "metadata": "{\"creator\":\"xx\"}",
   "annotationCount": 0,
   "currentOrganism": true,
   "obsolete": false,
@@ -11,6 +11,6 @@
   "valid": true,
   "genus": "genus",
   "species": null,
-  "id": 23,
+  "id": "xx",
   "nonDefaultTranslationTable": null
 }
b
diff -r 257230cd202f -r b763acecfb57 test-data/create_org/output2.json
--- a/test-data/create_org/output2.json Fri Apr 24 08:55:57 2020 -0400
+++ b/test-data/create_org/output2.json Mon Jun 29 09:11:39 2020 -0400
b
@@ -1,7 +1,7 @@
 {
   "commonName": "Test org",
   "blatdb": "/data/temporary/apollo_data/1384-Test_org/searchDatabaseData/genome.2bit",
-  "metadata": "{\"creator\":\"20\"}",
+  "metadata": "{\"creator\":\"xx\"}",
   "annotationCount": 0,
   "currentOrganism": true,
   "obsolete": false,
@@ -11,6 +11,6 @@
   "valid": true,
   "genus": "genus2",
   "species": "sp",
-  "id": 23,
+  "id": "xx",
   "nonDefaultTranslationTable": null
 }
b
diff -r 257230cd202f -r b763acecfb57 test-data/export/cdna.fa
--- a/test-data/export/cdna.fa Fri Apr 24 08:55:57 2020 -0400
+++ b/test-data/export/cdna.fa Mon Jun 29 09:11:39 2020 -0400
[
@@ -1,4 +1,4 @@
->ff2fe902-7bab-431c-be82-30ed072915d1 (mRNA) 690 residues [Merlin:2-691 + strand] [cdna] name=Unknown
+>df4157db-1481-4120-858c-e6a4c0f78547 (mRNA) 690 residues [Merlin:2-691 + strand] [cdna] name=Merlin_1_mRNA-00001
 CGTTTAGACAAAGGTACATTATTGTATCGTGGCCAAAAATTAGACCTTCCTACATTCGAG
 CATAACGCAGAGAATAAGTTGTTCTATTTCAGAAACTACGTTTCAACTTCATTAAAGCCT
 CTGATCTTTGGTGAATTTGGTCGTATGTTTATGGCACTAGATGACGATACTACAATTTAT
@@ -11,13 +11,13 @@
 CTGTTCATGGAAACAGGTGAAGTAGTAAAACTGTCCGGATTCATGCAGTTCGTCAACGAA
 TCTGCATACGATGAAGAGCAAAACCAGATGGCTGCTGAGATTCTGTCTGGATTCTTGGAC
 ATTGATGACATGCCACGTAAGTTCCGCTAG
->f2e1909a-1d40-4a49-a67b-5fe2afdc4957 (mRNA) 288 residues [Merlin:752-1039 + strand] [cdna] name=Unknown
+>eedd9b31-f1dd-487c-a3ab-6435b2214685 (mRNA) 288 residues [Merlin:752-1039 + strand] [cdna] name=mrna-name-00001
 ATGAAATCAATTTTTCGTATCAACGGTGTAGAAATTGTAGTTGAAGATGTAGTTCCTATG
 TCTTATGAATTCAATGAAGTTGTTTTCAAAGAGCTTAAGAAAATTTTAGGCGATAAGAAG
 CTTCAAAGTACTCCAATTGGACGTTTTGGAATGAAAGAAAACGTTGATACTTATATTGAA
 AGTGTAGTGACAGGGCAGTTAGAAGGTGAATTTTCTGTAGCAGTTCAAACTGTAGAAAAT
 GATGAAGTTATTTTAACTTTACCAGCTTTCGTAATTTTCCGCAAATAA
->12fe0db6-c8e1-4bc9-b594-87c92c6c9669 (mRNA) 945 residues [Merlin:1067-2011 - strand] [cdna] name=Unknown
+>8cd6db6d-b818-4b65-b6f2-de79844a5641 (mRNA) 945 residues [Merlin:1067-2011 - strand] [cdna] name=Merlin_3_mRNA-00001
 ATGCTAACTTTAGATGAATTTAAAAACCAAGCGGGTAATATAGACTTTCAGCGTACTAAT
 ATGTTTAGTTGTGTATTTGCAACTACTCCGTCAGCAAAGTCTCAACAATTACTCGATCAA
 TTTGGCGGTATGCTCTTTAATAACCTTCCGTTGAATAATGACTGGCTTGGATTAACACAA
@@ -34,7 +34,7 @@
 GATTGGATTGAAGATAGAGCTGTTAATTCTATAACTGGAATTAATAGTGAAATGTCTCTT
 AATGGAAGTTTAAGTAGATTATCTAGACTTGGAGGAGCTGCTGGAGGGTTGTCTCACGTC
 ATTAATTCGACCCGAAACTCTACTTCGAAAATACTTGGATTGTAA
->58fc8255-95ed-4417-a373-238f826810ac (mRNA) 1056 residues [Merlin:2011-3066 - strand] [cdna] name=Unknown
+>125a44c4-44da-4854-9d3b-ae2aa0221120 (mRNA) 1056 residues [Merlin:2011-3066 - strand] [cdna] name=Merlin_4_mRNA-00001
 ATGAGCATTAAAGTCAGAGAATTAGATGATAAGACTGATGCTTTAATTAGCGGAGTTAAA
 ACCTCCGCTGGTCAAAGTTCACAATCAGCAAAAATAAAATCCACTATAACTGCGCAATAT
 CCGTCTGAACGTTCAGCTGGTAATGACACATCTGGTTCTTTACGAGTTCATGATCTTTAT
@@ -53,7 +53,7 @@
 TGTCAAATTCAGAGTATCCGTTTTGATAAAACTCCAAATGGAAACTTTAACGGTTTAGCT
 ATAGCTCCAAACCTGCCAAGTACATTCACATTAGAAATTACTATGCGTGAAATCTTGACA
 TTGAACCGAGCTTCAGTATATGCGGAAGGATTCTGA
->c009dd7a-3284-4e7f-9ee1-3b56e2598e07 (mRNA) 1662 residues [Merlin:3066-4796 - strand] [cdna] name=multiexongene
+>87414073-7db0-4a60-903f-5e3593e55884 (mRNA) 1662 residues [Merlin:3066-4796 - strand] [cdna] name=Merlin_5_mRNA-00001
 ATGAAAAGCGAAAACATGTCCACAATGAGACGTCGTAAAGTTATCGCTGATTCAAAGGGT
 GAAAGAGATGCAGCCTCGACTGCATCTGATCAAGTAGACTCTTTAGAATTAATCGGCCTT
 AAACTTGATGATGTACAAAGCGCTAATGAACTAGTTGCTGAAGTAATTGAAGAAAAGGGC
@@ -82,7 +82,7 @@
 AAAGCTGAAAATGCTAAAGAGCAATCTAAAAAATCAACCGGTGATATGAATGTTGCTAAC
 ACTCAGGTTAATAACGTAAATAATAGTAAGACTATTCACCAGGTTCAAACAGTCACGGCT
 ACTCCAGCTCCTGGAGTATTCGGGGCAACAGGAGTTAATTAA
->2706ea76-172a-48c1-b940-eb603996f082 (mRNA) 1056 residues [Merlin:5011-6066 - strand] [cdna] name=cds-not-under-exon
+>1dcb3fc3-3307-4476-9c8a-04d252f9371f (mRNA) 1056 residues [Merlin:5011-6066 - strand] [cdna] name=Merlin_42_mRNA-00001
 CTTTAATGACGCTGGTGAATCAATAAAAGAGATGATCGGTGCAATTTATGAATCAAAACC
 TCTTATAGCACCTGCGATGAACACAATCAACACATATGTTCCTCGAGTTCCATGGACGAG
 TAACATAACTGAATACAAGAAATATGTTCGAGATGTTGCATTAGCAGTAGATAATGACCA
b
diff -r 257230cd202f -r b763acecfb57 test-data/export/cds.fa
--- a/test-data/export/cds.fa Fri Apr 24 08:55:57 2020 -0400
+++ b/test-data/export/cds.fa Mon Jun 29 09:11:39 2020 -0400
[
@@ -1,4 +1,4 @@
->ff2fe902-7bab-431c-be82-30ed072915d1 (mRNA) 690 residues [Merlin:2-691 + strand] [cds] name=Unknown
+>df4157db-1481-4120-858c-e6a4c0f78547 (mRNA) 690 residues [Merlin:2-691 + strand] [cds] name=Merlin_1_mRNA-00001
 CGTTTAGACAAAGGTACATTATTGTATCGTGGCCAAAAATTAGACCTTCCTACATTCGAG
 CATAACGCAGAGAATAAGTTGTTCTATTTCAGAAACTACGTTTCAACTTCATTAAAGCCT
 CTGATCTTTGGTGAATTTGGTCGTATGTTTATGGCACTAGATGACGATACTACAATTTAT
@@ -11,12 +11,30 @@
 CTGTTCATGGAAACAGGTGAAGTAGTAAAACTGTCCGGATTCATGCAGTTCGTCAACGAA
 TCTGCATACGATGAAGAGCAAAACCAGATGGCTGCTGAGATTCTGTCTGGATTCTTGGAC
 ATTGATGACATGCCACGTAAGTTCCGCTAG
->f2e1909a-1d40-4a49-a67b-5fe2afdc4957 (mRNA) 9 residues [Merlin:752-1039 + strand] [cds] name=Unknown
-AAATTTTAG
->12fe0db6-c8e1-4bc9-b594-87c92c6c9669 (mRNA) 108 residues [Merlin:1067-2011 - strand] [cds] name=Unknown
-CACCTCAATTATCACTGCCGGTACTCAACAGCTGGTAAGAAAGTCTGGTGTATCGAAATA
-TCTTATTGGAGCAATGAGCAATCGTGTTGTTCAGTCTTTATTAGGTGA
->58fc8255-95ed-4417-a373-238f826810ac (mRNA) 1056 residues [Merlin:2011-3066 - strand] [cds] name=Unknown
+>eedd9b31-f1dd-487c-a3ab-6435b2214685 (mRNA) 288 residues [Merlin:752-1039 + strand] [cds] name=mrna-name-00001
+ATGAAATCAATTTTTCGTATCAACGGTGTAGAAATTGTAGTTGAAGATGTAGTTCCTATG
+TCTTATGAATTCAATGAAGTTGTTTTCAAAGAGCTTAAGAAAATTTTAGGCGATAAGAAG
+CTTCAAAGTACTCCAATTGGACGTTTTGGAATGAAAGAAAACGTTGATACTTATATTGAA
+AGTGTAGTGACAGGGCAGTTAGAAGGTGAATTTTCTGTAGCAGTTCAAACTGTAGAAAAT
+GATGAAGTTATTTTAACTTTACCAGCTTTCGTAATTTTCCGCAAATAA
+>8cd6db6d-b818-4b65-b6f2-de79844a5641 (mRNA) 945 residues [Merlin:1067-2011 - strand] [cds] name=Merlin_3_mRNA-00001
+ATGCTAACTTTAGATGAATTTAAAAACCAAGCGGGTAATATAGACTTTCAGCGTACTAAT
+ATGTTTAGTTGTGTATTTGCAACTACTCCGTCAGCAAAGTCTCAACAATTACTCGATCAA
+TTTGGCGGTATGCTCTTTAATAACCTTCCGTTGAATAATGACTGGCTTGGATTAACACAA
+GGTGAGTTCACATCAGGACTCACCTCAATTATCACTGCCGGTACTCAACAGCTGGTAAGA
+AAGTCTGGTGTATCGAAATATCTTATTGGAGCAATGAGCAATCGTGTTGTTCAGTCTTTA
+TTAGGTGAATTTGAAGTCGGAACTTATTTGTTAGACTTCTTTAACATGGCTTATCCGCAA
+TCTGGATTGATGATTTATTCGGTCAAAATTCCAGAGAACAGATTGTCTCATGAAATGGAT
+TTCAACCATAACTCACCGAATATTAGAATAACTGGACGTGAACTCGATCCGTTAACTATA
+TCATTCAGAATGGATCCCGAAGCAAGTAACTATCGTGCAATGCAAGATTGGGTGAACTCC
+GTTCAAGACCCGGTTACTGGATTGCGAGCATTACCAACTGACGTCGAAGCTGACATTCAG
+GTTAACCTTCATGCTCGAAATGGATTACCTCATACTGTGATAATGTTCACAGGTTGTGTT
+CCTGTTGCGTGTGGAGCTCCTGAGCTTACATATGAAGGAGATAACCAAATTGCGGTTTTC
+GATGTTACATTTGCTTACAGAGTAATGCAAACGGGTGCTGTTGGACGTCAAGCTGCTCTT
+GATTGGATTGAAGATAGAGCTGTTAATTCTATAACTGGAATTAATAGTGAAATGTCTCTT
+AATGGAAGTTTAAGTAGATTATCTAGACTTGGAGGAGCTGCTGGAGGGTTGTCTCACGTC
+ATTAATTCGACCCGAAACTCTACTTCGAAAATACTTGGATTGTAA
+>125a44c4-44da-4854-9d3b-ae2aa0221120 (mRNA) 1056 residues [Merlin:2011-3066 - strand] [cds] name=Merlin_4_mRNA-00001
 ATGAGCATTAAAGTCAGAGAATTAGATGATAAGACTGATGCTTTAATTAGCGGAGTTAAA
 ACCTCCGCTGGTCAAAGTTCACAATCAGCAAAAATAAAATCCACTATAACTGCGCAATAT
 CCGTCTGAACGTTCAGCTGGTAATGACACATCTGGTTCTTTACGAGTTCATGATCTTTAT
@@ -35,7 +53,7 @@
 TGTCAAATTCAGAGTATCCGTTTTGATAAAACTCCAAATGGAAACTTTAACGGTTTAGCT
 ATAGCTCCAAACCTGCCAAGTACATTCACATTAGAAATTACTATGCGTGAAATCTTGACA
 TTGAACCGAGCTTCAGTATATGCGGAAGGATTCTGA
->c009dd7a-3284-4e7f-9ee1-3b56e2598e07 (mRNA) 1662 residues [Merlin:3066-4796 - strand] [cds] name=multiexongene
+>87414073-7db0-4a60-903f-5e3593e55884 (mRNA) 1662 residues [Merlin:3066-4796 - strand] [cds] name=Merlin_5_mRNA-00001
 ATGAAAAGCGAAAACATGTCCACAATGAGACGTCGTAAAGTTATCGCTGATTCAAAGGGT
 GAAAGAGATGCAGCCTCGACTGCATCTGATCAAGTAGACTCTTTAGAATTAATCGGCCTT
 AAACTTGATGATGTACAAAGCGCTAATGAACTAGTTGCTGAAGTAATTGAAGAAAAGGGC
@@ -64,5 +82,17 @@
 AAAGCTGAAAATGCTAAAGAGCAATCTAAAAAATCAACCGGTGATATGAATGTTGCTAAC
 ACTCAGGTTAATAACGTAAATAATAGTAAGACTATTCACCAGGTTCAAACAGTCACGGCT
 ACTCCAGCTCCTGGAGTATTCGGGGCAACAGGAGTTAATTAA
->2706ea76-172a-48c1-b940-eb603996f082 (mRNA) 6 residues [Merlin:5011-6066 - strand] [cds] name=cds-not-under-exon
-CTTTAA
+>1dcb3fc3-3307-4476-9c8a-04d252f9371f (mRNA) 777 residues [Merlin:5011-6066 - strand] [cds] name=Merlin_42_mRNA-00001
+TTTAATGACGCTGGTGAATCAATAAAAGAGATGATCGGTGCAATTTATGAATCAAAACCT
+CTTATAGCACCTGCGATGAACACAATCAACACATATGTTCCTCGAGTTCCATGGACGAGT
+AACATAACTGAATACAAGAAATATGTTCGAGATGTTGCATTAGCAGTAGATAATGACCAA
+TTCGTTTTTGTATGGGAAGATATCTATGGCTTGAACATGATGGATTATGACGCAATGATT
+AACCAAGAATCAATCAAGGTTATTGTCGGTGAACCACGCACAATAGGTCAATTTGTCGGT
+GAGCTGGAATATAATCTCGCTTATGACTTCCAGTGGTTAACGAAGGCTAATGCCCATACA
+CGCGATCCTATTTTTAACGCTACAATCTATTCACACTCATTCTTGGATAATAACCTTCCT
+AGAATAGTAACAGGTGATGGACAGAATAGCATCTTCGTTTCTCGCTCGGGTGCATATTCT
+GAAATGACTTATCGAAATGGATATGAAGAAGCTATCAGGCTTCAGACTATGGCACAATAC
+GACGGTTATGCAACTTGTAAAATGGTTGGAGACTTTGAAATGACTCCTGGAGATAAGATT
+AATTTCTTTGATCCAAAGAAACAATTCAAAGCTGATTTTTACATTGATGAAGTAATTCAT
+GAAGTAAGTAATAACCAAAGCATAACTACACTTTATATGTTTACTAACTCTCGTAAGTTG
+GAAACAGTAGAACCAATAAAGGTTAAAAATGAACTTAAATCTGATACTACCACTTAA
b
diff -r 257230cd202f -r b763acecfb57 test-data/export/pep.fa
--- a/test-data/export/pep.fa Fri Apr 24 08:55:57 2020 -0400
+++ b/test-data/export/pep.fa Mon Jun 29 09:11:39 2020 -0400
[
@@ -1,20 +1,26 @@
->ff2fe902-7bab-431c-be82-30ed072915d1 (mRNA) 229 residues [Merlin:2-691 + strand] [peptide] name=Unknown
+>df4157db-1481-4120-858c-e6a4c0f78547 (mRNA) 229 residues [Merlin:2-691 + strand] [peptide] name=Merlin_1_mRNA-00001
 RLDKGTLLYRGQKLDLPTFEHNAENKLFYFRNYVSTSLKPLIFGEFGRMFMALDDDTTIY
 TAETPDDYNRFANPEDIIDIGATQKDSFDDNNNDGTSINIGKQVNLGFVISGAENVRVIV
 PGSLTEYPEEAEVILPRGTLLKINKITTQVDKRSNKFMVEGSIVPPSEQIDESVEIYDGD
 LFMETGEVVKLSGFMQFVNESAYDEEQNQMAAEILSGFLDIDDMPRKFR
->f2e1909a-1d40-4a49-a67b-5fe2afdc4957 (mRNA) 2 residues [Merlin:752-1039 + strand] [peptide] name=Unknown
-KF
->12fe0db6-c8e1-4bc9-b594-87c92c6c9669 (mRNA) 35 residues [Merlin:1067-2011 - strand] [peptide] name=Unknown
-HLNYHCRYSTAGKKVWCIEISYWSNEQSCCSVFIR
->58fc8255-95ed-4417-a373-238f826810ac (mRNA) 351 residues [Merlin:2011-3066 - strand] [peptide] name=Unknown
+>eedd9b31-f1dd-487c-a3ab-6435b2214685 (mRNA) 95 residues [Merlin:752-1039 + strand] [peptide] name=mrna-name-00001
+MKSIFRINGVEIVVEDVVPMSYEFNEVVFKELKKILGDKKLQSTPIGRFGMKENVDTYIE
+SVVTGQLEGEFSVAVQTVENDEVILTLPAFVIFRK
+>8cd6db6d-b818-4b65-b6f2-de79844a5641 (mRNA) 314 residues [Merlin:1067-2011 - strand] [peptide] name=Merlin_3_mRNA-00001
+MLTLDEFKNQAGNIDFQRTNMFSCVFATTPSAKSQQLLDQFGGMLFNNLPLNNDWLGLTQ
+GEFTSGLTSIITAGTQQLVRKSGVSKYLIGAMSNRVVQSLLGEFEVGTYLLDFFNMAYPQ
+SGLMIYSVKIPENRLSHEMDFNHNSPNIRITGRELDPLTISFRMDPEASNYRAMQDWVNS
+VQDPVTGLRALPTDVEADIQVNLHARNGLPHTVIMFTGCVPVACGAPELTYEGDNQIAVF
+DVTFAYRVMQTGAVGRQAALDWIEDRAVNSITGINSEMSLNGSLSRLSRLGGAAGGLSHV
+INSTRNSTSKILGL
+>125a44c4-44da-4854-9d3b-ae2aa0221120 (mRNA) 351 residues [Merlin:2011-3066 - strand] [peptide] name=Merlin_4_mRNA-00001
 MSIKVRELDDKTDALISGVKTSAGQSSQSAKIKSTITAQYPSERSAGNDTSGSLRVHDLY
 KNGLLFTAYDMNSRTTGDMRSMRLGEMKRTANSVVKSITGTNTNKVDKIPVVNILLPRSK
 SDVESVSHKFNDVGDSLISRGGGTATGVLSNVASTAVFGGLESLTQGLMADHNEQIYNTA
 RSMYGGADNRTKVFTWDLTPRSVQDLIAIIEIYEYFNYYSYGETGTSTYAKEVKSQLDEW
 YKSTFLDTLTPDEANKNDTVFEKITSFLSNVIVVSNPTVWFVRNFGTTSKFDGRAEVFGP
 CQIQSIRFDKTPNGNFNGLAIAPNLPSTFTLEITMREILTLNRASVYAEGF
->c009dd7a-3284-4e7f-9ee1-3b56e2598e07 (mRNA) 553 residues [Merlin:3066-4796 - strand] [peptide] name=multiexongene
+>87414073-7db0-4a60-903f-5e3593e55884 (mRNA) 553 residues [Merlin:3066-4796 - strand] [peptide] name=Merlin_5_mRNA-00001
 MKSENMSTMRRRKVIADSKGERDAASTASDQVDSLELIGLKLDDVQSANELVAEVIEEKG
 NNLIDSVDNVAEGTELAAEASERTTESIKTLTGVASTISDKLSKLASMLESKVQAVEQKV
 QESGASASTGLSVIEDKLPDPDEPFFPPVPQEPENNKKDQKKDDKKPTDMLGDLLKTTKG
@@ -25,5 +31,9 @@
 YIGDVDPENPTNMQSLEKAYNSAKKSISDSAISDQPATKKELDKRFQRVESKYQKLKEDN
 TPKPAAPATSEDNQRVQNIQKAENAKEQSKKSTGDMNVANTQVNNVNNSKTIHQVQTVTA
 TPAPGVFGATGVN
->2706ea76-172a-48c1-b940-eb603996f082 (mRNA) 1 residues [Merlin:5011-6066 - strand] [peptide] name=cds-not-under-exon
-L
+>1dcb3fc3-3307-4476-9c8a-04d252f9371f (mRNA) 258 residues [Merlin:5011-6066 - strand] [peptide] name=Merlin_42_mRNA-00001
+FNDAGESIKEMIGAIYESKPLIAPAMNTINTYVPRVPWTSNITEYKKYVRDVALAVDNDQ
+FVFVWEDIYGLNMMDYDAMINQESIKVIVGEPRTIGQFVGELEYNLAYDFQWLTKANAHT
+RDPIFNATIYSHSFLDNNLPRIVTGDGQNSIFVSRSGAYSEMTYRNGYEEAIRLQTMAQY
+DGYATCKMVGDFEMTPGDKINFFDPKKQFKADFYIDEVIHEVSNNQSITTLYMFTNSRKL
+ETVEPIKVKNELKSDTTT
b
diff -r 257230cd202f -r b763acecfb57 test-data/load_gff3/output.tsv
--- a/test-data/load_gff3/output.tsv Fri Apr 24 08:55:57 2020 -0400
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
@@ -1,7 +0,0 @@
-# Feature ID Apollo ID Success Messages
-Merlin_1 a036ab4f-512d-45e3-b19e-1fe83984a185 success
-Merlin_2 4a3f5c6b-03fc-43d1-8d6d-1a7075931cc6 success
-Merlin_3 de819682-eb71-4b98-a532-032d59354b95 success
-Merlin_4 423ca5cc-d570-4ae8-8527-6a52e0a6862b success
-Merlin_5 f1b5327d-79ca-40f0-b4b3-90ea03d79a56 success
-Merlin_42 3629a7fe-03bb-420d-85d3-f23e55430abd success
b
diff -r 257230cd202f -r b763acecfb57 test-data/load_gff3/output.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/load_gff3/output.txt Mon Jun 29 09:11:39 2020 -0400
[
b'@@ -0,0 +1,646 @@\n+{\n+  "Merlin_1_mRNA": {\n+    "owner": "admin@local.host",\n+    "parent_name": "Merlin_1_mRNA",\n+    "uniquename": "d33cb6e8-0809-442f-84ff-015aff163846",\n+    "type": {\n+      "cv": {\n+        "name": "sequence"\n+      },\n+      "name": "mRNA"\n+    },\n+    "parent_type": {\n+      "cv": {\n+        "name": "sequence"\n+      },\n+      "name": "gene"\n+    },\n+    "date_creation": 1593424039041,\n+    "sequence": "Merlin",\n+    "children": [\n+      {\n+        "owner": "None",\n+        "parent_name": "Merlin_1_mRNA-00001",\n+        "uniquename": "d33cb6e8-0809-442f-84ff-015aff163846-CDS",\n+        "type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "CDS"\n+        },\n+        "parent_type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "mRNA"\n+        },\n+        "date_creation": 1593424039071,\n+        "sequence": "Merlin",\n+        "parent_id": "d33cb6e8-0809-442f-84ff-015aff163846",\n+        "name": "d33cb6e8-0809-442f-84ff-015aff163846-CDS",\n+        "location": {\n+          "strand": 1,\n+          "is_fmin_partial": true,\n+          "id": 459,\n+          "fmin": 1,\n+          "fmax": 691\n+        },\n+        "id": 458,\n+        "properties": [],\n+        "date_last_modified": 1593424039095\n+      },\n+      {\n+        "owner": "None",\n+        "parent_name": "Merlin_1_mRNA-00001",\n+        "uniquename": "0356ce47-8746-4557-9f45-2b08625ebc63",\n+        "type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "exon"\n+        },\n+        "parent_type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "mRNA"\n+        },\n+        "date_creation": 1593424039029,\n+        "sequence": "Merlin",\n+        "parent_id": "d33cb6e8-0809-442f-84ff-015aff163846",\n+        "name": "0356ce47-8746-4557-9f45-2b08625ebc63",\n+        "location": {\n+          "strand": 1,\n+          "id": 455,\n+          "fmin": 1,\n+          "fmax": 691\n+        },\n+        "id": 454,\n+        "properties": [],\n+        "date_last_modified": 1593424039078\n+      }\n+    ],\n+    "parent_id": "436dee83-9e76-44c3-94a8-37ac15c57e8e",\n+    "name": "Merlin_1_mRNA-00001",\n+    "location": {\n+      "strand": 1,\n+      "id": 453,\n+      "fmin": 1,\n+      "fmax": 691\n+    },\n+    "id": 452,\n+    "properties": [],\n+    "date_last_modified": 1593424039249\n+  },\n+  "Merlin_2_mRNA": {\n+    "owner": "admin@local.host",\n+    "parent_name": "mrna-name",\n+    "uniquename": "d5d0e6eb-458d-4402-b2ee-c19e4c1e0666",\n+    "type": {\n+      "cv": {\n+        "name": "sequence"\n+      },\n+      "name": "mRNA"\n+    },\n+    "parent_type": {\n+      "cv": {\n+        "name": "sequence"\n+      },\n+      "name": "gene"\n+    },\n+    "date_creation": 1593424039315,\n+    "sequence": "Merlin",\n+    "children": [\n+      {\n+        "owner": "None",\n+        "parent_name": "mrna-name-00001",\n+        "uniquename": "d5d0e6eb-458d-4402-b2ee-c19e4c1e0666-CDS",\n+        "type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "CDS"\n+        },\n+        "parent_type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "mRNA"\n+        },\n+        "date_creation": 1593424039321,\n+        "sequence": "Merlin",\n+        "parent_id": "d5d0e6eb-458d-4402-b2ee-c19e4c1e0666",\n+        "name": "d5d0e6eb-458d-4402-b2ee-c19e4c1e0666-CDS",\n+        "location": {\n+          "strand": 1,\n+          "id": 471,\n+          "fmin": 751,\n+          "fmax": 1039\n+        },\n+        "id": 470,\n+        "properties": [],\n+        "date_last_modified": 1593424039334\n+      },\n+      {\n+        "owner": "None",\n+        "parent_name": "mrna-name-00001",\n+        "uniquename": "46e2b6ce-5cf2-4472-b858-9535a374f535",\n+        "type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "exon"\n+        },\n+        "parent_type": {\n+          "cv": {\n+            "n'..b',\n+          "name": "mRNA"\n+        },\n+        "date_creation": 1593424039699,\n+        "sequence": "Merlin",\n+        "parent_id": "19b80336-a138-4276-96e1-116a7787afe8",\n+        "name": "31a23617-42b1-4bf1-a65d-45eccdd17e8e",\n+        "location": {\n+          "strand": -1,\n+          "id": 525,\n+          "fmin": 4365,\n+          "fmax": 4796\n+        },\n+        "id": 524,\n+        "properties": [],\n+        "date_last_modified": 1593424039716\n+      },\n+      {\n+        "owner": "None",\n+        "parent_name": "Merlin_5_mRNA-00001",\n+        "uniquename": "19b80336-a138-4276-96e1-116a7787afe8-CDS",\n+        "type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "CDS"\n+        },\n+        "parent_type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "mRNA"\n+        },\n+        "date_creation": 1593424039710,\n+        "sequence": "Merlin",\n+        "parent_id": "19b80336-a138-4276-96e1-116a7787afe8",\n+        "name": "19b80336-a138-4276-96e1-116a7787afe8-CDS",\n+        "location": {\n+          "strand": -1,\n+          "id": 529,\n+          "fmin": 3065,\n+          "fmax": 4796\n+        },\n+        "id": 528,\n+        "properties": [],\n+        "date_last_modified": 1593424039722\n+      }\n+    ],\n+    "parent_id": "f380f7b1-2b7d-45cd-8d0b-2519b1b0afee",\n+    "name": "Merlin_5_mRNA-00001",\n+    "location": {\n+      "strand": -1,\n+      "id": 520,\n+      "fmin": 3065,\n+      "fmax": 4796\n+    },\n+    "id": 519,\n+    "properties": [],\n+    "date_last_modified": 1593424039810\n+  },\n+  "Merlin_42_mRNA": {\n+    "owner": "admin@local.host",\n+    "parent_name": "Merlin_42_mRNA",\n+    "uniquename": "0e34cfa5-6f64-4111-9c2f-37655f6f1b92",\n+    "type": {\n+      "cv": {\n+        "name": "sequence"\n+      },\n+      "name": "mRNA"\n+    },\n+    "parent_type": {\n+      "cv": {\n+        "name": "sequence"\n+      },\n+      "name": "gene"\n+    },\n+    "date_creation": 1593424039850,\n+    "sequence": "Merlin",\n+    "children": [\n+      {\n+        "owner": "None",\n+        "parent_name": "Merlin_42_mRNA-00001",\n+        "uniquename": "6596e6e2-a894-4c0b-98c1-298c65f0c021",\n+        "type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "exon"\n+        },\n+        "parent_type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "mRNA"\n+        },\n+        "date_creation": 1593424039841,\n+        "sequence": "Merlin",\n+        "parent_id": "0e34cfa5-6f64-4111-9c2f-37655f6f1b92",\n+        "name": "6596e6e2-a894-4c0b-98c1-298c65f0c021",\n+        "location": {\n+          "strand": -1,\n+          "id": 543,\n+          "fmin": 5010,\n+          "fmax": 6066\n+        },\n+        "id": 542,\n+        "properties": [],\n+        "date_last_modified": 1593424039847\n+      },\n+      {\n+        "owner": "None",\n+        "parent_name": "Merlin_42_mRNA-00001",\n+        "uniquename": "a42c4166-5211-49b9-9110-e5fd41c9d2cb",\n+        "type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "CDS"\n+        },\n+        "parent_type": {\n+          "cv": {\n+            "name": "sequence"\n+          },\n+          "name": "mRNA"\n+        },\n+        "date_creation": 1593424039849,\n+        "sequence": "Merlin",\n+        "parent_id": "0e34cfa5-6f64-4111-9c2f-37655f6f1b92",\n+        "name": "a42c4166-5211-49b9-9110-e5fd41c9d2cb",\n+        "location": {\n+          "strand": -1,\n+          "id": 546,\n+          "fmin": 5288,\n+          "fmax": 6065,\n+          "is_fmax_partial": true\n+        },\n+        "id": 545,\n+        "properties": [],\n+        "date_last_modified": 1593424039867\n+      }\n+    ],\n+    "parent_id": "f7843db6-26da-44f9-ae05-6bb92ca573f6",\n+    "name": "Merlin_42_mRNA-00001",\n+    "location": {\n+      "strand": -1,\n+      "id": 541,\n+      "fmin": 5010,\n+      "fmax": 6066\n+    },\n+    "id": 540,\n+    "properties": [],\n+    "date_last_modified": 1593424039879\n+  }\n+}\n'