Mercurial > repos > johnheap > vapper
changeset 19:fe79425b1fa4 draft
Uploaded
author | johnheap |
---|---|
date | Mon, 03 Jun 2019 16:01:16 -0400 |
parents | e7da2274c9f6 |
children | 26ec953069b3 |
files | Tryp_V_T.py |
diffstat | 1 files changed, 425 insertions(+), 2611 deletions(-) [+] |
line wrap: on
line diff
--- a/Tryp_V_T.py Mon Jun 03 16:00:24 2019 -0400 +++ b/Tryp_V_T.py Mon Jun 03 16:01:16 2019 -0400 @@ -1,2611 +1,425 @@ - - - - - - -<!DOCTYPE html> -<html lang="en"> - <head> - <meta charset="utf-8"> - <link rel="dns-prefetch" href="https://github.githubassets.com"> - <link rel="dns-prefetch" href="https://avatars0.githubusercontent.com"> - <link rel="dns-prefetch" href="https://avatars1.githubusercontent.com"> - <link rel="dns-prefetch" href="https://avatars2.githubusercontent.com"> - <link rel="dns-prefetch" href="https://avatars3.githubusercontent.com"> - <link rel="dns-prefetch" href="https://github-cloud.s3.amazonaws.com"> - <link rel="dns-prefetch" href="https://user-images.githubusercontent.com/"> - - - - <link crossorigin="anonymous" media="all" integrity="sha512-3+HOqCwtQal5hOJQ+mdxiq5zmGOTjF6RhjDsPLxbKDYgGlLFeCwzoIanb7j5IiCuXKUqyC2q8FdkC4nmx2P2rA==" rel="stylesheet" href="https://github.githubassets.com/assets/frameworks-a2fba223d5af91496cac70d4ec3624df.css" /> - <link crossorigin="anonymous" media="all" integrity="sha512-MRlTIqIyb8caK5+o8llXVntXovciHyAM4qE3kWU2S7SIjAPDxYp4mE0jQp4kP5UYegy+lG9y1I6VlsdzEjb5Qw==" rel="stylesheet" href="https://github.githubassets.com/assets/site-294181adec18ed639e160b96b45d17ac.css" /> - <link crossorigin="anonymous" media="all" integrity="sha512-XjvAy/mMWN5aOA+pyb/FgAgcVgJkPkwTCwvFK07Ez/H44lvl55ZLGwtpyL4MaMrwDE8QYO+1VYljKFjqr4/iJA==" rel="stylesheet" href="https://github.githubassets.com/assets/github-5b066aa36cc405c9cbcbadf1bde399ed.css" /> - - - - - - <meta name="viewport" content="width=device-width"> - - <title>VAPPER-Galaxy/Tryp_V_T.py at master · johnheap/VAPPER-Galaxy · GitHub</title> - <meta name="description" content="Contribute to johnheap/VAPPER-Galaxy development by creating an account on GitHub."> - <link rel="search" type="application/opensearchdescription+xml" href="/opensearch.xml" title="GitHub"> - <link rel="fluid-icon" href="https://github.com/fluidicon.png" title="GitHub"> - <meta property="fb:app_id" content="1401488693436528"> - - <meta name="twitter:image:src" content="https://avatars0.githubusercontent.com/u/24318980?s=400&v=4" /><meta name="twitter:site" content="@github" /><meta name="twitter:card" content="summary" /><meta name="twitter:title" content="johnheap/VAPPER-Galaxy" /><meta name="twitter:description" content="Contribute to johnheap/VAPPER-Galaxy development by creating an account on GitHub." /> - <meta property="og:image" content="https://avatars0.githubusercontent.com/u/24318980?s=400&v=4" /><meta property="og:site_name" content="GitHub" /><meta property="og:type" content="object" /><meta property="og:title" content="johnheap/VAPPER-Galaxy" /><meta property="og:url" content="https://github.com/johnheap/VAPPER-Galaxy" /><meta property="og:description" content="Contribute to johnheap/VAPPER-Galaxy development by creating an account on GitHub." /> - - <link rel="assets" href="https://github.githubassets.com/"> - - <meta name="pjax-timeout" content="1000"> - - <meta name="request-id" content="A691:31FC:5350A:9C70E:5CF5626C" data-pjax-transient> - - - - - <meta name="selected-link" value="repo_source" data-pjax-transient> - - <meta name="google-site-verification" content="KT5gs8h0wvaagLKAVWq8bbeNwnZZK1r1XQysX3xurLU"> - <meta name="google-site-verification" content="ZzhVyEFwb7w3e0-uOTltm8Jsck2F5StVihD0exw2fsA"> - <meta name="google-site-verification" content="GXs5KoUUkNCoaAZn7wPN-t01Pywp9M3sEjnt_3_ZWPc"> - - <meta name="octolytics-host" content="collector.githubapp.com" /><meta name="octolytics-app-id" content="github" /><meta name="octolytics-event-url" content="https://collector.githubapp.com/github-external/browser_event" /><meta name="octolytics-dimension-request_id" content="A691:31FC:5350A:9C70E:5CF5626C" /><meta name="octolytics-dimension-region_edge" content="iad" /><meta name="octolytics-dimension-region_render" content="iad" /> -<meta name="analytics-location" content="/<user-name>/<repo-name>/blob/show" data-pjax-transient="true" /> - - - - <meta name="google-analytics" content="UA-3769691-2"> - - -<meta class="js-ga-set" name="dimension1" content="Logged Out"> - - - - - - <meta name="hostname" content="github.com"> - <meta name="user-login" content=""> - - <meta name="expected-hostname" content="github.com"> - <meta name="js-proxy-site-detection-payload" content="NzYzOGJlZTMwMzU0NWQ4MmU4MGE3MDYxZDI2MDFiZjQxMjBkYTg5NWI1NWRjYzdmZWNjMmE4MWRhZGIxMTMyN3x7InJlbW90ZV9hZGRyZXNzIjoiMTI4LjExOC4yNTAuNSIsInJlcXVlc3RfaWQiOiJBNjkxOjMxRkM6NTM1MEE6OUM3MEU6NUNGNTYyNkMiLCJ0aW1lc3RhbXAiOjE1NTk1ODUzODksImhvc3QiOiJnaXRodWIuY29tIn0="> - - <meta name="enabled-features" content="UNIVERSE_BANNER,MARKETPLACE_INVOICED_BILLING,MARKETPLACE_SOCIAL_PROOF_CUSTOMERS,MARKETPLACE_TRENDING_SOCIAL_PROOF,MARKETPLACE_RECOMMENDATIONS"> - - <meta name="html-safe-nonce" content="a37d7307800ea044bd751b0f42a3fd6deab2c7ff"> - - <meta http-equiv="x-pjax-version" content="af1499c2254d0582d0a98af1dfd7f11b"> - - - <link href="https://github.com/johnheap/VAPPER-Galaxy/commits/master.atom" rel="alternate" title="Recent Commits to VAPPER-Galaxy:master" type="application/atom+xml"> - - <meta name="go-import" content="github.com/johnheap/VAPPER-Galaxy git https://github.com/johnheap/VAPPER-Galaxy.git"> - - <meta name="octolytics-dimension-user_id" content="24318980" /><meta name="octolytics-dimension-user_login" content="johnheap" /><meta name="octolytics-dimension-repository_id" content="139730674" /><meta name="octolytics-dimension-repository_nwo" content="johnheap/VAPPER-Galaxy" /><meta name="octolytics-dimension-repository_public" content="true" /><meta name="octolytics-dimension-repository_is_fork" content="false" /><meta name="octolytics-dimension-repository_network_root_id" content="139730674" /><meta name="octolytics-dimension-repository_network_root_nwo" content="johnheap/VAPPER-Galaxy" /><meta name="octolytics-dimension-repository_explore_github_marketplace_ci_cta_shown" content="false" /> - - - <link rel="canonical" href="https://github.com/johnheap/VAPPER-Galaxy/blob/master/Tryp_V_T.py" data-pjax-transient> - - - <meta name="browser-stats-url" content="https://api.github.com/_private/browser/stats"> - - <meta name="browser-errors-url" content="https://api.github.com/_private/browser/errors"> - - <link rel="mask-icon" href="https://github.githubassets.com/pinned-octocat.svg" color="#000000"> - <link rel="icon" type="image/x-icon" class="js-site-favicon" href="https://github.githubassets.com/favicon.ico"> - -<meta name="theme-color" content="#1e2327"> - - - - - - <link rel="manifest" href="/manifest.json" crossOrigin="use-credentials"> - - </head> - - <body class="logged-out env-production page-responsive page-blob"> - - - <div class="position-relative js-header-wrapper "> - <a href="#start-of-content" tabindex="1" class="px-2 py-4 bg-blue text-white show-on-focus js-skip-to-content">Skip to content</a> - <div id="js-pjax-loader-bar" class="pjax-loader-bar"><div class="progress"></div></div> - - - - - - - <header class="Header-old header-logged-out js-details-container Details position-relative f4 py-2" role="banner"> - <div class="container-lg d-lg-flex flex-items-center p-responsive"> - <div class="d-flex flex-justify-between flex-items-center"> - <a class="mr-4" href="https://github.com/" aria-label="Homepage" data-ga-click="(Logged out) Header, go to homepage, icon:logo-wordmark"> - <svg height="32" class="octicon octicon-mark-github text-white" viewBox="0 0 16 16" version="1.1" width="32" aria-hidden="true"><path fill-rule="evenodd" d="M8 0C3.58 0 0 3.58 0 8c0 3.54 2.29 6.53 5.47 7.59.4.07.55-.17.55-.38 0-.19-.01-.82-.01-1.49-2.01.37-2.53-.49-2.69-.94-.09-.23-.48-.94-.82-1.13-.28-.15-.68-.52-.01-.53.63-.01 1.08.58 1.23.82.72 1.21 1.87.87 2.33.66.07-.52.28-.87.51-1.07-1.78-.2-3.64-.89-3.64-3.95 0-.87.31-1.59.82-2.15-.08-.2-.36-1.02.08-2.12 0 0 .67-.21 2.2.82.64-.18 1.32-.27 2-.27.68 0 1.36.09 2 .27 1.53-1.04 2.2-.82 2.2-.82.44 1.1.16 1.92.08 2.12.51.56.82 1.27.82 2.15 0 3.07-1.87 3.75-3.65 3.95.29.25.54.73.54 1.48 0 1.07-.01 1.93-.01 2.2 0 .21.15.46.55.38A8.013 8.013 0 0 0 16 8c0-4.42-3.58-8-8-8z"/></svg> - </a> - - <div class="d-lg-none css-truncate css-truncate-target width-fit p-2"> - - <svg class="octicon octicon-repo" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M4 9H3V8h1v1zm0-3H3v1h1V6zm0-2H3v1h1V4zm0-2H3v1h1V2zm8-1v12c0 .55-.45 1-1 1H6v2l-1.5-1.5L3 16v-2H1c-.55 0-1-.45-1-1V1c0-.55.45-1 1-1h10c.55 0 1 .45 1 1zm-1 10H1v2h2v-1h3v1h5v-2zm0-10H2v9h9V1z"/></svg> - <a class="Header-link" href="/johnheap">johnheap</a> - / - <a class="Header-link" href="/johnheap/VAPPER-Galaxy">VAPPER-Galaxy</a> - - - </div> - - <div class="d-flex flex-items-center"> - <a class="d-inline-block d-lg-none f5 text-white no-underline border border-gray-dark rounded-2 px-2 py-1 mr-3 mr-sm-5" data-hydro-click="{"event_type":"authentication.click","payload":{"location_in_page":"site header","repository_id":null,"auth_type":"SIGN_UP","client_id":null,"originating_request_id":"A691:31FC:5350A:9C70E:5CF5626C","originating_url":"https://github.com/johnheap/VAPPER-Galaxy/blob/master/Tryp_V_T.py","referrer":null,"user_id":null}}" data-hydro-click-hmac="dafab2b648ecc3a2244a0de6c85d4884478b192e1ed71d278d79bf55e6dcddd9" data-ga-click="(Logged out) Header, clicked Sign up, text:sign-up" href="/join?source=header-repo"> - Sign up -</a> - <button class="btn-link d-lg-none mt-1 js-details-target" type="button" aria-label="Toggle navigation" aria-expanded="false"> - <svg height="24" class="octicon octicon-three-bars text-white" viewBox="0 0 12 16" version="1.1" width="18" aria-hidden="true"><path fill-rule="evenodd" d="M11.41 9H.59C0 9 0 8.59 0 8c0-.59 0-1 .59-1H11.4c.59 0 .59.41.59 1 0 .59 0 1-.59 1h.01zm0-4H.59C0 5 0 4.59 0 4c0-.59 0-1 .59-1H11.4c.59 0 .59.41.59 1 0 .59 0 1-.59 1h.01zM.59 11H11.4c.59 0 .59.41.59 1 0 .59 0 1-.59 1H.59C0 13 0 12.59 0 12c0-.59 0-1 .59-1z"/></svg> - </button> - </div> - </div> - - <div class="HeaderMenu HeaderMenu--logged-out position-fixed top-0 right-0 bottom-0 height-fit position-lg-relative d-lg-flex flex-justify-between flex-items-center flex-auto"> - <div class="d-flex d-lg-none flex-justify-end border-bottom bg-gray-light p-3"> - <button class="btn-link js-details-target" type="button" aria-label="Toggle navigation" aria-expanded="false"> - <svg height="24" class="octicon octicon-x text-gray" viewBox="0 0 12 16" version="1.1" width="18" aria-hidden="true"><path fill-rule="evenodd" d="M7.48 8l3.75 3.75-1.48 1.48L6 9.48l-3.75 3.75-1.48-1.48L4.52 8 .77 4.25l1.48-1.48L6 6.52l3.75-3.75 1.48 1.48L7.48 8z"/></svg> - </button> - </div> - - <nav class="mt-0 px-3 px-lg-0 mb-5 mb-lg-0" aria-label="Global"> - <ul class="d-lg-flex list-style-none"> - <li class="d-block d-lg-flex flex-lg-nowrap flex-lg-items-center border-bottom border-lg-bottom-0 mr-0 mr-lg-3 edge-item-fix position-relative flex-wrap flex-justify-between d-flex flex-items-center "> - <details class="HeaderMenu-details details-overlay details-reset width-full"> - <summary class="HeaderMenu-summary HeaderMenu-link px-0 py-3 border-0 no-wrap d-block d-lg-inline-block"> - Why GitHub? - <svg x="0px" y="0px" viewBox="0 0 14 8" xml:space="preserve" fill="none" class="icon-chevon-down-mktg position-absolute position-lg-relative"> - <path d="M1,1l6.2,6L13,1"></path> - </svg> - </summary> - <div class="dropdown-menu flex-auto rounded-1 bg-white px-0 mt-0 pb-4 p-lg-4 position-relative position-lg-absolute left-0 left-lg-n4"> - <a href="/features" class="py-2 lh-condensed-ultra d-block link-gray-dark no-underline h5 Bump-link--hover" data-ga-click="(Logged out) Header, go to Features">Features <span class="Bump-link-symbol float-right text-normal text-gray-light">→</span></a> - <ul class="list-style-none f5 pb-3"> - <li class="edge-item-fix"><a href="/features/code-review/" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Code review">Code review</a></li> - <li class="edge-item-fix"><a href="/features/project-management/" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Project management">Project management</a></li> - <li class="edge-item-fix"><a href="/features/integrations" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Integrations">Integrations</a></li> - <li class="edge-item-fix"><a href="/features/actions" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Actions">Actions</a> - <li class="edge-item-fix"><a href="/features/package-registry" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Package Registry">Package registry</a> - <li class="edge-item-fix"><a href="/features#team-management" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Team management">Team management</a></li> - <li class="edge-item-fix"><a href="/features#social-coding" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Social coding">Social coding</a></li> - <li class="edge-item-fix"><a href="/features#documentation" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Documentation">Documentation</a></li> - <li class="edge-item-fix"><a href="/features#code-hosting" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Code hosting">Code hosting</a></li> - </ul> - - <ul class="list-style-none mb-0 border-lg-top pt-lg-3"> - <li class="edge-item-fix"><a href="/customer-stories" class="py-2 lh-condensed-ultra d-block no-underline link-gray-dark no-underline h5 Bump-link--hover" data-ga-click="(Logged out) Header, go to Customer stories">Customer stories <span class="Bump-link-symbol float-right text-normal text-gray-light">→</span></a></li> - <li class="edge-item-fix"><a href="/security" class="py-2 lh-condensed-ultra d-block no-underline link-gray-dark no-underline h5 Bump-link--hover" data-ga-click="(Logged out) Header, go to Security">Security <span class="Bump-link-symbol float-right text-normal text-gray-light">→</span></a></li> - </ul> - </div> - </details> - </li> - <li class="border-bottom border-lg-bottom-0 mr-0 mr-lg-3"> - <a href="/enterprise" class="HeaderMenu-link no-underline py-3 d-block d-lg-inline-block" data-ga-click="(Logged out) Header, go to Enterprise">Enterprise</a> - </li> - - <li class="d-block d-lg-flex flex-lg-nowrap flex-lg-items-center border-bottom border-lg-bottom-0 mr-0 mr-lg-3 edge-item-fix position-relative flex-wrap flex-justify-between d-flex flex-items-center "> - <details class="HeaderMenu-details details-overlay details-reset width-full"> - <summary class="HeaderMenu-summary HeaderMenu-link px-0 py-3 border-0 no-wrap d-block d-lg-inline-block"> - Explore - <svg x="0px" y="0px" viewBox="0 0 14 8" xml:space="preserve" fill="none" class="icon-chevon-down-mktg position-absolute position-lg-relative"> - <path d="M1,1l6.2,6L13,1"></path> - </svg> - </summary> - - <div class="dropdown-menu flex-auto rounded-1 bg-white px-0 pt-2 pb-0 mt-0 pb-4 p-lg-4 position-relative position-lg-absolute left-0 left-lg-n4"> - <ul class="list-style-none mb-3"> - <li class="edge-item-fix"><a href="/explore" class="py-2 lh-condensed-ultra d-block link-gray-dark no-underline h5 Bump-link--hover" data-ga-click="(Logged out) Header, go to Explore">Explore GitHub <span class="Bump-link-symbol float-right text-normal text-gray-light">→</span></a></li> - </ul> - - <h4 class="text-gray-light text-normal text-mono f5 mb-2 border-lg-top pt-lg-3">Learn & contribute</h4> - <ul class="list-style-none mb-3"> - <li class="edge-item-fix"><a href="/topics" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Topics">Topics</a></li> - <li class="edge-item-fix"><a href="/collections" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Collections">Collections</a></li> - <li class="edge-item-fix"><a href="/trending" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Trending">Trending</a></li> - <li class="edge-item-fix"><a href="https://lab.github.com/" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Learning lab">Learning Lab</a></li> - <li class="edge-item-fix"><a href="https://opensource.guide" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Open source guides">Open source guides</a></li> - </ul> - - <h4 class="text-gray-light text-normal text-mono f5 mb-2 border-lg-top pt-lg-3">Connect with others</h4> - <ul class="list-style-none mb-0"> - <li class="edge-item-fix"><a href="https://github.com/events" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Events">Events</a></li> - <li class="edge-item-fix"><a href="https://github.community" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Community forum">Community forum</a></li> - <li class="edge-item-fix"><a href="https://education.github.com" class="py-2 pb-0 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to GitHub Education">GitHub Education</a></li> - </ul> - </div> - </details> - </li> - - <li class="border-bottom border-lg-bottom-0 mr-0 mr-lg-3"> - <a href="/marketplace" class="HeaderMenu-link no-underline py-3 d-block d-lg-inline-block" data-ga-click="(Logged out) Header, go to Marketplace">Marketplace</a> - </li> - - <li class="d-block d-lg-flex flex-lg-nowrap flex-lg-items-center border-bottom border-lg-bottom-0 mr-0 mr-lg-3 edge-item-fix position-relative flex-wrap flex-justify-between d-flex flex-items-center "> - <details class="HeaderMenu-details details-overlay details-reset width-full"> - <summary class="HeaderMenu-summary HeaderMenu-link px-0 py-3 border-0 no-wrap d-block d-lg-inline-block"> - Pricing - <svg x="0px" y="0px" viewBox="0 0 14 8" xml:space="preserve" fill="none" class="icon-chevon-down-mktg position-absolute position-lg-relative"> - <path d="M1,1l6.2,6L13,1"></path> - </svg> - </summary> - - <div class="dropdown-menu flex-auto rounded-1 bg-white px-0 pt-2 pb-4 mt-0 p-lg-4 position-relative position-lg-absolute left-0 left-lg-n4"> - <a href="/pricing" class="pb-2 lh-condensed-ultra d-block link-gray-dark no-underline h5 Bump-link--hover" data-ga-click="(Logged out) Header, go to Pricing">Plans <span class="Bump-link-symbol float-right text-normal text-gray-light">→</span></a> - - <ul class="list-style-none mb-3"> - <li class="edge-item-fix"><a href="/pricing#feature-comparison" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Compare plans">Compare plans</a></li> - <li class="edge-item-fix"><a href="https://enterprise.github.com/contact" class="py-2 lh-condensed-ultra d-block link-gray no-underline f5" data-ga-click="(Logged out) Header, go to Contact Sales">Contact Sales</a></li> - </ul> - - <ul class="list-style-none mb-0 border-lg-top pt-lg-3"> - <li class="edge-item-fix"><a href="/nonprofit" class="py-2 lh-condensed-ultra d-block no-underline link-gray-dark no-underline h5 Bump-link--hover" data-ga-click="(Logged out) Header, go to Nonprofits">Nonprofit <span class="Bump-link-symbol float-right text-normal text-gray-light">→</span></a></li> - <li class="edge-item-fix"><a href="https://education.github.com" class="py-2 pb-0 lh-condensed-ultra d-block no-underline link-gray-dark no-underline h5 Bump-link--hover" data-ga-click="(Logged out) Header, go to Education">Education <span class="Bump-link-symbol float-right text-normal text-gray-light">→</span></a></li> - </ul> - </div> - </details> - </li> - </ul> - </nav> - - <div class="d-lg-flex flex-items-center px-3 px-lg-0 text-center text-lg-left"> - <div class="d-lg-flex mb-3 mb-lg-0"> - <div class="header-search flex-self-stretch flex-lg-self-auto mr-0 mr-lg-3 mb-3 mb-lg-0 scoped-search site-scoped-search js-site-search position-relative js-jump-to" - role="combobox" - aria-owns="jump-to-results" - aria-label="Search or jump to" - aria-haspopup="listbox" - aria-expanded="false" -> - <div class="position-relative"> - <!-- '"` --><!-- </textarea></xmp> --></option></form><form class="js-site-search-form" role="search" aria-label="Site" data-scope-type="Repository" data-scope-id="139730674" data-scoped-search-url="/johnheap/VAPPER-Galaxy/search" data-unscoped-search-url="/search" action="/johnheap/VAPPER-Galaxy/search" accept-charset="UTF-8" method="get"><input name="utf8" type="hidden" value="✓" /> - <label class="form-control input-sm header-search-wrapper p-0 header-search-wrapper-jump-to position-relative d-flex flex-justify-between flex-items-center js-chromeless-input-container"> - <input type="text" - class="form-control input-sm header-search-input jump-to-field js-jump-to-field js-site-search-focus js-site-search-field is-clearable" - data-hotkey="s,/" - name="q" - value="" - placeholder="Search" - data-unscoped-placeholder="Search GitHub" - data-scoped-placeholder="Search" - autocapitalize="off" - aria-autocomplete="list" - aria-controls="jump-to-results" - aria-label="Search" - data-jump-to-suggestions-path="/_graphql/GetSuggestedNavigationDestinations#csrf-token=OeWfhCkNlueqmf+vlMZUOIoZL/xaxMnWSzEKmM+a3P/55zFIrfSMdNtX4Lcjm/pZKDqzddz2DGdPMz+4X5/nxg==" - spellcheck="false" - autocomplete="off" - > - <input type="hidden" class="js-site-search-type-field" name="type" > - <img src="https://github.githubassets.com/images/search-key-slash.svg" alt="" class="mr-2 header-search-key-slash"> - - <div class="Box position-absolute overflow-hidden d-none jump-to-suggestions js-jump-to-suggestions-container"> - -<ul class="d-none js-jump-to-suggestions-template-container"> - - -<li class="d-flex flex-justify-start flex-items-center p-0 f5 navigation-item js-navigation-item js-jump-to-suggestion" role="option"> - <a tabindex="-1" class="no-underline d-flex flex-auto flex-items-center jump-to-suggestions-path js-jump-to-suggestion-path js-navigation-open p-2" href=""> - <div class="jump-to-octicon js-jump-to-octicon flex-shrink-0 mr-2 text-center d-none"> - <svg height="16" width="16" class="octicon octicon-repo flex-shrink-0 js-jump-to-octicon-repo d-none" title="Repository" aria-label="Repository" viewBox="0 0 12 16" version="1.1" role="img"><path fill-rule="evenodd" d="M4 9H3V8h1v1zm0-3H3v1h1V6zm0-2H3v1h1V4zm0-2H3v1h1V2zm8-1v12c0 .55-.45 1-1 1H6v2l-1.5-1.5L3 16v-2H1c-.55 0-1-.45-1-1V1c0-.55.45-1 1-1h10c.55 0 1 .45 1 1zm-1 10H1v2h2v-1h3v1h5v-2zm0-10H2v9h9V1z"/></svg> - <svg height="16" width="16" class="octicon octicon-project flex-shrink-0 js-jump-to-octicon-project d-none" title="Project" aria-label="Project" viewBox="0 0 15 16" version="1.1" role="img"><path fill-rule="evenodd" d="M10 12h3V2h-3v10zm-4-2h3V2H6v8zm-4 4h3V2H2v12zm-1 1h13V1H1v14zM14 0H1a1 1 0 0 0-1 1v14a1 1 0 0 0 1 1h13a1 1 0 0 0 1-1V1a1 1 0 0 0-1-1z"/></svg> - <svg height="16" width="16" class="octicon octicon-search flex-shrink-0 js-jump-to-octicon-search d-none" title="Search" aria-label="Search" viewBox="0 0 16 16" version="1.1" role="img"><path fill-rule="evenodd" d="M15.7 13.3l-3.81-3.83A5.93 5.93 0 0 0 13 6c0-3.31-2.69-6-6-6S1 2.69 1 6s2.69 6 6 6c1.3 0 2.48-.41 3.47-1.11l3.83 3.81c.19.2.45.3.7.3.25 0 .52-.09.7-.3a.996.996 0 0 0 0-1.41v.01zM7 10.7c-2.59 0-4.7-2.11-4.7-4.7 0-2.59 2.11-4.7 4.7-4.7 2.59 0 4.7 2.11 4.7 4.7 0 2.59-2.11 4.7-4.7 4.7z"/></svg> - </div> - - <img class="avatar mr-2 flex-shrink-0 js-jump-to-suggestion-avatar d-none" alt="" aria-label="Team" src="" width="28" height="28"> - - <div class="jump-to-suggestion-name js-jump-to-suggestion-name flex-auto overflow-hidden text-left no-wrap css-truncate css-truncate-target"> - </div> - - <div class="border rounded-1 flex-shrink-0 bg-gray px-1 text-gray-light ml-1 f6 d-none js-jump-to-badge-search"> - <span class="js-jump-to-badge-search-text-default d-none" aria-label="in this repository"> - In this repository - </span> - <span class="js-jump-to-badge-search-text-global d-none" aria-label="in all of GitHub"> - All GitHub - </span> - <span aria-hidden="true" class="d-inline-block ml-1 v-align-middle">↵</span> - </div> - - <div aria-hidden="true" class="border rounded-1 flex-shrink-0 bg-gray px-1 text-gray-light ml-1 f6 d-none d-on-nav-focus js-jump-to-badge-jump"> - Jump to - <span class="d-inline-block ml-1 v-align-middle">↵</span> - </div> - </a> -</li> - -</ul> - -<ul class="d-none js-jump-to-no-results-template-container"> - <li class="d-flex flex-justify-center flex-items-center f5 d-none js-jump-to-suggestion p-2"> - <span class="text-gray">No suggested jump to results</span> - </li> -</ul> - -<ul id="jump-to-results" role="listbox" class="p-0 m-0 js-navigation-container jump-to-suggestions-results-container js-jump-to-suggestions-results-container"> - - -<li class="d-flex flex-justify-start flex-items-center p-0 f5 navigation-item js-navigation-item js-jump-to-scoped-search d-none" role="option"> - <a tabindex="-1" class="no-underline d-flex flex-auto flex-items-center jump-to-suggestions-path js-jump-to-suggestion-path js-navigation-open p-2" href=""> - <div class="jump-to-octicon js-jump-to-octicon flex-shrink-0 mr-2 text-center d-none"> - <svg height="16" width="16" class="octicon octicon-repo flex-shrink-0 js-jump-to-octicon-repo d-none" title="Repository" aria-label="Repository" viewBox="0 0 12 16" version="1.1" role="img"><path fill-rule="evenodd" d="M4 9H3V8h1v1zm0-3H3v1h1V6zm0-2H3v1h1V4zm0-2H3v1h1V2zm8-1v12c0 .55-.45 1-1 1H6v2l-1.5-1.5L3 16v-2H1c-.55 0-1-.45-1-1V1c0-.55.45-1 1-1h10c.55 0 1 .45 1 1zm-1 10H1v2h2v-1h3v1h5v-2zm0-10H2v9h9V1z"/></svg> - <svg height="16" width="16" class="octicon octicon-project flex-shrink-0 js-jump-to-octicon-project d-none" title="Project" aria-label="Project" viewBox="0 0 15 16" version="1.1" role="img"><path fill-rule="evenodd" d="M10 12h3V2h-3v10zm-4-2h3V2H6v8zm-4 4h3V2H2v12zm-1 1h13V1H1v14zM14 0H1a1 1 0 0 0-1 1v14a1 1 0 0 0 1 1h13a1 1 0 0 0 1-1V1a1 1 0 0 0-1-1z"/></svg> - <svg height="16" width="16" class="octicon octicon-search flex-shrink-0 js-jump-to-octicon-search d-none" title="Search" aria-label="Search" viewBox="0 0 16 16" version="1.1" role="img"><path fill-rule="evenodd" d="M15.7 13.3l-3.81-3.83A5.93 5.93 0 0 0 13 6c0-3.31-2.69-6-6-6S1 2.69 1 6s2.69 6 6 6c1.3 0 2.48-.41 3.47-1.11l3.83 3.81c.19.2.45.3.7.3.25 0 .52-.09.7-.3a.996.996 0 0 0 0-1.41v.01zM7 10.7c-2.59 0-4.7-2.11-4.7-4.7 0-2.59 2.11-4.7 4.7-4.7 2.59 0 4.7 2.11 4.7 4.7 0 2.59-2.11 4.7-4.7 4.7z"/></svg> - </div> - - <img class="avatar mr-2 flex-shrink-0 js-jump-to-suggestion-avatar d-none" alt="" aria-label="Team" src="" width="28" height="28"> - - <div class="jump-to-suggestion-name js-jump-to-suggestion-name flex-auto overflow-hidden text-left no-wrap css-truncate css-truncate-target"> - </div> - - <div class="border rounded-1 flex-shrink-0 bg-gray px-1 text-gray-light ml-1 f6 d-none js-jump-to-badge-search"> - <span class="js-jump-to-badge-search-text-default d-none" aria-label="in this repository"> - In this repository - </span> - <span class="js-jump-to-badge-search-text-global d-none" aria-label="in all of GitHub"> - All GitHub - </span> - <span aria-hidden="true" class="d-inline-block ml-1 v-align-middle">↵</span> - </div> - - <div aria-hidden="true" class="border rounded-1 flex-shrink-0 bg-gray px-1 text-gray-light ml-1 f6 d-none d-on-nav-focus js-jump-to-badge-jump"> - Jump to - <span class="d-inline-block ml-1 v-align-middle">↵</span> - </div> - </a> -</li> - - - -<li class="d-flex flex-justify-start flex-items-center p-0 f5 navigation-item js-navigation-item js-jump-to-global-search d-none" role="option"> - <a tabindex="-1" class="no-underline d-flex flex-auto flex-items-center jump-to-suggestions-path js-jump-to-suggestion-path js-navigation-open p-2" href=""> - <div class="jump-to-octicon js-jump-to-octicon flex-shrink-0 mr-2 text-center d-none"> - <svg height="16" width="16" class="octicon octicon-repo flex-shrink-0 js-jump-to-octicon-repo d-none" title="Repository" aria-label="Repository" viewBox="0 0 12 16" version="1.1" role="img"><path fill-rule="evenodd" d="M4 9H3V8h1v1zm0-3H3v1h1V6zm0-2H3v1h1V4zm0-2H3v1h1V2zm8-1v12c0 .55-.45 1-1 1H6v2l-1.5-1.5L3 16v-2H1c-.55 0-1-.45-1-1V1c0-.55.45-1 1-1h10c.55 0 1 .45 1 1zm-1 10H1v2h2v-1h3v1h5v-2zm0-10H2v9h9V1z"/></svg> - <svg height="16" width="16" class="octicon octicon-project flex-shrink-0 js-jump-to-octicon-project d-none" title="Project" aria-label="Project" viewBox="0 0 15 16" version="1.1" role="img"><path fill-rule="evenodd" d="M10 12h3V2h-3v10zm-4-2h3V2H6v8zm-4 4h3V2H2v12zm-1 1h13V1H1v14zM14 0H1a1 1 0 0 0-1 1v14a1 1 0 0 0 1 1h13a1 1 0 0 0 1-1V1a1 1 0 0 0-1-1z"/></svg> - <svg height="16" width="16" class="octicon octicon-search flex-shrink-0 js-jump-to-octicon-search d-none" title="Search" aria-label="Search" viewBox="0 0 16 16" version="1.1" role="img"><path fill-rule="evenodd" d="M15.7 13.3l-3.81-3.83A5.93 5.93 0 0 0 13 6c0-3.31-2.69-6-6-6S1 2.69 1 6s2.69 6 6 6c1.3 0 2.48-.41 3.47-1.11l3.83 3.81c.19.2.45.3.7.3.25 0 .52-.09.7-.3a.996.996 0 0 0 0-1.41v.01zM7 10.7c-2.59 0-4.7-2.11-4.7-4.7 0-2.59 2.11-4.7 4.7-4.7 2.59 0 4.7 2.11 4.7 4.7 0 2.59-2.11 4.7-4.7 4.7z"/></svg> - </div> - - <img class="avatar mr-2 flex-shrink-0 js-jump-to-suggestion-avatar d-none" alt="" aria-label="Team" src="" width="28" height="28"> - - <div class="jump-to-suggestion-name js-jump-to-suggestion-name flex-auto overflow-hidden text-left no-wrap css-truncate css-truncate-target"> - </div> - - <div class="border rounded-1 flex-shrink-0 bg-gray px-1 text-gray-light ml-1 f6 d-none js-jump-to-badge-search"> - <span class="js-jump-to-badge-search-text-default d-none" aria-label="in this repository"> - In this repository - </span> - <span class="js-jump-to-badge-search-text-global d-none" aria-label="in all of GitHub"> - All GitHub - </span> - <span aria-hidden="true" class="d-inline-block ml-1 v-align-middle">↵</span> - </div> - - <div aria-hidden="true" class="border rounded-1 flex-shrink-0 bg-gray px-1 text-gray-light ml-1 f6 d-none d-on-nav-focus js-jump-to-badge-jump"> - Jump to - <span class="d-inline-block ml-1 v-align-middle">↵</span> - </div> - </a> -</li> - - -</ul> - - </div> - </label> -</form> </div> -</div> - - </div> - - <a class="HeaderMenu-link no-underline mr-3" data-hydro-click="{"event_type":"authentication.click","payload":{"location_in_page":"site header menu","repository_id":null,"auth_type":"LOG_IN","client_id":null,"originating_request_id":"A691:31FC:5350A:9C70E:5CF5626C","originating_url":"https://github.com/johnheap/VAPPER-Galaxy/blob/master/Tryp_V_T.py","referrer":null,"user_id":null}}" data-hydro-click-hmac="337eab5a1a33edba9a56afe56b6817bbe2bfb8bfab94836352641826ce53b626" data-ga-click="(Logged out) Header, clicked Sign in, text:sign-in" href="/login?return_to=%2Fjohnheap%2FVAPPER-Galaxy%2Fblob%2Fmaster%2FTryp_V_T.py"> - Sign in -</a> <a class="HeaderMenu-link d-inline-block no-underline border border-gray-dark rounded-1 px-2 py-1" data-hydro-click="{"event_type":"authentication.click","payload":{"location_in_page":"site header menu","repository_id":null,"auth_type":"SIGN_UP","client_id":null,"originating_request_id":"A691:31FC:5350A:9C70E:5CF5626C","originating_url":"https://github.com/johnheap/VAPPER-Galaxy/blob/master/Tryp_V_T.py","referrer":null,"user_id":null}}" data-hydro-click-hmac="ae884c1f61e6facf2cb96fcd7d55fbcf227cb7989e192de2cb6c5ab5c46e53d1" data-ga-click="(Logged out) Header, clicked Sign up, text:sign-up" href="/join?source=header-repo"> - Sign up -</a> </div> - </div> - </div> -</header> - - </div> - - <div id="start-of-content" class="show-on-focus"></div> - - - <div id="js-flash-container"> - -</div> - - - - <div class="application-main " data-commit-hovercards-enabled> - <div itemscope itemtype="http://schema.org/SoftwareSourceCode" class=""> - <main > - - - - - - - - - - - <div class="pagehead repohead instapaper_ignore readability-menu experiment-repo-nav pt-0 pt-lg-4 "> - <div class="repohead-details-container clearfix container-lg p-responsive d-none d-lg-block"> - - <ul class="pagehead-actions"> - - - - - <li> - - <a class="tooltipped tooltipped-s btn btn-sm btn-with-count" aria-label="You must be signed in to watch a repository" rel="nofollow" data-hydro-click="{"event_type":"authentication.click","payload":{"location_in_page":"notification subscription menu watch","repository_id":null,"auth_type":"LOG_IN","client_id":null,"originating_request_id":"A691:31FC:5350A:9C70E:5CF5626C","originating_url":"https://github.com/johnheap/VAPPER-Galaxy/blob/master/Tryp_V_T.py","referrer":null,"user_id":null}}" data-hydro-click-hmac="af7329bf60da95c08a620876666a89de6aa2bf96a8da8486f5eb50741ad8743e" href="/login?return_to=%2Fjohnheap%2FVAPPER-Galaxy"> - <svg class="octicon octicon-eye v-align-text-bottom" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8.06 2C3 2 0 8 0 8s3 6 8.06 6C13 14 16 8 16 8s-3-6-7.94-6zM8 12c-2.2 0-4-1.78-4-4 0-2.2 1.8-4 4-4 2.22 0 4 1.8 4 4 0 2.22-1.78 4-4 4zm2-4c0 1.11-.89 2-2 2-1.11 0-2-.89-2-2 0-1.11.89-2 2-2 1.11 0 2 .89 2 2z"/></svg> - Watch -</a> <a class="social-count" href="/johnheap/VAPPER-Galaxy/watchers" - aria-label="0 users are watching this repository"> - 0 - </a> - - </li> - - <li> - <a class="btn btn-sm btn-with-count tooltipped tooltipped-s" aria-label="You must be signed in to star a repository" rel="nofollow" data-hydro-click="{"event_type":"authentication.click","payload":{"location_in_page":"star button","repository_id":139730674,"auth_type":"LOG_IN","client_id":null,"originating_request_id":"A691:31FC:5350A:9C70E:5CF5626C","originating_url":"https://github.com/johnheap/VAPPER-Galaxy/blob/master/Tryp_V_T.py","referrer":null,"user_id":null}}" data-hydro-click-hmac="0db565041ee36ff7a0a3ca6a8ab0c55e0708db9b7f32415674420a32f9615882" href="/login?return_to=%2Fjohnheap%2FVAPPER-Galaxy"> - <svg class="octicon octicon-star v-align-text-bottom" viewBox="0 0 14 16" version="1.1" width="14" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M14 6l-4.9-.64L7 1 4.9 5.36 0 6l3.6 3.26L2.67 14 7 11.67 11.33 14l-.93-4.74L14 6z"/></svg> - Star -</a> - <a class="social-count js-social-count" href="/johnheap/VAPPER-Galaxy/stargazers" - aria-label="0 users starred this repository"> - 0 - </a> - - </li> - - <li> - <a class="btn btn-sm btn-with-count tooltipped tooltipped-s" aria-label="You must be signed in to fork a repository" rel="nofollow" data-hydro-click="{"event_type":"authentication.click","payload":{"location_in_page":"repo details fork button","repository_id":139730674,"auth_type":"LOG_IN","client_id":null,"originating_request_id":"A691:31FC:5350A:9C70E:5CF5626C","originating_url":"https://github.com/johnheap/VAPPER-Galaxy/blob/master/Tryp_V_T.py","referrer":null,"user_id":null}}" data-hydro-click-hmac="f1fd12af9e16afa9f9169bba4e92280efdd13b9f988453b683991c292a94ee58" href="/login?return_to=%2Fjohnheap%2FVAPPER-Galaxy"> - <svg class="octicon octicon-repo-forked v-align-text-bottom" viewBox="0 0 10 16" version="1.1" width="10" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8 1a1.993 1.993 0 0 0-1 3.72V6L5 8 3 6V4.72A1.993 1.993 0 0 0 2 1a1.993 1.993 0 0 0-1 3.72V6.5l3 3v1.78A1.993 1.993 0 0 0 5 15a1.993 1.993 0 0 0 1-3.72V9.5l3-3V4.72A1.993 1.993 0 0 0 8 1zM2 4.2C1.34 4.2.8 3.65.8 3c0-.65.55-1.2 1.2-1.2.65 0 1.2.55 1.2 1.2 0 .65-.55 1.2-1.2 1.2zm3 10c-.66 0-1.2-.55-1.2-1.2 0-.65.55-1.2 1.2-1.2.65 0 1.2.55 1.2 1.2 0 .65-.55 1.2-1.2 1.2zm3-10c-.66 0-1.2-.55-1.2-1.2 0-.65.55-1.2 1.2-1.2.65 0 1.2.55 1.2 1.2 0 .65-.55 1.2-1.2 1.2z"/></svg> - Fork -</a> - <a href="/johnheap/VAPPER-Galaxy/network/members" class="social-count" - aria-label="0 users forked this repository"> - 0 - </a> - </li> -</ul> - - <h1 class="public "> - <svg class="octicon octicon-repo" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M4 9H3V8h1v1zm0-3H3v1h1V6zm0-2H3v1h1V4zm0-2H3v1h1V2zm8-1v12c0 .55-.45 1-1 1H6v2l-1.5-1.5L3 16v-2H1c-.55 0-1-.45-1-1V1c0-.55.45-1 1-1h10c.55 0 1 .45 1 1zm-1 10H1v2h2v-1h3v1h5v-2zm0-10H2v9h9V1z"/></svg> - <span class="author" itemprop="author"><a class="url fn" rel="author" data-hovercard-type="user" data-hovercard-url="/hovercards?user_id=24318980" data-octo-click="hovercard-link-click" data-octo-dimensions="link_type:self" href="/johnheap">johnheap</a></span><!-- ---><span class="path-divider">/</span><!-- ---><strong itemprop="name"><a data-pjax="#js-repo-pjax-container" href="/johnheap/VAPPER-Galaxy">VAPPER-Galaxy</a></strong> - - -</h1> - - </div> - -<nav class="hx_reponav reponav js-repo-nav js-sidenav-container-pjax container-lg p-responsive d-none d-lg-block" - itemscope - itemtype="http://schema.org/BreadcrumbList" - aria-label="Repository" - data-pjax="#js-repo-pjax-container"> - - <span itemscope itemtype="http://schema.org/ListItem" itemprop="itemListElement"> - <a class="js-selected-navigation-item selected reponav-item" itemprop="url" data-hotkey="g c" aria-current="page" data-selected-links="repo_source repo_downloads repo_commits repo_releases repo_tags repo_branches repo_packages /johnheap/VAPPER-Galaxy" href="/johnheap/VAPPER-Galaxy"> - <svg class="octicon octicon-code" viewBox="0 0 14 16" version="1.1" width="14" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M9.5 3L8 4.5 11.5 8 8 11.5 9.5 13 14 8 9.5 3zm-5 0L0 8l4.5 5L6 11.5 2.5 8 6 4.5 4.5 3z"/></svg> - <span itemprop="name">Code</span> - <meta itemprop="position" content="1"> -</a> </span> - - <span itemscope itemtype="http://schema.org/ListItem" itemprop="itemListElement"> - <a itemprop="url" data-hotkey="g i" class="js-selected-navigation-item reponav-item" data-selected-links="repo_issues repo_labels repo_milestones /johnheap/VAPPER-Galaxy/issues" href="/johnheap/VAPPER-Galaxy/issues"> - <svg class="octicon octicon-issue-opened" viewBox="0 0 14 16" version="1.1" width="14" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M7 2.3c3.14 0 5.7 2.56 5.7 5.7s-2.56 5.7-5.7 5.7A5.71 5.71 0 0 1 1.3 8c0-3.14 2.56-5.7 5.7-5.7zM7 1C3.14 1 0 4.14 0 8s3.14 7 7 7 7-3.14 7-7-3.14-7-7-7zm1 3H6v5h2V4zm0 6H6v2h2v-2z"/></svg> - <span itemprop="name">Issues</span> - <span class="Counter">0</span> - <meta itemprop="position" content="2"> -</a> </span> - - <span itemscope itemtype="http://schema.org/ListItem" itemprop="itemListElement"> - <a data-hotkey="g p" itemprop="url" class="js-selected-navigation-item reponav-item" data-selected-links="repo_pulls checks /johnheap/VAPPER-Galaxy/pulls" href="/johnheap/VAPPER-Galaxy/pulls"> - <svg class="octicon octicon-git-pull-request" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M11 11.28V5c-.03-.78-.34-1.47-.94-2.06C9.46 2.35 8.78 2.03 8 2H7V0L4 3l3 3V4h1c.27.02.48.11.69.31.21.2.3.42.31.69v6.28A1.993 1.993 0 0 0 10 15a1.993 1.993 0 0 0 1-3.72zm-1 2.92c-.66 0-1.2-.55-1.2-1.2 0-.65.55-1.2 1.2-1.2.65 0 1.2.55 1.2 1.2 0 .65-.55 1.2-1.2 1.2zM4 3c0-1.11-.89-2-2-2a1.993 1.993 0 0 0-1 3.72v6.56A1.993 1.993 0 0 0 2 15a1.993 1.993 0 0 0 1-3.72V4.72c.59-.34 1-.98 1-1.72zm-.8 10c0 .66-.55 1.2-1.2 1.2-.65 0-1.2-.55-1.2-1.2 0-.65.55-1.2 1.2-1.2.65 0 1.2.55 1.2 1.2zM2 4.2C1.34 4.2.8 3.65.8 3c0-.65.55-1.2 1.2-1.2.65 0 1.2.55 1.2 1.2 0 .65-.55 1.2-1.2 1.2z"/></svg> - <span itemprop="name">Pull requests</span> - <span class="Counter">0</span> - <meta itemprop="position" content="3"> -</a> </span> - - - <a data-hotkey="g b" class="js-selected-navigation-item reponav-item" data-selected-links="repo_projects new_repo_project repo_project /johnheap/VAPPER-Galaxy/projects" href="/johnheap/VAPPER-Galaxy/projects"> - <svg class="octicon octicon-project" viewBox="0 0 15 16" version="1.1" width="15" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M10 12h3V2h-3v10zm-4-2h3V2H6v8zm-4 4h3V2H2v12zm-1 1h13V1H1v14zM14 0H1a1 1 0 0 0-1 1v14a1 1 0 0 0 1 1h13a1 1 0 0 0 1-1V1a1 1 0 0 0-1-1z"/></svg> - Projects - <span class="Counter" >0</span> -</a> - - - <a data-skip-pjax="true" class="js-selected-navigation-item reponav-item" data-selected-links="security alerts policy /johnheap/VAPPER-Galaxy/security/advisories" href="/johnheap/VAPPER-Galaxy/security/advisories"> - <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" class="octicon" height="16px" width="16px"> - <path fill-rule="evenodd" clip-rule="evenodd" d="M1 2l7-2 7 2v6.02C15 12.69 9.69 16 8 16c-1.69 0-7-3.31-7-7.98V2zm1 .75L8 1l6 1.75v5.268C14 12.104 9.45 15 8 15c-1.45 0-6-2.896-6-6.982V2.75z"></path> - <path d="M3 3.5L8 2v12c-1.207 0-5-2.482-5-5.985V3.5z"></path> -</svg> - - Security -</a> - <a class="js-selected-navigation-item reponav-item" data-selected-links="repo_graphs repo_contributors dependency_graph pulse people /johnheap/VAPPER-Galaxy/pulse" href="/johnheap/VAPPER-Galaxy/pulse"> - <svg class="octicon octicon-graph" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M16 14v1H0V0h1v14h15zM5 13H3V8h2v5zm4 0H7V3h2v10zm4 0h-2V6h2v7z"/></svg> - Insights -</a> - -</nav> - - <div class="reponav-wrapper reponav-small d-lg-none"> - <nav class="reponav js-reponav text-center no-wrap" - itemscope - itemtype="http://schema.org/BreadcrumbList"> - - <span itemscope itemtype="http://schema.org/ListItem" itemprop="itemListElement"> - <a class="js-selected-navigation-item selected reponav-item" itemprop="url" aria-current="page" data-selected-links="repo_source repo_downloads repo_commits repo_releases repo_tags repo_branches repo_packages /johnheap/VAPPER-Galaxy" href="/johnheap/VAPPER-Galaxy"> - <span itemprop="name">Code</span> - <meta itemprop="position" content="1"> -</a> </span> - - <span itemscope itemtype="http://schema.org/ListItem" itemprop="itemListElement"> - <a itemprop="url" class="js-selected-navigation-item reponav-item" data-selected-links="repo_issues repo_labels repo_milestones /johnheap/VAPPER-Galaxy/issues" href="/johnheap/VAPPER-Galaxy/issues"> - <span itemprop="name">Issues</span> - <span class="Counter">0</span> - <meta itemprop="position" content="2"> -</a> </span> - - <span itemscope itemtype="http://schema.org/ListItem" itemprop="itemListElement"> - <a itemprop="url" class="js-selected-navigation-item reponav-item" data-selected-links="repo_pulls checks /johnheap/VAPPER-Galaxy/pulls" href="/johnheap/VAPPER-Galaxy/pulls"> - <span itemprop="name">Pull requests</span> - <span class="Counter">0</span> - <meta itemprop="position" content="3"> -</a> </span> - - <span itemscope itemtype="http://schema.org/ListItem" itemprop="itemListElement"> - <a itemprop="url" class="js-selected-navigation-item reponav-item" data-selected-links="repo_projects new_repo_project repo_project /johnheap/VAPPER-Galaxy/projects" href="/johnheap/VAPPER-Galaxy/projects"> - <span itemprop="name">Projects</span> - <span class="Counter">0</span> - <meta itemprop="position" content="4"> -</a> </span> - - - <a itemprop="url" class="js-selected-navigation-item reponav-item" data-selected-links="security alerts policy /johnheap/VAPPER-Galaxy/security/advisories" href="/johnheap/VAPPER-Galaxy/security/advisories"> - <span itemprop="name">Security</span> - <meta itemprop="position" content="6"> -</a> - <a class="js-selected-navigation-item reponav-item" data-selected-links="pulse /johnheap/VAPPER-Galaxy/pulse" href="/johnheap/VAPPER-Galaxy/pulse"> - Pulse -</a> - - </nav> -</div> - - - </div> -<div class="container-lg new-discussion-timeline experiment-repo-nav p-responsive"> - <div class="repository-content "> - - - - - - - - <a class="d-none js-permalink-shortcut" data-hotkey="y" href="/johnheap/VAPPER-Galaxy/blob/a4e16d71fe985f389930c02f94354b87d3aabadb/Tryp_V_T.py">Permalink</a> - - <!-- blob contrib key: blob_contributors:v21:9b80d5431ee2c66dc8d0bd669b319131 --> - <div class="signup-prompt-bg rounded-1"> - <div class="signup-prompt p-4 text-center mb-4 rounded-1"> - <div class="position-relative"> - <!-- '"` --><!-- </textarea></xmp> --></option></form><form action="/prompt_dismissals/signup" accept-charset="UTF-8" method="post"><input name="utf8" type="hidden" value="✓" /><input type="hidden" name="_method" value="put" /><input type="hidden" name="authenticity_token" value="u8vaE+nJK1t8+Agdc/ZN/ZDEQ1zDW1rahinuGQ03qeICRZPwq5nUk+WWU12I6oJkTK1SE+lme9JaR2kcuAfQbQ==" /> - <button type="submit" class="position-absolute top-0 right-0 btn-link link-gray" data-ga-click="(Logged out) Sign up prompt, clicked Dismiss, text:dismiss"> - Dismiss - </button> -</form> <h3 class="pt-2">Join GitHub today</h3> - <p class="col-6 mx-auto">GitHub is home to over 36 million developers working together to host and review code, manage projects, and build software together.</p> - <a class="btn btn-primary" data-hydro-click="{"event_type":"authentication.click","payload":{"location_in_page":"files signup prompt","repository_id":null,"auth_type":"SIGN_UP","client_id":null,"originating_request_id":"A691:31FC:5350A:9C70E:5CF5626C","originating_url":"https://github.com/johnheap/VAPPER-Galaxy/blob/master/Tryp_V_T.py","referrer":null,"user_id":null}}" data-hydro-click-hmac="4bf7c9cc5dabe6e4cbd6bb6269757b356cdffe6bf9214fa28ed8854e1073068e" data-ga-click="(Logged out) Sign up prompt, clicked Sign up, text:sign-up" href="/join?source=prompt-blob-show">Sign up</a> - </div> - </div> - </div> - - - <div class="d-flex flex-items-start flex-shrink-0 mb-2 flex-column flex-md-row"> - <span class="d-flex flex-justify-between width-full width-md-auto"> - -<details class="details-reset details-overlay select-menu branch-select-menu hx_rsm" id="branch-select-menu"> - <summary class="btn btn-sm select-menu-button css-truncate" - data-hotkey="w" - - title="Switch branches or tags"> - <i>Branch:</i> - <span class="css-truncate-target">master</span> - </summary> - - <details-menu class="select-menu-modal hx_rsm-modal position-absolute" style="z-index: 99;" src="/johnheap/VAPPER-Galaxy/ref-list/master/Tryp_V_T.py?source_action=show&source_controller=blob" preload> - <include-fragment class="select-menu-loading-overlay anim-pulse"> - <svg height="32" class="octicon octicon-octoface" viewBox="0 0 16 16" version="1.1" width="32" aria-hidden="true"><path fill-rule="evenodd" d="M14.7 5.34c.13-.32.55-1.59-.13-3.31 0 0-1.05-.33-3.44 1.3-1-.28-2.07-.32-3.13-.32s-2.13.04-3.13.32c-2.39-1.64-3.44-1.3-3.44-1.3-.68 1.72-.26 2.99-.13 3.31C.49 6.21 0 7.33 0 8.69 0 13.84 3.33 15 7.98 15S16 13.84 16 8.69c0-1.36-.49-2.48-1.3-3.35zM8 14.02c-3.3 0-5.98-.15-5.98-3.35 0-.76.38-1.48 1.02-2.07 1.07-.98 2.9-.46 4.96-.46 2.07 0 3.88-.52 4.96.46.65.59 1.02 1.3 1.02 2.07 0 3.19-2.68 3.35-5.98 3.35zM5.49 9.01c-.66 0-1.2.8-1.2 1.78s.54 1.79 1.2 1.79c.66 0 1.2-.8 1.2-1.79s-.54-1.78-1.2-1.78zm5.02 0c-.66 0-1.2.79-1.2 1.78s.54 1.79 1.2 1.79c.66 0 1.2-.8 1.2-1.79s-.53-1.78-1.2-1.78z"/></svg> - </include-fragment> - </details-menu> -</details> - - <div class="BtnGroup flex-shrink-0 d-md-none"> - <a href="/johnheap/VAPPER-Galaxy/find/master" - class="js-pjax-capture-input btn btn-sm BtnGroup-item" - data-pjax - data-hotkey="t"> - Find file - </a> - <clipboard-copy value="Tryp_V_T.py" class="btn btn-sm BtnGroup-item"> - Copy path - </clipboard-copy> - </div> - </span> - <h2 id="blob-path" class="breadcrumb flex-auto min-width-0 text-normal flex-md-self-center ml-md-2 mr-md-3 my-2 my-md-0"> - <span class="js-repo-root text-bold"><span class="js-path-segment"><a data-pjax="true" href="/johnheap/VAPPER-Galaxy"><span>VAPPER-Galaxy</span></a></span></span><span class="separator">/</span><strong class="final-path">Tryp_V_T.py</strong> - </h2> - - <div class="BtnGroup flex-shrink-0 d-none d-md-inline-block"> - <a href="/johnheap/VAPPER-Galaxy/find/master" - class="js-pjax-capture-input btn btn-sm BtnGroup-item" - data-pjax - data-hotkey="t"> - Find file - </a> - <clipboard-copy value="Tryp_V_T.py" class="btn btn-sm BtnGroup-item"> - Copy path - </clipboard-copy> - </div> - </div> - - - - <include-fragment src="/johnheap/VAPPER-Galaxy/contributors/master/Tryp_V_T.py" class="Box Box--condensed commit-loader"> - <div class="Box-body bg-blue-light f6"> - Fetching contributors… - </div> - - <div class="Box-body d-flex flex-items-center" > - <img alt="" class="loader-loading mr-2" src="https://github.githubassets.com/images/spinners/octocat-spinner-32-EAF2F5.gif" width="16" height="16" /> - <span class="text-red h6 loader-error">Cannot retrieve contributors at this time</span> - </div> -</include-fragment> - - - - - - <div class="Box mt-3 position-relative"> - -<div class="Box-header py-2 d-flex flex-column flex-shrink-0 flex-md-row flex-md-items-center"> - - <div class="text-mono f6 flex-auto pr-3 flex-order-2 flex-md-order-1 mt-2 mt-md-0"> - 426 lines (349 sloc) - <span class="file-info-divider"></span> - 17.3 KB - </div> - - <div class="d-flex py-1 py-md-0 flex-auto flex-order-1 flex-md-order-2 flex-sm-grow-0 flex-justify-between"> - - <div class="BtnGroup"> - <a id="raw-url" class="btn btn-sm BtnGroup-item" href="/johnheap/VAPPER-Galaxy/raw/master/Tryp_V_T.py">Raw</a> - <a class="btn btn-sm js-update-url-with-hash BtnGroup-item" data-hotkey="b" href="/johnheap/VAPPER-Galaxy/blame/master/Tryp_V_T.py">Blame</a> - <a rel="nofollow" class="btn btn-sm BtnGroup-item" href="/johnheap/VAPPER-Galaxy/commits/master/Tryp_V_T.py">History</a> - </div> - - - <div> - - <button type="button" class="btn-octicon disabled tooltipped tooltipped-nw" - aria-label="You must be signed in to make or propose changes"> - <svg class="octicon octicon-pencil" viewBox="0 0 14 16" version="1.1" width="14" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M0 12v3h3l8-8-3-3-8 8zm3 2H1v-2h1v1h1v1zm10.3-9.3L12 6 9 3l1.3-1.3a.996.996 0 0 1 1.41 0l1.59 1.59c.39.39.39 1.02 0 1.41z"/></svg> - </button> - <button type="button" class="btn-octicon btn-octicon-danger disabled tooltipped tooltipped-nw" - aria-label="You must be signed in to make or propose changes"> - <svg class="octicon octicon-trashcan" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M11 2H9c0-.55-.45-1-1-1H5c-.55 0-1 .45-1 1H2c-.55 0-1 .45-1 1v1c0 .55.45 1 1 1v9c0 .55.45 1 1 1h7c.55 0 1-.45 1-1V5c.55 0 1-.45 1-1V3c0-.55-.45-1-1-1zm-1 12H3V5h1v8h1V5h1v8h1V5h1v8h1V5h1v9zm1-10H2V3h9v1z"/></svg> - </button> - </div> - </div> -</div> - - - - <div itemprop="text" class="Box-body p-0 blob-wrapper data type-python "> - -<table class="highlight tab-size js-file-line-container" data-tab-size="8"> - <tr> - <td id="L1" class="blob-num js-line-number" data-line-number="1"></td> - <td id="LC1" class="blob-code blob-code-inner js-file-line"><span class="pl-s"><span class="pl-pds">"""</span></span></td> - </tr> - <tr> - <td id="L2" class="blob-num js-line-number" data-line-number="2"></td> - <td id="LC2" class="blob-code blob-code-inner js-file-line"><span class="pl-s">* Galaxy Version</span></td> - </tr> - <tr> - <td id="L3" class="blob-num js-line-number" data-line-number="3"></td> - <td id="LC3" class="blob-code blob-code-inner js-file-line"><span class="pl-s"></span></td> - </tr> - <tr> - <td id="L4" class="blob-num js-line-number" data-line-number="4"></td> - <td id="LC4" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> * Copyright 2019 University of Liverpool</span></td> - </tr> - <tr> - <td id="L5" class="blob-num js-line-number" data-line-number="5"></td> - <td id="LC5" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> * Author John Heap, Computational Biology Facility, UoL</span></td> - </tr> - <tr> - <td id="L6" class="blob-num js-line-number" data-line-number="6"></td> - <td id="LC6" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> * Based on original scripts of Sara Silva Silva Pereira, Institute of Infection and Global Health, UoL</span></td> - </tr> - <tr> - <td id="L7" class="blob-num js-line-number" data-line-number="7"></td> - <td id="LC7" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> *</span></td> - </tr> - <tr> - <td id="L8" class="blob-num js-line-number" data-line-number="8"></td> - <td id="LC8" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> * Licensed under the Apache License, Version 2.0 (the "License");</span></td> - </tr> - <tr> - <td id="L9" class="blob-num js-line-number" data-line-number="9"></td> - <td id="LC9" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> * you may not use this file except in compliance with the License.</span></td> - </tr> - <tr> - <td id="L10" class="blob-num js-line-number" data-line-number="10"></td> - <td id="LC10" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> * You may obtain a copy of the License at</span></td> - </tr> - <tr> - <td id="L11" class="blob-num js-line-number" data-line-number="11"></td> - <td id="LC11" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> *</span></td> - </tr> - <tr> - <td id="L12" class="blob-num js-line-number" data-line-number="12"></td> - <td id="LC12" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> * http://www.apache.org/licenses/LICENSE-2.0</span></td> - </tr> - <tr> - <td id="L13" class="blob-num js-line-number" data-line-number="13"></td> - <td id="LC13" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> *</span></td> - </tr> - <tr> - <td id="L14" class="blob-num js-line-number" data-line-number="14"></td> - <td id="LC14" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> * Unless required by applicable law or agreed to in writing, software</span></td> - </tr> - <tr> - <td id="L15" class="blob-num js-line-number" data-line-number="15"></td> - <td id="LC15" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> * distributed under the License is distributed on an "AS IS" BASIS,</span></td> - </tr> - <tr> - <td id="L16" class="blob-num js-line-number" data-line-number="16"></td> - <td id="LC16" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.</span></td> - </tr> - <tr> - <td id="L17" class="blob-num js-line-number" data-line-number="17"></td> - <td id="LC17" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> * See the License for the specific language governing permissions and</span></td> - </tr> - <tr> - <td id="L18" class="blob-num js-line-number" data-line-number="18"></td> - <td id="LC18" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> * limitations under the License.</span></td> - </tr> - <tr> - <td id="L19" class="blob-num js-line-number" data-line-number="19"></td> - <td id="LC19" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> *</span></td> - </tr> - <tr> - <td id="L20" class="blob-num js-line-number" data-line-number="20"></td> - <td id="LC20" class="blob-code blob-code-inner js-file-line"><span class="pl-s"> <span class="pl-pds">"""</span></span></td> - </tr> - <tr> - <td id="L21" class="blob-num js-line-number" data-line-number="21"></td> - <td id="LC21" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L22" class="blob-num js-line-number" data-line-number="22"></td> - <td id="LC22" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L23" class="blob-num js-line-number" data-line-number="23"></td> - <td id="LC23" class="blob-code blob-code-inner js-file-line"><span class="pl-k">import</span> subprocess</td> - </tr> - <tr> - <td id="L24" class="blob-num js-line-number" data-line-number="24"></td> - <td id="LC24" class="blob-code blob-code-inner js-file-line"><span class="pl-k">import</span> pandas <span class="pl-k">as</span> pd</td> - </tr> - <tr> - <td id="L25" class="blob-num js-line-number" data-line-number="25"></td> - <td id="LC25" class="blob-code blob-code-inner js-file-line"><span class="pl-k">import</span> re</td> - </tr> - <tr> - <td id="L26" class="blob-num js-line-number" data-line-number="26"></td> - <td id="LC26" class="blob-code blob-code-inner js-file-line"><span class="pl-k">import</span> os</td> - </tr> - <tr> - <td id="L27" class="blob-num js-line-number" data-line-number="27"></td> - <td id="LC27" class="blob-code blob-code-inner js-file-line"><span class="pl-k">import</span> sys</td> - </tr> - <tr> - <td id="L28" class="blob-num js-line-number" data-line-number="28"></td> - <td id="LC28" class="blob-code blob-code-inner js-file-line"><span class="pl-k">import</span> shutil</td> - </tr> - <tr> - <td id="L29" class="blob-num js-line-number" data-line-number="29"></td> - <td id="LC29" class="blob-code blob-code-inner js-file-line"><span class="pl-c"><span class="pl-c">#</span> import matplotlib as mpl</span></td> - </tr> - <tr> - <td id="L30" class="blob-num js-line-number" data-line-number="30"></td> - <td id="LC30" class="blob-code blob-code-inner js-file-line"><span class="pl-c"><span class="pl-c">#</span> mpl.use('Agg')</span></td> - </tr> - <tr> - <td id="L31" class="blob-num js-line-number" data-line-number="31"></td> - <td id="LC31" class="blob-code blob-code-inner js-file-line"><span class="pl-k">import</span> matplotlib.pyplot <span class="pl-k">as</span> plt</td> - </tr> - <tr> - <td id="L32" class="blob-num js-line-number" data-line-number="32"></td> - <td id="LC32" class="blob-code blob-code-inner js-file-line"><span class="pl-k">import</span> numpy <span class="pl-k">as</span> np</td> - </tr> - <tr> - <td id="L33" class="blob-num js-line-number" data-line-number="33"></td> - <td id="LC33" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L34" class="blob-num js-line-number" data-line-number="34"></td> - <td id="LC34" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L35" class="blob-num js-line-number" data-line-number="35"></td> - <td id="LC35" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L36" class="blob-num js-line-number" data-line-number="36"></td> - <td id="LC36" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L37" class="blob-num js-line-number" data-line-number="37"></td> - <td id="LC37" class="blob-code blob-code-inner js-file-line"><span class="pl-c"><span class="pl-c">#</span> copies the user provided Fasta file to data/reference/file/file.fasta</span></td> - </tr> - <tr> - <td id="L38" class="blob-num js-line-number" data-line-number="38"></td> - <td id="LC38" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">uploadUserReferenceFastq</span>(<span class="pl-smi">refFastq</span>):</td> - </tr> - <tr> - <td id="L39" class="blob-num js-line-number" data-line-number="39"></td> - <td id="LC39" class="blob-code blob-code-inner js-file-line"> refBase <span class="pl-k">=</span> os.path.basename(refFastq)</td> - </tr> - <tr> - <td id="L40" class="blob-num js-line-number" data-line-number="40"></td> - <td id="LC40" class="blob-code blob-code-inner js-file-line"> ref <span class="pl-k">=</span> os.path.splitext(refBase)[<span class="pl-c1">0</span>] <span class="pl-c"><span class="pl-c">#</span> 'mydata/test.fasta' -> 'test'</span></td> - </tr> - <tr> - <td id="L41" class="blob-num js-line-number" data-line-number="41"></td> - <td id="LC41" class="blob-code blob-code-inner js-file-line"> dir_path <span class="pl-k">=</span> os.path.dirname(os.path.realpath(<span class="pl-c1">__file__</span>)) <span class="pl-c"><span class="pl-c">#</span> directory of this file</span></td> - </tr> - <tr> - <td id="L42" class="blob-num js-line-number" data-line-number="42"></td> - <td id="LC42" class="blob-code blob-code-inner js-file-line"> refDir <span class="pl-k">=</span> dir_path <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">"</span>/data/Reference/<span class="pl-pds">"</span></span> <span class="pl-k">+</span> ref <span class="pl-c"><span class="pl-c">#</span>propose putting file in '/data/reference/ref/</span></td> - </tr> - <tr> - <td id="L43" class="blob-num js-line-number" data-line-number="43"></td> - <td id="LC43" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">if</span> <span class="pl-k">not</span> os.path.isdir(refDir): <span class="pl-c"><span class="pl-c">#</span> if directory data/Reference/ref doesn't exist</span></td> - </tr> - <tr> - <td id="L44" class="blob-num js-line-number" data-line-number="44"></td> - <td id="LC44" class="blob-code blob-code-inner js-file-line"> os.mkdir(refDir)</td> - </tr> - <tr> - <td id="L45" class="blob-num js-line-number" data-line-number="45"></td> - <td id="LC45" class="blob-code blob-code-inner js-file-line"> refPath <span class="pl-k">=</span> refDir<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>/<span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L46" class="blob-num js-line-number" data-line-number="46"></td> - <td id="LC46" class="blob-code blob-code-inner js-file-line"> shutil.copy(refFastq, refPath <span class="pl-k">+</span> refBase) <span class="pl-c"><span class="pl-c">#</span>copy reference file into the directory</span></td> - </tr> - <tr> - <td id="L47" class="blob-num js-line-number" data-line-number="47"></td> - <td id="LC47" class="blob-code blob-code-inner js-file-line"> argString <span class="pl-k">=</span> <span class="pl-s"><span class="pl-pds">"</span>bowtie2-build <span class="pl-pds">"</span></span> <span class="pl-k">+</span> refPath <span class="pl-k">+</span> refBase<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span> <span class="pl-pds">"</span></span><span class="pl-k">+</span>refPath<span class="pl-k">+</span>ref</td> - </tr> - <tr> - <td id="L48" class="blob-num js-line-number" data-line-number="48"></td> - <td id="LC48" class="blob-code blob-code-inner js-file-line"> <span class="pl-c1">print</span>(<span class="pl-s"><span class="pl-pds">"</span>Building the bowtie2 reference files.<span class="pl-pds">"</span></span>)</td> - </tr> - <tr> - <td id="L49" class="blob-num js-line-number" data-line-number="49"></td> - <td id="LC49" class="blob-code blob-code-inner js-file-line"> subprocess.call(argString, <span class="pl-v">shell</span><span class="pl-k">=</span><span class="pl-c1">True</span>)</td> - </tr> - <tr> - <td id="L50" class="blob-num js-line-number" data-line-number="50"></td> - <td id="LC50" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">return</span></td> - </tr> - <tr> - <td id="L51" class="blob-num js-line-number" data-line-number="51"></td> - <td id="LC51" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L52" class="blob-num js-line-number" data-line-number="52"></td> - <td id="LC52" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">transcriptMapping</span>(<span class="pl-smi">inputname</span>, <span class="pl-smi">refFastq</span>, <span class="pl-smi">forwardFN</span>, <span class="pl-smi">reverseFN</span>):</td> - </tr> - <tr> - <td id="L53" class="blob-num js-line-number" data-line-number="53"></td> - <td id="LC53" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> where is our Reference data?</span></td> - </tr> - <tr> - <td id="L54" class="blob-num js-line-number" data-line-number="54"></td> - <td id="LC54" class="blob-code blob-code-inner js-file-line"> refBase <span class="pl-k">=</span> os.path.basename(refFastq)</td> - </tr> - <tr> - <td id="L55" class="blob-num js-line-number" data-line-number="55"></td> - <td id="LC55" class="blob-code blob-code-inner js-file-line"> ref <span class="pl-k">=</span> os.path.splitext(refBase)[<span class="pl-c1">0</span>]</td> - </tr> - <tr> - <td id="L56" class="blob-num js-line-number" data-line-number="56"></td> - <td id="LC56" class="blob-code blob-code-inner js-file-line"> dir_path <span class="pl-k">=</span> os.path.dirname(os.path.realpath(<span class="pl-c1">__file__</span>))</td> - </tr> - <tr> - <td id="L57" class="blob-num js-line-number" data-line-number="57"></td> - <td id="LC57" class="blob-code blob-code-inner js-file-line"> refDir <span class="pl-k">=</span> dir_path <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">"</span>/data/Reference/<span class="pl-pds">"</span></span> <span class="pl-k">+</span> ref <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">"</span>/<span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L58" class="blob-num js-line-number" data-line-number="58"></td> - <td id="LC58" class="blob-code blob-code-inner js-file-line"> refName <span class="pl-k">=</span> refDir <span class="pl-k">+</span> ref</td> - </tr> - <tr> - <td id="L59" class="blob-num js-line-number" data-line-number="59"></td> - <td id="LC59" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> now have reference file so we can proceed with the transcript mapping via bowtie2</span></td> - </tr> - <tr> - <td id="L60" class="blob-num js-line-number" data-line-number="60"></td> - <td id="LC60" class="blob-code blob-code-inner js-file-line"> argString <span class="pl-k">=</span> <span class="pl-s"><span class="pl-pds">"</span>bowtie2 -x <span class="pl-pds">"</span></span><span class="pl-k">+</span>refName<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span> -1 <span class="pl-pds">"</span></span><span class="pl-k">+</span>forwardFN<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span> -2 <span class="pl-pds">"</span></span><span class="pl-k">+</span>reverseFN<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span> -S <span class="pl-pds">"</span></span><span class="pl-k">+</span>inputname<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>.sam<span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L61" class="blob-num js-line-number" data-line-number="61"></td> - <td id="LC61" class="blob-code blob-code-inner js-file-line"> <span class="pl-c1">print</span>(argString)</td> - </tr> - <tr> - <td id="L62" class="blob-num js-line-number" data-line-number="62"></td> - <td id="LC62" class="blob-code blob-code-inner js-file-line"> subprocess.call(argString, <span class="pl-v">shell</span><span class="pl-k">=</span><span class="pl-c1">True</span>) <span class="pl-c"><span class="pl-c">#</span>outputs a name.sam file</span></td> - </tr> - <tr> - <td id="L63" class="blob-num js-line-number" data-line-number="63"></td> - <td id="LC63" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">return</span></td> - </tr> - <tr> - <td id="L64" class="blob-num js-line-number" data-line-number="64"></td> - <td id="LC64" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L65" class="blob-num js-line-number" data-line-number="65"></td> - <td id="LC65" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L66" class="blob-num js-line-number" data-line-number="66"></td> - <td id="LC66" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L67" class="blob-num js-line-number" data-line-number="67"></td> - <td id="LC67" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">processSamFiles</span>(<span class="pl-smi">inputname</span>):</td> - </tr> - <tr> - <td id="L68" class="blob-num js-line-number" data-line-number="68"></td> - <td id="LC68" class="blob-code blob-code-inner js-file-line"> cur_path <span class="pl-k">=</span> os.getcwd()</td> - </tr> - <tr> - <td id="L69" class="blob-num js-line-number" data-line-number="69"></td> - <td id="LC69" class="blob-code blob-code-inner js-file-line"> samName <span class="pl-k">=</span> cur_path<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>/<span class="pl-pds">"</span></span><span class="pl-k">+</span>inputname</td> - </tr> - <tr> - <td id="L70" class="blob-num js-line-number" data-line-number="70"></td> - <td id="LC70" class="blob-code blob-code-inner js-file-line"> argString <span class="pl-k">=</span> <span class="pl-s"><span class="pl-pds">"</span>samtools view -bS <span class="pl-pds">"</span></span><span class="pl-k">+</span>inputname<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>.sam > <span class="pl-pds">"</span></span><span class="pl-k">+</span>samName<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>.bam<span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L71" class="blob-num js-line-number" data-line-number="71"></td> - <td id="LC71" class="blob-code blob-code-inner js-file-line"> <span class="pl-c1">print</span>(argString)</td> - </tr> - <tr> - <td id="L72" class="blob-num js-line-number" data-line-number="72"></td> - <td id="LC72" class="blob-code blob-code-inner js-file-line"> subprocess.call(argString, <span class="pl-v">shell</span><span class="pl-k">=</span><span class="pl-c1">True</span>)</td> - </tr> - <tr> - <td id="L73" class="blob-num js-line-number" data-line-number="73"></td> - <td id="LC73" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L74" class="blob-num js-line-number" data-line-number="74"></td> - <td id="LC74" class="blob-code blob-code-inner js-file-line"> argString <span class="pl-k">=</span> <span class="pl-s"><span class="pl-pds">"</span>samtools sort <span class="pl-pds">"</span></span><span class="pl-k">+</span>samName<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>.bam -o <span class="pl-pds">"</span></span><span class="pl-k">+</span>samName<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>.sorted<span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L75" class="blob-num js-line-number" data-line-number="75"></td> - <td id="LC75" class="blob-code blob-code-inner js-file-line"> <span class="pl-c1">print</span>(<span class="pl-s"><span class="pl-pds">"</span>argstring = <span class="pl-pds">"</span></span><span class="pl-k">+</span>argString)</td> - </tr> - <tr> - <td id="L76" class="blob-num js-line-number" data-line-number="76"></td> - <td id="LC76" class="blob-code blob-code-inner js-file-line"> subprocess.call(argString, <span class="pl-v">shell</span><span class="pl-k">=</span><span class="pl-c1">True</span>)</td> - </tr> - <tr> - <td id="L77" class="blob-num js-line-number" data-line-number="77"></td> - <td id="LC77" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L78" class="blob-num js-line-number" data-line-number="78"></td> - <td id="LC78" class="blob-code blob-code-inner js-file-line"> argString <span class="pl-k">=</span> <span class="pl-s"><span class="pl-pds">"</span>samtools index <span class="pl-pds">"</span></span><span class="pl-k">+</span>samName<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>.sorted <span class="pl-pds">"</span></span><span class="pl-k">+</span>samName<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>.sorted.bai<span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L79" class="blob-num js-line-number" data-line-number="79"></td> - <td id="LC79" class="blob-code blob-code-inner js-file-line"> <span class="pl-c1">print</span>(<span class="pl-s"><span class="pl-pds">"</span>argstring = <span class="pl-pds">"</span></span> <span class="pl-k">+</span> argString)</td> - </tr> - <tr> - <td id="L80" class="blob-num js-line-number" data-line-number="80"></td> - <td id="LC80" class="blob-code blob-code-inner js-file-line"> subprocess.call(argString, <span class="pl-v">shell</span><span class="pl-k">=</span><span class="pl-c1">True</span>)</td> - </tr> - <tr> - <td id="L81" class="blob-num js-line-number" data-line-number="81"></td> - <td id="LC81" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">return</span> <span class="pl-c"><span class="pl-c">#</span>we have saved out the relevent name.bam, name.sorted and name.sorted.bai files</span></td> - </tr> - <tr> - <td id="L82" class="blob-num js-line-number" data-line-number="82"></td> - <td id="LC82" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L83" class="blob-num js-line-number" data-line-number="83"></td> - <td id="LC83" class="blob-code blob-code-inner js-file-line"><span class="pl-c"><span class="pl-c">#</span> we will not have the .gtf file so call cufflinks without -G option</span></td> - </tr> - <tr> - <td id="L84" class="blob-num js-line-number" data-line-number="84"></td> - <td id="LC84" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">transcriptAbundance</span>(<span class="pl-smi">inputname</span>):</td> - </tr> - <tr> - <td id="L85" class="blob-num js-line-number" data-line-number="85"></td> - <td id="LC85" class="blob-code blob-code-inner js-file-line"> argString <span class="pl-k">=</span> <span class="pl-s"><span class="pl-pds">"</span>cufflinks -o <span class="pl-pds">"</span></span><span class="pl-k">+</span>inputname<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>.cuff -u -p 8 <span class="pl-pds">"</span></span><span class="pl-k">+</span>inputname<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>.sorted<span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L86" class="blob-num js-line-number" data-line-number="86"></td> - <td id="LC86" class="blob-code blob-code-inner js-file-line"> subprocess.call(argString, <span class="pl-v">shell</span> <span class="pl-k">=</span> <span class="pl-c1">True</span>)</td> - </tr> - <tr> - <td id="L87" class="blob-num js-line-number" data-line-number="87"></td> - <td id="LC87" class="blob-code blob-code-inner js-file-line"> os.remove(inputname<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>.sorted<span class="pl-pds">"</span></span>) <span class="pl-c"><span class="pl-c">#</span>remove name.sorted</span></td> - </tr> - <tr> - <td id="L88" class="blob-num js-line-number" data-line-number="88"></td> - <td id="LC88" class="blob-code blob-code-inner js-file-line"> os.remove(inputname<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>.sorted.bai<span class="pl-pds">"</span></span>)</td> - </tr> - <tr> - <td id="L89" class="blob-num js-line-number" data-line-number="89"></td> - <td id="LC89" class="blob-code blob-code-inner js-file-line"> os.remove(inputname<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>.bam<span class="pl-pds">"</span></span>)</td> - </tr> - <tr> - <td id="L90" class="blob-num js-line-number" data-line-number="90"></td> - <td id="LC90" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">return</span></td> - </tr> - <tr> - <td id="L91" class="blob-num js-line-number" data-line-number="91"></td> - <td id="LC91" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L92" class="blob-num js-line-number" data-line-number="92"></td> - <td id="LC92" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">transcriptsForBlast</span>(<span class="pl-smi">name</span>, <span class="pl-smi">refFastq</span>):</td> - </tr> - <tr> - <td id="L93" class="blob-num js-line-number" data-line-number="93"></td> - <td id="LC93" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> quick and dirty just to see.</span></td> - </tr> - <tr> - <td id="L94" class="blob-num js-line-number" data-line-number="94"></td> - <td id="LC94" class="blob-code blob-code-inner js-file-line"> refBase <span class="pl-k">=</span> os.path.basename(refFastq)</td> - </tr> - <tr> - <td id="L95" class="blob-num js-line-number" data-line-number="95"></td> - <td id="LC95" class="blob-code blob-code-inner js-file-line"> ref <span class="pl-k">=</span> os.path.splitext(refBase)[<span class="pl-c1">0</span>] <span class="pl-c"><span class="pl-c">#</span> 'mydata/test.fasta' -> 'test'</span></td> - </tr> - <tr> - <td id="L96" class="blob-num js-line-number" data-line-number="96"></td> - <td id="LC96" class="blob-code blob-code-inner js-file-line"> dir_path <span class="pl-k">=</span> os.path.dirname(os.path.realpath(<span class="pl-c1">__file__</span>)) <span class="pl-c"><span class="pl-c">#</span> directory of this file</span></td> - </tr> - <tr> - <td id="L97" class="blob-num js-line-number" data-line-number="97"></td> - <td id="LC97" class="blob-code blob-code-inner js-file-line"> refPath <span class="pl-k">=</span> dir_path <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">"</span>/data/Reference/<span class="pl-pds">"</span></span> <span class="pl-k">+</span> ref <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">"</span>/<span class="pl-pds">"</span></span> <span class="pl-k">+</span> refBase <span class="pl-c"><span class="pl-c">#</span> eg refPath = data/Reference/Trinity/Trinity.fasta</span></td> - </tr> - <tr> - <td id="L98" class="blob-num js-line-number" data-line-number="98"></td> - <td id="LC98" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> used for dirty # refPath = 'Trinity.fasta' # dirty one</span></td> - </tr> - <tr> - <td id="L99" class="blob-num js-line-number" data-line-number="99"></td> - <td id="LC99" class="blob-code blob-code-inner js-file-line"> track_df <span class="pl-k">=</span> pd.read_csv(name<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">'</span>.cuff/genes.fpkm_tracking<span class="pl-pds">'</span></span>, <span class="pl-v">sep</span><span class="pl-k">=</span><span class="pl-s"><span class="pl-pds">'</span><span class="pl-cce">\t</span><span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L100" class="blob-num js-line-number" data-line-number="100"></td> - <td id="LC100" class="blob-code blob-code-inner js-file-line"> names <span class="pl-k">=</span> track_df[<span class="pl-s"><span class="pl-pds">'</span>locus<span class="pl-pds">'</span></span>]</td> - </tr> - <tr> - <td id="L101" class="blob-num js-line-number" data-line-number="101"></td> - <td id="LC101" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> print(len(names))</span></td> - </tr> - <tr> - <td id="L102" class="blob-num js-line-number" data-line-number="102"></td> - <td id="LC102" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> print(names[:5])</span></td> - </tr> - <tr> - <td id="L103" class="blob-num js-line-number" data-line-number="103"></td> - <td id="LC103" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L104" class="blob-num js-line-number" data-line-number="104"></td> - <td id="LC104" class="blob-code blob-code-inner js-file-line"> nlist <span class="pl-k">=</span> []</td> - </tr> - <tr> - <td id="L105" class="blob-num js-line-number" data-line-number="105"></td> - <td id="LC105" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> n <span class="pl-k">in</span> <span class="pl-c1">range</span>(<span class="pl-c1">0</span>,<span class="pl-c1">len</span>(names)):</td> - </tr> - <tr> - <td id="L106" class="blob-num js-line-number" data-line-number="106"></td> - <td id="LC106" class="blob-code blob-code-inner js-file-line"> i <span class="pl-k">=</span> names[n].find(<span class="pl-s"><span class="pl-pds">'</span>:<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L107" class="blob-num js-line-number" data-line-number="107"></td> - <td id="LC107" class="blob-code blob-code-inner js-file-line"> nlist.append(names[n][:i])</td> - </tr> - <tr> - <td id="L108" class="blob-num js-line-number" data-line-number="108"></td> - <td id="LC108" class="blob-code blob-code-inner js-file-line"> nameset <span class="pl-k">=</span> <span class="pl-c1">set</span>(nlist) <span class="pl-c"><span class="pl-c">#</span>get unique.</span></td> - </tr> - <tr> - <td id="L109" class="blob-num js-line-number" data-line-number="109"></td> - <td id="LC109" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">with</span> <span class="pl-c1">open</span>(refPath, <span class="pl-s"><span class="pl-pds">'</span>r<span class="pl-pds">'</span></span>) <span class="pl-k">as</span> myRef:</td> - </tr> - <tr> - <td id="L110" class="blob-num js-line-number" data-line-number="110"></td> - <td id="LC110" class="blob-code blob-code-inner js-file-line"> refData <span class="pl-k">=</span> myRef.read()</td> - </tr> - <tr> - <td id="L111" class="blob-num js-line-number" data-line-number="111"></td> - <td id="LC111" class="blob-code blob-code-inner js-file-line"> refData<span class="pl-k">=</span> refData<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">'</span><span class="pl-cce">\n</span>><span class="pl-pds">'</span></span></td> - </tr> - <tr> - <td id="L112" class="blob-num js-line-number" data-line-number="112"></td> - <td id="LC112" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L113" class="blob-num js-line-number" data-line-number="113"></td> - <td id="LC113" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">with</span> <span class="pl-c1">open</span>(name <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">'</span>_for_blast.fa<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>w<span class="pl-pds">'</span></span>) <span class="pl-k">as</span> outfile:</td> - </tr> - <tr> - <td id="L114" class="blob-num js-line-number" data-line-number="114"></td> - <td id="LC114" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> trans_id <span class="pl-k">in</span> nameset:</td> - </tr> - <tr> - <td id="L115" class="blob-num js-line-number" data-line-number="115"></td> - <td id="LC115" class="blob-code blob-code-inner js-file-line"> namepos <span class="pl-k">=</span> refData.find(trans_id)</td> - </tr> - <tr> - <td id="L116" class="blob-num js-line-number" data-line-number="116"></td> - <td id="LC116" class="blob-code blob-code-inner js-file-line"> endpos <span class="pl-k">=</span> refData.find(<span class="pl-s"><span class="pl-pds">'</span>><span class="pl-pds">'</span></span>, namepos)</td> - </tr> - <tr> - <td id="L117" class="blob-num js-line-number" data-line-number="117"></td> - <td id="LC117" class="blob-code blob-code-inner js-file-line"> outfile.write(<span class="pl-s"><span class="pl-pds">'</span>><span class="pl-pds">'</span></span><span class="pl-k">+</span>refData[namepos:endpos])</td> - </tr> - <tr> - <td id="L118" class="blob-num js-line-number" data-line-number="118"></td> - <td id="LC118" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L119" class="blob-num js-line-number" data-line-number="119"></td> - <td id="LC119" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">pass</span></td> - </tr> - <tr> - <td id="L120" class="blob-num js-line-number" data-line-number="120"></td> - <td id="LC120" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L121" class="blob-num js-line-number" data-line-number="121"></td> - <td id="LC121" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">blastContigs</span>(<span class="pl-smi">test_name</span>,<span class="pl-smi">html_resource</span>, <span class="pl-smi">database</span>):</td> - </tr> - <tr> - <td id="L122" class="blob-num js-line-number" data-line-number="122"></td> - <td id="LC122" class="blob-code blob-code-inner js-file-line"> db_path <span class="pl-k">=</span> database</td> - </tr> - <tr> - <td id="L123" class="blob-num js-line-number" data-line-number="123"></td> - <td id="LC123" class="blob-code blob-code-inner js-file-line"> argString <span class="pl-k">=</span> <span class="pl-s"><span class="pl-pds">"</span>blastx -db <span class="pl-pds">"</span></span><span class="pl-k">+</span>db_path<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span> -query <span class="pl-pds">"</span></span><span class="pl-k">+</span>test_name<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>_for_blast.fa -outfmt 10 -out <span class="pl-pds">"</span></span><span class="pl-k">+</span>test_name<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>_blast.txt<span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L124" class="blob-num js-line-number" data-line-number="124"></td> - <td id="LC124" class="blob-code blob-code-inner js-file-line"> <span class="pl-c1">print</span>(argString)</td> - </tr> - <tr> - <td id="L125" class="blob-num js-line-number" data-line-number="125"></td> - <td id="LC125" class="blob-code blob-code-inner js-file-line"> returncode <span class="pl-k">=</span> subprocess.call(argString, <span class="pl-v">shell</span><span class="pl-k">=</span><span class="pl-c1">True</span>)</td> - </tr> - <tr> - <td id="L126" class="blob-num js-line-number" data-line-number="126"></td> - <td id="LC126" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">if</span> returncode <span class="pl-k">!=</span> <span class="pl-c1">0</span>:</td> - </tr> - <tr> - <td id="L127" class="blob-num js-line-number" data-line-number="127"></td> - <td id="LC127" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">return</span> <span class="pl-s"><span class="pl-pds">"</span>Error in blastall<span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L128" class="blob-num js-line-number" data-line-number="128"></td> - <td id="LC128" class="blob-code blob-code-inner js-file-line"> blast_df <span class="pl-k">=</span> pd.read_csv(<span class="pl-s"><span class="pl-pds">"</span><span class="pl-pds">"</span></span><span class="pl-k">+</span>test_name<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>_blast.txt<span class="pl-pds">"</span></span>)</td> - </tr> - <tr> - <td id="L129" class="blob-num js-line-number" data-line-number="129"></td> - <td id="LC129" class="blob-code blob-code-inner js-file-line"> blast_df.columns <span class="pl-k">=</span> [<span class="pl-s"><span class="pl-pds">'</span>qaccver<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>saccver<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>pident<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>length<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>mismatch<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>gapopen<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>qstart<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>qend<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>sstart<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>send<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>evalue<span class="pl-pds">'</span></span>,<span class="pl-s"><span class="pl-pds">'</span>bitscore<span class="pl-pds">'</span></span>]</td> - </tr> - <tr> - <td id="L130" class="blob-num js-line-number" data-line-number="130"></td> - <td id="LC130" class="blob-code blob-code-inner js-file-line"> blastResult_df <span class="pl-k">=</span> blast_df[(blast_df[<span class="pl-s"><span class="pl-pds">'</span>pident<span class="pl-pds">'</span></span>]<span class="pl-k">>=</span><span class="pl-c1">70</span>) <span class="pl-k">&</span> (blast_df[<span class="pl-s"><span class="pl-pds">'</span>length<span class="pl-pds">'</span></span>] <span class="pl-k">></span> <span class="pl-c1">100</span>) <span class="pl-k">&</span> (blast_df[<span class="pl-s"><span class="pl-pds">'</span>evalue<span class="pl-pds">'</span></span>] <span class="pl-k"><=</span><span class="pl-c1">0.001</span>) ]</td> - </tr> - <tr> - <td id="L131" class="blob-num js-line-number" data-line-number="131"></td> - <td id="LC131" class="blob-code blob-code-inner js-file-line"> blastResult_df <span class="pl-k">=</span> blastResult_df[[<span class="pl-s"><span class="pl-pds">'</span>qaccver<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>saccver<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>pident<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>evalue<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>bitscore<span class="pl-pds">'</span></span>]] <span class="pl-c"><span class="pl-c">#</span>query accession.version, subject accession.version, Percentage of identical matches</span></td> - </tr> - <tr> - <td id="L132" class="blob-num js-line-number" data-line-number="132"></td> - <td id="LC132" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> need to allocate the transcripts (if allocated more than once to the phylotype with least error.</span></td> - </tr> - <tr> - <td id="L133" class="blob-num js-line-number" data-line-number="133"></td> - <td id="LC133" class="blob-code blob-code-inner js-file-line"> transcripts <span class="pl-k">=</span> blastResult_df[<span class="pl-s"><span class="pl-pds">'</span>qaccver<span class="pl-pds">'</span></span>]</td> - </tr> - <tr> - <td id="L134" class="blob-num js-line-number" data-line-number="134"></td> - <td id="LC134" class="blob-code blob-code-inner js-file-line"> b_df <span class="pl-k">=</span> pd.DataFrame(<span class="pl-v">columns</span><span class="pl-k">=</span>[<span class="pl-s"><span class="pl-pds">'</span>qaccver<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>saccver<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>pident<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>evalue<span class="pl-pds">'</span></span>, <span class="pl-s"><span class="pl-pds">'</span>bitscore<span class="pl-pds">'</span></span>])</td> - </tr> - <tr> - <td id="L135" class="blob-num js-line-number" data-line-number="135"></td> - <td id="LC135" class="blob-code blob-code-inner js-file-line"> transSet <span class="pl-k">=</span> <span class="pl-c1">set</span>(transcripts)</td> - </tr> - <tr> - <td id="L136" class="blob-num js-line-number" data-line-number="136"></td> - <td id="LC136" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> t <span class="pl-k">in</span> transSet:</td> - </tr> - <tr> - <td id="L137" class="blob-num js-line-number" data-line-number="137"></td> - <td id="LC137" class="blob-code blob-code-inner js-file-line"> temp_df <span class="pl-k">=</span> blastResult_df[(blastResult_df[<span class="pl-s"><span class="pl-pds">'</span>qaccver<span class="pl-pds">'</span></span>] <span class="pl-k">==</span> t)]</td> - </tr> - <tr> - <td id="L138" class="blob-num js-line-number" data-line-number="138"></td> - <td id="LC138" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> get one with smallest error value</span></td> - </tr> - <tr> - <td id="L139" class="blob-num js-line-number" data-line-number="139"></td> - <td id="LC139" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>print(t + ":")</span></td> - </tr> - <tr> - <td id="L140" class="blob-num js-line-number" data-line-number="140"></td> - <td id="LC140" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>print(temp_df)</span></td> - </tr> - <tr> - <td id="L141" class="blob-num js-line-number" data-line-number="141"></td> - <td id="LC141" class="blob-code blob-code-inner js-file-line"> temp_df <span class="pl-k">=</span> temp_df.sort_values(<span class="pl-v">by</span><span class="pl-k">=</span>[<span class="pl-s"><span class="pl-pds">'</span>evalue<span class="pl-pds">'</span></span>])</td> - </tr> - <tr> - <td id="L142" class="blob-num js-line-number" data-line-number="142"></td> - <td id="LC142" class="blob-code blob-code-inner js-file-line"> b_df <span class="pl-k">=</span> b_df.append(temp_df.iloc[[<span class="pl-c1">0</span>]])</td> - </tr> - <tr> - <td id="L143" class="blob-num js-line-number" data-line-number="143"></td> - <td id="LC143" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L144" class="blob-num js-line-number" data-line-number="144"></td> - <td id="LC144" class="blob-code blob-code-inner js-file-line"> b_df.sort_values(<span class="pl-v">by</span><span class="pl-k">=</span>[<span class="pl-s"><span class="pl-pds">'</span>qaccver<span class="pl-pds">'</span></span>])</td> - </tr> - <tr> - <td id="L145" class="blob-num js-line-number" data-line-number="145"></td> - <td id="LC145" class="blob-code blob-code-inner js-file-line"> b_df.to_csv(test_name <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">'</span>_transcript.csv<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L146" class="blob-num js-line-number" data-line-number="146"></td> - <td id="LC146" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">return</span> b_df</td> - </tr> - <tr> - <td id="L147" class="blob-num js-line-number" data-line-number="147"></td> - <td id="LC147" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L148" class="blob-num js-line-number" data-line-number="148"></td> - <td id="LC148" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L149" class="blob-num js-line-number" data-line-number="149"></td> - <td id="LC149" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">createMultiHTML</span>(<span class="pl-smi">tdict</span>,<span class="pl-smi">composite_df</span>):</td> - </tr> - <tr> - <td id="L150" class="blob-num js-line-number" data-line-number="150"></td> - <td id="LC150" class="blob-code blob-code-inner js-file-line"> labelList <span class="pl-k">=</span> composite_df.columns.tolist()</td> - </tr> - <tr> - <td id="L151" class="blob-num js-line-number" data-line-number="151"></td> - <td id="LC151" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><html><title>T<span class="pl-c1">.</span>vivax VAP <span class="pl-c1">(</span>Transcriptomic Pathway<span class="pl-c1">(</span></title><body><div style='text-align:center'><h2><i>Trypanosoma vivax</i> Variant Antigen Profile</h2><h3><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L152" class="blob-num js-line-number" data-line-number="152"></td> - <td id="LC152" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span>Sample name: <span class="pl-pds">"</span></span><span class="pl-k">+</span>tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]</td> - </tr> - <tr> - <td id="L153" class="blob-num js-line-number" data-line-number="153"></td> - <td id="LC153" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><br>Transcriptomic Analysis</h3></p><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L154" class="blob-num js-line-number" data-line-number="154"></td> - <td id="LC154" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> <span class="pl-s"><span class="pl-pds">"</span><p style = 'margin-left:20%; margin-right:20%'>Legend: <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L155" class="blob-num js-line-number" data-line-number="155"></td> - <td id="LC155" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>Variant Antigen Profile of a <i>Trypanosoma vivax</i> transcriptomes. <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L156" class="blob-num js-line-number" data-line-number="156"></td> - <td id="LC156" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>Weighted Frequency reflects Phylotype abundance and is expressed as <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L157" class="blob-num js-line-number" data-line-number="157"></td> - <td id="LC157" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>phylotype frequencies adjusted for the combined transcript abundance. <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L158" class="blob-num js-line-number" data-line-number="158"></td> - <td id="LC158" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>Data was produced with VAPPER-Variant Antigen Profiler <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L159" class="blob-num js-line-number" data-line-number="159"></td> - <td id="LC159" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>(Silva Pereira et al., 2019).</p> <span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L160" class="blob-num js-line-number" data-line-number="160"></td> - <td id="LC160" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><style> table, th, tr, td {border: 1px solid black; border-collapse: collapse;}</style><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L161" class="blob-num js-line-number" data-line-number="161"></td> - <td id="LC161" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L162" class="blob-num js-line-number" data-line-number="162"></td> - <td id="LC162" class="blob-code blob-code-inner js-file-line"> header <span class="pl-k">=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><table style='width:50%;margin-left:25%;text-align:center'><tr><th>Phylotype</th><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L163" class="blob-num js-line-number" data-line-number="163"></td> - <td id="LC163" class="blob-code blob-code-inner js-file-line"> wLists <span class="pl-k">=</span> []</td> - </tr> - <tr> - <td id="L164" class="blob-num js-line-number" data-line-number="164"></td> - <td id="LC164" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L165" class="blob-num js-line-number" data-line-number="165"></td> - <td id="LC165" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> j <span class="pl-k">in</span> <span class="pl-c1">range</span>(<span class="pl-c1">1</span>,<span class="pl-c1">len</span>(labelList)):</td> - </tr> - <tr> - <td id="L166" class="blob-num js-line-number" data-line-number="166"></td> - <td id="LC166" class="blob-code blob-code-inner js-file-line"> wLists.append(composite_df[labelList[j]])</td> - </tr> - <tr> - <td id="L167" class="blob-num js-line-number" data-line-number="167"></td> - <td id="LC167" class="blob-code blob-code-inner js-file-line"> header <span class="pl-k">+=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><th><span class="pl-pds">"</span></span> <span class="pl-k">+</span> <span class="pl-c1">str</span>(labelList[j]) <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">"</span></th><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L168" class="blob-num js-line-number" data-line-number="168"></td> - <td id="LC168" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L169" class="blob-num js-line-number" data-line-number="169"></td> - <td id="LC169" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> <span class="pl-s"><span class="pl-pds">"</span></tr><span class="pl-cce">\n</span><span class="pl-pds">"</span></span> <span class="pl-k">+</span> header</td> - </tr> - <tr> - <td id="L170" class="blob-num js-line-number" data-line-number="170"></td> - <td id="LC170" class="blob-code blob-code-inner js-file-line"> tabString <span class="pl-k">=</span> <span class="pl-s"><span class="pl-pds">"</span><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L171" class="blob-num js-line-number" data-line-number="171"></td> - <td id="LC171" class="blob-code blob-code-inner js-file-line"> phyList <span class="pl-k">=</span> composite_df[<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>]</td> - </tr> - <tr> - <td id="L172" class="blob-num js-line-number" data-line-number="172"></td> - <td id="LC172" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L173" class="blob-num js-line-number" data-line-number="173"></td> - <td id="LC173" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L174" class="blob-num js-line-number" data-line-number="174"></td> - <td id="LC174" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L175" class="blob-num js-line-number" data-line-number="175"></td> - <td id="LC175" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> i <span class="pl-k">in</span> <span class="pl-c1">range</span>(<span class="pl-c1">0</span>, <span class="pl-c1">len</span>(composite_df)):</td> - </tr> - <tr> - <td id="L176" class="blob-num js-line-number" data-line-number="176"></td> - <td id="LC176" class="blob-code blob-code-inner js-file-line"> tabString <span class="pl-k">+=</span> <span class="pl-s"><span class="pl-pds">"</span><tr><td><span class="pl-pds">"</span></span> <span class="pl-k">+</span> <span class="pl-c1">str</span>(phyList[i]) <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">"</span></td><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L177" class="blob-num js-line-number" data-line-number="177"></td> - <td id="LC177" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> j <span class="pl-k">in</span> <span class="pl-c1">range</span>(<span class="pl-c1">0</span>,<span class="pl-c1">len</span>(labelList)<span class="pl-k">-</span><span class="pl-c1">1</span>):</td> - </tr> - <tr> - <td id="L178" class="blob-num js-line-number" data-line-number="178"></td> - <td id="LC178" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>print(j)</span></td> - </tr> - <tr> - <td id="L179" class="blob-num js-line-number" data-line-number="179"></td> - <td id="LC179" class="blob-code blob-code-inner js-file-line"> f <span class="pl-k">=</span> <span class="pl-c1">format</span>(wLists[j][i], <span class="pl-s"><span class="pl-pds">'</span>.4f<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L180" class="blob-num js-line-number" data-line-number="180"></td> - <td id="LC180" class="blob-code blob-code-inner js-file-line"> tabString <span class="pl-k">+=</span> <span class="pl-s"><span class="pl-pds">"</span><td><span class="pl-pds">"</span></span> <span class="pl-k">+</span> <span class="pl-c1">str</span>(f) <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">"</span></td><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L181" class="blob-num js-line-number" data-line-number="181"></td> - <td id="LC181" class="blob-code blob-code-inner js-file-line"> tabString <span class="pl-k">+=</span> <span class="pl-s"><span class="pl-pds">"</span></tr><span class="pl-cce">\n</span><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L182" class="blob-num js-line-number" data-line-number="182"></td> - <td id="LC182" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L183" class="blob-num js-line-number" data-line-number="183"></td> - <td id="LC183" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> tabString <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">"</span></table><br><br><br><br><br><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L184" class="blob-num js-line-number" data-line-number="184"></td> - <td id="LC184" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><h3>Weighted Relative Frequencies of Detected Phylotypes<span class="pl-c1">.</span></h3><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L185" class="blob-num js-line-number" data-line-number="185"></td> - <td id="LC185" class="blob-code blob-code-inner js-file-line"> imgString <span class="pl-k">=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><img src = '<span class="pl-pds">"</span></span><span class="pl-k">+</span> tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>_phylotypes.png' alt='Bar chart of phylotype variation' style='max-width:100%'><br><br><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L186" class="blob-num js-line-number" data-line-number="186"></td> - <td id="LC186" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> imgString</td> - </tr> - <tr> - <td id="L187" class="blob-num js-line-number" data-line-number="187"></td> - <td id="LC187" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L188" class="blob-num js-line-number" data-line-number="188"></td> - <td id="LC188" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">with</span> <span class="pl-c1">open</span>(tdict[<span class="pl-s"><span class="pl-pds">'</span>html_file<span class="pl-pds">'</span></span>], <span class="pl-s"><span class="pl-pds">"</span>w<span class="pl-pds">"</span></span>) <span class="pl-k">as</span> htmlfile:</td> - </tr> - <tr> - <td id="L189" class="blob-num js-line-number" data-line-number="189"></td> - <td id="LC189" class="blob-code blob-code-inner js-file-line"> htmlfile.write(htmlString)</td> - </tr> - <tr> - <td id="L190" class="blob-num js-line-number" data-line-number="190"></td> - <td id="LC190" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L191" class="blob-num js-line-number" data-line-number="191"></td> - <td id="LC191" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L192" class="blob-num js-line-number" data-line-number="192"></td> - <td id="LC192" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">createHTML</span>(<span class="pl-smi">tdict</span>,<span class="pl-smi">sum_df</span>):</td> - </tr> - <tr> - <td id="L193" class="blob-num js-line-number" data-line-number="193"></td> - <td id="LC193" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>assumes imgs are heatmap.png, dheatmap.png, vapPCA.png and already in htmlresource</span></td> - </tr> - <tr> - <td id="L194" class="blob-num js-line-number" data-line-number="194"></td> - <td id="LC194" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><html><title>T<span class="pl-c1">.</span>vivax VAP <span class="pl-c1">(</span>Transcriptomic Pathway<span class="pl-c1">(</span></title><body><div style='text-align:center'><h2><i>Trypanosoma vivax</i> Variant Antigen Profile</h2><h3><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L195" class="blob-num js-line-number" data-line-number="195"></td> - <td id="LC195" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span>Sample name: <span class="pl-pds">"</span></span><span class="pl-k">+</span>tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]</td> - </tr> - <tr> - <td id="L196" class="blob-num js-line-number" data-line-number="196"></td> - <td id="LC196" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><br>Transcriptomic Analysis</h3></p><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L197" class="blob-num js-line-number" data-line-number="197"></td> - <td id="LC197" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> <span class="pl-s"><span class="pl-pds">"</span><p style = 'margin-left:20%; margin-right:20%'>Legend: <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L198" class="blob-num js-line-number" data-line-number="198"></td> - <td id="LC198" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>Variant Antigen Profile of a <i>Trypanosoma vivax</i> transcriptome. <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L199" class="blob-num js-line-number" data-line-number="199"></td> - <td id="LC199" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>Weighted Frequency reflects Phylotype abundance and is expressed as <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L200" class="blob-num js-line-number" data-line-number="200"></td> - <td id="LC200" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>phylotype frequencies adjusted for the combined transcript abundance. <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L201" class="blob-num js-line-number" data-line-number="201"></td> - <td id="LC201" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>Data was produced with VAPPER-Variant Antigen Profiler <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L202" class="blob-num js-line-number" data-line-number="202"></td> - <td id="LC202" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>(Silva Pereira et al., 2019).</p> <span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L203" class="blob-num js-line-number" data-line-number="203"></td> - <td id="LC203" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><style> table, th, tr, td {border: 1px solid black; border-collapse: collapse;}</style><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L204" class="blob-num js-line-number" data-line-number="204"></td> - <td id="LC204" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L205" class="blob-num js-line-number" data-line-number="205"></td> - <td id="LC205" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><table style='width:50%;table-layout: auto; margin-left:25%;text-align:center'><tr><th>Phylotype</th><span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L206" class="blob-num js-line-number" data-line-number="206"></td> - <td id="LC206" class="blob-code blob-code-inner js-file-line"> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><th>Combined FPKM</th><th>Weighted Frequency</th></tr><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L207" class="blob-num js-line-number" data-line-number="207"></td> - <td id="LC207" class="blob-code blob-code-inner js-file-line"> tabString <span class="pl-k">=</span> <span class="pl-s"><span class="pl-pds">"</span><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L208" class="blob-num js-line-number" data-line-number="208"></td> - <td id="LC208" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> flush out table with correct values</span></td> - </tr> - <tr> - <td id="L209" class="blob-num js-line-number" data-line-number="209"></td> - <td id="LC209" class="blob-code blob-code-inner js-file-line"> phySeries <span class="pl-k">=</span> sum_df[<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>]</td> - </tr> - <tr> - <td id="L210" class="blob-num js-line-number" data-line-number="210"></td> - <td id="LC210" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> sacSeries = sum_df['saccver']</span></td> - </tr> - <tr> - <td id="L211" class="blob-num js-line-number" data-line-number="211"></td> - <td id="LC211" class="blob-code blob-code-inner js-file-line"> fSeries <span class="pl-k">=</span> sum_df[<span class="pl-s"><span class="pl-pds">'</span>FPKM<span class="pl-pds">'</span></span>]</td> - </tr> - <tr> - <td id="L212" class="blob-num js-line-number" data-line-number="212"></td> - <td id="LC212" class="blob-code blob-code-inner js-file-line"> total <span class="pl-k">=</span> fSeries.sum()</td> - </tr> - <tr> - <td id="L213" class="blob-num js-line-number" data-line-number="213"></td> - <td id="LC213" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> print("Total="+str(total))</span></td> - </tr> - <tr> - <td id="L214" class="blob-num js-line-number" data-line-number="214"></td> - <td id="LC214" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> i <span class="pl-k">in</span> <span class="pl-c1">range</span>(<span class="pl-c1">0</span>, <span class="pl-c1">len</span>(sum_df)):</td> - </tr> - <tr> - <td id="L215" class="blob-num js-line-number" data-line-number="215"></td> - <td id="LC215" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> print(phySeries[i])</span></td> - </tr> - <tr> - <td id="L216" class="blob-num js-line-number" data-line-number="216"></td> - <td id="LC216" class="blob-code blob-code-inner js-file-line"> f <span class="pl-k">=</span> <span class="pl-c1">format</span>(fSeries[i], <span class="pl-s"><span class="pl-pds">'</span>.2f<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L217" class="blob-num js-line-number" data-line-number="217"></td> - <td id="LC217" class="blob-code blob-code-inner js-file-line"> w <span class="pl-k">=</span> <span class="pl-c1">format</span>(fSeries[i]<span class="pl-k">/</span>total, <span class="pl-s"><span class="pl-pds">'</span>.2f<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L218" class="blob-num js-line-number" data-line-number="218"></td> - <td id="LC218" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L219" class="blob-num js-line-number" data-line-number="219"></td> - <td id="LC219" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>w = format(weightList[i], '.4f')</span></td> - </tr> - <tr> - <td id="L220" class="blob-num js-line-number" data-line-number="220"></td> - <td id="LC220" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L221" class="blob-num js-line-number" data-line-number="221"></td> - <td id="LC221" class="blob-code blob-code-inner js-file-line"> tabString <span class="pl-k">+=</span> <span class="pl-s"><span class="pl-pds">"</span><tr><td><span class="pl-pds">"</span></span> <span class="pl-k">+</span> <span class="pl-c1">str</span>(phySeries[i]) <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">"</span></td><td><span class="pl-pds">"</span></span> <span class="pl-k">+</span> <span class="pl-c1">str</span>(f) <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">"</span></td><td><span class="pl-pds">"</span></span><span class="pl-k">+</span><span class="pl-c1">str</span>(w)<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span></tr><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L222" class="blob-num js-line-number" data-line-number="222"></td> - <td id="LC222" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> tabString <span class="pl-k">+</span> <span class="pl-s"><span class="pl-pds">"</span></table><br><br><br><br><br><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L223" class="blob-num js-line-number" data-line-number="223"></td> - <td id="LC223" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><h3>Weighted Relative Frequencies of Detected Phylotypes<span class="pl-c1">.</span></h3><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L224" class="blob-num js-line-number" data-line-number="224"></td> - <td id="LC224" class="blob-code blob-code-inner js-file-line"> imgString <span class="pl-k">=</span> <span class="pl-sr"><span class="pl-k">r</span><span class="pl-pds">"</span><img src = '<span class="pl-pds">"</span></span><span class="pl-k">+</span> tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>_phylotypes.png' alt='Bar chart of phylotype variation' style='max-width:100%'><br><br><span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L225" class="blob-num js-line-number" data-line-number="225"></td> - <td id="LC225" class="blob-code blob-code-inner js-file-line"> htmlString <span class="pl-k">+=</span> imgString</td> - </tr> - <tr> - <td id="L226" class="blob-num js-line-number" data-line-number="226"></td> - <td id="LC226" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L227" class="blob-num js-line-number" data-line-number="227"></td> - <td id="LC227" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">with</span> <span class="pl-c1">open</span>(tdict[<span class="pl-s"><span class="pl-pds">'</span>html_file<span class="pl-pds">'</span></span>], <span class="pl-s"><span class="pl-pds">"</span>w<span class="pl-pds">"</span></span>) <span class="pl-k">as</span> htmlfile:</td> - </tr> - <tr> - <td id="L228" class="blob-num js-line-number" data-line-number="228"></td> - <td id="LC228" class="blob-code blob-code-inner js-file-line"> htmlfile.write(htmlString)</td> - </tr> - <tr> - <td id="L229" class="blob-num js-line-number" data-line-number="229"></td> - <td id="LC229" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L230" class="blob-num js-line-number" data-line-number="230"></td> - <td id="LC230" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L231" class="blob-num js-line-number" data-line-number="231"></td> - <td id="LC231" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L232" class="blob-num js-line-number" data-line-number="232"></td> - <td id="LC232" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">getPhyloNumber</span>(<span class="pl-smi">sac</span>):</td> - </tr> - <tr> - <td id="L233" class="blob-num js-line-number" data-line-number="233"></td> - <td id="LC233" class="blob-code blob-code-inner js-file-line"> i <span class="pl-k">=</span> sac.find(<span class="pl-s"><span class="pl-pds">'</span>_<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L234" class="blob-num js-line-number" data-line-number="234"></td> - <td id="LC234" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">return</span> <span class="pl-c1">int</span>(sac[<span class="pl-c1">1</span>:i])</td> - </tr> - <tr> - <td id="L235" class="blob-num js-line-number" data-line-number="235"></td> - <td id="LC235" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L236" class="blob-num js-line-number" data-line-number="236"></td> - <td id="LC236" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">combineFPMK</span>(<span class="pl-smi">tdict</span>):</td> - </tr> - <tr> - <td id="L237" class="blob-num js-line-number" data-line-number="237"></td> - <td id="LC237" class="blob-code blob-code-inner js-file-line"> fpkm_df <span class="pl-k">=</span> pd.read_csv(tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">'</span>.cuff/genes.fpkm_tracking<span class="pl-pds">'</span></span>, <span class="pl-v">sep</span><span class="pl-k">=</span><span class="pl-s"><span class="pl-pds">'</span><span class="pl-cce">\t</span><span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L238" class="blob-num js-line-number" data-line-number="238"></td> - <td id="LC238" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L239" class="blob-num js-line-number" data-line-number="239"></td> - <td id="LC239" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>fpkm_df = pd.read_csv('genes.fpkm_tracking',sep='\t')</span></td> - </tr> - <tr> - <td id="L240" class="blob-num js-line-number" data-line-number="240"></td> - <td id="LC240" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>print(fpkm_df.head())</span></td> - </tr> - <tr> - <td id="L241" class="blob-num js-line-number" data-line-number="241"></td> - <td id="LC241" class="blob-code blob-code-inner js-file-line"> fpkm_df[<span class="pl-s"><span class="pl-pds">'</span>locus<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> fpkm_df[<span class="pl-s"><span class="pl-pds">'</span>locus<span class="pl-pds">'</span></span>].apply(<span class="pl-k">lambda</span> <span class="pl-smi">names</span>: names[:names.find(<span class="pl-s"><span class="pl-pds">'</span>:<span class="pl-pds">'</span></span>)])</td> - </tr> - <tr> - <td id="L242" class="blob-num js-line-number" data-line-number="242"></td> - <td id="LC242" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>print(fpkm_df.head())</span></td> - </tr> - <tr> - <td id="L243" class="blob-num js-line-number" data-line-number="243"></td> - <td id="LC243" class="blob-code blob-code-inner js-file-line"> reducedBlast_df <span class="pl-k">=</span> pd.read_csv(tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">'</span>_transcript.csv<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L244" class="blob-num js-line-number" data-line-number="244"></td> - <td id="LC244" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> reducedBlast_df = pd.read_csv('TrinityVT_transcript.csv')</span></td> - </tr> - <tr> - <td id="L245" class="blob-num js-line-number" data-line-number="245"></td> - <td id="LC245" class="blob-code blob-code-inner js-file-line"> saccverSet <span class="pl-k">=</span> <span class="pl-c1">set</span>(reducedBlast_df[<span class="pl-s"><span class="pl-pds">'</span>saccver<span class="pl-pds">'</span></span>])</td> - </tr> - <tr> - <td id="L246" class="blob-num js-line-number" data-line-number="246"></td> - <td id="LC246" class="blob-code blob-code-inner js-file-line"> saccverList <span class="pl-k">=</span> <span class="pl-c1">list</span>(saccverSet)</td> - </tr> - <tr> - <td id="L247" class="blob-num js-line-number" data-line-number="247"></td> - <td id="LC247" class="blob-code blob-code-inner js-file-line"> saccverList.sort()</td> - </tr> - <tr> - <td id="L248" class="blob-num js-line-number" data-line-number="248"></td> - <td id="LC248" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> print(saccverList[:5])</span></td> - </tr> - <tr> - <td id="L249" class="blob-num js-line-number" data-line-number="249"></td> - <td id="LC249" class="blob-code blob-code-inner js-file-line"> new_df <span class="pl-k">=</span> pd.DataFrame(<span class="pl-v">columns</span><span class="pl-k">=</span>[<span class="pl-s"><span class="pl-pds">'</span>qaccver<span class="pl-pds">'</span></span>,<span class="pl-s"><span class="pl-pds">'</span>saccver<span class="pl-pds">'</span></span>,<span class="pl-s"><span class="pl-pds">'</span>FPKM<span class="pl-pds">'</span></span>])</td> - </tr> - <tr> - <td id="L250" class="blob-num js-line-number" data-line-number="250"></td> - <td id="LC250" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> sv <span class="pl-k">in</span> saccverList:</td> - </tr> - <tr> - <td id="L251" class="blob-num js-line-number" data-line-number="251"></td> - <td id="LC251" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>print(sv)</span></td> - </tr> - <tr> - <td id="L252" class="blob-num js-line-number" data-line-number="252"></td> - <td id="LC252" class="blob-code blob-code-inner js-file-line"> temp_df <span class="pl-k">=</span> reducedBlast_df[reducedBlast_df[<span class="pl-s"><span class="pl-pds">'</span>saccver<span class="pl-pds">'</span></span>] <span class="pl-k">==</span> sv]</td> - </tr> - <tr> - <td id="L253" class="blob-num js-line-number" data-line-number="253"></td> - <td id="LC253" class="blob-code blob-code-inner js-file-line"> qList <span class="pl-k">=</span> <span class="pl-c1">list</span>(temp_df[<span class="pl-s"><span class="pl-pds">'</span>qaccver<span class="pl-pds">'</span></span>])</td> - </tr> - <tr> - <td id="L254" class="blob-num js-line-number" data-line-number="254"></td> - <td id="LC254" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> q <span class="pl-k">in</span> qList:</td> - </tr> - <tr> - <td id="L255" class="blob-num js-line-number" data-line-number="255"></td> - <td id="LC255" class="blob-code blob-code-inner js-file-line"> f_df <span class="pl-k">=</span> fpkm_df[(fpkm_df[<span class="pl-s"><span class="pl-pds">'</span>locus<span class="pl-pds">'</span></span>] <span class="pl-k">==</span> q)]</td> - </tr> - <tr> - <td id="L256" class="blob-num js-line-number" data-line-number="256"></td> - <td id="LC256" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">if</span> <span class="pl-c1">len</span>(f_df) <span class="pl-k">></span> <span class="pl-c1">1</span>:</td> - </tr> - <tr> - <td id="L257" class="blob-num js-line-number" data-line-number="257"></td> - <td id="LC257" class="blob-code blob-code-inner js-file-line"> <span class="pl-c1">print</span>(<span class="pl-s"><span class="pl-pds">'</span>WARNING MULTIPLE FPKM<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L258" class="blob-num js-line-number" data-line-number="258"></td> - <td id="LC258" class="blob-code blob-code-inner js-file-line"> new_fpkm<span class="pl-k">=</span><span class="pl-c1">list</span>(f_df[<span class="pl-s"><span class="pl-pds">'</span>FPKM<span class="pl-pds">'</span></span>])</td> - </tr> - <tr> - <td id="L259" class="blob-num js-line-number" data-line-number="259"></td> - <td id="LC259" class="blob-code blob-code-inner js-file-line"> f <span class="pl-k">=</span> (new_fpkm[<span class="pl-c1">0</span>])</td> - </tr> - <tr> - <td id="L260" class="blob-num js-line-number" data-line-number="260"></td> - <td id="LC260" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> print(f)</span></td> - </tr> - <tr> - <td id="L261" class="blob-num js-line-number" data-line-number="261"></td> - <td id="LC261" class="blob-code blob-code-inner js-file-line"> new_df <span class="pl-k">=</span> new_df.append({<span class="pl-s"><span class="pl-pds">'</span>qaccver<span class="pl-pds">'</span></span>: q, <span class="pl-s"><span class="pl-pds">'</span>saccver<span class="pl-pds">'</span></span>: sv, <span class="pl-s"><span class="pl-pds">'</span>FPKM<span class="pl-pds">'</span></span>: f}, <span class="pl-v">ignore_index</span><span class="pl-k">=</span><span class="pl-c1">True</span>)</td> - </tr> - <tr> - <td id="L262" class="blob-num js-line-number" data-line-number="262"></td> - <td id="LC262" class="blob-code blob-code-inner js-file-line"> FPKMsum_df <span class="pl-k">=</span> new_df.groupby(<span class="pl-s"><span class="pl-pds">'</span>saccver<span class="pl-pds">'</span></span>)[<span class="pl-s"><span class="pl-pds">'</span>FPKM<span class="pl-pds">'</span></span>].sum().reset_index()</td> - </tr> - <tr> - <td id="L263" class="blob-num js-line-number" data-line-number="263"></td> - <td id="LC263" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L264" class="blob-num js-line-number" data-line-number="264"></td> - <td id="LC264" class="blob-code blob-code-inner js-file-line"> FPKMsum_df[<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> FPKMsum_df.apply(<span class="pl-k">lambda</span> <span class="pl-smi">row</span>: getPhyloNumber(row[<span class="pl-s"><span class="pl-pds">'</span>saccver<span class="pl-pds">'</span></span>]), <span class="pl-v">axis</span><span class="pl-k">=</span><span class="pl-c1">1</span>)</td> - </tr> - <tr> - <td id="L265" class="blob-num js-line-number" data-line-number="265"></td> - <td id="LC265" class="blob-code blob-code-inner js-file-line"> FPKMsum_df <span class="pl-k">=</span> FPKMsum_df.sort_values(<span class="pl-v">by</span><span class="pl-k">=</span>[<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>])</td> - </tr> - <tr> - <td id="L266" class="blob-num js-line-number" data-line-number="266"></td> - <td id="LC266" class="blob-code blob-code-inner js-file-line"> FPKMsum_df <span class="pl-k">=</span> FPKMsum_df.reset_index(<span class="pl-v">drop</span><span class="pl-k">=</span><span class="pl-c1">True</span>)</td> - </tr> - <tr> - <td id="L267" class="blob-num js-line-number" data-line-number="267"></td> - <td id="LC267" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L268" class="blob-num js-line-number" data-line-number="268"></td> - <td id="LC268" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> print(FPKMsum_df)</span></td> - </tr> - <tr> - <td id="L269" class="blob-num js-line-number" data-line-number="269"></td> - <td id="LC269" class="blob-code blob-code-inner js-file-line"> FPKMsum_df.to_csv(<span class="pl-s"><span class="pl-pds">'</span>FPKM_sum.csv<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L270" class="blob-num js-line-number" data-line-number="270"></td> - <td id="LC270" class="blob-code blob-code-inner js-file-line"> FPKMsum2_df <span class="pl-k">=</span> FPKMsum_df.groupby(<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>)[<span class="pl-s"><span class="pl-pds">'</span>FPKM<span class="pl-pds">'</span></span>].sum().reset_index()</td> - </tr> - <tr> - <td id="L271" class="blob-num js-line-number" data-line-number="271"></td> - <td id="LC271" class="blob-code blob-code-inner js-file-line"> FPKMsum2_df <span class="pl-k">=</span> FPKMsum2_df.sort_values(<span class="pl-v">by</span><span class="pl-k">=</span>[<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>])</td> - </tr> - <tr> - <td id="L272" class="blob-num js-line-number" data-line-number="272"></td> - <td id="LC272" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L273" class="blob-num js-line-number" data-line-number="273"></td> - <td id="LC273" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> print(FPKMsum2_df)</span></td> - </tr> - <tr> - <td id="L274" class="blob-num js-line-number" data-line-number="274"></td> - <td id="LC274" class="blob-code blob-code-inner js-file-line"> FPKMsum2_df.to_csv(<span class="pl-s"><span class="pl-pds">'</span>FPKM_sum2.csv<span class="pl-pds">'</span></span>) <span class="pl-c"><span class="pl-c">#</span> in case more than one entry for a particular phylotype</span></td> - </tr> - <tr> - <td id="L275" class="blob-num js-line-number" data-line-number="275"></td> - <td id="LC275" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">return</span> FPKMsum_df, FPKMsum2_df</td> - </tr> - <tr> - <td id="L276" class="blob-num js-line-number" data-line-number="276"></td> - <td id="LC276" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L277" class="blob-num js-line-number" data-line-number="277"></td> - <td id="LC277" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L278" class="blob-num js-line-number" data-line-number="278"></td> - <td id="LC278" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L279" class="blob-num js-line-number" data-line-number="279"></td> - <td id="LC279" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">normalisef</span>(<span class="pl-smi">f</span>,<span class="pl-smi">max</span>):</td> - </tr> - <tr> - <td id="L280" class="blob-num js-line-number" data-line-number="280"></td> - <td id="LC280" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">return</span> f<span class="pl-k">/</span><span class="pl-c1">max</span></td> - </tr> - <tr> - <td id="L281" class="blob-num js-line-number" data-line-number="281"></td> - <td id="LC281" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L282" class="blob-num js-line-number" data-line-number="282"></td> - <td id="LC282" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">getComposite_sum2</span>(<span class="pl-smi">nameList</span>,<span class="pl-smi">sum2_dfs</span>):</td> - </tr> - <tr> - <td id="L283" class="blob-num js-line-number" data-line-number="283"></td> - <td id="LC283" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> lets get a composite sum2_df from all of the sum2_dfs</span></td> - </tr> - <tr> - <td id="L284" class="blob-num js-line-number" data-line-number="284"></td> - <td id="LC284" class="blob-code blob-code-inner js-file-line"> phyList <span class="pl-k">=</span> []</td> - </tr> - <tr> - <td id="L285" class="blob-num js-line-number" data-line-number="285"></td> - <td id="LC285" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L286" class="blob-num js-line-number" data-line-number="286"></td> - <td id="LC286" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> i <span class="pl-k">in</span> <span class="pl-c1">range</span>(<span class="pl-c1">0</span>, <span class="pl-c1">len</span>(sum2_dfs)):</td> - </tr> - <tr> - <td id="L287" class="blob-num js-line-number" data-line-number="287"></td> - <td id="LC287" class="blob-code blob-code-inner js-file-line"> total <span class="pl-k">=</span> sum2_dfs[i][<span class="pl-s"><span class="pl-pds">'</span>FPKM<span class="pl-pds">'</span></span>].sum()</td> - </tr> - <tr> - <td id="L288" class="blob-num js-line-number" data-line-number="288"></td> - <td id="LC288" class="blob-code blob-code-inner js-file-line"> sum2_dfs[i][<span class="pl-s"><span class="pl-pds">'</span>w<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> sum2_dfs[i].apply(<span class="pl-k">lambda</span> <span class="pl-smi">row</span>: normalisef(row[<span class="pl-s"><span class="pl-pds">'</span>FPKM<span class="pl-pds">'</span></span>], total), <span class="pl-v">axis</span><span class="pl-k">=</span><span class="pl-c1">1</span>)</td> - </tr> - <tr> - <td id="L289" class="blob-num js-line-number" data-line-number="289"></td> - <td id="LC289" class="blob-code blob-code-inner js-file-line"> pSeries <span class="pl-k">=</span> sum2_dfs[i][<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>]</td> - </tr> - <tr> - <td id="L290" class="blob-num js-line-number" data-line-number="290"></td> - <td id="LC290" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> p <span class="pl-k">in</span> pSeries:</td> - </tr> - <tr> - <td id="L291" class="blob-num js-line-number" data-line-number="291"></td> - <td id="LC291" class="blob-code blob-code-inner js-file-line"> phyList.append(p) <span class="pl-c"><span class="pl-c">#</span> get all the phylotypes in this one</span></td> - </tr> - <tr> - <td id="L292" class="blob-num js-line-number" data-line-number="292"></td> - <td id="LC292" class="blob-code blob-code-inner js-file-line"> phyList <span class="pl-k">=</span> <span class="pl-c1">list</span>(<span class="pl-c1">set</span>(phyList))</td> - </tr> - <tr> - <td id="L293" class="blob-num js-line-number" data-line-number="293"></td> - <td id="LC293" class="blob-code blob-code-inner js-file-line"> phyList.sort()</td> - </tr> - <tr> - <td id="L294" class="blob-num js-line-number" data-line-number="294"></td> - <td id="LC294" class="blob-code blob-code-inner js-file-line"> composite_sum2_df <span class="pl-k">=</span> pd.DataFrame(phyList, <span class="pl-v">columns</span><span class="pl-k">=</span>[<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>])</td> - </tr> - <tr> - <td id="L295" class="blob-num js-line-number" data-line-number="295"></td> - <td id="LC295" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> i <span class="pl-k">in</span> <span class="pl-c1">range</span>(<span class="pl-c1">0</span>, <span class="pl-c1">len</span>(sum2_dfs)):</td> - </tr> - <tr> - <td id="L296" class="blob-num js-line-number" data-line-number="296"></td> - <td id="LC296" class="blob-code blob-code-inner js-file-line"> wList <span class="pl-k">=</span> []</td> - </tr> - <tr> - <td id="L297" class="blob-num js-line-number" data-line-number="297"></td> - <td id="LC297" class="blob-code blob-code-inner js-file-line"> pindf <span class="pl-k">=</span> <span class="pl-c1">list</span>(sum2_dfs[i][<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>])</td> - </tr> - <tr> - <td id="L298" class="blob-num js-line-number" data-line-number="298"></td> - <td id="LC298" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> print(pindf)</span></td> - </tr> - <tr> - <td id="L299" class="blob-num js-line-number" data-line-number="299"></td> - <td id="LC299" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> p <span class="pl-k">in</span> phyList:</td> - </tr> - <tr> - <td id="L300" class="blob-num js-line-number" data-line-number="300"></td> - <td id="LC300" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">if</span> p <span class="pl-k">in</span> pindf:</td> - </tr> - <tr> - <td id="L301" class="blob-num js-line-number" data-line-number="301"></td> - <td id="LC301" class="blob-code blob-code-inner js-file-line"> df <span class="pl-k">=</span> sum2_dfs[i]</td> - </tr> - <tr> - <td id="L302" class="blob-num js-line-number" data-line-number="302"></td> - <td id="LC302" class="blob-code blob-code-inner js-file-line"> w <span class="pl-k">=</span> df.loc[df[<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>] <span class="pl-k">==</span> p, <span class="pl-s"><span class="pl-pds">'</span>w<span class="pl-pds">'</span></span>].iloc[<span class="pl-c1">0</span>]</td> - </tr> - <tr> - <td id="L303" class="blob-num js-line-number" data-line-number="303"></td> - <td id="LC303" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">else</span>:</td> - </tr> - <tr> - <td id="L304" class="blob-num js-line-number" data-line-number="304"></td> - <td id="LC304" class="blob-code blob-code-inner js-file-line"> w <span class="pl-k">=</span> <span class="pl-c1">0</span></td> - </tr> - <tr> - <td id="L305" class="blob-num js-line-number" data-line-number="305"></td> - <td id="LC305" class="blob-code blob-code-inner js-file-line"> wList.append(w)</td> - </tr> - <tr> - <td id="L306" class="blob-num js-line-number" data-line-number="306"></td> - <td id="LC306" class="blob-code blob-code-inner js-file-line"> composite_sum2_df[nameList[i]] <span class="pl-k">=</span> wList</td> - </tr> - <tr> - <td id="L307" class="blob-num js-line-number" data-line-number="307"></td> - <td id="LC307" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>print(composite_sum2_df)</span></td> - </tr> - <tr> - <td id="L308" class="blob-num js-line-number" data-line-number="308"></td> - <td id="LC308" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>composite_sum2_df.to_csv('composite.csv')</span></td> - </tr> - <tr> - <td id="L309" class="blob-num js-line-number" data-line-number="309"></td> - <td id="LC309" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">return</span> composite_sum2_df</td> - </tr> - <tr> - <td id="L310" class="blob-num js-line-number" data-line-number="310"></td> - <td id="LC310" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L311" class="blob-num js-line-number" data-line-number="311"></td> - <td id="LC311" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L312" class="blob-num js-line-number" data-line-number="312"></td> - <td id="LC312" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">doMultiBarChart</span>(<span class="pl-smi">tdict</span>, <span class="pl-smi">composite_df</span>): <span class="pl-c"><span class="pl-c">#</span>array of multiple sum2_dfs</span></td> - </tr> - <tr> - <td id="L313" class="blob-num js-line-number" data-line-number="313"></td> - <td id="LC313" class="blob-code blob-code-inner js-file-line"> labelList <span class="pl-k">=</span> composite_df.columns.tolist()</td> - </tr> - <tr> - <td id="L314" class="blob-num js-line-number" data-line-number="314"></td> - <td id="LC314" class="blob-code blob-code-inner js-file-line"> sampnum <span class="pl-k">=</span> <span class="pl-c1">len</span>(labelList)<span class="pl-k">-</span><span class="pl-c1">1</span></td> - </tr> - <tr> - <td id="L315" class="blob-num js-line-number" data-line-number="315"></td> - <td id="LC315" class="blob-code blob-code-inner js-file-line"><span class="pl-c"><span class="pl-c">#</span> need to arrange bars</span></td> - </tr> - <tr> - <td id="L316" class="blob-num js-line-number" data-line-number="316"></td> - <td id="LC316" class="blob-code blob-code-inner js-file-line"><span class="pl-c"><span class="pl-c">#</span> number of phylotype = len(composite_df)</span></td> - </tr> - <tr> - <td id="L317" class="blob-num js-line-number" data-line-number="317"></td> - <td id="LC317" class="blob-code blob-code-inner js-file-line"><span class="pl-c"><span class="pl-c">#</span>number of bars = (len(labelist)-1) +1 for space</span></td> - </tr> - <tr> - <td id="L318" class="blob-num js-line-number" data-line-number="318"></td> - <td id="LC318" class="blob-code blob-code-inner js-file-line"><span class="pl-c"><span class="pl-c">#</span> ytick needs to ne</span></td> - </tr> - <tr> - <td id="L319" class="blob-num js-line-number" data-line-number="319"></td> - <td id="LC319" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L320" class="blob-num js-line-number" data-line-number="320"></td> - <td id="LC320" class="blob-code blob-code-inner js-file-line"> cmap <span class="pl-k">=</span> plt.cm.get_cmap(<span class="pl-s"><span class="pl-pds">'</span>tab10<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L321" class="blob-num js-line-number" data-line-number="321"></td> - <td id="LC321" class="blob-code blob-code-inner js-file-line"> palette <span class="pl-k">=</span> [cmap(i) <span class="pl-k">for</span> i <span class="pl-k">in</span> <span class="pl-c1">range</span>(cmap.N)]</td> - </tr> - <tr> - <td id="L322" class="blob-num js-line-number" data-line-number="322"></td> - <td id="LC322" class="blob-code blob-code-inner js-file-line"> title <span class="pl-k">=</span> <span class="pl-s"><span class="pl-pds">"</span>Legend: Variant Antigen Profile of a $\itTrypanosoma$ $\itvivax$ transcriptomes. <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L323" class="blob-num js-line-number" data-line-number="323"></td> - <td id="LC323" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>Phylotype abundance is expressed as phylotype frequencies adjusted <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L324" class="blob-num js-line-number" data-line-number="324"></td> - <td id="LC324" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>for combined transcript abundance. <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L325" class="blob-num js-line-number" data-line-number="325"></td> - <td id="LC325" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>Data was produced with VAPPER-Variant Antigen Profiler (Silva Pereira et al., 2019).<span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L326" class="blob-num js-line-number" data-line-number="326"></td> - <td id="LC326" class="blob-code blob-code-inner js-file-line"> width <span class="pl-k">=</span> <span class="pl-c1">0.6</span></td> - </tr> - <tr> - <td id="L327" class="blob-num js-line-number" data-line-number="327"></td> - <td id="LC327" class="blob-code blob-code-inner js-file-line"> ind <span class="pl-k">=</span> np.arange(width<span class="pl-k">*</span>sampnum<span class="pl-k">/</span><span class="pl-c1">2</span>, <span class="pl-c1">len</span>(composite_df)<span class="pl-k">*</span>width<span class="pl-k">*</span>(sampnum<span class="pl-k">+</span><span class="pl-c1">1</span>), width<span class="pl-k">*</span>(sampnum<span class="pl-k">+</span><span class="pl-c1">1</span>))</td> - </tr> - <tr> - <td id="L328" class="blob-num js-line-number" data-line-number="328"></td> - <td id="LC328" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>print(ind)</span></td> - </tr> - <tr> - <td id="L329" class="blob-num js-line-number" data-line-number="329"></td> - <td id="LC329" class="blob-code blob-code-inner js-file-line"> ysize <span class="pl-k">=</span> <span class="pl-c1">len</span>(composite_df)<span class="pl-k">*</span><span class="pl-c1">0.4</span></td> - </tr> - <tr> - <td id="L330" class="blob-num js-line-number" data-line-number="330"></td> - <td id="LC330" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L331" class="blob-num js-line-number" data-line-number="331"></td> - <td id="LC331" class="blob-code blob-code-inner js-file-line"> fig, ax <span class="pl-k">=</span> plt.subplots(<span class="pl-v">figsize</span><span class="pl-k">=</span>(<span class="pl-c1">10</span>,ysize))</td> - </tr> - <tr> - <td id="L332" class="blob-num js-line-number" data-line-number="332"></td> - <td id="LC332" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L333" class="blob-num js-line-number" data-line-number="333"></td> - <td id="LC333" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L334" class="blob-num js-line-number" data-line-number="334"></td> - <td id="LC334" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> s <span class="pl-k">in</span> <span class="pl-c1">range</span>(<span class="pl-c1">1</span>, <span class="pl-c1">len</span>(labelList)):</td> - </tr> - <tr> - <td id="L335" class="blob-num js-line-number" data-line-number="335"></td> - <td id="LC335" class="blob-code blob-code-inner js-file-line"> ax.barh(ind, composite_df[labelList[s]], width, <span class="pl-v">color</span><span class="pl-k">=</span>palette[s], <span class="pl-v">label</span><span class="pl-k">=</span>labelList[s])</td> - </tr> - <tr> - <td id="L336" class="blob-num js-line-number" data-line-number="336"></td> - <td id="LC336" class="blob-code blob-code-inner js-file-line"> ind <span class="pl-k">=</span> ind <span class="pl-k">+</span> width</td> - </tr> - <tr> - <td id="L337" class="blob-num js-line-number" data-line-number="337"></td> - <td id="LC337" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L338" class="blob-num js-line-number" data-line-number="338"></td> - <td id="LC338" class="blob-code blob-code-inner js-file-line"> ax.set(<span class="pl-v">yticks</span><span class="pl-k">=</span>np.arange(width<span class="pl-k">*</span>(sampnum<span class="pl-k">+</span><span class="pl-c1">2</span>)<span class="pl-k">/</span><span class="pl-c1">2</span>, <span class="pl-c1">len</span>(composite_df)<span class="pl-k">*</span>width<span class="pl-k">*</span>(sampnum<span class="pl-k">+</span><span class="pl-c1">1</span>), width<span class="pl-k">*</span>(sampnum<span class="pl-k">+</span><span class="pl-c1">1</span>)), <span class="pl-v">yticklabels</span><span class="pl-k">=</span>composite_df[<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>]) <span class="pl-c"><span class="pl-c">#</span> , ylim=[(len(labelList)-1) * width - 1, len(composite_df)])</span></td> - </tr> - <tr> - <td id="L339" class="blob-num js-line-number" data-line-number="339"></td> - <td id="LC339" class="blob-code blob-code-inner js-file-line"> ax.legend()</td> - </tr> - <tr> - <td id="L340" class="blob-num js-line-number" data-line-number="340"></td> - <td id="LC340" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L341" class="blob-num js-line-number" data-line-number="341"></td> - <td id="LC341" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L342" class="blob-num js-line-number" data-line-number="342"></td> - <td id="LC342" class="blob-code blob-code-inner js-file-line"> ax.set_ylabel(<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L343" class="blob-num js-line-number" data-line-number="343"></td> - <td id="LC343" class="blob-code blob-code-inner js-file-line"> ax.invert_yaxis() <span class="pl-c"><span class="pl-c">#</span> labels read top-to-bottom</span></td> - </tr> - <tr> - <td id="L344" class="blob-num js-line-number" data-line-number="344"></td> - <td id="LC344" class="blob-code blob-code-inner js-file-line"> ax.set_xlabel(<span class="pl-s"><span class="pl-pds">'</span>Weighted Phylotype Frequency<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L345" class="blob-num js-line-number" data-line-number="345"></td> - <td id="LC345" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L346" class="blob-num js-line-number" data-line-number="346"></td> - <td id="LC346" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> plt.text(-0.3, -0.15, title, va="top", wrap="True")</span></td> - </tr> - <tr> - <td id="L347" class="blob-num js-line-number" data-line-number="347"></td> - <td id="LC347" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>plt.tight_layout()</span></td> - </tr> - <tr> - <td id="L348" class="blob-num js-line-number" data-line-number="348"></td> - <td id="LC348" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L349" class="blob-num js-line-number" data-line-number="349"></td> - <td id="LC349" class="blob-code blob-code-inner js-file-line"> plt.subplots_adjust(<span class="pl-v">bottom</span><span class="pl-k">=</span><span class="pl-c1">0.1</span>, <span class="pl-v">top</span><span class="pl-k">=</span><span class="pl-c1">0.92</span>, <span class="pl-v">left</span><span class="pl-k">=</span><span class="pl-c1">0.15</span>, <span class="pl-v">right</span><span class="pl-k">=</span><span class="pl-c1">0.9</span>)</td> - </tr> - <tr> - <td id="L350" class="blob-num js-line-number" data-line-number="350"></td> - <td id="LC350" class="blob-code blob-code-inner js-file-line"> ax.set_title(title, <span class="pl-v">x</span><span class="pl-k">=</span><span class="pl-c1">0</span>, <span class="pl-v">wrap</span><span class="pl-k">=</span><span class="pl-s"><span class="pl-pds">'</span>True<span class="pl-pds">'</span></span>,<span class="pl-v">ha</span><span class="pl-k">=</span><span class="pl-s"><span class="pl-pds">'</span>left<span class="pl-pds">'</span></span>,)</td> - </tr> - <tr> - <td id="L351" class="blob-num js-line-number" data-line-number="351"></td> - <td id="LC351" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L352" class="blob-num js-line-number" data-line-number="352"></td> - <td id="LC352" class="blob-code blob-code-inner js-file-line"> plt.savefig(tdict[<span class="pl-s"><span class="pl-pds">'</span>html_resource<span class="pl-pds">'</span></span>] <span class="pl-k">+</span> tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>_phylotypes.png<span class="pl-pds">"</span></span>)</td> - </tr> - <tr> - <td id="L353" class="blob-num js-line-number" data-line-number="353"></td> - <td id="LC353" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">if</span> tdict[<span class="pl-s"><span class="pl-pds">'</span>pdf<span class="pl-pds">'</span></span>] <span class="pl-k">==</span> <span class="pl-s"><span class="pl-pds">'</span>PDF_Yes<span class="pl-pds">'</span></span>:</td> - </tr> - <tr> - <td id="L354" class="blob-num js-line-number" data-line-number="354"></td> - <td id="LC354" class="blob-code blob-code-inner js-file-line"> plt.savefig(tdict[<span class="pl-s"><span class="pl-pds">'</span>html_resource<span class="pl-pds">'</span></span>] <span class="pl-k">+</span> tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>phylotypes.pdf<span class="pl-pds">"</span></span>)</td> - </tr> - <tr> - <td id="L355" class="blob-num js-line-number" data-line-number="355"></td> - <td id="LC355" class="blob-code blob-code-inner js-file-line"> plt.show()</td> - </tr> - <tr> - <td id="L356" class="blob-num js-line-number" data-line-number="356"></td> - <td id="LC356" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">pass</span></td> - </tr> - <tr> - <td id="L357" class="blob-num js-line-number" data-line-number="357"></td> - <td id="LC357" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L358" class="blob-num js-line-number" data-line-number="358"></td> - <td id="LC358" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L359" class="blob-num js-line-number" data-line-number="359"></td> - <td id="LC359" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L360" class="blob-num js-line-number" data-line-number="360"></td> - <td id="LC360" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">doBarChart</span>(<span class="pl-smi">tdict</span>, <span class="pl-smi">sum2_df</span>):</td> - </tr> - <tr> - <td id="L361" class="blob-num js-line-number" data-line-number="361"></td> - <td id="LC361" class="blob-code blob-code-inner js-file-line"> cmap <span class="pl-k">=</span> plt.cm.get_cmap(<span class="pl-s"><span class="pl-pds">'</span>tab20<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L362" class="blob-num js-line-number" data-line-number="362"></td> - <td id="LC362" class="blob-code blob-code-inner js-file-line"> palette <span class="pl-k">=</span> [cmap(i) <span class="pl-k">for</span> i <span class="pl-k">in</span> <span class="pl-c1">range</span>(cmap.N)]</td> - </tr> - <tr> - <td id="L363" class="blob-num js-line-number" data-line-number="363"></td> - <td id="LC363" class="blob-code blob-code-inner js-file-line"> title <span class="pl-k">=</span> <span class="pl-s"><span class="pl-pds">"</span>Legend: Variant Antigen Profile of a $\itTrypanosoma$ $\itvivax$ transcriptome. <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L364" class="blob-num js-line-number" data-line-number="364"></td> - <td id="LC364" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>Phylotype abundance is expressed as phylotype frequencies adjusted <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L365" class="blob-num js-line-number" data-line-number="365"></td> - <td id="LC365" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>for combined transcript abundance. <span class="pl-pds">"</span></span> \</td> - </tr> - <tr> - <td id="L366" class="blob-num js-line-number" data-line-number="366"></td> - <td id="LC366" class="blob-code blob-code-inner js-file-line"> <span class="pl-s"><span class="pl-pds">"</span>Data was produced with VAPPER-Variant Antigen Profiler (Silva Pereira et al., 2019).<span class="pl-pds">"</span></span></td> - </tr> - <tr> - <td id="L367" class="blob-num js-line-number" data-line-number="367"></td> - <td id="LC367" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> get a list of phylotype, create equivalent of saccver, get a list of</span></td> - </tr> - <tr> - <td id="L368" class="blob-num js-line-number" data-line-number="368"></td> - <td id="LC368" class="blob-code blob-code-inner js-file-line"> maxFPKM <span class="pl-k">=</span> sum2_df[<span class="pl-s"><span class="pl-pds">'</span>FPKM<span class="pl-pds">'</span></span>].max()</td> - </tr> - <tr> - <td id="L369" class="blob-num js-line-number" data-line-number="369"></td> - <td id="LC369" class="blob-code blob-code-inner js-file-line"> total <span class="pl-k">=</span> sum2_df[<span class="pl-s"><span class="pl-pds">'</span>FPKM<span class="pl-pds">'</span></span>].sum()</td> - </tr> - <tr> - <td id="L370" class="blob-num js-line-number" data-line-number="370"></td> - <td id="LC370" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L371" class="blob-num js-line-number" data-line-number="371"></td> - <td id="LC371" class="blob-code blob-code-inner js-file-line"> sum2_df[<span class="pl-s"><span class="pl-pds">'</span>Normalised<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> sum2_df.apply(<span class="pl-k">lambda</span> <span class="pl-smi">row</span>: normalisef(row[<span class="pl-s"><span class="pl-pds">'</span>FPKM<span class="pl-pds">'</span></span>], maxFPKM),<span class="pl-v">axis</span><span class="pl-k">=</span><span class="pl-c1">1</span>)</td> - </tr> - <tr> - <td id="L372" class="blob-num js-line-number" data-line-number="372"></td> - <td id="LC372" class="blob-code blob-code-inner js-file-line"> sum2_df[<span class="pl-s"><span class="pl-pds">'</span>Weighted<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> sum2_df.apply(<span class="pl-k">lambda</span> <span class="pl-smi">row</span>: normalisef(row[<span class="pl-s"><span class="pl-pds">'</span>FPKM<span class="pl-pds">'</span></span>], total),<span class="pl-v">axis</span><span class="pl-k">=</span><span class="pl-c1">1</span>)</td> - </tr> - <tr> - <td id="L373" class="blob-num js-line-number" data-line-number="373"></td> - <td id="LC373" class="blob-code blob-code-inner js-file-line"> pList <span class="pl-k">=</span> sum2_df[<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>]</td> - </tr> - <tr> - <td id="L374" class="blob-num js-line-number" data-line-number="374"></td> - <td id="LC374" class="blob-code blob-code-inner js-file-line"> phList <span class="pl-k">=</span> []</td> - </tr> - <tr> - <td id="L375" class="blob-num js-line-number" data-line-number="375"></td> - <td id="LC375" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">for</span> p <span class="pl-k">in</span> pList:</td> - </tr> - <tr> - <td id="L376" class="blob-num js-line-number" data-line-number="376"></td> - <td id="LC376" class="blob-code blob-code-inner js-file-line"> phList.append(<span class="pl-c1">str</span>(p))</td> - </tr> - <tr> - <td id="L377" class="blob-num js-line-number" data-line-number="377"></td> - <td id="LC377" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L378" class="blob-num js-line-number" data-line-number="378"></td> - <td id="LC378" class="blob-code blob-code-inner js-file-line"> fList <span class="pl-k">=</span> sum2_df[<span class="pl-s"><span class="pl-pds">'</span>Weighted<span class="pl-pds">'</span></span>]</td> - </tr> - <tr> - <td id="L379" class="blob-num js-line-number" data-line-number="379"></td> - <td id="LC379" class="blob-code blob-code-inner js-file-line"> ysize <span class="pl-k">=</span> <span class="pl-c1">len</span>(phList)<span class="pl-k">*</span><span class="pl-c1">0.3</span></td> - </tr> - <tr> - <td id="L380" class="blob-num js-line-number" data-line-number="380"></td> - <td id="LC380" class="blob-code blob-code-inner js-file-line"> fig, ax <span class="pl-k">=</span> plt.subplots(<span class="pl-v">figsize</span><span class="pl-k">=</span>(<span class="pl-c1">10</span>,ysize))</td> - </tr> - <tr> - <td id="L381" class="blob-num js-line-number" data-line-number="381"></td> - <td id="LC381" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L382" class="blob-num js-line-number" data-line-number="382"></td> - <td id="LC382" class="blob-code blob-code-inner js-file-line"> ax.barh(phList, fList, <span class="pl-v">color</span><span class="pl-k">=</span>palette)</td> - </tr> - <tr> - <td id="L383" class="blob-num js-line-number" data-line-number="383"></td> - <td id="LC383" class="blob-code blob-code-inner js-file-line"> ax.set_ylabel(<span class="pl-s"><span class="pl-pds">'</span>Phylotype<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L384" class="blob-num js-line-number" data-line-number="384"></td> - <td id="LC384" class="blob-code blob-code-inner js-file-line"> ax.invert_yaxis() <span class="pl-c"><span class="pl-c">#</span> labels read top-to-bottom</span></td> - </tr> - <tr> - <td id="L385" class="blob-num js-line-number" data-line-number="385"></td> - <td id="LC385" class="blob-code blob-code-inner js-file-line"> ax.set_xlabel(<span class="pl-s"><span class="pl-pds">'</span>Weighted Phylotype Frequency<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L386" class="blob-num js-line-number" data-line-number="386"></td> - <td id="LC386" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L387" class="blob-num js-line-number" data-line-number="387"></td> - <td id="LC387" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> plt.text(-0.3, -0.15, title, va="top", wrap="True")</span></td> - </tr> - <tr> - <td id="L388" class="blob-num js-line-number" data-line-number="388"></td> - <td id="LC388" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span>plt.tight_layout()</span></td> - </tr> - <tr> - <td id="L389" class="blob-num js-line-number" data-line-number="389"></td> - <td id="LC389" class="blob-code blob-code-inner js-file-line"> plt.subplots_adjust(<span class="pl-v">bottom</span><span class="pl-k">=</span><span class="pl-c1">0.1</span>, <span class="pl-v">top</span><span class="pl-k">=</span><span class="pl-c1">0.9</span>, <span class="pl-v">left</span><span class="pl-k">=</span><span class="pl-c1">0.15</span>, <span class="pl-v">right</span><span class="pl-k">=</span><span class="pl-c1">0.9</span>)</td> - </tr> - <tr> - <td id="L390" class="blob-num js-line-number" data-line-number="390"></td> - <td id="LC390" class="blob-code blob-code-inner js-file-line"> ax.set_title(title, <span class="pl-v">x</span><span class="pl-k">=</span><span class="pl-c1">0</span>, <span class="pl-v">wrap</span><span class="pl-k">=</span><span class="pl-s"><span class="pl-pds">'</span>True<span class="pl-pds">'</span></span>,<span class="pl-v">ha</span><span class="pl-k">=</span><span class="pl-s"><span class="pl-pds">'</span>left<span class="pl-pds">'</span></span>,)</td> - </tr> - <tr> - <td id="L391" class="blob-num js-line-number" data-line-number="391"></td> - <td id="LC391" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L392" class="blob-num js-line-number" data-line-number="392"></td> - <td id="LC392" class="blob-code blob-code-inner js-file-line"> plt.savefig(tdict[<span class="pl-s"><span class="pl-pds">'</span>html_resource<span class="pl-pds">'</span></span>] <span class="pl-k">+</span> tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>_phylotypes.png<span class="pl-pds">"</span></span>)</td> - </tr> - <tr> - <td id="L393" class="blob-num js-line-number" data-line-number="393"></td> - <td id="LC393" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">if</span> tdict[<span class="pl-s"><span class="pl-pds">'</span>pdf<span class="pl-pds">'</span></span>] <span class="pl-k">==</span> <span class="pl-s"><span class="pl-pds">'</span>PDF_Yes<span class="pl-pds">'</span></span>:</td> - </tr> - <tr> - <td id="L394" class="blob-num js-line-number" data-line-number="394"></td> - <td id="LC394" class="blob-code blob-code-inner js-file-line"> plt.savefig(tdict[<span class="pl-s"><span class="pl-pds">'</span>html_resource<span class="pl-pds">'</span></span>] <span class="pl-k">+</span> tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]<span class="pl-k">+</span><span class="pl-s"><span class="pl-pds">"</span>phylotypes.pdf<span class="pl-pds">"</span></span>)</td> - </tr> - <tr> - <td id="L395" class="blob-num js-line-number" data-line-number="395"></td> - <td id="LC395" class="blob-code blob-code-inner js-file-line"> <span class="pl-c"><span class="pl-c">#</span> plt.show()</span></td> - </tr> - <tr> - <td id="L396" class="blob-num js-line-number" data-line-number="396"></td> - <td id="LC396" class="blob-code blob-code-inner js-file-line"> <span class="pl-k">pass</span></td> - </tr> - <tr> - <td id="L397" class="blob-num js-line-number" data-line-number="397"></td> - <td id="LC397" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L398" class="blob-num js-line-number" data-line-number="398"></td> - <td id="LC398" class="blob-code blob-code-inner js-file-line"><span class="pl-c"><span class="pl-c">#</span> argdict = {'name':2, 'pdfexport': 3, 'refFastq': 4, 'forward': 5, 'reverse': 6, 'html_file': 7, 'html_resource': 8}</span></td> - </tr> - <tr> - <td id="L399" class="blob-num js-line-number" data-line-number="399"></td> - <td id="LC399" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L400" class="blob-num js-line-number" data-line-number="400"></td> - <td id="LC400" class="blob-code blob-code-inner js-file-line"><span class="pl-k">def</span> <span class="pl-en">transcriptomicProcess</span>(<span class="pl-smi">args</span>,<span class="pl-smi">argdict</span>):</td> - </tr> - <tr> - <td id="L401" class="blob-num js-line-number" data-line-number="401"></td> - <td id="LC401" class="blob-code blob-code-inner js-file-line"> tdict <span class="pl-k">=</span> {}</td> - </tr> - <tr> - <td id="L402" class="blob-num js-line-number" data-line-number="402"></td> - <td id="LC402" class="blob-code blob-code-inner js-file-line"> tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> args[argdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]]</td> - </tr> - <tr> - <td id="L403" class="blob-num js-line-number" data-line-number="403"></td> - <td id="LC403" class="blob-code blob-code-inner js-file-line"> tdict[<span class="pl-s"><span class="pl-pds">'</span>refFastq<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> args[argdict[<span class="pl-s"><span class="pl-pds">'</span>refFastq<span class="pl-pds">'</span></span>]]</td> - </tr> - <tr> - <td id="L404" class="blob-num js-line-number" data-line-number="404"></td> - <td id="LC404" class="blob-code blob-code-inner js-file-line"> tdict[<span class="pl-s"><span class="pl-pds">'</span>forward<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> args[argdict[<span class="pl-s"><span class="pl-pds">'</span>forward<span class="pl-pds">'</span></span>]]</td> - </tr> - <tr> - <td id="L405" class="blob-num js-line-number" data-line-number="405"></td> - <td id="LC405" class="blob-code blob-code-inner js-file-line"> tdict[<span class="pl-s"><span class="pl-pds">'</span>reverse<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> args[argdict[<span class="pl-s"><span class="pl-pds">'</span>reverse<span class="pl-pds">'</span></span>]]</td> - </tr> - <tr> - <td id="L406" class="blob-num js-line-number" data-line-number="406"></td> - <td id="LC406" class="blob-code blob-code-inner js-file-line"> tdict[<span class="pl-s"><span class="pl-pds">'</span>vivax_trans_database<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> <span class="pl-s"><span class="pl-pds">'</span>data/vivax/Database/Phylotype_typeseqs.fas<span class="pl-pds">'</span></span></td> - </tr> - <tr> - <td id="L407" class="blob-num js-line-number" data-line-number="407"></td> - <td id="LC407" class="blob-code blob-code-inner js-file-line"> tdict[<span class="pl-s"><span class="pl-pds">'</span>pdf<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> args[argdict[<span class="pl-s"><span class="pl-pds">'</span>pdfexport<span class="pl-pds">'</span></span>]]</td> - </tr> - <tr> - <td id="L408" class="blob-num js-line-number" data-line-number="408"></td> - <td id="LC408" class="blob-code blob-code-inner js-file-line"> tdict[<span class="pl-s"><span class="pl-pds">'</span>html_file<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> args[argdict[<span class="pl-s"><span class="pl-pds">'</span>html_file<span class="pl-pds">'</span></span>]]</td> - </tr> - <tr> - <td id="L409" class="blob-num js-line-number" data-line-number="409"></td> - <td id="LC409" class="blob-code blob-code-inner js-file-line"> tdict[<span class="pl-s"><span class="pl-pds">'</span>html_resource<span class="pl-pds">'</span></span>] <span class="pl-k">=</span> args[argdict[<span class="pl-s"><span class="pl-pds">'</span>html_resource<span class="pl-pds">'</span></span>]]</td> - </tr> - <tr> - <td id="L410" class="blob-num js-line-number" data-line-number="410"></td> - <td id="LC410" class="blob-code blob-code-inner js-file-line"> </td> - </tr> - <tr> - <td id="L411" class="blob-num js-line-number" data-line-number="411"></td> - <td id="LC411" class="blob-code blob-code-inner js-file-line"> uploadUserReferenceFastq(tdict[<span class="pl-s"><span class="pl-pds">'</span>refFastq<span class="pl-pds">'</span></span>])</td> - </tr> - <tr> - <td id="L412" class="blob-num js-line-number" data-line-number="412"></td> - <td id="LC412" class="blob-code blob-code-inner js-file-line"> transcriptMapping(tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>], tdict[<span class="pl-s"><span class="pl-pds">'</span>refFastq<span class="pl-pds">'</span></span>], tdict[<span class="pl-s"><span class="pl-pds">'</span>forward<span class="pl-pds">'</span></span>], tdict[<span class="pl-s"><span class="pl-pds">'</span>reverse<span class="pl-pds">'</span></span>]) <span class="pl-c"><span class="pl-c">#</span>uses bowtie</span></td> - </tr> - <tr> - <td id="L413" class="blob-num js-line-number" data-line-number="413"></td> - <td id="LC413" class="blob-code blob-code-inner js-file-line"> processSamFiles(tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]) <span class="pl-c"><span class="pl-c">#</span>uses samtools</span></td> - </tr> - <tr> - <td id="L414" class="blob-num js-line-number" data-line-number="414"></td> - <td id="LC414" class="blob-code blob-code-inner js-file-line"> transcriptAbundance(tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>]) <span class="pl-c"><span class="pl-c">#</span>uses cufflinks -> ?.cuff/*.*</span></td> - </tr> - <tr> - <td id="L415" class="blob-num js-line-number" data-line-number="415"></td> - <td id="LC415" class="blob-code blob-code-inner js-file-line"> transcriptsForBlast(tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>], tdict[<span class="pl-s"><span class="pl-pds">'</span>refFastq<span class="pl-pds">'</span></span>]) <span class="pl-c"><span class="pl-c">#</span>creates name+4blast.fa</span></td> - </tr> - <tr> - <td id="L416" class="blob-num js-line-number" data-line-number="416"></td> - <td id="LC416" class="blob-code blob-code-inner js-file-line"> blastContigs(tdict[<span class="pl-s"><span class="pl-pds">'</span>name<span class="pl-pds">'</span></span>], tdict[<span class="pl-s"><span class="pl-pds">'</span>html_resource<span class="pl-pds">'</span></span>], <span class="pl-s"><span class="pl-pds">'</span>data/vivax/Database/Phylotype_typeseqs.fas<span class="pl-pds">'</span></span>)</td> - </tr> - <tr> - <td id="L417" class="blob-num js-line-number" data-line-number="417"></td> - <td id="LC417" class="blob-code blob-code-inner js-file-line"> sum_df, sum2_df <span class="pl-k">=</span> combineFPMK(tdict)</td> - </tr> - <tr> - <td id="L418" class="blob-num js-line-number" data-line-number="418"></td> - <td id="LC418" class="blob-code blob-code-inner js-file-line"> doBarChart(tdict, sum2_df)</td> - </tr> - <tr> - <td id="L419" class="blob-num js-line-number" data-line-number="419"></td> - <td id="LC419" class="blob-code blob-code-inner js-file-line"> createHTML(tdict, sum_df)</td> - </tr> - <tr> - <td id="L420" class="blob-num js-line-number" data-line-number="420"></td> - <td id="LC420" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L421" class="blob-num js-line-number" data-line-number="421"></td> - <td id="LC421" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L422" class="blob-num js-line-number" data-line-number="422"></td> - <td id="LC422" class="blob-code blob-code-inner js-file-line"><span class="pl-k">if</span> <span class="pl-c1">__name__</span> <span class="pl-k">==</span> <span class="pl-s"><span class="pl-pds">"</span>__main__<span class="pl-pds">"</span></span>:</td> - </tr> - <tr> - <td id="L423" class="blob-num js-line-number" data-line-number="423"></td> - <td id="LC423" class="blob-code blob-code-inner js-file-line"> <span class="pl-c1">exit</span>()</td> - </tr> - <tr> - <td id="L424" class="blob-num js-line-number" data-line-number="424"></td> - <td id="LC424" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> - <tr> - <td id="L425" class="blob-num js-line-number" data-line-number="425"></td> - <td id="LC425" class="blob-code blob-code-inner js-file-line"> -</td> - </tr> -</table> - - <details class="details-reset details-overlay BlobToolbar position-absolute js-file-line-actions dropdown d-none" aria-hidden="true"> - <summary class="btn-octicon ml-0 px-2 p-0 bg-white border border-gray-dark rounded-1" aria-label="Inline file action toolbar"> - <svg class="octicon octicon-kebab-horizontal" viewBox="0 0 13 16" version="1.1" width="13" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M1.5 9a1.5 1.5 0 1 0 0-3 1.5 1.5 0 0 0 0 3zm5 0a1.5 1.5 0 1 0 0-3 1.5 1.5 0 0 0 0 3zM13 7.5a1.5 1.5 0 1 1-3 0 1.5 1.5 0 0 1 3 0z"/></svg> - </summary> - <details-menu> - <ul class="BlobToolbar-dropdown dropdown-menu dropdown-menu-se mt-2" style="width:185px"> - <li><clipboard-copy role="menuitem" class="dropdown-item" id="js-copy-lines" style="cursor:pointer;" data-original-text="Copy lines">Copy lines</clipboard-copy></li> - <li><clipboard-copy role="menuitem" class="dropdown-item" id="js-copy-permalink" style="cursor:pointer;" data-original-text="Copy permalink">Copy permalink</clipboard-copy></li> - <li><a class="dropdown-item js-update-url-with-hash" id="js-view-git-blame" role="menuitem" href="/johnheap/VAPPER-Galaxy/blame/a4e16d71fe985f389930c02f94354b87d3aabadb/Tryp_V_T.py">View git blame</a></li> - <li><a class="dropdown-item" id="js-new-issue" role="menuitem" href="/johnheap/VAPPER-Galaxy/issues/new">Reference in new issue</a></li> - </ul> - </details-menu> - </details> - - </div> - - </div> - - - - <details class="details-reset details-overlay details-overlay-dark"> - <summary data-hotkey="l" aria-label="Jump to line"></summary> - <details-dialog class="Box Box--overlay d-flex flex-column anim-fade-in fast linejump" aria-label="Jump to line"> - <!-- '"` --><!-- </textarea></xmp> --></option></form><form class="js-jump-to-line-form Box-body d-flex" action="" accept-charset="UTF-8" method="get"><input name="utf8" type="hidden" value="✓" /> - <input class="form-control flex-auto mr-3 linejump-input js-jump-to-line-field" type="text" placeholder="Jump to line…" aria-label="Jump to line" autofocus> - <button type="submit" class="btn" data-close-dialog>Go</button> -</form> </details-dialog> - </details> - - - - </div> - <div class="modal-backdrop js-touch-events"></div> -</div> - - </main> - </div> - - - </div> - - -<div class="footer container-lg width-full p-responsive" role="contentinfo"> - <div class="position-relative d-flex flex-row-reverse flex-lg-row flex-wrap flex-lg-nowrap flex-justify-center flex-lg-justify-between pt-6 pb-2 mt-6 f6 text-gray border-top border-gray-light "> - <ul class="list-style-none d-flex flex-wrap col-12 col-lg-5 flex-justify-center flex-lg-justify-between mb-2 mb-lg-0"> - <li class="mr-3 mr-lg-0">© 2019 <span title="0.75142s from unicorn-74746df85b-zvhqz">GitHub</span>, Inc.</li> - <li class="mr-3 mr-lg-0"><a data-ga-click="Footer, go to terms, text:terms" href="https://github.com/site/terms">Terms</a></li> - <li class="mr-3 mr-lg-0"><a data-ga-click="Footer, go to privacy, text:privacy" href="https://github.com/site/privacy">Privacy</a></li> - <li class="mr-3 mr-lg-0"><a data-ga-click="Footer, go to security, text:security" href="https://github.com/security">Security</a></li> - <li class="mr-3 mr-lg-0"><a href="https://githubstatus.com/" data-ga-click="Footer, go to status, text:status">Status</a></li> - <li><a data-ga-click="Footer, go to help, text:help" href="https://help.github.com">Help</a></li> - </ul> - - <a aria-label="Homepage" title="GitHub" class="footer-octicon d-none d-lg-block mx-lg-4" href="https://github.com"> - <svg height="24" class="octicon octicon-mark-github" viewBox="0 0 16 16" version="1.1" width="24" aria-hidden="true"><path fill-rule="evenodd" d="M8 0C3.58 0 0 3.58 0 8c0 3.54 2.29 6.53 5.47 7.59.4.07.55-.17.55-.38 0-.19-.01-.82-.01-1.49-2.01.37-2.53-.49-2.69-.94-.09-.23-.48-.94-.82-1.13-.28-.15-.68-.52-.01-.53.63-.01 1.08.58 1.23.82.72 1.21 1.87.87 2.33.66.07-.52.28-.87.51-1.07-1.78-.2-3.64-.89-3.64-3.95 0-.87.31-1.59.82-2.15-.08-.2-.36-1.02.08-2.12 0 0 .67-.21 2.2.82.64-.18 1.32-.27 2-.27.68 0 1.36.09 2 .27 1.53-1.04 2.2-.82 2.2-.82.44 1.1.16 1.92.08 2.12.51.56.82 1.27.82 2.15 0 3.07-1.87 3.75-3.65 3.95.29.25.54.73.54 1.48 0 1.07-.01 1.93-.01 2.2 0 .21.15.46.55.38A8.013 8.013 0 0 0 16 8c0-4.42-3.58-8-8-8z"/></svg> -</a> - <ul class="list-style-none d-flex flex-wrap col-12 col-lg-5 flex-justify-center flex-lg-justify-between mb-2 mb-lg-0"> - <li class="mr-3 mr-lg-0"><a data-ga-click="Footer, go to contact, text:contact" href="https://github.com/contact">Contact GitHub</a></li> - <li class="mr-3 mr-lg-0"><a href="https://github.com/pricing" data-ga-click="Footer, go to Pricing, text:Pricing">Pricing</a></li> - <li class="mr-3 mr-lg-0"><a href="https://developer.github.com" data-ga-click="Footer, go to api, text:api">API</a></li> - <li class="mr-3 mr-lg-0"><a href="https://training.github.com" data-ga-click="Footer, go to training, text:training">Training</a></li> - <li class="mr-3 mr-lg-0"><a href="https://github.blog" data-ga-click="Footer, go to blog, text:blog">Blog</a></li> - <li><a data-ga-click="Footer, go to about, text:about" href="https://github.com/about">About</a></li> - - </ul> - </div> - <div class="d-flex flex-justify-center pb-6"> - <span class="f6 text-gray-light"></span> - </div> -</div> - - - - <div id="ajax-error-message" class="ajax-error-message flash flash-error"> - <svg class="octicon octicon-alert" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8.893 1.5c-.183-.31-.52-.5-.887-.5s-.703.19-.886.5L.138 13.499a.98.98 0 0 0 0 1.001c.193.31.53.501.886.501h13.964c.367 0 .704-.19.877-.5a1.03 1.03 0 0 0 .01-1.002L8.893 1.5zm.133 11.497H6.987v-2.003h2.039v2.003zm0-3.004H6.987V5.987h2.039v4.006z"/></svg> - <button type="button" class="flash-close js-ajax-error-dismiss" aria-label="Dismiss error"> - <svg class="octicon octicon-x" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M7.48 8l3.75 3.75-1.48 1.48L6 9.48l-3.75 3.75-1.48-1.48L4.52 8 .77 4.25l1.48-1.48L6 6.52l3.75-3.75 1.48 1.48L7.48 8z"/></svg> - </button> - You can’t perform that action at this time. - </div> - - - <script crossorigin="anonymous" integrity="sha512-EPrD+nddbyhpiLL8l3M8VfJpZr4J2EWQLaPXZ+6A3VDJKzS5HeZ3dkMVieHSdvIPHsMbWPyVlY42SWKoS4XTfA==" type="application/javascript" src="https://github.githubassets.com/assets/compat-bootstrap-831f12d4.js"></script> - <script crossorigin="anonymous" integrity="sha512-oFBEYscCdWEyvUQehaYyaCSiKtIN4UvpfFHNpIXLUTSQ35JcacPNj86R8fgJfI1e7BOjbLZPTv1nJg3TECiMLw==" type="application/javascript" src="https://github.githubassets.com/assets/frameworks-7af24171.js"></script> - - <script crossorigin="anonymous" async="async" integrity="sha512-b9BDH7EZq1yaR2fUH08I378zVkToScLiQ//L0gdyPviliuwpWiVFkB8uW0K8zZszdeLeBpib7wGBLkPiIFgyHg==" type="application/javascript" src="https://github.githubassets.com/assets/github-bootstrap-2a8c2b54.js"></script> - - - - <div class="js-stale-session-flash stale-session-flash flash flash-warn flash-banner" hidden - > - <svg class="octicon octicon-alert" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8.893 1.5c-.183-.31-.52-.5-.887-.5s-.703.19-.886.5L.138 13.499a.98.98 0 0 0 0 1.001c.193.31.53.501.886.501h13.964c.367 0 .704-.19.877-.5a1.03 1.03 0 0 0 .01-1.002L8.893 1.5zm.133 11.497H6.987v-2.003h2.039v2.003zm0-3.004H6.987V5.987h2.039v4.006z"/></svg> - <span class="signed-in-tab-flash">You signed in with another tab or window. <a href="">Reload</a> to refresh your session.</span> - <span class="signed-out-tab-flash">You signed out in another tab or window. <a href="">Reload</a> to refresh your session.</span> - </div> - <template id="site-details-dialog"> - <details class="details-reset details-overlay details-overlay-dark lh-default text-gray-dark hx_rsm" open> - <summary role="button" aria-label="Close dialog"></summary> - <details-dialog class="Box Box--overlay d-flex flex-column anim-fade-in fast hx_rsm-dialog hx_rsm-modal"> - <button class="Box-btn-octicon m-0 btn-octicon position-absolute right-0 top-0" type="button" aria-label="Close dialog" data-close-dialog> - <svg class="octicon octicon-x" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M7.48 8l3.75 3.75-1.48 1.48L6 9.48l-3.75 3.75-1.48-1.48L4.52 8 .77 4.25l1.48-1.48L6 6.52l3.75-3.75 1.48 1.48L7.48 8z"/></svg> - </button> - <div class="octocat-spinner my-6 js-details-dialog-spinner"></div> - </details-dialog> - </details> -</template> - - <div class="Popover js-hovercard-content position-absolute" style="display: none; outline: none;" tabindex="0"> - <div class="Popover-message Popover-message--bottom-left Popover-message--large Box box-shadow-large" style="width:360px;"> - </div> -</div> - - <div aria-live="polite" class="js-global-screen-reader-notice sr-only"></div> - - </body> -</html> - +""" +* Galaxy Version + + * Copyright 2019 University of Liverpool + * Author John Heap, Computational Biology Facility, UoL + * Based on original scripts of Sara Silva Silva Pereira, Institute of Infection and Global Health, UoL + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + * + """ + + +import subprocess +import pandas as pd +import re +import os +import sys +import shutil +# import matplotlib as mpl +# mpl.use('Agg') +import matplotlib.pyplot as plt +import numpy as np + + + + +# copies the user provided Fasta file to data/reference/file/file.fasta +def uploadUserReferenceFastq(refFastq): + refBase = os.path.basename(refFastq) + ref = os.path.splitext(refBase)[0] # 'mydata/test.fasta' -> 'test' + dir_path = os.path.dirname(os.path.realpath(__file__)) # directory of this file + refDir = dir_path + "/data/Reference/" + ref #propose putting file in '/data/reference/ref/ + if not os.path.isdir(refDir): # if directory data/Reference/ref doesn't exist + os.mkdir(refDir) + refPath = refDir+"/" + shutil.copy(refFastq, refPath + refBase) #copy reference file into the directory + argString = "bowtie2-build " + refPath + refBase+" "+refPath+ref + print("Building the bowtie2 reference files.") + subprocess.call(argString, shell=True) + return + +def transcriptMapping(inputname, refFastq, forwardFN, reverseFN): + # where is our Reference data? + refBase = os.path.basename(refFastq) + ref = os.path.splitext(refBase)[0] + dir_path = os.path.dirname(os.path.realpath(__file__)) + refDir = dir_path + "/data/Reference/" + ref + "/" + refName = refDir + ref + # now have reference file so we can proceed with the transcript mapping via bowtie2 + argString = "bowtie2 -x "+refName+" -1 "+forwardFN+" -2 "+reverseFN+" -S "+inputname+".sam" + print(argString) + subprocess.call(argString, shell=True) #outputs a name.sam file + return + + + +def processSamFiles(inputname): + cur_path = os.getcwd() + samName = cur_path+"/"+inputname + argString = "samtools view -bS "+inputname+".sam > "+samName+".bam" + print(argString) + subprocess.call(argString, shell=True) + + argString = "samtools sort "+samName+".bam -o "+samName+".sorted" + print("argstring = "+argString) + subprocess.call(argString, shell=True) + + argString = "samtools index "+samName+".sorted "+samName+".sorted.bai" + print("argstring = " + argString) + subprocess.call(argString, shell=True) + return #we have saved out the relevent name.bam, name.sorted and name.sorted.bai files + +# we will not have the .gtf file so call cufflinks without -G option +def transcriptAbundance(inputname): + argString = "cufflinks -o "+inputname+".cuff -u -p 8 "+inputname+".sorted" + subprocess.call(argString, shell = True) + os.remove(inputname+".sorted") #remove name.sorted + os.remove(inputname+".sorted.bai") + os.remove(inputname+".bam") + return + +def transcriptsForBlast(name, refFastq): + # quick and dirty just to see. + refBase = os.path.basename(refFastq) + ref = os.path.splitext(refBase)[0] # 'mydata/test.fasta' -> 'test' + dir_path = os.path.dirname(os.path.realpath(__file__)) # directory of this file + refPath = dir_path + "/data/Reference/" + ref + "/" + refBase # eg refPath = data/Reference/Trinity/Trinity.fasta + # used for dirty # refPath = 'Trinity.fasta' # dirty one + track_df = pd.read_csv(name+'.cuff/genes.fpkm_tracking', sep='\t') + names = track_df['locus'] + # print(len(names)) + # print(names[:5]) + + nlist = [] + for n in range(0,len(names)): + i = names[n].find(':') + nlist.append(names[n][:i]) + nameset = set(nlist) #get unique. + with open(refPath, 'r') as myRef: + refData = myRef.read() + refData= refData+'\n>' + + with open(name + '_for_blast.fa', 'w') as outfile: + for trans_id in nameset: + namepos = refData.find(trans_id) + endpos = refData.find('>', namepos) + outfile.write('>'+refData[namepos:endpos]) + + pass + +def blastContigs(test_name,html_resource, database): + db_path = database + argString = "blastx -db "+db_path+" -query "+test_name+"_for_blast.fa -outfmt 10 -out "+test_name+"_blast.txt" + print(argString) + returncode = subprocess.call(argString, shell=True) + if returncode != 0: + return "Error in blastall" + blast_df = pd.read_csv(""+test_name+"_blast.txt") + blast_df.columns = ['qaccver', 'saccver', 'pident', 'length', 'mismatch', 'gapopen', 'qstart', 'qend', 'sstart', 'send', 'evalue','bitscore'] + blastResult_df = blast_df[(blast_df['pident']>=70) & (blast_df['length'] > 100) & (blast_df['evalue'] <=0.001) ] + blastResult_df = blastResult_df[['qaccver', 'saccver', 'pident', 'evalue', 'bitscore']] #query accession.version, subject accession.version, Percentage of identical matches + # need to allocate the transcripts (if allocated more than once to the phylotype with least error. + transcripts = blastResult_df['qaccver'] + b_df = pd.DataFrame(columns=['qaccver', 'saccver', 'pident', 'evalue', 'bitscore']) + transSet = set(transcripts) + for t in transSet: + temp_df = blastResult_df[(blastResult_df['qaccver'] == t)] + # get one with smallest error value + #print(t + ":") + #print(temp_df) + temp_df = temp_df.sort_values(by=['evalue']) + b_df = b_df.append(temp_df.iloc[[0]]) + + b_df.sort_values(by=['qaccver']) + b_df.to_csv(test_name + '_transcript.csv') + return b_df + + +def createMultiHTML(tdict,composite_df): + labelList = composite_df.columns.tolist() + htmlString = r"<html><title>T.vivax VAP (Transcriptomic Pathway(</title><body><div style='text-align:center'><h2><i>Trypanosoma vivax</i> Variant Antigen Profile</h2><h3>" + htmlString += r"Sample name: "+tdict['name'] + htmlString += r"<br>Transcriptomic Analysis</h3></p>" + htmlString += "<p style = 'margin-left:20%; margin-right:20%'>Legend: " \ + "Variant Antigen Profile of a <i>Trypanosoma vivax</i> transcriptomes. " \ + "Weighted Frequency reflects Phylotype abundance and is expressed as " \ + "phylotype frequencies adjusted for the combined transcript abundance. " \ + "Data was produced with VAPPER-Variant Antigen Profiler " \ + "(Silva Pereira et al., 2019).</p> " + htmlString += r"<style> table, th, tr, td {border: 1px solid black; border-collapse: collapse;}</style>" + + header = r"<table style='width:50%;margin-left:25%;text-align:center'><tr><th>Phylotype</th>" + wLists = [] + + for j in range(1,len(labelList)): + wLists.append(composite_df[labelList[j]]) + header += r"<th>" + str(labelList[j]) + "</th>" + + htmlString += "</tr>\n" + header + tabString = "" + phyList = composite_df['Phylotype'] + + + + for i in range(0, len(composite_df)): + tabString += "<tr><td>" + str(phyList[i]) + "</td>" + for j in range(0,len(labelList)-1): + #print(j) + f = format(wLists[j][i], '.4f') + tabString += "<td>" + str(f) + "</td>" + tabString += "</tr>\n" + + htmlString += tabString + "</table><br><br><br><br><br>" + htmlString += r"<h3>Weighted Relative Frequencies of Detected Phylotypes.</h3>" + imgString = r"<img src = '"+ tdict['name']+"_phylotypes.png' alt='Bar chart of phylotype variation' style='max-width:100%'><br><br>" + htmlString += imgString + + with open(tdict['html_file'], "w") as htmlfile: + htmlfile.write(htmlString) + + +def createHTML(tdict,sum_df): + #assumes imgs are heatmap.png, dheatmap.png, vapPCA.png and already in htmlresource + htmlString = r"<html><title>T.vivax VAP (Transcriptomic Pathway(</title><body><div style='text-align:center'><h2><i>Trypanosoma vivax</i> Variant Antigen Profile</h2><h3>" + htmlString += r"Sample name: "+tdict['name'] + htmlString += r"<br>Transcriptomic Analysis</h3></p>" + htmlString += "<p style = 'margin-left:20%; margin-right:20%'>Legend: " \ + "Variant Antigen Profile of a <i>Trypanosoma vivax</i> transcriptome. " \ + "Weighted Frequency reflects Phylotype abundance and is expressed as " \ + "phylotype frequencies adjusted for the combined transcript abundance. " \ + "Data was produced with VAPPER-Variant Antigen Profiler " \ + "(Silva Pereira et al., 2019).</p> " + htmlString += r"<style> table, th, tr, td {border: 1px solid black; border-collapse: collapse;}</style>" + + htmlString += r"<table style='width:50%;table-layout: auto; margin-left:25%;text-align:center'><tr><th>Phylotype</th>" \ + r"<th>Combined FPKM</th><th>Weighted Frequency</th></tr>" + tabString = "" + # flush out table with correct values + phySeries = sum_df['Phylotype'] + # sacSeries = sum_df['saccver'] + fSeries = sum_df['FPKM'] + total = fSeries.sum() + # print("Total="+str(total)) + for i in range(0, len(sum_df)): + # print(phySeries[i]) + f = format(fSeries[i], '.2f') + w = format(fSeries[i]/total, '.2f') + + #w = format(weightList[i], '.4f') + + tabString += "<tr><td>" + str(phySeries[i]) + "</td><td>" + str(f) + "</td><td>"+str(w)+"</tr>" + htmlString += tabString + "</table><br><br><br><br><br>" + htmlString += r"<h3>Weighted Relative Frequencies of Detected Phylotypes.</h3>" + imgString = r"<img src = '"+ tdict['name']+"_phylotypes.png' alt='Bar chart of phylotype variation' style='max-width:100%'><br><br>" + htmlString += imgString + + with open(tdict['html_file'], "w") as htmlfile: + htmlfile.write(htmlString) + + + +def getPhyloNumber(sac): + i = sac.find('_') + return int(sac[1:i]) + +def combineFPMK(tdict): + fpkm_df = pd.read_csv(tdict['name']+'.cuff/genes.fpkm_tracking', sep='\t') + + #fpkm_df = pd.read_csv('genes.fpkm_tracking',sep='\t') + #print(fpkm_df.head()) + fpkm_df['locus'] = fpkm_df['locus'].apply(lambda names: names[:names.find(':')]) + #print(fpkm_df.head()) + reducedBlast_df = pd.read_csv(tdict['name']+'_transcript.csv') + # reducedBlast_df = pd.read_csv('TrinityVT_transcript.csv') + saccverSet = set(reducedBlast_df['saccver']) + saccverList = list(saccverSet) + saccverList.sort() + # print(saccverList[:5]) + new_df = pd.DataFrame(columns=['qaccver','saccver','FPKM']) + for sv in saccverList: + #print(sv) + temp_df = reducedBlast_df[reducedBlast_df['saccver'] == sv] + qList = list(temp_df['qaccver']) + for q in qList: + f_df = fpkm_df[(fpkm_df['locus'] == q)] + if len(f_df) > 1: + print('WARNING MULTIPLE FPKM') + new_fpkm=list(f_df['FPKM']) + f = (new_fpkm[0]) + # print(f) + new_df = new_df.append({'qaccver': q, 'saccver': sv, 'FPKM': f}, ignore_index=True) + FPKMsum_df = new_df.groupby('saccver')['FPKM'].sum().reset_index() + + FPKMsum_df['Phylotype'] = FPKMsum_df.apply(lambda row: getPhyloNumber(row['saccver']), axis=1) + FPKMsum_df = FPKMsum_df.sort_values(by=['Phylotype']) + FPKMsum_df = FPKMsum_df.reset_index(drop=True) + + # print(FPKMsum_df) + FPKMsum_df.to_csv('FPKM_sum.csv') + FPKMsum2_df = FPKMsum_df.groupby('Phylotype')['FPKM'].sum().reset_index() + FPKMsum2_df = FPKMsum2_df.sort_values(by=['Phylotype']) + + # print(FPKMsum2_df) + FPKMsum2_df.to_csv('FPKM_sum2.csv') # in case more than one entry for a particular phylotype + return FPKMsum_df, FPKMsum2_df + + + +def normalisef(f,max): + return f/max + +def getComposite_sum2(nameList,sum2_dfs): + # lets get a composite sum2_df from all of the sum2_dfs + phyList = [] + + for i in range(0, len(sum2_dfs)): + total = sum2_dfs[i]['FPKM'].sum() + sum2_dfs[i]['w'] = sum2_dfs[i].apply(lambda row: normalisef(row['FPKM'], total), axis=1) + pSeries = sum2_dfs[i]['Phylotype'] + for p in pSeries: + phyList.append(p) # get all the phylotypes in this one + phyList = list(set(phyList)) + phyList.sort() + composite_sum2_df = pd.DataFrame(phyList, columns=['Phylotype']) + for i in range(0, len(sum2_dfs)): + wList = [] + pindf = list(sum2_dfs[i]['Phylotype']) + # print(pindf) + for p in phyList: + if p in pindf: + df = sum2_dfs[i] + w = df.loc[df['Phylotype'] == p, 'w'].iloc[0] + else: + w = 0 + wList.append(w) + composite_sum2_df[nameList[i]] = wList + #print(composite_sum2_df) + #composite_sum2_df.to_csv('composite.csv') + return composite_sum2_df + + +def doMultiBarChart(tdict, composite_df): #array of multiple sum2_dfs + labelList = composite_df.columns.tolist() + sampnum = len(labelList)-1 +# need to arrange bars +# number of phylotype = len(composite_df) +#number of bars = (len(labelist)-1) +1 for space +# ytick needs to ne + + cmap = plt.cm.get_cmap('tab10') + palette = [cmap(i) for i in range(cmap.N)] + title = "Legend: Variant Antigen Profile of a $\itTrypanosoma$ $\itvivax$ transcriptomes. " \ + "Phylotype abundance is expressed as phylotype frequencies adjusted " \ + "for combined transcript abundance. " \ + "Data was produced with VAPPER-Variant Antigen Profiler (Silva Pereira et al., 2019)." + width = 0.6 + ind = np.arange(width*sampnum/2, len(composite_df)*width*(sampnum+1), width*(sampnum+1)) + #print(ind) + ysize = len(composite_df)*0.4 + + fig, ax = plt.subplots(figsize=(10,ysize)) + + + for s in range(1, len(labelList)): + ax.barh(ind, composite_df[labelList[s]], width, color=palette[s], label=labelList[s]) + ind = ind + width + + ax.set(yticks=np.arange(width*(sampnum+2)/2, len(composite_df)*width*(sampnum+1), width*(sampnum+1)), yticklabels=composite_df['Phylotype']) # , ylim=[(len(labelList)-1) * width - 1, len(composite_df)]) + ax.legend() + + + ax.set_ylabel('Phylotype') + ax.invert_yaxis() # labels read top-to-bottom + ax.set_xlabel('Weighted Phylotype Frequency') + + # plt.text(-0.3, -0.15, title, va="top", wrap="True") + #plt.tight_layout() + + plt.subplots_adjust(bottom=0.1, top=0.92, left=0.15, right=0.9) + ax.set_title(title, x=0, wrap='True',ha='left',) + + plt.savefig(tdict['html_resource'] + tdict['name']+"_phylotypes.png") + if tdict['pdf'] == 'PDF_Yes': + plt.savefig(tdict['html_resource'] + tdict['name']+"phylotypes.pdf") + plt.show() + pass + + + +def doBarChart(tdict, sum2_df): + cmap = plt.cm.get_cmap('tab20') + palette = [cmap(i) for i in range(cmap.N)] + title = "Legend: Variant Antigen Profile of a $\itTrypanosoma$ $\itvivax$ transcriptome. " \ + "Phylotype abundance is expressed as phylotype frequencies adjusted " \ + "for combined transcript abundance. " \ + "Data was produced with VAPPER-Variant Antigen Profiler (Silva Pereira et al., 2019)." + # get a list of phylotype, create equivalent of saccver, get a list of + maxFPKM = sum2_df['FPKM'].max() + total = sum2_df['FPKM'].sum() + + sum2_df['Normalised'] = sum2_df.apply(lambda row: normalisef(row['FPKM'], maxFPKM),axis=1) + sum2_df['Weighted'] = sum2_df.apply(lambda row: normalisef(row['FPKM'], total),axis=1) + pList = sum2_df['Phylotype'] + phList = [] + for p in pList: + phList.append(str(p)) + + fList = sum2_df['Weighted'] + ysize = len(phList)*0.3 + fig, ax = plt.subplots(figsize=(10,ysize)) + + ax.barh(phList, fList, color=palette) + ax.set_ylabel('Phylotype') + ax.invert_yaxis() # labels read top-to-bottom + ax.set_xlabel('Weighted Phylotype Frequency') + + # plt.text(-0.3, -0.15, title, va="top", wrap="True") + #plt.tight_layout() + plt.subplots_adjust(bottom=0.1, top=0.9, left=0.15, right=0.9) + ax.set_title(title, x=0, wrap='True',ha='left',) + + plt.savefig(tdict['html_resource'] + tdict['name']+"_phylotypes.png") + if tdict['pdf'] == 'PDF_Yes': + plt.savefig(tdict['html_resource'] + tdict['name']+"phylotypes.pdf") + # plt.show() + pass + +# argdict = {'name':2, 'pdfexport': 3, 'refFastq': 4, 'forward': 5, 'reverse': 6, 'html_file': 7, 'html_resource': 8} + +def transcriptomicProcess(args,argdict): + tdict = {} + tdict['name'] = args[argdict['name']] + tdict['refFastq'] = args[argdict['refFastq']] + tdict['forward'] = args[argdict['forward']] + tdict['reverse'] = args[argdict['reverse']] + tdict['vivax_trans_database'] = 'data/vivax/Database/Phylotype_typeseqs.fas' + tdict['pdf'] = args[argdict['pdfexport']] + tdict['html_file'] = args[argdict['html_file']] + tdict['html_resource'] = args[argdict['html_resource']] + + uploadUserReferenceFastq(tdict['refFastq']) + transcriptMapping(tdict['name'], tdict['refFastq'], tdict['forward'], tdict['reverse']) #uses bowtie + processSamFiles(tdict['name']) #uses samtools + transcriptAbundance(tdict['name']) #uses cufflinks -> ?.cuff/*.* + transcriptsForBlast(tdict['name'], tdict['refFastq']) #creates name+4blast.fa + blastContigs(tdict['name'], tdict['html_resource'], 'data/vivax/Database/Phylotype_typeseqs.fas') + sum_df, sum2_df = combineFPMK(tdict) + doBarChart(tdict, sum2_df) + createHTML(tdict, sum_df) + + +if __name__ == "__main__": + exit() + +