Mercurial > repos > jay > pdaug_addclasslabel
view PDAUG_Sequence_Network/PDAUG_Sequence_Network.py @ 8:b9659a0a327d draft
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit d396d7ff89705cc0dd626ed32c45a9f4029b1b05"
author | jay |
---|---|
date | Mon, 10 Jan 2022 05:04:27 +0000 |
parents | 2df11ea23f10 |
children |
line wrap: on
line source
import Levenshtein import matplotlib.pyplot as plt import networkx as nx import os def SeqSimilarityNetwork(InFile, OutFile): f = open(InFile) lines = f.readlines() record = [] seq = [] G = nx.Graph() for line in lines: if ">" in line: record.append(line.strip('\n')) else: seq.append(line.strip('\n')) for x, i in enumerate(seq): for X, I in enumerate(seq): L = Levenshtein.ratio(i, I ) if L >= 0.4: G.add_edge(record[x], record[X], weight=float(Levenshtein.ratio(i, I ))) elarge = [(u, v) for (u, v, d) in G.edges(data=True) if d['weight'] >= 0.4] pos = nx.spring_layout(G) nx.draw_networkx_nodes(G, pos, node_size=10) nx.draw_networkx_edges(G, pos, edgelist=elarge,width=1) plt.axis('off') plt.savefig(OutFile) if __name__=="__main__": import argparse parser = argparse.ArgumentParser() parser.add_argument("-I", "--InFile", required=True, default=None, help="Path to target tsv file") parser.add_argument("-O","--OutFile", required=False, help="HTML out file", default="out.png") args = parser.parse_args() SeqSimilarityNetwork(args.InFile, args.OutFile)