Mercurial > repos > jay > pdaug_basic_plots
view PDAUG_Peptide_Core_Descriptors/PDAUG_Peptide_Core_Descriptors.py @ 9:15b6eec94c40 draft default tip
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit d396d7ff89705cc0dd626ed32c45a9f4029b1b05"
author | jay |
---|---|
date | Wed, 12 Jan 2022 19:47:58 +0000 |
parents | 7d247e27ff11 |
children |
line wrap: on
line source
from modlamp.core import BaseDescriptor from modlamp.descriptors import PeptideDescriptor import pandas as pd import argparse, os parser = argparse.ArgumentParser() parser.add_argument("-I", "--InFile", required=True, default=None, help="Input file") parser.add_argument("-O", "--OutFile", required=True, default=None, help="Output file") parser.add_argument("-N", "--Ngrams", required=True, default=None, help="ngrams") args = parser.parse_args() file = open(args.InFile) lines = file.readlines() Index = [] Pep = [] for line in lines: if '>' in line: Index.append(line.strip('\n')) else: line = line.strip('\n') line = line.strip('\r') Pep.append(line) df = pd.DataFrame() for i, l in enumerate(Pep): D = PeptideDescriptor(l) D.count_ngrams([int(args.Ngrams)]) df1 = pd.DataFrame(D.descriptor, index=["sequence"+str(i),]) df = pd.concat([df, df1], axis=0) df = df.fillna(0) df.to_csv(args.OutFile, sep='\t', index=None)