Counts n-grams in the entire sequence set and fitting their distribution with the power-law distribution (Zipf’s law)
python
powerlaw
quantiprot
@misc{PDAUGGITHUB,
author = {Joshi, Jayadev and Blankenberg, Daniel},
year = {2020},
title ={PDAUG - a Galaxy based toolset for peptide library analysis, visualization, and machine learning modeling},
publisher = {GitHub},
journal = {GitHub repository},
url =
{https://github.com/jaidevjoshi83/pdaug.git},
}
@article{konopka_marciniak_dyrka_2017,
title={Quantiprot - a Python package for quantitative analysis of protein sequences},
volume={18},
DOI={10.1186/s12859-017-1751-4},
number={1},
journal={BMC Bioinformatics},
author={Konopka, Bogumił M. and Marciniak, Marta and Dyrka, Witold},
year={2017}
}