Source code for sequana.misc

#
#  This file is part of Sequana software
#
#  Copyright (c) 2016-2022 - Sequana Development Team
#
#  Distributed under the terms of the 3-clause BSD license.
#  The full license is in the LICENSE file, distributed with this software.
#
#  website: https://github.com/sequana/sequana
#  documentation: http://sequana.readthedocs.io
#
##############################################################################
""".. rubric:: misc utilities"""
import glob
import os
import pathlib
import platform

import colorlog

from sequana.lazy import numpy as np

logger = colorlog.getLogger(__name__)


__all__ = ["textwrap", "wget", "findpos", "normpdf"]


[docs]def normpdf(x, mu, sigma): """Return the normal pdf evaluated at *x*; args provides *mu*, *sigma*" .. note:: same as scipy.stats.norm but implemented to avoid scipy dependency """ return 1.0 / (np.sqrt(2 * np.pi) * sigma) * np.exp(-0.5 * (1.0 / sigma * (x - mu)) ** 2)
[docs]def textwrap(text, width=80, indent=0): """Wrap a string with 80 characters :param text: input text :param width: (defaults to 80 characters) :param indent: possible indentation (0 by default) """ if indent == 0: indent = "" else: indent = " " * indent data = [indent + text[i * width : (i + 1) * width :] for i in range(len(text) // width + 1)] return "\n".join(data)
[docs]def wget(link, output): """Retrieve a file from internet. :param str link: a valid URL :param str output: the output filename .. warning:: no sanity check of any kind for now """ try: from urllib import urlretrieve except: from urllib.request import urlretrieve urlretrieve(link, filename=output)
[docs]def findpos(seq, chr): """Find position(s) of a substring into a longer string. Note that this function is a generator:: >>> list(findpos("AACCGGAAGGTT", "GG")) [4,8] """ N = len(chr) for i, dummy in enumerate(seq): if seq[i : i + N] == chr: yield i