2016-03-07 22:20:48 +00:00
|
|
|
"""Helper methods for various modules."""
|
2024-03-08 15:36:11 +00:00
|
|
|
|
2021-03-17 20:46:07 +00:00
|
|
|
from __future__ import annotations
|
|
|
|
|
2018-03-10 03:38:51 +00:00
|
|
|
import asyncio
|
2022-02-04 22:45:25 +00:00
|
|
|
from collections.abc import Callable, Coroutine, Iterable, KeysView, Mapping
|
2018-07-23 08:24:39 +00:00
|
|
|
from datetime import datetime, timedelta
|
2021-11-15 17:18:57 +00:00
|
|
|
from functools import wraps
|
2015-01-18 05:55:33 +00:00
|
|
|
import random
|
2019-12-09 15:42:10 +00:00
|
|
|
import re
|
2015-01-18 05:55:33 +00:00
|
|
|
import string
|
2019-12-09 15:42:10 +00:00
|
|
|
import threading
|
2024-05-18 09:43:32 +00:00
|
|
|
from typing import Any
|
2016-07-23 18:07:08 +00:00
|
|
|
|
2018-12-17 06:51:13 +00:00
|
|
|
import slugify as unicode_slug
|
|
|
|
|
2016-04-16 07:55:35 +00:00
|
|
|
from .dt import as_local, utcnow
|
2015-04-29 02:12:05 +00:00
|
|
|
|
2019-07-30 23:59:12 +00:00
|
|
|
RE_SANITIZE_FILENAME = re.compile(r"(~|\.\.|/|\\)")
|
|
|
|
RE_SANITIZE_PATH = re.compile(r"(~|\.(\.)+)")
|
2013-12-07 20:54:19 +00:00
|
|
|
|
2013-11-11 00:46:48 +00:00
|
|
|
|
2021-01-26 14:53:21 +00:00
|
|
|
def raise_if_invalid_filename(filename: str) -> None:
|
2023-01-09 06:01:55 +00:00
|
|
|
"""Check if a filename is valid.
|
2021-01-26 14:53:21 +00:00
|
|
|
|
|
|
|
Raises a ValueError if the filename is invalid.
|
|
|
|
"""
|
|
|
|
if RE_SANITIZE_FILENAME.sub("", filename) != filename:
|
|
|
|
raise ValueError(f"{filename} is not a safe filename")
|
|
|
|
|
|
|
|
|
|
|
|
def raise_if_invalid_path(path: str) -> None:
|
2023-01-09 06:01:55 +00:00
|
|
|
"""Check if a path is valid.
|
2021-01-26 14:53:21 +00:00
|
|
|
|
|
|
|
Raises a ValueError if the path is invalid.
|
|
|
|
"""
|
|
|
|
if RE_SANITIZE_PATH.sub("", path) != path:
|
|
|
|
raise ValueError(f"{path} is not a safe path")
|
|
|
|
|
|
|
|
|
2021-07-28 09:50:13 +00:00
|
|
|
def slugify(text: str | None, *, separator: str = "_") -> str:
|
2016-03-07 22:20:48 +00:00
|
|
|
"""Slugify a given text."""
|
2021-07-28 09:50:13 +00:00
|
|
|
if text == "" or text is None:
|
2021-01-27 11:25:49 +00:00
|
|
|
return ""
|
|
|
|
slug = unicode_slug.slugify(text, separator=separator)
|
|
|
|
return "unknown" if slug == "" else slug
|
2014-01-20 03:10:40 +00:00
|
|
|
|
|
|
|
|
2016-07-23 18:07:08 +00:00
|
|
|
def repr_helper(inp: Any) -> str:
|
2016-03-07 22:20:48 +00:00
|
|
|
"""Help creating a more readable string representation of objects."""
|
2022-02-04 22:45:25 +00:00
|
|
|
if isinstance(inp, Mapping):
|
2014-04-14 07:10:24 +00:00
|
|
|
return ", ".join(
|
2020-04-07 21:14:28 +00:00
|
|
|
f"{repr_helper(key)}={repr_helper(item)}" for key, item in inp.items()
|
2019-07-30 23:59:12 +00:00
|
|
|
)
|
2018-07-23 08:16:05 +00:00
|
|
|
if isinstance(inp, datetime):
|
2016-04-16 07:55:35 +00:00
|
|
|
return as_local(inp).isoformat()
|
2017-07-06 03:02:16 +00:00
|
|
|
|
|
|
|
return str(inp)
|
2014-01-27 02:44:36 +00:00
|
|
|
|
|
|
|
|
2024-05-18 09:43:32 +00:00
|
|
|
def convert[_T, _U](
|
2022-03-17 17:52:38 +00:00
|
|
|
value: _T | None, to_type: Callable[[_T], _U], default: _U | None = None
|
|
|
|
) -> _U | None:
|
2016-03-07 22:20:48 +00:00
|
|
|
"""Convert value to to_type, returns default if fails."""
|
2014-03-16 22:00:59 +00:00
|
|
|
try:
|
2014-03-26 07:08:50 +00:00
|
|
|
return default if value is None else to_type(value)
|
2016-02-21 19:23:16 +00:00
|
|
|
except (ValueError, TypeError):
|
2014-03-16 22:00:59 +00:00
|
|
|
# If value could not be converted
|
|
|
|
return default
|
|
|
|
|
|
|
|
|
2019-07-30 23:59:12 +00:00
|
|
|
def ensure_unique_string(
|
2021-03-17 20:46:07 +00:00
|
|
|
preferred_string: str, current_strings: Iterable[str] | KeysView[str]
|
2019-07-30 23:59:12 +00:00
|
|
|
) -> str:
|
2016-03-07 22:20:48 +00:00
|
|
|
"""Return a string that is not present in current_strings.
|
|
|
|
|
|
|
|
If preferred string exists will append _2, _3, ..
|
|
|
|
"""
|
2015-01-18 05:55:33 +00:00
|
|
|
test_string = preferred_string
|
2016-07-28 03:33:49 +00:00
|
|
|
current_strings_set = set(current_strings)
|
2014-03-23 19:31:24 +00:00
|
|
|
|
|
|
|
tries = 1
|
|
|
|
|
2016-07-28 03:33:49 +00:00
|
|
|
while test_string in current_strings_set:
|
2014-03-23 19:31:24 +00:00
|
|
|
tries += 1
|
2019-08-23 16:53:33 +00:00
|
|
|
test_string = f"{preferred_string}_{tries}"
|
2014-03-23 19:31:24 +00:00
|
|
|
|
2015-01-18 05:55:33 +00:00
|
|
|
return test_string
|
2014-03-23 19:31:24 +00:00
|
|
|
|
|
|
|
|
2015-01-18 05:55:33 +00:00
|
|
|
# Taken from http://stackoverflow.com/a/23728630
|
2018-07-23 08:24:39 +00:00
|
|
|
def get_random_string(length: int = 10) -> str:
|
2016-03-07 22:20:48 +00:00
|
|
|
"""Return a random string with letters and digits."""
|
2015-01-18 05:55:33 +00:00
|
|
|
generator = random.SystemRandom()
|
|
|
|
source_chars = string.ascii_letters + string.digits
|
|
|
|
|
2019-07-30 23:59:12 +00:00
|
|
|
return "".join(generator.choice(source_chars) for _ in range(length))
|
2015-01-18 05:55:33 +00:00
|
|
|
|
|
|
|
|
2018-07-20 08:45:20 +00:00
|
|
|
class Throttle:
|
2016-03-07 22:20:48 +00:00
|
|
|
"""A class for throttling the execution of tasks.
|
|
|
|
|
|
|
|
This method decorator adds a cooldown to a method to prevent it from being
|
2022-12-20 10:10:31 +00:00
|
|
|
called more than 1 time within the timedelta interval `min_time` after it
|
2014-12-05 05:06:45 +00:00
|
|
|
returned its result.
|
2014-12-04 09:14:27 +00:00
|
|
|
|
2014-12-05 05:06:45 +00:00
|
|
|
Calling a method a second time during the interval will return None.
|
2014-12-04 09:14:27 +00:00
|
|
|
|
2014-12-05 05:06:45 +00:00
|
|
|
Pass keyword argument `no_throttle=True` to the wrapped method to make
|
|
|
|
the call not throttled.
|
|
|
|
|
|
|
|
Decorator takes in an optional second timedelta interval to throttle the
|
|
|
|
'no_throttle' calls.
|
|
|
|
|
|
|
|
Adds a datetime attribute `last_call` to the method.
|
2014-12-04 09:14:27 +00:00
|
|
|
"""
|
|
|
|
|
2019-07-30 23:59:12 +00:00
|
|
|
def __init__(
|
2021-03-17 20:46:07 +00:00
|
|
|
self, min_time: timedelta, limit_no_throttle: timedelta | None = None
|
2019-07-30 23:59:12 +00:00
|
|
|
) -> None:
|
2016-03-07 22:20:48 +00:00
|
|
|
"""Initialize the throttle."""
|
2014-12-04 09:14:27 +00:00
|
|
|
self.min_time = min_time
|
2014-12-05 05:06:45 +00:00
|
|
|
self.limit_no_throttle = limit_no_throttle
|
2014-12-04 09:14:27 +00:00
|
|
|
|
2018-07-23 08:24:39 +00:00
|
|
|
def __call__(self, method: Callable) -> Callable:
|
2016-03-07 22:20:48 +00:00
|
|
|
"""Caller for the throttle."""
|
2018-03-17 03:27:05 +00:00
|
|
|
# Make sure we return a coroutine if the method is async.
|
|
|
|
if asyncio.iscoroutinefunction(method):
|
2019-07-30 23:59:12 +00:00
|
|
|
|
2018-07-23 08:24:39 +00:00
|
|
|
async def throttled_value() -> None:
|
2018-03-17 03:27:05 +00:00
|
|
|
"""Stand-in function for when real func is being throttled."""
|
2019-07-30 23:59:12 +00:00
|
|
|
|
2018-03-17 03:27:05 +00:00
|
|
|
else:
|
2019-07-30 23:59:12 +00:00
|
|
|
|
2022-02-18 10:30:59 +00:00
|
|
|
def throttled_value() -> None: # type: ignore[misc]
|
2018-03-17 03:27:05 +00:00
|
|
|
"""Stand-in function for when real func is being throttled."""
|
|
|
|
|
2014-12-05 05:06:45 +00:00
|
|
|
if self.limit_no_throttle is not None:
|
|
|
|
method = Throttle(self.limit_no_throttle)(method)
|
|
|
|
|
2015-10-11 17:42:42 +00:00
|
|
|
# Different methods that can be passed in:
|
|
|
|
# - a function
|
|
|
|
# - an unbound function on a class
|
|
|
|
# - a method (bound function on a class)
|
|
|
|
|
|
|
|
# We want to be able to differentiate between function and unbound
|
|
|
|
# methods (which are considered functions).
|
2017-09-23 15:15:46 +00:00
|
|
|
# All methods have the classname in their qualname separated by a '.'
|
2015-10-09 06:49:55 +00:00
|
|
|
# Functions have a '.' in their qualname if defined inline, but will
|
|
|
|
# be prefixed by '.<locals>.' so we strip that out.
|
2019-07-30 23:59:12 +00:00
|
|
|
is_func = (
|
|
|
|
not hasattr(method, "__self__")
|
2022-11-15 20:45:48 +00:00
|
|
|
and "." not in method.__qualname__.rpartition(".<locals>.")[-1]
|
2019-07-30 23:59:12 +00:00
|
|
|
)
|
2015-10-09 06:49:55 +00:00
|
|
|
|
2014-12-04 09:14:27 +00:00
|
|
|
@wraps(method)
|
2021-03-17 20:46:07 +00:00
|
|
|
def wrapper(*args: Any, **kwargs: Any) -> Callable | Coroutine:
|
2017-05-02 16:18:47 +00:00
|
|
|
"""Wrap that allows wrapped to be called only once per min_time.
|
2016-03-07 22:20:48 +00:00
|
|
|
|
2015-01-06 04:50:34 +00:00
|
|
|
If we cannot acquire the lock, it is running so return None.
|
2014-12-04 09:14:27 +00:00
|
|
|
"""
|
2019-07-30 23:59:12 +00:00
|
|
|
if hasattr(method, "__self__"):
|
|
|
|
host = getattr(method, "__self__")
|
2015-10-11 17:42:42 +00:00
|
|
|
elif is_func:
|
|
|
|
host = wrapper
|
|
|
|
else:
|
|
|
|
host = args[0] if args else wrapper
|
|
|
|
|
2019-07-30 23:59:12 +00:00
|
|
|
if not hasattr(host, "_throttle"):
|
2024-05-06 18:33:26 +00:00
|
|
|
host._throttle = {} # noqa: SLF001
|
2015-10-09 06:49:55 +00:00
|
|
|
|
2024-05-06 18:33:26 +00:00
|
|
|
if id(self) not in host._throttle: # noqa: SLF001
|
|
|
|
host._throttle[id(self)] = [threading.Lock(), None] # noqa: SLF001
|
|
|
|
throttle = host._throttle[id(self)] # noqa: SLF001
|
2016-02-27 22:18:56 +00:00
|
|
|
|
|
|
|
if not throttle[0].acquire(False):
|
2018-03-10 03:38:51 +00:00
|
|
|
return throttled_value()
|
2015-09-13 05:56:49 +00:00
|
|
|
|
2015-10-09 06:49:55 +00:00
|
|
|
# Check if method is never called or no_throttle is given
|
2019-07-30 23:59:12 +00:00
|
|
|
force = kwargs.pop("no_throttle", False) or not throttle[1]
|
2015-09-13 05:56:49 +00:00
|
|
|
|
2015-10-09 06:49:55 +00:00
|
|
|
try:
|
2016-02-27 22:18:56 +00:00
|
|
|
if force or utcnow() - throttle[1] > self.min_time:
|
2015-09-13 05:56:49 +00:00
|
|
|
result = method(*args, **kwargs)
|
2016-02-27 22:18:56 +00:00
|
|
|
throttle[1] = utcnow()
|
2022-02-18 10:30:59 +00:00
|
|
|
return result # type: ignore[no-any-return]
|
2017-07-06 03:02:16 +00:00
|
|
|
|
2018-03-10 03:38:51 +00:00
|
|
|
return throttled_value()
|
2015-09-13 05:56:49 +00:00
|
|
|
finally:
|
2016-02-27 22:18:56 +00:00
|
|
|
throttle[0].release()
|
2014-12-04 09:14:27 +00:00
|
|
|
|
|
|
|
return wrapper
|