X-Git-Url: https://wannabe.guru.org/gitweb/?a=blobdiff_plain;f=list_utils.py;h=1141af2fe9b6bb8861dfd25c08dab735bfd4ceaf;hb=a9bdfd8fc9f84b7b2c09a57cd12ba32259e84d1c;hp=992f1ae4207228711c17573bb779cc0aaae2d0f8;hpb=5f75cf834725ac26b289cc5f157af0cb71cd5f0e;p=python_utils.git diff --git a/list_utils.py b/list_utils.py index 992f1ae..1141af2 100644 --- a/list_utils.py +++ b/list_utils.py @@ -1,8 +1,13 @@ #!/usr/bin/env python3 +# © Copyright 2021-2022, Scott Gasch + +"""Some useful(?) utilities for dealing with Lists.""" + +import random from collections import Counter -from itertools import islice -from typing import Any, Iterator, List, Mapping, Sequence, Tuple +from itertools import chain, combinations, islice +from typing import Any, Iterator, List, MutableSequence, Sequence, Tuple def shard(lst: List[Any], size: int) -> Iterator[Any]: @@ -65,7 +70,7 @@ def remove_list_if_one_element(lst: List[Any]) -> Any: return lst -def population_counts(lst: List[Any]) -> Mapping[Any, int]: +def population_counts(lst: Sequence[Any]) -> Counter: """ Return a population count mapping for the list (i.e. the keys are list items and the values are the number of occurrances of that @@ -197,12 +202,12 @@ def ngrams(lst: Sequence[Any], n): ['an', 'awesome', 'test'] """ for i in range(len(lst) - n + 1): - yield lst[i:i + n] + yield lst[i : i + n] -def permute(seq: Sequence[Any]): +def permute(seq: str): """ - Returns all permutations of a sequence; takes O(N^2) time. + Returns all permutations of a sequence; takes O(N!) time. >>> for x in permute('cat'): ... print(x) @@ -216,19 +221,45 @@ def permute(seq: Sequence[Any]): """ yield from _permute(seq, "") -def _permute(seq: Sequence[Any], path): - if len(seq) == 0: + +def _permute(seq: str, path: str): + seq_len = len(seq) + if seq_len == 0: yield path - for i in range(len(seq)): + for i in range(seq_len): car = seq[i] left = seq[0:i] - right = seq[i + 1:] + right = seq[i + 1 :] cdr = left + right yield from _permute(cdr, path + car) -def binary_search(lst: Sequence[Any], target:Any) -> Tuple[bool, int]: +def shuffle(seq: MutableSequence[Any]) -> MutableSequence[Any]: + """Shuffles a sequence into a random order. + + >>> random.seed(22) + >>> shuffle([1, 2, 3, 4, 5]) + [3, 4, 1, 5, 2] + + >>> shuffle('example') + 'empaelx' + + """ + if isinstance(seq, str): + import string_utils + + return string_utils.shuffle(seq) + else: + random.shuffle(seq) + return seq + + +def scramble(seq: MutableSequence[Any]) -> MutableSequence[Any]: + return shuffle(seq) + + +def binary_search(lst: Sequence[Any], target: Any, *, sanity_check=False) -> Tuple[bool, int]: """Performs a binary search on lst (which must already be sorted). Returns a Tuple composed of a bool which indicates whether the target was found and an int which indicates the index closest to @@ -247,7 +278,19 @@ def binary_search(lst: Sequence[Any], target:Any) -> Tuple[bool, int]: >>> binary_search(a, 2) (False, 1) + >>> a.append(9) + >>> binary_search(a, 4, sanity_check=True) + Traceback (most recent call last): + ... + AssertionError + """ + if sanity_check: + last = None + for x in lst: + if last is not None: + assert x >= last # This asserts iff the list isn't sorted + last = x # in ascending order. return _binary_search(lst, target, 0, len(lst) - 1) @@ -264,6 +307,24 @@ def _binary_search(lst: Sequence[Any], target: Any, low: int, high: int) -> Tupl return (False, low) +def powerset(lst: Sequence[Any]) -> Iterator[Sequence[Any]]: + """Returns the powerset of the items in the input sequence. + + >>> for x in powerset([1, 2, 3]): + ... print(x) + () + (1,) + (2,) + (3,) + (1, 2) + (1, 3) + (2, 3) + (1, 2, 3) + """ + return chain.from_iterable(combinations(lst, r) for r in range(len(lst) + 1)) + + if __name__ == '__main__': import doctest + doctest.testmod()