Source code for cardinal_pythonlib.maths_numpy

#!/usr/bin/env python
# cardinal_pythonlib/maths_numpy.py

"""
===============================================================================

    Original code copyright (C) 2009-2022 Rudolf Cardinal (rudolf@pobox.com).

    This file is part of cardinal_pythonlib.

    Licensed under the Apache License, Version 2.0 (the "License");
    you may not use this file except in compliance with the License.
    You may obtain a copy of the License at

        https://www.apache.org/licenses/LICENSE-2.0

    Unless required by applicable law or agreed to in writing, software
    distributed under the License is distributed on an "AS IS" BASIS,
    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    See the License for the specific language governing permissions and
    limitations under the License.

===============================================================================

**Miscellaneous mathematical functions that use Numpy** (which can be slow to
load).

"""

# =============================================================================
# Imports
# =============================================================================

from collections import Counter
import random
import sys
from typing import List, Optional, Union

import numpy as np  # pip install numpy

from cardinal_pythonlib.logs import get_brace_style_log_with_null_handler

log = get_brace_style_log_with_null_handler(__name__)


# =============================================================================
# Constants
# =============================================================================

# sys.float_info.max_10_exp:
#       largest integer x such that 10 ** x is representable as a float
# sys.float_info.max_exp:
#       largest integer x such that float(sys.float_info.radix) ** x is
#       representable as a float... and that's 2.0 ** x
# But what we want is the largest integer x such that e ** x = math.exp(x)
# is representable as a float, and that is:

MAX_E_EXPONENT = int(np.log(sys.float_info.max))  # typically, 709


# =============================================================================
# Softmax
# =============================================================================


[docs]def softmax(x: np.ndarray, b: float = 1.0) -> np.ndarray: r""" Standard softmax function: .. math:: P_i = \frac {e ^ {\beta \cdot x_i}} { \sum_{i}{\beta \cdot x_i} } Args: x: vector (``numpy.array``) of values b: exploration parameter :math:`\beta`, or inverse temperature [Daw2009], or :math:`1/t`; see below Returns: vector of probabilities corresponding to the input values where: - :math:`t` is temperature (towards infinity: all actions equally likely; towards zero: probability of action with highest value tends to 1) - Temperature is not used directly as optimizers may take it to zero, giving an infinity; use inverse temperature instead. - [Daw2009] Daw ND, "Trial-by-trial data analysis using computational methods", 2009/2011; in "Decision Making, Affect, and Learning: Attention and Performance XXIII"; Delgado MR, Phelps EA, Robbins TW (eds), Oxford University Press. """ n = len(x) if b == 0.0: # e^0 / sum(a bunch of e^0) = 1 / n return np.full(n, 1 / n) constant = np.mean(x) products = x * b - constant # ... softmax is invariant to addition of a constant: Daw article and # http://www.faqs.org/faqs/ai-faq/neural-nets/part2/section-12.html#b # noinspection PyUnresolvedReferences if products.max() > MAX_E_EXPONENT: log.warning( f"OVERFLOW in softmax(): x = {x}, b = {b}, constant = {constant}, " f"x*b - constant = {products}" ) # map the maximum to 1, other things to zero index_of_max = np.argmax(products) answer = np.zeros(n) answer[index_of_max] = 1.0 return answer # noinspection PyUnresolvedReferences exponented = np.exp(products) sum_exponented = np.sum(exponented) if sum_exponented == 0.0: # ... avoid division by zero return np.full(n, 1 / n) return exponented / np.sum(exponented)
[docs]def pick_from_probabilities( probabilities: Union[List[float], np.ndarray] ) -> int: """ Given a list of probabilities like ``[0.1, 0.3, 0.6]``, returns the index of the probabilistically chosen item. In this example, we would return ``0`` with probability 0.1; ``1`` with probability 0.3; and ``2`` with probability 0.6. Args: probabilities: list of probabilities, which should sum to 1 Returns: the index of the chosen option Raises: :exc:`ValueError` if a random number in the range [0, 1) is greater than or equal to the cumulative sum of the supplied probabilities (i.e. if you've specified probabilities adding up to less than 1) Does not object if you supply e.g. ``[1, 1, 1]``; it'll always pick the first in this example. """ r = random.random() # range [0.0, 1.0), i.e. 0 <= r < 1 cs = np.cumsum(probabilities) # e.g. [0.1, 0.4, 1] in this example for idx in range(len(cs)): if r < cs[idx]: return idx raise ValueError( f"Probabilities sum to <1: probabilities = {probabilities!r}, " f"cumulative sum = {cs!r}" )
# ============================================================================= # Logistic # =============================================================================
[docs]def logistic( x: Union[float, np.ndarray], k: float, theta: float ) -> Optional[float]: r""" Standard logistic function. .. math:: y = \frac {1} {1 + e^{-k (x - \theta)}} Args: x: :math:`x` k: :math:`k` theta: :math:`\theta` Returns: :math:`y` """ # https://www.sharelatex.com/learn/List_of_Greek_letters_and_math_symbols if x is None or k is None or theta is None: return None # noinspection PyUnresolvedReferences return 1 / (1 + np.exp(-k * (x - theta)))
[docs]def inv_logistic( y: Union[float, np.ndarray], k: float, theta: float ) -> Optional[float]: r""" Inverse standard logistic function: .. math:: x = ( log( \frac {1} {y} - 1) / -k ) + \theta Args: y: :math:`y` k: :math:`k` theta: :math:`\theta` Returns: :math:`x` """ if y is None or k is None or theta is None: return None # noinspection PyUnresolvedReferences return (np.log((1 / y) - 1) / -k) + theta
# ============================================================================= # Testing # ============================================================================= def _test_softmax() -> None: """ Tests the :func`softmax` function. """ arrays = [ [1, 1], [1, 1, 2], [1, 1, 1, 1, 1.01], [1, 2, 3, 4, 5], [1, 2, 3, 4, 1000], [1, 2, 3, 4, 5.0**400], ] betas = [0, 0.5, 1, 2, 10, 100] for x in arrays: for b in betas: y = softmax(np.array(x), b=b) print(f"softmax({x!r}, b={b}) -> {y}") def _test_pick_from_probabilities() -> None: """ Tests the :func:`pick_from_probabilities` function. """ probabilities = [ [0.0, 1.0], [0.1, 0.3, 0.6], [0.25, 0.25, 5], # [0.25], # crashes (appropriately) [1, 1, 1], # silly, but doesn't crash ] n_values = [10, 1000, 100000] for p in probabilities: for n in n_values: c = Counter() c.update(pick_from_probabilities(p) for _ in range(n)) sc = sorted(c.items(), key=lambda kv: kv[0]) print(f"_test_pick_from_probabilities: p = {p}, n = {n} -> {sc}") if __name__ == "__main__": _test_softmax() _test_pick_from_probabilities()