Source code for multivar_horner.classes.horner_poly

import ctypes
import pickle
from pathlib import Path
from typing import Callable, Tuple, Type, TypeVar

import numpy as np

from multivar_horner import c_evaluation
from multivar_horner.c_evaluation import (
    COMPILED_C_ENDING,
    compile_c_file,
    get_compiler,
    write_c_file,
)
from multivar_horner.classes.abstract_poly import AbstractPolynomial
from multivar_horner.classes.factorisation import (
    BasePolynomialNode,
    HeuristicFactorisationRoot,
    OptimalFactorisationRoot,
)
from multivar_horner.classes.helpers import FactorContainer
from multivar_horner.global_settings import (
    BOOL_DTYPE,
    COMPLEX_DTYPE,
    FLOAT_DTYPE,
    PATH2CACHE,
    TYPE_1D_FLOAT,
    UINT_DTYPE,
)
from multivar_horner.helper_fcts import rectify_query_point, validate_query_point
from multivar_horner.helpers_fcts_numba import eval_recipe

T = TypeVar("T")



[docs]
class HornerMultivarPolynomial(AbstractPolynomial):
    """a representation of a multivariate polynomial using Horner factorisation

    after computing the factorised representation of the polynomial,
    the instructions required for evaluation are being compiled and stored.
    The default format is C instructions.
    When there is no C compiler installed, the fallback option is encoding the required instructions
    in numpy arrays (here referred to as "recipes"),
    which can be processed by (``numba``) just in time compiled functions.

    Args:
        coefficients: ndarray of floats with shape (N,1)
            representing the coefficients of the monomials
            NOTE: coefficients with value 0 and 1 are allowed and will not affect the internal representation,
            because coefficients must be replaceable
        exponents: ndarray of unsigned integers with shape (N,m)
            representing the exponents of the monomials
            where m is the number of dimensions (self.dim),
            the ordering corresponds to the ordering of the coefficients, every exponent row has to be unique!
        rectify_input: bool, default=False
            whether to convert coefficients and exponents into compatible numpy arrays
            with this set to True, coefficients and exponents can be given in standard python arrays
        compute_representation: bool, default=False
            whether to compute a string representation of the polynomial
        verbose: bool, default=False
            whether to print status statements

        keep_tree: whether the factorisation tree object should be kept in memory after finishing factorisation
        store_c_instr: whether a C file with all required evaluation instructions
            should be created under any circumstances.
            By default the class will use C based evaluation, but skip if no compiler (``gcc``/``cc``) is installed.
        store_numpy_recipe: whether a pickle file with all required evaluation instructions
            in the custom ``numpy+numba`` format should be created under any circumstances.
            By default the class will use C based evaluation and only use this evaluation format as fallback.

    Attributes:
        num_monomials: the amount of coefficients/monomials N of the polynomial
        dim: the dimensionality m of the polynomial
            NOTE: the polynomial needs not to actually depend on all m dimensions
        unused_variables: the dimensions the polynomial does not depend on
        num_ops: the amount of mathematical operations required to evaluate the polynomial in this representation
        representation: a human readable string visualising the polynomial representation

        total_degree: the usual notion of degree for a polynomial.
            = the maximum sum of exponents in any of its monomials
            = the maximum l_1-norm of the exponent vectors of all monomials
            in contrast to 1D polynomials, different concepts of degrees exist for polynomials in multiple dimensions.
            following the naming in [1] L. Trefethen, “Multivariate polynomial approximation in the hypercube”,
            Proceedings of the American Mathematical Society, vol. 145, no. 11, pp. 4837–4844, 2017.
        euclidean_degree: the maximum l_2-norm of the exponent vectors of all monomials.
            NOTE: this is not in general an integer
        maximal_degree: the largest exponent in any of its monomials
            = the maximum l_infinity-norm of the exponent vectors of all monomials

        factorisation: a tuple of factorisation_tree and factor_container. s. below
        factorisation_tree: the object oriented, recursive data structure representing the factorisation
            (only if keep_tree=True)
        factor_container: the object containing all (unique) factors of the factorisation (only if keep_tree=True)
        root_value_idx: the index in the value array where the value of this polynomial
            (= root of the factorisation_tree) will be stored
        value_array_length: the amount of addresses (storage) required to evaluate the polynomial.
            for evaluating the polynomial in tree form intermediary results have to be stored in a value array.
            the value array begins with the coefficients of the polynomial.
            (without further optimisation) every factor requires its own address.

        copy_recipe: ndarray encoding the operations required to evaluate all scalar factors with exponent 1
        scalar_recipe: ndarray encoding the operations required to evaluate all remaining scalar factors
        monomial_recipe: ndarray encoding the operations required to evaluate all monomial factors
        tree_recipe: ndarray encoding the addresses required to evaluate
            the polynomial values of the factorisation_tree.
        tree_ops: ndarray encoding the type of operation required to evaluate
            the polynomial values of the factorisation_tree.
            encoded as a boolean ndarray separate from tree_recipe,
            since only the two operations ADD & MUL need to be encoded.

    Raises:
        TypeError: if coefficients or exponents are not given as ndarrays
            of the required dtype
        ValueError: if coefficients or exponents do not have the required shape or
            do not fulfill the other requirements
    """

    # __slots__ declared in parents are available in child classes. However, child subclasses will get a __dict__
    # and __weakref__ unless they also define __slots__ (which should only contain names of any additional slots).
    __slots__ = [
        "factorisation",
        "root_value_idx",
        "value_array_length",
        "keep_tree",
        "use_c_eval",
        "recipe",
        "_c_eval_fct",
        "ctype_x",
        "ctype_coeff",
        "root_class",
    ]

    # FIXME: creates duplicate entries in Sphinx autodoc

[docs]
    def __init__(
        self,
        coefficients,
        exponents,
        rectify_input: bool = False,
        compute_representation: bool = False,
        verbose: bool = False,
        keep_tree: bool = False,
        store_c_instr: bool = False,
        store_numpy_recipe: bool = False,
        *args,
        **kwargs,
    ):
        super().__init__(
            coefficients, exponents, rectify_input, compute_representation, verbose
        )
        self.root_class: Type = HeuristicFactorisationRoot
        self.keep_tree: bool = keep_tree
        self.value_array_length: int
        self.recipe: Tuple

        self._c_eval_fct: Callable
        double = c_evaluation.C_TYPE_DOUBLE
        self.ctype_x = double * self.dim
        self.ctype_coeff = double * self.num_monomials

        self._configure_evaluation(store_c_instr, store_numpy_recipe)
        self.compute_string_representation(*args, **kwargs)

        if not self.keep_tree:
            try:
                del self.factorisation
            except AttributeError:
                pass


    def _configure_evaluation(
        self,
        store_c_instr: bool = False,
        store_numpy_recipe: bool = False,
    ):
        self.use_c_eval: bool = True
        if store_c_instr:
            # force storing a C file
            self._compile_c_file()
        if store_numpy_recipe:
            # force storing the numpy+Numba recipe
            self._compile_recipes()

        if not (store_c_instr or store_numpy_recipe):
            # by default use faster C evaluation -> compile C file
            # if the compilers are not installed this will raise a `ValueError`
            try:
                self._compile_c_file()
            except ValueError as exc:
                self.print(exc)
                # if C compilation does not work, use recipe (numpy+Numba based) evaluation as a fallback
                self.use_c_eval = False
                self._compile_recipes()

    def _compute_factorisation(self):
        # do not compute the factorisation when it is already present
        try:
            self.factorisation
            self.print("factorisation already exists.")
            return
        except AttributeError:
            pass

        self.print("computing factorisation...")
        # NOTE: do NOT automatically create all scalar factors with exponent 1
        # (they might be unused, since the polynomial must not actually depend on all variables)
        factor_container = FactorContainer()
        factorisation_tree: BasePolynomialNode = self.root_class(
            self.exponents, factor_container
        )
        self.root_value_idx = factorisation_tree.value_idx
        self.value_array_length = self.num_monomials + len(factor_container)
        self.factorisation: Tuple[BasePolynomialNode, FactorContainer] = (
            factorisation_tree,
            factor_container,
        )

    @property
    def factorisation_tree(self) -> BasePolynomialNode:
        return self.factorisation[0]

    @property
    def factor_container(self) -> FactorContainer:
        return self.factorisation[1]


[docs]
    def compute_string_representation(
        self,
        coeff_fmt_str: str = "{:.2}",
        factor_fmt_str: str = "x_{dim}^{exp}",
        *args,
        **kwargs,
    ) -> str:
        repre = ""
        if not self.compute_representation:
            self.representation = repre
            return repre
        repre = f"[#ops={self.num_ops}] p(x)"
        try:
            tree = self.factorisation_tree
            repre += " = " + tree.get_string_representation(
                self.coefficients, coeff_fmt_str, factor_fmt_str
            )
            # exponentiation with 1 won't cause an operation in this representation
            # but are present in the string representation due to string formatting restrictions
            # -> they should not be displayed (misleading)
            repre = repre.replace(
                "^1", ""
            )  # <- workaround for the default string format
        except AttributeError:
            pass  # self.factorisation_tree does not exist
        self.representation = repre
        return self.representation


    def _compile_recipes(self):
        """encode all instructions needed for evaluating the polynomial in 'recipes'

        recipes are represented as numpy ndarrays (cf. assembler instructions)

        -> acquire a data structure representing the factorisation tree
        -> avoid recursion and function call overhead during evaluation
        -> enables the use of jit compiled functions

        the factor container must now contain all unique factors used in the chosen factorisation
        during evaluation of a polynomial the values of all the factors are needed at least once
        -> compute the values of all factors once and store them
        -> store a pointer to the computed value for every factor ('value index' = address in the value array)
        this is required for compiling evaluation instructions depending on the factor values
        monomial factors exist only if their value is required during the evaluation of the parent polynomial
        scalar factors exist only if their value is required during the evaluation of existing monomial factors
        (scalar factors can be 'standalone' factors as well)
        -> values must not be overwritten (reusing addresses), because they might be needed again by another factor
        -> (without further optimisation) each factor requires its own space in the value array

        """
        # reuse pickled recipe if present
        try:
            self._load_recipe()
            return
        except ValueError:
            self.print("recipe does not exist yet.")
            pass

        # for compiling the recipes the factorisation must be computed first
        self._compute_factorisation()
        # the values of the factors are being stored after the coefficients
        # start the address assignment with the correct offset
        value_idx = self.num_monomials

        # compile the recipes for computing the value of all factors
        copy_recipe = []  # skip computing factors with exp 1, just copy x value
        scalar_recipe = []
        monomial_recipe = []
        self.num_ops = 0

        # count the amount of multiplications encoded by the recipes
        # NOTE: count exponentiations as exponent-1 multiplications, e.g. x^3 <-> 2 operations

        # -> IMPORTANT: value idx assignment must happen first for the scalar factors
        for scalar_factor in self.factor_container.scalar_factors:
            scalar_factor.value_idx = value_idx
            value_idx += 1
            copy_instr, scalar_instr = scalar_factor.get_recipe()
            copy_recipe += copy_instr
            scalar_recipe += scalar_instr
            if len(scalar_instr) > 0:
                exponent = scalar_instr[0][2]
                self.num_ops += exponent - 1

        for monomial_factor in self.factor_container.monomial_factors:
            monomial_factor.value_idx = value_idx
            value_idx += 1
            monomial_factor.factorisation_idxs = [
                f.value_idx for f in monomial_factor.scalar_factors
            ]
            monomial_instr = monomial_factor.get_recipe()
            monomial_recipe += monomial_instr
            self.num_ops += 1  # every monomial instruction encodes one multiplication

        # compile the recipe for evaluating the Horner factorisation tree
        tree_recipe, tree_ops = self.factorisation_tree.get_recipe()
        # convert the recipes into the data types expected by the jit compiled functions
        # and store them
        tree_ops = np.array(tree_ops, dtype=BOOL_DTYPE)
        self.num_ops += len(tree_ops) - np.count_nonzero(
            tree_ops
        )  # every 0/False encodes a multiplication

        copy_recipe = np.array(copy_recipe, dtype=UINT_DTYPE).reshape((-1, 2))
        scalar_recipe = np.array(scalar_recipe, dtype=UINT_DTYPE).reshape((-1, 3))
        monomial_recipe = np.array(monomial_recipe, dtype=UINT_DTYPE).reshape((-1, 3))
        tree_recipe = np.array(tree_recipe, dtype=UINT_DTYPE).reshape((-1, 2))
        # IMPORTANT: strict ordering required!
        self.recipe = (
            copy_recipe,
            scalar_recipe,
            monomial_recipe,
            tree_recipe,
            tree_ops,
        )
        self._pickle_recipe()

    def _pickle_recipe(self):
        path = self.recipe_file
        self.print(f'storing recipe in file "{path}"')
        pickle_obj = (
            self.recipe,
            self.num_ops,
            self.value_array_length,
            self.root_value_idx,
        )
        with open(path, "wb") as f:
            pickle.dump(pickle_obj, f)

    def _load_recipe(self):
        path = self.recipe_file
        if not path.exists():
            raise ValueError("recipe pickle file does not exist.")
        self.print(f'loading recipe from file "{path}"')
        with open(path, "rb") as f:
            pickle_obj = pickle.load(f)
        self.recipe, self.num_ops, self.value_array_length, self.root_value_idx = (
            pickle_obj
        )


[docs]
    def eval(self, x: TYPE_1D_FLOAT, rectify_input: bool = False) -> float:
        """computes the value of the polynomial at query point x

        either uses C  or numpy+Numba evaluation

        Args:
            x: ndarray of floats with shape = [self.dim] representing the query point
            rectify_input: whether to convert coefficients and exponents into compatible numpy arrays
                with this set to True, the query point x can be given in standard python arrays

        Returns:
             the value of the polynomial at point x

        Raises:
            TypeError: if x is not given as ndarray of dtype float
            ValueError: if x does not have the shape ``[self.dim]``
        """
        if rectify_input:
            x = rectify_query_point(x)

        # use numpy+Numba recipe evaluation as fallback
        # input type and shape should always be validated.
        #   otherwise the numba jit compiled functions may fail with cryptic error messages
        validate_query_point(x, self.dim)

        if self.use_c_eval:
            return self._eval_c(x)

        return self._eval_recipe(x, dtype=FLOAT_DTYPE)



[docs]
    def eval_complex(self, x: np.ndarray) -> COMPLEX_DTYPE:
        """computes the value of the polynomial at a complex query point x

        Args:
            x: the query point given as numpy complex type

        Returns:
             the complex value of the polynomial at point x

        Raises:
            TypeError: if x is not given as ndarray of dtype complex
            ValueError: if x does not have the shape ``[self.dim]``
        """
        validate_query_point(x, self.dim, dtype=COMPLEX_DTYPE)
        return self._eval_recipe(x, dtype=COMPLEX_DTYPE)


    def _eval_recipe(self, x: TYPE_1D_FLOAT, dtype: Type[T]) -> T:
        """computes the value of the polynomial at query point x

        makes use of fast ``Numba`` just in time compiled functions
        """
        try:
            recipe = self.recipe
        except AttributeError:  # the recipe has not been compiled yet
            self._compile_recipes()
            recipe = self.recipe

        value_array = np.empty(self.value_array_length, dtype=dtype)
        # the coefficients are being stored at the beginning of the value array
        # TODO remove flatten, always store coefficients as a 1D array (also for horner fact.)?!
        #   also in MultivarPolynomial.eval()
        value_array[: self.num_monomials] = self.coefficients.flatten()
        return eval_recipe(
            x,
            value_array,
            *recipe,
            self.root_value_idx,
        )

    @property
    def c_eval_fct(self):
        try:
            return self._c_eval_fct
        except AttributeError:
            compiled_file = self.c_file_compiled
            cdll = ctypes.CDLL(str(compiled_file))
            fct = getattr(cdll, c_evaluation.EVAL_FCT)
            fct.argtypes = (self.ctype_x, self.ctype_coeff)
            fct.restype = c_evaluation.C_TYPE_DOUBLE
            self._c_eval_fct = fct

        return self._c_eval_fct

    def _eval_c(self, x: TYPE_1D_FLOAT) -> float:
        compiled_file = self.c_file_compiled
        if not compiled_file.exists():
            raise ValueError(f"missing compiled C file: {compiled_file}")

        x_typed = self.ctype_x(*x)
        coeffs = self.coefficients.flatten()
        coeffs_typed = self.ctype_coeff(*coeffs)

        p_x = self.c_eval_fct(x_typed, coeffs_typed)
        return p_x


[docs]
    def get_c_file_name(self, ending: str = ".c") -> str:
        return f"eval_poly_{hash(self)}{ending}"


    @property
    def c_file(self) -> Path:
        return PATH2CACHE / self.get_c_file_name()

    @property
    def c_file_compiled(self):
        return PATH2CACHE / self.get_c_file_name(ending=COMPILED_C_ENDING)

    @property
    def recipe_file(self) -> Path:
        return PATH2CACHE / f"numpy_recipe_{hash(self)}.pickle"

    def _write_c_file(self):
        path_out = self.c_file
        if path_out.exists():
            return
        # for compiling the instructions the factorisation must be computed first
        self._compute_factorisation()
        self.print("compiling C instructions ...")
        try:
            factorisation = self.factorisation
        except AttributeError:
            raise ValueError(
                "need a stored factorisation tree, but the reference to it has already been deleted. "
                "initialise class with 'keep_tree=True`"
            )
        self.num_ops = write_c_file(
            self.num_monomials, self.dim, path_out, factorisation, self.verbose
        )


[docs]
    def get_c_instructions(self) -> str:
        path = self.c_file
        self.print(f"reading C instructions from file {path}")
        with open(path) as c_file:
            instr = c_file.read()
        return instr


    def _compile_c_file(self):
        path_out = self.c_file_compiled
        if path_out.exists():
            self.print(f"using existing compiled C file {path_out}")
            return

        # NOTE: skip compiling C instructions if no compiler is available
        compiler = get_compiler()
        self._write_c_file()
        path_in = self.c_file
        self.print(f"compiling to file {path_out}")
        compile_c_file(compiler, path_in, path_out)




[docs]
class HornerMultivarPolynomialOpt(HornerMultivarPolynomial):
    """a Horner factorised polynomial with an optimal factorisation found by searching all possible factorisations

    Optimality in this context refers to the minimal amount of operations needed for evaluation
    in comparison to other Horner factorisation (not other factorisatio/optimisation techniques).

    NOTES:

    * this requires MUCH more computational resources than just trying one factorisation
        (the number of possible factorisations is growing exponentially with the size of the polynomial!).

    * for the small polynomial examples in the current tests, the found factorisations were not superior
    """

    root_class = OptimalFactorisationRoot