Source code for zfit.models.tobinned

#  Copyright (c) 2024 zfit
from __future__ import annotations

from typing import TYPE_CHECKING

if TYPE_CHECKING:
    import zfit

import tensorflow as tf

import zfit
import zfit.z.numpy as znp
from zfit import z

from ..core.interfaces import ZfitPDF, ZfitSpace
from ..util import ztyping
from ..util.warnings import warn_advanced_feature
from .binned_functor import BaseBinnedFunctorPDF


class MapNotVectorized(Exception):
    pass


[docs] class BinnedFromUnbinnedPDF(BaseBinnedFunctorPDF): def __init__( self, pdf: ZfitPDF, space: ZfitSpace, *, extended: ztyping.ExtendedInputType = None, norm: ztyping.NormInputType = None, name: str | None = None, label: str | None = None, ) -> None: """Create a binned pdf from an unbinned pdf binning in *space*. Args: pdf: The unbinned pdf to be binned. space: |@doc:pdf.init.obs| Observables of the model. This will be used as the default space of the PDF and, if not given explicitly, as the normalization range. The default space is used for example in the sample method: if no sampling limits are given, the default space is used. If the observables are binned and the model is unbinned, the model will be a binned model, by wrapping the model in a :py:class:`~zfit.pdf.BinnedFromUnbinnedPDF`, equivalent to calling :py:meth:`~zfit.pdf.BasePDF.to_binned`. The observables are not equal to the domain as it does not restrict or truncate the model outside this range. |@docend:pdf.init.obs| extended: |@doc:pdf.init.extended| The overall yield of the PDF. If this is parameter-like, it will be used as the yield, the expected number of events, and the PDF will be extended. An extended PDF has additional functionality, such as the ``ext_*`` methods and the ``counts`` (for binned PDFs). |@docend:pdf.init.extended| norm: |@doc:pdf.init.norm| Normalization of the PDF. By default, this is the same as the default space of the PDF. |@docend:pdf.init.norm| name: |@doc:pdf.init.name| Name of the PDF. Maybe has implications on the serialization and deserialization of the PDF. For a human-readable name, use the label. |@docend:pdf.init.name| label: |@doc:pdf.init.label| Human-readable name or label of the PDF for a better description, to be used with plots etc. Has no programmatical functional purpose as identification. |@docend:pdf.init.label| """ if pdf.is_extended: if extended is not None: warn_advanced_feature( f"PDF {pdf} is already extended, but extended also given {extended}. Will" f" use the given yield.", identifier="extend_wrapped_extended", ) else: extended = pdf.get_yield() if not isinstance(space, ZfitSpace): try: space = pdf.space.with_binning(space) except Exception as error: msg = f"Could not create space {space} from pdf {pdf} with binning {space}" raise ValueError(msg) from error if label is None: label = f"Binned_{pdf.name}" super().__init__( obs=space, extended=extended, norm=norm, models=pdf, params={}, name=name, label=label, ) self.pdfs = self.models # def _get_params(self, floating: bool | None = True, is_yield: bool | None = None, # extract_independent: bool | None = True) -> set[ZfitParameter]: # params = super()._get_params(floating=floating, is_yield=is_yield, extract_independent=extract_independent) # daughter_params = self.pdfs[0].get_params(floating=floating, is_yield=is_yield, # extract_independent=extract_independent) # return daughter_params | params @z.function def _rel_counts(self, x, norm): del x # not used, we just return the full histogram pdf = self.pdfs[0] edges = [znp.array(edge) for edge in self.axes.edges] edges_flat = [znp.reshape(edge, [-1]) for edge in edges] lowers = [edge[:-1] for edge in edges_flat] uppers = [edge[1:] for edge in edges_flat] lowers_meshed = znp.meshgrid(*lowers, indexing="ij") uppers_meshed = znp.meshgrid(*uppers, indexing="ij") shape = tf.shape(lowers_meshed[0]) lowers_meshed_flat = [znp.reshape(lower_mesh, [-1]) for lower_mesh in lowers_meshed] uppers_meshed_flat = [znp.reshape(upper_mesh, [-1]) for upper_mesh in uppers_meshed] lower_flat = znp.stack(lowers_meshed_flat, axis=-1) upper_flat = znp.stack(uppers_meshed_flat, axis=-1) options = {"type": "bins"} @z.function def integrate_one(limits): low, up = tf.unstack(limits) limits_space = zfit.Space(obs=self.obs, limits=[low, up]) return pdf.integrate(limits_space, norm=False, options=options) limits = znp.stack([lower_flat, upper_flat], axis=1) from zfit import run try: if run.get_graph_mode() is False: msg = "Just stearing the eager execution" raise MapNotVectorized(msg) values = tf.vectorized_map(integrate_one, limits)[:, 0] except (ValueError, MapNotVectorized): values = znp.asarray(tuple(map(integrate_one, limits))) values = znp.reshape(values, shape) if norm: values /= pdf.normalization(norm) return values @z.function(wraps="model_binned") def _counts(self, x, norm): del x # not used, we just return the full histogram pdf = self.pdfs[0] edges = [znp.array(edge) for edge in self.axes.edges] edges_flat = [znp.reshape(edge, [-1]) for edge in edges] lowers = [edge[:-1] for edge in edges_flat] uppers = [edge[1:] for edge in edges_flat] lowers_meshed = znp.meshgrid(*lowers, indexing="ij") uppers_meshed = znp.meshgrid(*uppers, indexing="ij") shape = tf.shape(lowers_meshed[0]) lowers_meshed_flat = [znp.reshape(lower_mesh, [-1]) for lower_mesh in lowers_meshed] uppers_meshed_flat = [znp.reshape(upper_mesh, [-1]) for upper_mesh in uppers_meshed] lower_flat = znp.stack(lowers_meshed_flat, axis=-1) upper_flat = znp.stack(uppers_meshed_flat, axis=-1) options = {"type": "bins"} if pdf.is_extended: @z.function def integrate_one(limits): low, up = tf.unstack(limits) limits_space = zfit.Space(obs=self.obs, limits=[low, up]) return pdf.ext_integrate(limits_space, norm=False, options=options) missing_yield = False else: @z.function def integrate_one(limits): low, up = tf.unstack(limits) limits_space = zfit.Space(obs=self.obs, limits=[low, up]) return pdf.integrate(limits_space, norm=False, options=options) missing_yield = True limits = znp.stack([lower_flat, upper_flat], axis=1) from zfit import run try: if run.get_graph_mode() is False: msg = "Just stearing the eager execution" raise MapNotVectorized(msg) values = tf.vectorized_map(integrate_one, limits)[:, 0] except (ValueError, MapNotVectorized): values = znp.asarray(tuple(map(integrate_one, limits))) values = znp.reshape(values, shape) if missing_yield: values *= self.get_yield() if norm: values /= pdf.normalization(norm) return values def __str__(self): return f"<BinnedFromUnbinnedPDF model={self.pdfs[0]} binning={self.space.binning}>"