§
    z”j,<  ã                  óx   — d dl mZ d dlmZ d dlmZ d dlZd dlmZ erd dlm	Z	m
Z
  G d„ dej        ¦  «        ZdS )	é    )Úannotations)ÚSequence)ÚTYPE_CHECKINGN)Údistribution)ÚTensorÚdtypec                  óè   ‡ — e Zd ZU dZded<   ded<   ded<   	 dd ˆ fd„Zd!d„Zd"d„Zd"d„Zd#d„Z	d"d„Z
ed"d„¦   «         Zed"d„¦   «         Zg fd$d„Zg fd$d„Zd#d„Zd#d„Zd"d„Zd#d„Zd#d„Zd%d„Zˆ xZS )&ÚContinuousBernoullia   The Continuous Bernoulli distribution with parameter: `probs` characterizing the shape of the density function.
    The Continuous Bernoulli distribution is defined on [0, 1], and it can be viewed as a continuous version of the Bernoulli distribution.

    `The continuous Bernoulli: fixing a pervasive error in variational autoencoders. <https://arxiv.org/abs/1907.06845>`_

    Mathematical details

    The probability density function (pdf) is

    .. math::

        p(x;\lambda) = C(\lambda)\lambda^x (1-\lambda)^{1-x}

    In the above equation:

    * :math:`x`: is continuous between 0 and 1
    * :math:`probs = \lambda`: is the probability.
    * :math:`C(\lambda)`: is the normalizing constant factor

    .. math::

        C(\lambda) =
        \left\{
        \begin{aligned}
        &2 & \text{ if $\lambda = \frac{1}{2}$} \\
        &\frac{2\tanh^{-1}(1-2\lambda)}{1 - 2\lambda} & \text{ otherwise}
        \end{aligned}
        \right.

    Args:
        probs(int|float|Tensor): The probability of Continuous Bernoulli distribution between [0, 1],
            which characterize the shape of the pdf. If the input data type is int or float, the data type of
            `probs` will be convert to a 1-D Tensor the paddle global default dtype.
        lims(tuple): Specify the unstable calculation region near 0.5, where the calculation is approximated
            by talyor expansion. The default value is (0.499, 0.501).

    Examples:
        .. code-block:: python

            >>> import paddle
            >>> from paddle.distribution import ContinuousBernoulli
            >>> paddle.set_device("cpu")
            >>> paddle.seed(100)

            >>> rv = ContinuousBernoulli(paddle.to_tensor([0.2, 0.5]))

            >>> print(rv.sample([2]))
            Tensor(shape=[2, 2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [[0.38694882, 0.20714243],
             [0.00631948, 0.51577556]])

            >>> print(rv.mean)
            Tensor(shape=[2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [0.38801414, 0.50000000])

            >>> print(rv.variance)
            Tensor(shape=[2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [0.07589778, 0.08333334])

            >>> print(rv.entropy())
            Tensor(shape=[2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [-0.07641457,  0.        ])

            >>> print(rv.cdf(paddle.to_tensor(0.1)))
            Tensor(shape=[2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [0.17259926, 0.10000000])

            >>> print(rv.icdf(paddle.to_tensor(0.1)))
            Tensor(shape=[2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [0.05623737, 0.10000000])

            >>> rv1 = ContinuousBernoulli(paddle.to_tensor([0.2, 0.8]))
            >>> rv2 = ContinuousBernoulli(paddle.to_tensor([0.7, 0.5]))
            >>> print(rv1.kl_divergence(rv2))
            Tensor(shape=[2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [0.20103608, 0.07641447])
    r   ÚprobsÚlimsr   ©gV-²ïß?gÕxé&1à?úfloat | Tensorútuple[float]ÚreturnÚNonec                ó”  •— t          j        ¦   «         | _        |                      |¦  «        | _        t          j        || j        ¬¦  «        | _        t          j        | j        j        ¦  «        j        }t          j	        | j        |d|z
  ¬¦  «        | _        | j        j
        }t          ¦   «                              |¦  «         d S )N©r   é   )ÚminÚmax)ÚpaddleÚget_default_dtyper   Ú
_to_tensorr   Ú	to_tensorr   ÚfinfoÚepsÚclipÚshapeÚsuperÚ__init__)Úselfr   r   Úeps_probÚbatch_shapeÚ	__class__s        €úx/lsinfo/ai/hellotax_ai/data_center/backend/venv/lib/python3.11/site-packages/paddle/distribution/continuous_bernoulli.pyr    zContinuousBernoulli.__init__n   s    ø€ õ Ô-Ñ/Ô/ˆŒ
Ø—_’_ UÑ+Ô+ˆŒ
ÝÔ$ T°´Ð<Ñ<Ô<ˆŒ	õ ”< ¤
Ô 0Ñ1Ô1Ô5ˆÝ”[ ¤°¸qÀ8¹|ÐLÑLÔLˆŒ
à”jÔ&ˆÝ‰Œ×Ò˜Ñ%Ô%Ð%Ð%Ð%ó    c                ó   — t          |t          t          f¦  «        rt          j        |g| j        ¬¦  «        }n|j        | _        |S )zoConvert the input parameters into tensors

        Returns:
            Tensor: converted probability.
        r   )Ú
isinstanceÚfloatÚintr   r   r   )r!   r   s     r%   r   zContinuousBernoulli._to_tensor|   sC   € õ ee¥S˜\Ñ*Ô*ð 	%ÝÔ$ e W°D´JÐ?Ñ?Ô?ˆEˆEàœˆDŒJØˆr&   c                ó¸   — t          j        t          j        | j        | j        d         ¦  «        t          j        | j        | j        d         ¦  «        ¦  «        S )zïGenerate stable support region indicator (prob < self.lims[0] && prob >= self.lims[1] )

        Returns:
            Tensor: the element of the returned indicator tensor corresponding to stable region is True, and False otherwise
        r   r   )r   Ú
logical_orÚ
less_equalr   r   Úgreater_than©r!   s    r%   Ú_cut_support_regionz'ContinuousBernoulli._cut_support_region‰   sI   € õ Ô ÝÔ˜dœj¨$¬)°A¬,Ñ7Ô7ÝÔ ¤
¨D¬I°a¬LÑ9Ô9ñ
ô 
ð 	
r&   c                ó¦   — t          j        |                      ¦   «         | j        | j        d         t          j        | j        ¦  «        z  ¦  «        S )zêCut the probability parameter with stable support region

        Returns:
            Tensor: the element of the returned probability tensor corresponding to unstable region is set to be self.lims[0], and unchanged otherwise
        r   )r   Úwherer0   r   r   Ú	ones_liker/   s    r%   Ú
_cut_probszContinuousBernoulli._cut_probs”   sG   € õ Œ|Ø×$Ò$Ñ&Ô&ØŒJØŒIaŒL6Ô+¨D¬JÑ7Ô7Ñ7ñ
ô 
ð 	
r&   Úvaluec                ó\   — dt          j        |¦  «        t          j        | ¦  «        z
  z  S )z’Calculate the tanh inverse of value

        Args:
            value (Tensor)

        Returns:
            Tensor: tanh inverse of value
        ç      à?)r   Úlog1p©r!   r5   s     r%   Ú_tanh_inversez!ContinuousBernoulli._tanh_inverse    s*   € ð •f”l 5Ñ)Ô)­F¬L¸%¸Ñ,@Ô,@Ñ@ÑAÐAr&   c           
     óx  — |                       ¦   «         }t          j        d| j        ¬¦  «        }t          j        t          j        ||¦  «        |t          j        |¦  «        ¦  «        }t          j        t          j        ||¦  «        |t          j        |¦  «        ¦  «        }t          j	        dt          j
        |                      dd|z  z
  ¦  «        ¦  «        z  ¦  «        t          j        t          j        ||¦  «        t          j        d|z  ¦  «        t          j	        d|z  dz
  ¦  «        ¦  «        z
  }t          j        | j        dz
  ¦  «        }t          j	        t          j        d| j        ¬¦  «        ¦  «        dd|z  z   |z  z   }t          j        |                      ¦   «         ||¦  «        S )zÄCalculate the logarithm of the constant factor :math:`C(lambda)` in the pdf of the Continuous Bernoulli distribution

        Returns:
            Tensor: logarithm of the constant factor
        r7   r   ç       @ç      ð?g       ÀgUUUUUUõ?gÒ'}Ò'}@)r4   r   r   r   r2   r-   Ú
zeros_likeÚgreater_equalr3   ÚlogÚabsr:   r8   Úsquarer   r0   )r!   Ú	cut_probsÚhalfÚcut_probs_below_halfÚcut_probs_above_halfÚlog_constant_proposeÚxÚtaylor_expansions           r%   Ú_log_constantz!ContinuousBernoulli._log_constant«   sœ  € ð —O’OÑ%Ô%ˆ	ÝÔ ¨4¬:Ð6Ñ6Ô6ˆÝ%œ|ÝÔ˜i¨Ñ.Ô.ØÝÔ˜iÑ(Ô(ñ 
ô  
Ðõ
  &œ|ÝÔ  ¨DÑ1Ô1ØÝÔ˜YÑ'Ô'ñ 
ô  
Ðõ
  &œzØ•&”*˜T×/Ò/°°c¸I±oÑ0EÑFÔFÑGÔGÑGñ 
ô  
åŒLÝÔ˜i¨Ñ.Ô.ÝŒL˜Ð 4Ñ4Ñ5Ô5ÝŒJsÐ1Ñ1°CÑ7Ñ8Ô8ñ
ô 
ñ 
Ðõ ŒM˜$œ* sÑ*Ñ+Ô+ˆåŒJ•vÔ'¨°4´:Ð>Ñ>Ô>Ñ?Ô?Ø˜<¨!Ñ+Ñ+¨qÑ0ñ1ð 	õ Œ|Ø×$Ò$Ñ&Ô&Ð(<Ð>Nñ
ô 
ð 	
r&   c           
     óž  — |                       ¦   «         }t          j        |d|z  dz
  ¦  «        }|t          j        t          j        d| j        ¬¦  «        d|                      dd|z  z
  ¦  «        z  ¦  «        z   }| j        dz
  }dddt          j        |¦  «        z  z   |z  z   }t          j        |  	                    ¦   «         ||¦  «        S )zeMean of Continuous Bernoulli distribution.

        Returns:
            Tensor: mean value.
        r<   r=   r   r7   gUUUUUUÕ?glÁlÁÖ?)
r4   r   Údivider   r   r:   r   rB   r2   r0   ©r!   rC   ÚtmpÚproposerH   rI   s         r%   ÚmeanzContinuousBernoulli.meanÍ   s×   € ð —O’OÑ%Ô%ˆ	ÝŒm˜I s¨Y¡¸Ñ'<Ñ=Ô=ˆØœÝÔ˜S¨¬
Ð3Ñ3Ô3Ø$×$Ò$ S¨3°©?Ñ%:Ñ;Ô;Ñ;ñ
ô 
ñ 
ˆð ŒJ˜Ñˆà9˜{­V¬]¸1Ñ-=Ô-=Ñ=Ñ=ÀÑBÑBð 	õ Œ|Ø×$Ò$Ñ&Ô&¨Ð1Añ
ô 
ð 	
r&   c           
     ó
  — |                       ¦   «         }t          j        ||dz
  z  t          j        dd|z  z
  ¦  «        ¦  «        }|t          j        t          j        d| j        ¬¦  «        t          j        t          j        | ¦  «        t          j        |¦  «        z
  ¦  «        ¦  «        z   }t          j        | j        dz
  ¦  «        }ddd|z  z
  |z  z
  }t          j	        |  
                    ¦   «         ||¦  «        S )zmVariance of Continuous Bernoulli distribution.

        Returns:
            Tensor: variance value.
        r=   r<   r   r7   gUUUUUUµ?g±?gg¼jVÁ?)r4   r   rL   rB   r   r   r8   r@   r   r2   r0   rM   s         r%   ÚvariancezContinuousBernoulli.varianceâ   s÷   € ð —O’OÑ%Ô%ˆ	ÝŒmØ˜ S™Ñ)ÝŒM˜#  i¡Ñ/Ñ0Ô0ñ
ô 
ˆð œÝÔ˜S¨¬
Ð3Ñ3Ô3ÝŒM&œ,¨	 zÑ2Ô2µV´ZÀ	Ñ5JÔ5JÑJÑKÔKñ
ô 
ñ 
ˆõ ŒM˜$œ* sÑ*Ñ+Ô+ˆØ%¨°mÀaÑ6GÑ)GÈ1Ñ(LÑLÐÝŒ|Ø×$Ò$Ñ&Ô&¨Ð1Añ
ô 
ð 	
r&   r   úSequence[int]c                ó†   — t          j        ¦   «         5  |                      |¦  «        cddd¦  «         S # 1 swxY w Y   dS )áC  Generate Continuous Bernoulli samples of the specified shape. The final shape would be ``sample_shape + batch_shape``.

        Args:
            shape (Sequence[int], optional): Prepended shape of the generated samples.

        Returns:
            Tensor, Sampled data with shape `sample_shape` + `batch_shape`.
        N)r   Úno_gradÚrsample)r!   r   s     r%   ÚsamplezContinuousBernoulli.sampleø   s…   € õ Œ^ÑÔð 	'ð 	'Ø—<’< Ñ&Ô&ð	'ð 	'ð 	'ð 	'ñ 	'ô 	'ð 	'ð 	'ð 	'ð 	'ð 	'ð 	'øøøð 	'ð 	'ð 	'ð 	'ð 	'ð 	's   ”6¶:½:c                ó  — t          |t          ¦  «        st          d¦  «        ‚t          |¦  «        }t          | j        ¦  «        }t          ||z   ¦  «        }t          j        || j        dd¬¦  «        }|                      |¦  «        S )rU   z%sample shape must be Sequence object.r   r   )r   r   r   r   )	r(   r   Ú	TypeErrorÚtupler#   r   Úuniformr   Úicdf)r!   r   r#   Úoutput_shapeÚus        r%   rW   zContinuousBernoulli.rsample  s}   € õ ˜%¥Ñ*Ô*ð 	EÝÐCÑDÔDÐDÝe‘”ˆÝ˜DÔ,Ñ-Ô-ˆÝ˜U [Ñ0Ñ1Ô1ˆÝŒN °T´ZÀQÈAÐNÑNÔNˆØyŠy˜‰|Œ|Ðr&   c                óT  — t          j        || j        ¬¦  «        }t          j        | j        j        ¦  «        j        }t          j        |t          j        | j        ¦  «        z  d|z
  t          j        d| j        z
  ¦  «        z  z   | ¬¦  «        }|                      ¦   «         |z   S )zÅLog probability density function.

        Args:
          value (Tensor): The input tensor.

        Returns:
          Tensor: log probability. The data type is the same as `self.probs`.
        r   r=   r   )Úneginf)	r   Úcastr   r   r   r   Ú
nan_to_numr@   rJ   )r!   r5   r   Úcross_entropys       r%   Úlog_probzContinuousBernoulli.log_prob  s›   € õ ”˜E¨¬Ð4Ñ4Ô4ˆÝŒl˜4œ:Ô+Ñ,Ô,Ô0ˆÝÔ)Ø•F”J˜tœzÑ*Ô*Ñ*ØU‰{fœj¨¨T¬Z©Ñ8Ô8Ñ8ñ9à4ð
ñ 
ô 
ˆð
 ×!Ò!Ñ#Ô# mÑ3Ð3r&   c                óP   — t          j        |                      |¦  «        ¦  «        S )zÁProbability density function.

        Args:
            value (Tensor): The input tensor.

        Returns:
            Tensor: probability. The data type is the same as `self.probs`.
        )r   Úexpre   r9   s     r%   ÚprobzContinuousBernoulli.prob'  s    € õ Œz˜$Ÿ-š-¨Ñ.Ô.Ñ/Ô/Ð/r&   c           	     ón  — t          j        | j        ¦  «        }t          j        | j         ¦  «        }t          j        t          j        | j        t          j        d| j        ¬¦  «        ¦  «        t          j        | j        d¦  «        |  	                    ¦   «          | j
        ||z
  z  z   |z
  ¦  «        S )a‚  Shannon entropy in nats.

        The entropy is

        .. math::

            \mathcal{H}(X) = -\log C + \left[ \log (1 - \lambda) -\log \lambda \right] \mathbb{E}(X)  - \log(1 - \lambda)

        In the above equation:

        * :math:`\Omega`: is the support of the distribution.

        Returns:
            Tensor, Shannon entropy of Continuous Bernoulli distribution.
        r7   r   ç        )r   r@   r   r8   r2   Úequalr   r   Ú	full_likerJ   rP   )r!   Úlog_pÚlog_1_minus_ps      r%   ÚentropyzContinuousBernoulli.entropy2  sŸ   € õ  ”
˜4œ:Ñ&Ô&ˆÝœ d¤j [Ñ1Ô1ˆåŒ|ÝŒL˜œ¥VÔ%5°cÀÄÐ%LÑ%LÔ%LÑMÔMÝÔ˜TœZ¨Ñ-Ô-à×#Ò#Ñ%Ô%Ð%Ø”)˜}¨uÑ4Ñ5ñ6àñ ñ	
ô 
ð 	
r&   c                ó|  — t          j        || j        ¬¦  «        }|                      ¦   «         }t          j        ||¦  «        t          j        d|z
  d|z
  ¦  «        z  |z   dz
  d|z  dz
  z  }t          j        |                      ¦   «         ||¦  «        }t          j        t          j        |t          j        d| j        ¬¦  «        ¦  «        t          j	        |¦  «        t          j        t          j
        |t          j        d| j        ¬¦  «        ¦  «        t          j        |¦  «        |¦  «        ¦  «        S )a>  Cumulative distribution function

        .. math::

            {   P(X \le t; \lambda) =
                F(t;\lambda) =
                \left\{
                \begin{aligned}
                &t & \text{ if $\lambda = \frac{1}{2}$} \\
                &\frac{\lambda^t (1 - \lambda)^{1 - t} + \lambda - 1}{2\lambda - 1} & \text{ otherwise}
                \end{aligned}
                \right. }

        Args:
            value (Tensor): The input tensor.

        Returns:
            Tensor: quantile of :attr:`value`. The data type is the same as `self.probs`.
        r   r=   r<   rj   )r   rb   r   r4   Úpowr2   r0   r-   r   r>   r?   r3   )r!   r5   rC   ÚcdfsÚunbounded_cdfss        r%   ÚcdfzContinuousBernoulli.cdfO  s)  € õ( ”˜E¨¬Ð4Ñ4Ô4ˆØ—O’OÑ%Ô%ˆ	åŒJy %Ñ(Ô(ÝŒj˜˜y™¨#°©+Ñ6Ô6ñ7àñð ñð 9‰_˜sÑ"ñ$ˆõ  œ d×&>Ò&>Ñ&@Ô&@À$ÈÑNÔNˆÝŒ|ÝÔ˜e¥VÔ%5°cÀÄÐ%LÑ%LÔ%LÑMÔMÝÔ˜eÑ$Ô$ÝŒLÝÔ$Ø6Ô+¨C°t´zÐBÑBÔBñô õ Ô  Ñ'Ô'Øñô ñ

ô 

ð 
	
r&   c           	     óp  — t          j        || j        ¬¦  «        }|                      ¦   «         }t          j        |                      ¦   «         t          j        | |d|z  dz
  z  z   ¦  «        t          j        | ¦  «        z
  t          j        |¦  «        t          j        | ¦  «        z
  z  |¦  «        S )af  Inverse cumulative distribution function

        .. math::

            {   F^{-1}(x;\lambda) =
                \left\{
                \begin{aligned}
                &x & \text{ if $\lambda = \frac{1}{2}$} \\
                &\frac{\log(1+(\frac{2\lambda - 1}{1 - \lambda})x)}{\log(\frac{\lambda}{1-\lambda})} & \text{ otherwise}
                \end{aligned}
                \right. }

        Args:
            value (Tensor): The input tensor, meaning the quantile.

        Returns:
            Tensor: the value of the r.v. corresponding to the quantile. The data type is the same as `self.probs`.
        r   r<   r=   )r   rb   r   r4   r2   r0   r8   r@   )r!   r5   rC   s      r%   r]   zContinuousBernoulli.icdfx  s­   € õ& ”˜E¨¬Ð4Ñ4Ô4ˆØ—O’OÑ%Ô%ˆ	ÝŒ|Ø×$Ò$Ñ&Ô&å”˜i˜Z¨%°3¸±?ÀSÑ3HÑ*IÑIÑJÔJÝ”, 	˜zÑ*Ô*ñ+õ Œz˜)Ñ$Ô$¥v¤|°Y°JÑ'?Ô'?Ñ?ñ	Að
 ñ
ô 
ð 	
r&   Úotherc                ó&  — | j         |j         k    rt          d¦  «        ‚|                      ¦   «          }t          j        |j        ¦  «        }t          j        |j         ¦  «        }|                     ¦   «         | j        ||z
  z  z   |z    }||z   S )a  The KL-divergence between two Continuous Bernoulli distributions with the same `batch_shape`.

        The probability density function (pdf) is

        .. math::

            KL\_divergence(\lambda_1, \lambda_2) = - H - \{\log C_2 + [\log \lambda_2 -  \log (1-\lambda_2)]  \mathbb{E}_1(X) +  \log (1-\lambda_2)  \}

        Args:
            other (ContinuousBernoulli): instance of Continuous Bernoulli.

        Returns:
            Tensor, kl-divergence between two Continuous Bernoulli distributions.

        z\KL divergence of two Continuous Bernoulli distributions should share the same `batch_shape`.)	r#   Ú
ValueErrorro   r   r@   r   r8   rJ   rP   )r!   rv   Úpart1Úlog_qÚlog_1_minus_qÚpart2s         r%   Úkl_divergencez!ContinuousBernoulli.kl_divergence—  s   € ð" Ô˜uÔ0Ò0Ð0ÝØnñô ð ð —’‘”ˆÝ”
˜5œ;Ñ'Ô'ˆÝœ e¤k \Ñ2Ô2ˆà×ÒÑ!Ô!ØŒi˜5 =Ñ0Ñ1ñ2àñð
ˆð
 u‰}Ðr&   )r   )r   r   r   r   r   r   )r   r   r   r   )r   r   )r5   r   r   r   )r   rS   r   r   )rv   r
   r   r   )Ú__name__Ú
__module__Ú__qualname__Ú__doc__Ú__annotations__r    r   r0   r4   r:   rJ   ÚpropertyrP   rR   rX   rW   re   rh   ro   rt   r]   r}   Ú__classcell__)r$   s   @r%   r
   r
      sÒ  ø€ € € € € € ðLð Lð\ €M€MMØ€L€LLØ€L€LLð ;Ið&ð &ð &ð &ð &ð &ð &ðð ð ð ð	
ð 	
ð 	
ð 	
ð

ð 

ð 

ð 

ð	Bð 	Bð 	Bð 	Bð 
ð  
ð  
ð  
ðD ð
ð 
ð 
ñ „Xð
ð( ð
ð 
ð 
ñ „Xð
ð* -/ð 
'ð 
'ð 
'ð 
'ð 
'ð .0ð ð ð ð ð ð"4ð 4ð 4ð 4ð$	0ð 	0ð 	0ð 	0ð
ð 
ð 
ð 
ð:'
ð '
ð '
ð '
ðR
ð 
ð 
ð 
ð>ð ð ð ð ð ð ð r&   r
   )Ú
__future__r   Úcollections.abcr   Útypingr   r   Úpaddle.distributionr   r   r   ÚDistributionr
   © r&   r%   ú<module>r‹      s¹   ðð #Ð "Ð "Ð "Ð "Ð "à $Ð $Ð $Ð $Ð $Ð $Ø  Ð  Ð  Ð  Ð  Ð  à €€€Ø ,Ð ,Ð ,Ð ,Ð ,Ð ,àð %Ø$Ð$Ð$Ð$Ð$Ð$Ð$Ð$ðYð Yð Yð Yð Y˜,Ô3ñ Yô Yð Yð Yð Yr&   