o
    ñpi,<  ã                   @  sb   d dl mZ d dlmZ d dlmZ d dlZd dlmZ er&d dlm	Z	m
Z
 G dd„ dejƒZdS )	é    )Úannotations)ÚSequence)ÚTYPE_CHECKINGN)Údistribution)ÚTensorÚdtypec                      sæ   e Zd ZU dZded< ded< ded< 	d/d0‡ fdd„Zd1dd„Zd2dd„Zd2dd„Zd3dd„Z	d2dd„Z
ed2dd„ƒZed2dd„ƒZg fd4dd„Zg fd4d d!„Zd3d"d#„Zd3d$d%„Zd2d&d'„Zd3d(d)„Zd3d*d+„Zd5d-d.„Z‡  ZS )6ÚContinuousBernoullia   The Continuous Bernoulli distribution with parameter: `probs` characterizing the shape of the density function.
    The Continuous Bernoulli distribution is defined on [0, 1], and it can be viewed as a continuous version of the Bernoulli distribution.

    `The continuous Bernoulli: fixing a pervasive error in variational autoencoders. <https://arxiv.org/abs/1907.06845>`_

    Mathematical details

    The probability density function (pdf) is

    .. math::

        p(x;\lambda) = C(\lambda)\lambda^x (1-\lambda)^{1-x}

    In the above equation:

    * :math:`x`: is continuous between 0 and 1
    * :math:`probs = \lambda`: is the probability.
    * :math:`C(\lambda)`: is the normalizing constant factor

    .. math::

        C(\lambda) =
        \left\{
        \begin{aligned}
        &2 & \text{ if $\lambda = \frac{1}{2}$} \\
        &\frac{2\tanh^{-1}(1-2\lambda)}{1 - 2\lambda} & \text{ otherwise}
        \end{aligned}
        \right.

    Args:
        probs(int|float|Tensor): The probability of Continuous Bernoulli distribution between [0, 1],
            which characterize the shape of the pdf. If the input data type is int or float, the data type of
            `probs` will be convert to a 1-D Tensor the paddle global default dtype.
        lims(tuple): Specify the unstable calculation region near 0.5, where the calculation is approximated
            by talyor expansion. The default value is (0.499, 0.501).

    Examples:
        .. code-block:: python

            >>> import paddle
            >>> from paddle.distribution import ContinuousBernoulli
            >>> paddle.set_device("cpu")
            >>> paddle.seed(100)

            >>> rv = ContinuousBernoulli(paddle.to_tensor([0.2, 0.5]))

            >>> print(rv.sample([2]))
            Tensor(shape=[2, 2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [[0.38694882, 0.20714243],
             [0.00631948, 0.51577556]])

            >>> print(rv.mean)
            Tensor(shape=[2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [0.38801414, 0.50000000])

            >>> print(rv.variance)
            Tensor(shape=[2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [0.07589778, 0.08333334])

            >>> print(rv.entropy())
            Tensor(shape=[2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [-0.07641457,  0.        ])

            >>> print(rv.cdf(paddle.to_tensor(0.1)))
            Tensor(shape=[2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [0.17259926, 0.10000000])

            >>> print(rv.icdf(paddle.to_tensor(0.1)))
            Tensor(shape=[2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [0.05623737, 0.10000000])

            >>> rv1 = ContinuousBernoulli(paddle.to_tensor([0.2, 0.8]))
            >>> rv2 = ContinuousBernoulli(paddle.to_tensor([0.7, 0.5]))
            >>> print(rv1.kl_divergence(rv2))
            Tensor(shape=[2], dtype=float32, place=Place(cpu), stop_gradient=True,
            [0.20103608, 0.07641447])
    r   ÚprobsÚlimsr   ©gV-²ïß?gÕxé&1à?úfloat | Tensorútuple[float]ÚreturnÚNonec                   sh   t  ¡ | _|  |¡| _t j|| jd| _t  | jj¡j}t j	| j|d| d| _| jj
}tƒ  |¡ d S )N©r   é   )ÚminÚmax)ÚpaddleZget_default_dtyper   Ú
_to_tensorr	   Ú	to_tensorr
   ÚfinfoÚepsZclipÚshapeÚsuperÚ__init__)Úselfr	   r
   Zeps_probÚbatch_shape©Ú	__class__© úo/home/app/PaddleOCR-VL/.venv_paddleocr/lib/python3.10/site-packages/paddle/distribution/continuous_bernoulli.pyr   n   s   
zContinuousBernoulli.__init__c                 C  s0   t |ttfƒrtj|g| jd}|S |j| _|S )zoConvert the input parameters into tensors

        Returns:
            Tensor: converted probability.
        r   )Ú
isinstanceÚfloatÚintr   r   r   )r   r	   r    r    r!   r   |   s
   ÿzContinuousBernoulli._to_tensorc                 C  s,   t  t  | j| jd ¡t  | j| jd ¡¡S )zïGenerate stable support region indicator (prob < self.lims[0] && prob >= self.lims[1] )

        Returns:
            Tensor: the element of the returned indicator tensor corresponding to stable region is True, and False otherwise
        r   r   )r   Ú
logical_orÚ
less_equalr	   r
   Úgreater_than©r   r    r    r!   Ú_cut_support_region‰   s   þz'ContinuousBernoulli._cut_support_regionc                 C  s&   t  |  ¡ | j| jd t  | j¡ ¡S )zêCut the probability parameter with stable support region

        Returns:
            Tensor: the element of the returned probability tensor corresponding to unstable region is set to be self.lims[0], and unchanged otherwise
        r   )r   Úwherer)   r	   r
   Ú	ones_liker(   r    r    r!   Ú
_cut_probs”   s
   ýzContinuousBernoulli._cut_probsÚvaluec                 C  s   dt  |¡t  | ¡  S )z’Calculate the tanh inverse of value

        Args:
            value (Tensor)

        Returns:
            Tensor: tanh inverse of value
        ç      à?)r   Úlog1p©r   r-   r    r    r!   Ú_tanh_inverse    s   	z!ContinuousBernoulli._tanh_inversec              
   C  sè   |   ¡ }tjd| jd}t t ||¡|t |¡¡}t t ||¡|t |¡¡}t 	dt 
|  dd|  ¡¡ ¡t t ||¡t d| ¡t 	d| d ¡¡ }t | jd ¡}t 	tjd| jd¡dd|  |  }t |  ¡ ||¡S )zÄCalculate the logarithm of the constant factor :math:`C(lambda)` in the pdf of the Continuous Bernoulli distribution

        Returns:
            Tensor: logarithm of the constant factor
        r.   r   ç       @ç      ð?g       ÀgUUUUUUõ?gÒ'}Ò'}@)r,   r   r   r   r*   r&   Ú
zeros_likeÚgreater_equalr+   ÚlogÚabsr1   r/   Úsquarer	   r)   )r   Ú	cut_probsZhalfZcut_probs_below_halfZcut_probs_above_halfZlog_constant_proposeÚxÚtaylor_expansionr    r    r!   Ú_log_constant«   s:   
ý
ýÿ
ýþÿÿ
ÿz!ContinuousBernoulli._log_constantc              
   C  s€   |   ¡ }t |d| d ¡}|t tjd| jdd|  dd|  ¡ ¡ }| jd }dddt |¡  |  }t |  	¡ ||¡S )zeMean of Continuous Bernoulli distribution.

        Returns:
            Tensor: mean value.
        r2   r3   r   r.   gUUUUUUÕ?glÁlÁÖ?)
r,   r   Údivider   r   r1   r	   r8   r*   r)   ©r   r9   ÚtmpZproposer:   r;   r    r    r!   ÚmeanÍ   s   þ
ÿ
ÿzContinuousBernoulli.meanc              
   C  s”   |   ¡ }t ||d  t dd|  ¡¡}|t tjd| jdt t | ¡t |¡ ¡¡ }t | jd ¡}ddd|  |  }t 	|  
¡ ||¡S )zmVariance of Continuous Bernoulli distribution.

        Returns:
            Tensor: variance value.
        r3   r2   r   r.   gUUUUUUµ?g±?gg¼jVÁ?)r,   r   r=   r8   r   r   r/   r6   r	   r*   r)   r>   r    r    r!   Úvarianceâ   s   
þþ
ÿzContinuousBernoulli.variancer   úSequence[int]c                 C  s6   t  ¡  |  |¡W  d  ƒ S 1 sw   Y  dS )áC  Generate Continuous Bernoulli samples of the specified shape. The final shape would be ``sample_shape + batch_shape``.

        Args:
            shape (Sequence[int], optional): Prepended shape of the generated samples.

        Returns:
            Tensor, Sampled data with shape `sample_shape` + `batch_shape`.
        N)r   Zno_gradÚrsample)r   r   r    r    r!   Úsampleø   s   
	$ÿzContinuousBernoulli.samplec                 C  sN   t |tƒs	tdƒ‚t|ƒ}t| jƒ}t|| ƒ}tj|| jddd}|  |¡S )rC   z%sample shape must be Sequence object.r   r   )r   r   r   r   )	r"   r   Ú	TypeErrorÚtupler   r   Úuniformr   Úicdf)r   r   r   Zoutput_shapeÚur    r    r!   rD     s   
	

zContinuousBernoulli.rsamplec                 C  s`   t j|| jd}t  | jj¡j}t j|t  | j¡ d| t  d| j ¡  | d}|  ¡ | S )zÅLog probability density function.

        Args:
          value (Tensor): The input tensor.

        Returns:
          Tensor: log probability. The data type is the same as `self.probs`.
        r   r3   r   )Zneginf)	r   Úcastr   r   r	   r   Z
nan_to_numr6   r<   )r   r-   r   Zcross_entropyr    r    r!   Úlog_prob  s   	ÿýzContinuousBernoulli.log_probc                 C  s   t  |  |¡¡S )zÁProbability density function.

        Args:
            value (Tensor): The input tensor.

        Returns:
            Tensor: probability. The data type is the same as `self.probs`.
        )r   ÚexprL   r0   r    r    r!   Úprob'  s   	zContinuousBernoulli.probc              	   C  s`   t  | j¡}t  | j ¡}t  t  | jt jd| jd¡t  | jd¡|  	¡  | j
||   | ¡S )a‚  Shannon entropy in nats.

        The entropy is

        .. math::

            \mathcal{H}(X) = -\log C + \left[ \log (1 - \lambda) -\log \lambda \right] \mathbb{E}(X)  - \log(1 - \lambda)

        In the above equation:

        * :math:`\Omega`: is the support of the distribution.

        Returns:
            Tensor, Shannon entropy of Continuous Bernoulli distribution.
        r.   r   ç        )r   r6   r	   r/   r*   Úequalr   r   Z	full_liker<   r@   )r   Zlog_pZlog_1_minus_pr    r    r!   Úentropy2  s   ÿþüzContinuousBernoulli.entropyc                 C  sª   t j|| jd}|  ¡ }t  ||¡t  d| d| ¡ | d d| d  }t  |  ¡ ||¡}t  t  |t jd| jd¡t  	|¡t  t  
|t jd| jd¡t  |¡|¡¡S )a>  Cumulative distribution function

        .. math::

            {   P(X \le t; \lambda) =
                F(t;\lambda) =
                \left\{
                \begin{aligned}
                &t & \text{ if $\lambda = \frac{1}{2}$} \\
                &\frac{\lambda^t (1 - \lambda)^{1 - t} + \lambda - 1}{2\lambda - 1} & \text{ otherwise}
                \end{aligned}
                \right. }

        Args:
            value (Tensor): The input tensor.

        Returns:
            Tensor: quantile of :attr:`value`. The data type is the same as `self.probs`.
        r   r3   r2   rO   )r   rK   r   r,   Úpowr*   r)   r&   r   r4   r5   r+   )r   r-   r9   ZcdfsZunbounded_cdfsr    r    r!   ÚcdfO  s.   
ÿþý
ûÿûýzContinuousBernoulli.cdfc              	   C  sd   t j|| jd}|  ¡ }t  |  ¡ t  | |d| d   ¡t  | ¡ t  |¡t  | ¡  |¡S )af  Inverse cumulative distribution function

        .. math::

            {   F^{-1}(x;\lambda) =
                \left\{
                \begin{aligned}
                &x & \text{ if $\lambda = \frac{1}{2}$} \\
                &\frac{\log(1+(\frac{2\lambda - 1}{1 - \lambda})x)}{\log(\frac{\lambda}{1-\lambda})} & \text{ otherwise}
                \end{aligned}
                \right. }

        Args:
            value (Tensor): The input tensor, meaning the quantile.

        Returns:
            Tensor: the value of the r.v. corresponding to the quantile. The data type is the same as `self.probs`.
        r   r2   r3   )r   rK   r   r,   r*   r)   r/   r6   )r   r-   r9   r    r    r!   rI   x  s   
ÿüùzContinuousBernoulli.icdfÚotherc                 C  s\   | j |j kr
tdƒ‚|  ¡  }t |j¡}t |j ¡}| ¡ | j||   |  }|| S )a  The KL-divergence between two Continuous Bernoulli distributions with the same `batch_shape`.

        The probability density function (pdf) is

        .. math::

            KL\_divergence(\lambda_1, \lambda_2) = - H - \{\log C_2 + [\log \lambda_2 -  \log (1-\lambda_2)]  \mathbb{E}_1(X) +  \log (1-\lambda_2)  \}

        Args:
            other (ContinuousBernoulli): instance of Continuous Bernoulli.

        Returns:
            Tensor, kl-divergence between two Continuous Bernoulli distributions.

        z\KL divergence of two Continuous Bernoulli distributions should share the same `batch_shape`.)	r   Ú
ValueErrorrQ   r   r6   r	   r/   r<   r@   )r   rT   Zpart1Zlog_qZlog_1_minus_qZpart2r    r    r!   Úkl_divergence—  s   ÿ
ÿþÿz!ContinuousBernoulli.kl_divergence)r   )r	   r   r
   r   r   r   )r	   r   r   r   )r   r   )r-   r   r   r   )r   rB   r   r   )rT   r   r   r   )Ú__name__Ú
__module__Ú__qualname__Ú__doc__Ú__annotations__r   r   r)   r,   r1   r<   Úpropertyr@   rA   rE   rD   rL   rN   rQ   rS   rI   rV   Ú__classcell__r    r    r   r!   r      s0   
 Nÿ




"




)r   )Ú
__future__r   Úcollections.abcr   Útypingr   r   Zpaddle.distributionr   r   r   ÚDistributionr   r    r    r    r!   Ú<module>   s   