o
    + iï  ã                   @  sh   d dl mZ d dlZd dlmZ d dlmZ ddlmZ er*d dl	m
Z
 ddlmZ G d	d
„ d
eƒZdS )é    )ÚannotationsN)ÚTYPE_CHECKING)Úfleeté   )ÚQuantization)ÚLayer)ÚQuantConfigc                      s6   e Zd ZdZd‡ fdd„Zdd	„ Zdddd„Z‡  ZS )ÚPTQz;
    Applying post training quantization to the model.
    Úconfigr   ÚreturnÚNonec                   s   t ƒ  |¡ d S )N)ÚsuperÚ__init__)Úselfr
   ©Ú	__class__© úc/home/app/PaddleOCR-VL-test/.venv_paddleocr/lib/python3.10/site-packages/paddle/quantization/ptq.pyr   "   s   zPTQ.__init__c                 C  s.   zt  ¡ dkr
W dS W dS  ty   Y dS w )Né   TF)r   Z
worker_numÚ	Exception)r   r   r   r   Ú_is_parallel_training%   s   ÿzPTQ._is_parallel_trainingFÚmodelr   ÚinplaceÚboolc                 C  sd   |}|s|   ¡ rJ dƒ‚t |¡}| ¡  |jrJ dƒ‚| j |¡ |  || j¡ |  || j¡ |S )a9  
        Create a model for post-training quantization.

        The quantization configuration will be propagated in the model.
        And it will insert observers into the model to collect and compute
        quantization parameters.

        Args:
            model(Layer): The model to be quantized.
            inplace(bool): Whether to modify the model in-place.

        Return: The prepared model for post-training quantization.

        Examples:
            .. code-block:: python

                >>> from paddle.quantization import PTQ, QuantConfig
                >>> from paddle.quantization.observers import AbsmaxObserver
                >>> from paddle.vision.models import LeNet

                >>> observer = AbsmaxObserver()
                >>> q_config = QuantConfig(activation=observer, weight=observer)
                >>> ptq = PTQ(q_config)
                >>> model = LeNet()
                >>> model.eval()
                >>> quant_model = ptq.quantize(model)
                >>> print(quant_model)
                LeNet(
                  (features): Sequential(
                    (0): QuantedConv2D(
                      (weight_quanter): AbsmaxObserverLayer()
                      (activation_quanter): AbsmaxObserverLayer()
                    )
                    (1): ObserveWrapper(
                      (_observer): AbsmaxObserverLayer()
                      (_observed): ReLU()
                    )
                    (2): ObserveWrapper(
                      (_observer): AbsmaxObserverLayer()
                      (_observed): MaxPool2D(kernel_size=2, stride=2, padding=0)
                    )
                    (3): QuantedConv2D(
                      (weight_quanter): AbsmaxObserverLayer()
                      (activation_quanter): AbsmaxObserverLayer()
                    )
                    (4): ObserveWrapper(
                      (_observer): AbsmaxObserverLayer()
                      (_observed): ReLU()
                    )
                    (5): ObserveWrapper(
                      (_observer): AbsmaxObserverLayer()
                      (_observed): MaxPool2D(kernel_size=2, stride=2, padding=0)
                    )
                  )
                  (fc): Sequential(
                    (0): QuantedLinear(
                      (weight_quanter): AbsmaxObserverLayer()
                      (activation_quanter): AbsmaxObserverLayer()
                    )
                    (1): QuantedLinear(
                      (weight_quanter): AbsmaxObserverLayer()
                      (activation_quanter): AbsmaxObserverLayer()
                    )
                    (2): QuantedLinear(
                      (weight_quanter): AbsmaxObserverLayer()
                      (activation_quanter): AbsmaxObserverLayer()
                    )
                  )
                )
        z3'inplace' is not compatible with parallel training.zjPost-Training Quantization should not work on training models. Please set evaluation mode by model.eval().)	r   ÚcopyÚdeepcopyÚevalZtrainingÚ_configZ_specifyZ_convert_to_quant_layersZ_insert_activation_observers)r   r   r   Ú_modelr   r   r   Úquantize.   s   G
ÿ
ÿzPTQ.quantize)r
   r   r   r   )F)r   r   r   r   r   r   )Ú__name__Ú
__module__Ú__qualname__Ú__doc__r   r   r   Ú__classcell__r   r   r   r   r	      s
    	r	   )Ú
__future__r   r   Útypingr   Zpaddle.distributedr   r   r   Z	paddle.nnr   r
   r   r	   r   r   r   r   Ú<module>   s   