£Á°èZ¨Ä…–K§‚«“ô4“ÒÙ´dîfUÙÃÅ WKbyÊ¦•êŽ…È®FÒ¿ÊÎóCozá¬S@6{Í:›œêZÌ:Š•_%:¢¾¾~;‘Ã~èŠ©ÊÇí`ÔÑ©úë™µ'5I¿fš×WO%ø9¾«¾DK|€ùÍD”Ýs]nHÕ¶ê×Ó¼ãžªéUWŸÈË%DÒÕ¬ï‘]/Åcx  ‰ï2ß]ä6G[]S£ÔÏ¯rs{úëóµmÒï#UQxo·õÞCe]"±/aÙ&Eã4ú9Jé_ÞåëdãöKë)AÞ                  ¯¹ægƒÛowÐø^d™ý½ßB7áyMä9ÜÖUã
!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
<html>

Re                 @   sB   d  d l  Z  d  d l Z d d l m Z Gd d   d e  Z d S)    N   )ProbingStatec               @   s   e  Z d  Z d Z d d d  Z d d   Z e d d    Z d	 d
   Z e d d    Z	 d d   Z
 e d d    Z e d d    Z e d d    Z d S)CharSetProbergffffff?Nc             C   s(   d  |  _  | |  _ t j t  |  _ d  S)N)_statelang_filterlogging	getLogger__name__logger)selfr    r   /builddir/build/BUILDROOT/alt-python35-pip-20.2.4-5.el8.x86_64/opt/alt/python35/lib/python3.5/site-packages/pip/_vendor/chardet/charsetprober.py__init__'   s    		zCharSetProber.__init__c             C   s   t  j |  _ d  S)N)r   	DETECTINGr   )r   r   r   r   reset,   s    zCharSetProber.resetc             C   s   d  S)Nr   )r   r   r   r   charset_name/   s    zCharSetProber.charset_namec             C   s   d  S)Nr   )r   bufr   r   r   feed3   s    zCharSetProber.feedc             C   s   |  j  S)N)r   )r   r   r   r   state6   s    zCharSetProber.statec             C   s   d S)Ng        r   )r   r   r   r   get_confidence:   s    zCharSetProber.get_confidencec             C   s   t  j d d |   }  |  S)Ns   ([ -])+    )resub)r   r   r   r   filter_high_byte_only=   s    z#CharSetProber.filter_high_byte_onlyc             C   s   t    } t j d |   } xa | D]Y } | j | d d   | d d  } | j   rn | d k  rn d } | j |  q" W| S)u9  
        We define three types of bytes:
        alphabet: english alphabets [a-zA-Z]
        international: international characters [-ÿ]
        marker: everything else [^a-zA-Z-ÿ]

        The input buffer can be thought to contain a series of words delimited
        by markers. This function works to filter all words that contain at
        least one international character. All contiguous sequences of markers
        are replaced by a single space ascii character.

        This filter applies to all scripts which do not use English characters.
        s%   [a-zA-Z]*[-]+[a-zA-Z]*[^a-zA-Z-]?Nr   s   r   r   )	bytearrayr   findallextendisalpha)r   filteredwordsword	last_charr   r   r   filter_international_wordsB   s    			z(CharSetProber.filter_international_wordsc             C   s   t    } d } d } x t t |    D] } |  | | d  } | d k rW d } n | d k ri d } | d k  r( | j   r( | | k r | r | j |  | |   | j d  | d } q( W| s | j |  | d	   | S)
a  
        Returns a copy of ``buf`` that retains only the sequences of English
        alphabet and high byte characters that are not between <> characters.
        Also retains English alphabet and high byte characters immediately
        before occurrences of >.

        This filter can be applied to all scripts which contain both English
        characters and extended ASCII characters, but is currently only used by
        ``Latin1Prober``.
        Fr   r      >   <Ts   r   N)r   rangelenr   r   )r   r   in_tagprevcurrbuf_charr   r   r   filter_with_english_lettersg   s"    		z)CharSetProber.filter_with_english_letters)r	   
__module____qualname__SHORTCUT_THRESHOLDr   r   propertyr   r   r   r   staticmethodr   r#   r,   r   r   r   r   r   #   s   %r   )r   r   enumsr   objectr   r   r   r   r   <module>   s   