U
    yc                      @   s`   d dl mZmZmZmZmZ ddlmZ ddlm	Z	m
Z
mZ G dd deZG dd deZd	S )
    )DictList
NamedTupleOptionalUnion   )CharSetProber)CharacterCategoryProbingStateSequenceLikelihoodc                   @   s^   e Zd ZU eed< eed< eeef ed< eeeeef f ed< eed< eed< eed< dS )	SingleByteCharSetModelcharset_namelanguagechar_to_order_maplanguage_modeltypical_positive_ratiokeep_ascii_lettersZalphabetN)	__name__
__module____qualname__str__annotations__r   intfloatbool r   r   B/tmp/pip-build-0we0fmvo/pip/pip/_vendor/chardet/sbcharsetprober.pyr   #   s   
r   c                       s   e Zd ZdZdZdZdZdeee	e
 dd fdd	Zdd
 fddZee	e d
ddZee	e d
ddZeeef edddZed
ddZ  ZS )SingleByteCharSetProber@   i   gffffff?g?FN)modelis_reversedname_proberreturnc                    sL   t    || _|| _|| _d| _g | _d| _d| _d| _	d| _
|   d S N   r   )super__init___model	_reversed_name_prober_last_order_seq_counters_total_seqs_total_char_control_char
_freq_charreset)selfr   r    r!   	__class__r   r   r&   3   s    
z SingleByteCharSetProber.__init__)r"   c                    s<   t    d| _dgt  | _d| _d| _d| _d| _	d S r#   )
r%   r0   r*   r   get_num_categoriesr+   r,   r-   r.   r/   r1   r2   r   r   r0   G   s    
zSingleByteCharSetProber.resetc                 C   s   | j r| j jS | jjS N)r)   r   r'   r5   r   r   r   r   R   s    z$SingleByteCharSetProber.charset_namec                 C   s   | j r| j jS | jjS r6   )r)   r   r'   r5   r   r   r   r   X   s    z SingleByteCharSetProber.language)byte_strr"   c           	      C   sV  | j js| |}n
| |}|s(| jS | j j}| j j}|D ]}||tj	}|tj
k rf|  jd7  _|| jk r|  jd7  _| j| jk r|  jd7  _| js|| j | }n|| | j }| j|  d7  < || _q<| j j}| jtjkrP| j| jkrP|  }|| jkr(| jd|| tj| _n(|| jk rP| jd||| j tj| _| jS )Nr   z$%s confidence = %s, we have a winnerz8%s confidence = %s, below negative shortcut threshold %s)r'   r   filter_international_wordsZremove_xml_tagsstater   r   getr	   	UNDEFINEDCONTROLr-   SAMPLE_SIZEr/   r*   r,   r(   r+   r   r
   	DETECTINGSB_ENOUGH_REL_THRESHOLDget_confidencePOSITIVE_SHORTCUT_THRESHOLDloggerdebugFOUND_IT_stateNEGATIVE_SHORTCUT_THRESHOLDNOT_ME)	r1   r7   r   r   charorderZlm_catr   
confidencer   r   r   feed^   sP    


  
zSingleByteCharSetProber.feedc                 C   sn   d}| j dkrj| jtj d| jtj   | j  | jj }|| j| j  | j }|| j	 | j }|dkrjd}|S )Ng{Gz?r   g      ?g      ?gGz?)
r,   r+   r   POSITIVELIKELYr'   r   r-   r.   r/   )r1   rr   r   r   r@      s    

z&SingleByteCharSetProber.get_confidence)FN)r   r   r   r=   r?   rA   rF   r   r   r   r   r&   r0   propertyr   r   r   r   bytes	bytearrayr
   rK   r   r@   __classcell__r   r   r2   r   r   -   s&     2r   N)typingr   r   r   r   r   charsetproberr   enumsr	   r
   r   r   r   r   r   r   r   <module>   s   
