U
    yc}                     @   s  d Z ddlZddlZddlZddlmZmZ ddlmZ ddl	m
Z
mZmZmZ ddlmZmZmZmZmZmZ ddlmZ dd	d
dddddddddgZdddddgZedd ZG dd deZG dd dedZG dd deZG d d deZ G d!d" d"Z!e! Z"G d#d$ d$e#Z$G d%d& d&Z%d'd Z&G d(d) d)Z'e' Z(d*d Z)G d+d dZ*G d,d deZ+G d-d. d.eZ,G d/d	 d	ee,dZ-G d0d dZ.G d1d
 d
e-Z/d2d3 Z0G d4d5 d5e,Z1G d6d7 d7e-e1dZ2dS )8z
    pygments.lexer
    ~~~~~~~~~~~~~~

    Base lexer classes.

    :copyright: Copyright 2006-2022 by the Pygments team, see AUTHORS.
    :license: BSD, see LICENSE for details.
    N)apply_filtersFilter)get_filter_by_name)ErrorTextOther
_TokenType)get_bool_optget_int_optget_list_optmake_analysatorFutureguess_decode)	regex_optLexer
RegexLexerExtendedRegexLexerDelegatingLexerLexerContextincludeinheritbygroupsusingthisdefaultwords)s   ﻿utf-8)s     zutf-32)s     zutf-32be)s   zutf-16)s   zutf-16bec                 C   s   dS )N         xr   r   9/tmp/pip-build-0we0fmvo/pip/pip/_vendor/pygments/lexer.py<lambda>!       r"   c                   @   s   e Zd ZdZdd ZdS )	LexerMetaz
    This metaclass automagically converts ``analyse_text`` methods into
    static methods which always return float values.
    c                 C   s(   d|krt |d |d< t| |||S )Nanalyse_text)r   type__new__)Zmcsnamebasesdr   r   r!   r'   *   s    zLexerMeta.__new__N)__name__
__module____qualname____doc__r'   r   r   r   r!   r$   $   s   r$   c                   @   s^   e Zd ZdZdZdZg Zg Zg Zg Z	dZ
dd Zdd Zdd	 Zd
d ZdddZdd ZdS )r   a  
    Lexer for a specific language.

    Basic options recognized:
    ``stripnl``
        Strip leading and trailing newlines from the input (default: True).
    ``stripall``
        Strip all leading and trailing whitespace from the input
        (default: False).
    ``ensurenl``
        Make sure that the input ends with a newline (default: True).  This
        is required for some lexers that consume input linewise.

        .. versionadded:: 1.3

    ``tabsize``
        If given and greater than 0, expand tabs in the input (default: 0).
    ``encoding``
        If given, must be an encoding name. This encoding will be used to
        convert the input string to Unicode, if it is not already a Unicode
        string (default: ``'guess'``, which uses a simple UTF-8 / Locale /
        Latin1 detection.  Can also be ``'chardet'`` to use the chardet
        library, if it is installed.
    ``inencoding``
        Overrides the ``encoding`` if given.
    Nr   c                 K   s   || _ t|dd| _t|dd| _t|dd| _t|dd| _|dd	| _|d
pZ| j| _g | _	t
|ddD ]}| | qpd S )NstripnlTstripallFensurenltabsizer   encodingguessZ
inencodingfiltersr   )optionsr	   r/   r0   r1   r
   r2   getr3   r5   r   
add_filter)selfr6   filter_r   r   r!   __init__a   s    zLexer.__init__c                 C   s(   | j rd| jj| j f S d| jj S d S )Nz<pygments.lexers.%s with %r>z<pygments.lexers.%s>)r6   	__class__r+   r9   r   r   r!   __repr__m   s
    zLexer.__repr__c                 K   s&   t |tst|f|}| j| dS )z8
        Add a new stream filter to this lexer.
        N)
isinstancer   r   r5   append)r9   r:   r6   r   r   r!   r8   t   s    
zLexer.add_filterc                 C   s   dS )a~  
        Has to return a float between ``0`` and ``1`` that indicates
        if a lexer wants to highlight this text. Used by ``guess_lexer``.
        If this method returns ``0`` it won't highlight it in any case, if
        it returns ``1`` highlighting with this lexer is guaranteed.

        The `LexerMeta` metaclass automatically wraps this function so
        that it works like a static method (no ``self`` or ``cls``
        parameter) and the return value is automatically converted to
        `float`. If the return value is an object that is boolean `False`
        it's the same as if the return values was ``0.0``.
        Nr   )textr   r   r!   r%   |   s    zLexer.analyse_textFc              
      s  t ts jdkr$t\}nވ jdkrzddlm} W n, tk
rj } ztd|W 5 d}~X Y nX d}tD ].\}}|rtt	|d 
|d} qqt|dkr|dd }	
|	d	pd
d}|n(
 jdr t	dd ndr t	dd dddd jrJ n jr\d jdkrt j jrdsd7  fdd}
|
 }|st| j }|S )a=  
        Return an iterable of (tokentype, value) pairs generated from
        `text`. If `unfiltered` is set to `True`, the filtering mechanism
        is bypassed even if filters are defined.

        Also preprocess the text, i.e. expand tabs and strip it if
        wanted and applies registered filters.
        r4   chardetr   )rB   zkTo enable chardet encoding guessing, please install the chardet library from http://chardet.feedparser.org/Nreplacei   r3   r   u   ﻿z

c                  3   s$     D ]\} }}||fV  q
d S N)get_tokens_unprocessed)_tvr9   rA   r   r!   streamer   s    z"Lexer.get_tokens.<locals>.streamer)r?   strr3   r   pip._vendorrB   ImportError_encoding_map
startswithlendecodedetectr7   rC   r0   stripr/   r2   
expandtabsr1   endswithr   r5   )r9   rA   Z
unfilteredrH   rB   edecodedbomr3   encrL   streamr   rK   r!   
get_tokens   sR    	




zLexer.get_tokensc                 C   s   t dS )z
        Return an iterable of (index, tokentype, value) pairs where "index"
        is the starting position of the token within the input text.

        In subclasses, implement this method as a generator to
        maximize effectiveness.
        N)NotImplementedErrorrK   r   r   r!   rG      s    zLexer.get_tokens_unprocessed)F)r+   r,   r-   r.   r(   urlaliases	filenamesZalias_filenames	mimetypespriorityr;   r>   r8   r%   r]   rG   r   r   r   r!   r   0   s   
;)	metaclassc                   @   s$   e Zd ZdZefddZdd ZdS )r   a   
    This lexer takes two lexer as arguments. A root lexer and
    a language lexer. First everything is scanned using the language
    lexer, afterwards all ``Other`` tokens are lexed using the root
    lexer.

    The lexers from the ``template`` lexer package use this base lexer.
    c                 K   s0   |f || _ |f || _|| _tj| f| d S rF   )
root_lexerlanguage_lexerneedler   r;   )r9   Z_root_lexerZ_language_lexerZ_needler6   r   r   r!   r;      s    zDelegatingLexer.__init__c                 C   s   d}g }g }| j |D ]H\}}}|| jkrP|rF|t||f g }||7 }q||||f q|rx|t||f t|| j|S )N )rf   rG   rg   r@   rR   do_insertionsre   )r9   rA   Zbuffered
insertionsZ
lng_bufferirI   rJ   r   r   r!   rG      s    


z&DelegatingLexer.get_tokens_unprocessedN)r+   r,   r-   r.   r   r;   rG   r   r   r   r!   r      s   	c                   @   s   e Zd ZdZdS )r   zI
    Indicates that a state should include rules from another state.
    Nr+   r,   r-   r.   r   r   r   r!   r      s   c                   @   s   e Zd ZdZdd ZdS )_inheritzC
    Indicates the a state should inherit from its superclass.
    c                 C   s   dS )Nr   r   r=   r   r   r!   r>     s    z_inherit.__repr__N)r+   r,   r-   r.   r>   r   r   r   r!   rm      s   rm   c                   @   s    e Zd ZdZdd Zdd ZdS )combinedz:
    Indicates a state combined from multiple states.
    c                 G   s   t | |S rF   )tupler'   )clsargsr   r   r!   r'     s    zcombined.__new__c                 G   s   d S rF   r   )r9   rq   r   r   r!   r;     s    zcombined.__init__N)r+   r,   r-   r.   r'   r;   r   r   r   r!   rn     s   rn   c                   @   sF   e Zd ZdZdd ZdddZdddZdd	d
Zdd Zdd Z	dS )_PseudoMatchz:
    A pseudo match object constructed from a string.
    c                 C   s   || _ || _d S rF   )_text_start)r9   startrA   r   r   r!   r;     s    z_PseudoMatch.__init__Nc                 C   s   | j S rF   )rt   r9   argr   r   r!   ru     s    z_PseudoMatch.startc                 C   s   | j t| j S rF   )rt   rR   rs   rv   r   r   r!   end!  s    z_PseudoMatch.endc                 C   s   |rt d| jS )NzNo such group)
IndexErrorrs   rv   r   r   r!   group$  s    z_PseudoMatch.groupc                 C   s   | j fS rF   )rs   r=   r   r   r!   groups)  s    z_PseudoMatch.groupsc                 C   s   i S rF   r   r=   r   r   r!   	groupdict,  s    z_PseudoMatch.groupdict)N)N)N)
r+   r,   r-   r.   r;   ru   rx   rz   r{   r|   r   r   r   r!   rr     s   


rr   c                     s   d fdd	}|S )zL
    Callback that yields multiple actions for each group in the match.
    Nc                 3   s   t  D ]\}}|d krqqt|tkrR||d }|r||d ||fV  q||d }|d k	r|r|||d |_|| t||d ||D ]}|r|V  qq|r| |_d S )N   )	enumerater&   r   rz   ru   posrr   rx   )lexermatchctxrk   actiondataitemrq   r   r!   callback4  s&     
zbygroups.<locals>.callback)Nr   )rq   r   r   r   r!   r   0  s    c                   @   s   e Zd ZdZdS )_ThiszX
    Special singleton used for indicating the caller class.
    Used by ``using``.
    Nrl   r   r   r   r!   r   J  s   r   c                    sj   i dkr: d}t|ttfr.|d< nd|fd<  tkrTdfdd	}nd	 fdd	}|S )
a  
    Callback that processes the match with a different lexer.

    The keyword arguments are forwarded to the lexer, except `state` which
    is handled separately.

    `state` specifies the state that the new lexer will start in, and can
    be an enumerable such as ('root', 'inline', 'string') or a simple
    string which is assumed to be on top of the root state.

    Note: For that to work, `_other` must not be an `ExtendedRegexLexer`.
    statestackrootNc                 3   sj   r | j | jf }n| }| }|j| f D ]\}}}|| ||fV  q<|rf| |_d S rF   )updater6   r<   ru   rG   rz   rx   r   r   r   r   Zlxsrk   rI   rJ   )	gt_kwargskwargsr   r!   r   i  s    zusing.<locals>.callbackc                 3   s^    | j  f }| }|j| fD ]\}}}|| ||fV  q0|rZ| |_d S rF   )r   r6   ru   rG   rz   rx   r   r   _otherr   r   r   r!   r   x  s    
)N)N)popr?   listro   r   )r   r   r   r   r   r   r!   r   S  s    


c                   @   s   e Zd ZdZdd ZdS )r   z
    Indicates a state or state action (e.g. #pop) to apply.
    For example default('#pop') is equivalent to ('', Token, '#pop')
    Note that state tuples may be used as well.

    .. versionadded:: 2.0
    c                 C   s
   || _ d S rF   )r   )r9   r   r   r   r!   r;     s    zdefault.__init__N)r+   r,   r-   r.   r;   r   r   r   r!   r     s   c                   @   s"   e Zd ZdZdddZdd ZdS )	r   z
    Indicates a list of literal words that is transformed into an optimized
    regex that matches any of the words.

    .. versionadded:: 2.0
    rh   c                 C   s   || _ || _|| _d S rF   )r   prefixsuffix)r9   r   r   r   r   r   r!   r;     s    zwords.__init__c                 C   s   t | j| j| jdS )Nr   r   )r   r   r   r   r=   r   r   r!   r7     s    z	words.getN)rh   rh   )r+   r,   r-   r.   r;   r7   r   r   r   r!   r     s   
c                   @   sJ   e Zd ZdZdd Zdd Zdd Zdd	 ZdddZdd Z	dd Z
d
S )RegexLexerMetazw
    Metaclass for RegexLexer, creates the self._tokens attribute from
    self.tokens on the first instantiation.
    c                 C   s    t |tr| }t||jS )zBPreprocess the regular expression component of a token definition.)r?   r   r7   recompiler   )rp   regexrflagsr   r   r   r!   _process_regex  s    
zRegexLexerMeta._process_regexc                 C   s&   t |tks"t|s"td|f |S )z5Preprocess the token component of a token definition.z2token type must be simple type or callable, not %r)r&   r   callableAssertionError)rp   tokenr   r   r!   _process_token  s    zRegexLexerMeta._process_tokenc                 C   s  t |trd|dkrdS ||kr$|fS |dkr0|S |dd dkrRt|dd  S dsbtd| nt |trd	| j }|  jd
7  _g }|D ],}||kstd| || ||| q|||< |fS t |tr |D ] }||ks|dkstd| q|S dstd| dS )z=Preprocess the state transition action of a token definition.#pop#pushN   z#pop:Fzunknown new state %rz_tmp_%dr}   zcircular state ref %r)r   r   zunknown new state zunknown new state def %r)	r?   rM   intr   rn   _tmpnameextend_process_statero   )rp   	new_stateunprocessed	processedZ	tmp_stateitokensZistater   r   r!   _process_new_state  s>    



 z!RegexLexerMeta._process_new_statec                 C   s  t |tkstd| |d dks0td| ||kr@|| S g  }||< | j}|| D ].}t|tr||ks~td| || ||t| qZt|trqZt|t	r| 
|j||}|tdjd|f qZt |tkstd| z| |d ||}W n> tk
rD }	 ztd	|d || |	f |	W 5 d}	~	X Y nX | |d
 }
t|dkrhd}n| 
|d ||}|||
|f qZ|S )z%Preprocess a single state definition.zwrong state name %rr   #zinvalid state name %rzcircular state reference %rrh   Nzwrong rule def %rz+uncompilable regex %r in state %r of %r: %sr}      )r&   rM   r   flagsr?   r   r   r   rm   r   r   r   r@   r   r   r   ro   r   	Exception
ValueErrorr   rR   )rp   r   r   r   tokensr   Ztdefr   rexerrr   r   r   r!   r     sJ    



 zRegexLexerMeta._process_stateNc                 C   s<   i  }| j |< |p| j| }t|D ]}| ||| q$|S )z-Preprocess a dictionary of token definitions.)_all_tokensr   r   r   )rp   r(   	tokendefsr   r   r   r   r!   process_tokendef  s
    zRegexLexerMeta.process_tokendefc           
   
   C   s   i }i }| j D ]}|jdi }| D ]\}}||}|dkr||||< z|t}W n tk
rp   Y q(Y nX |||< q(||d}|dkrq(||||d < z|t}	W n tk
r   Y q(X ||	 ||< q(q|S )a  
        Merge tokens from superclasses in MRO order, returning a single tokendef
        dictionary.

        Any state that is not defined by a subclass will be inherited
        automatically.  States that *are* defined by subclasses will, by
        default, override that state in the superclass.  If a subclass wishes to
        inherit definitions from a superclass, it can use the special value
        "inherit", which will cause the superclass' state definition to be
        included at that point in the state.
        r   Nr}   )__mro____dict__r7   itemsindexr   r   r   )
rp   r   inheritablectoksr   r   ZcuritemsZinherit_ndxZnew_inh_ndxr   r   r!   get_tokendefs
  s0    


zRegexLexerMeta.get_tokendefsc                 O   sL   d| j kr:i | _d| _t| dr(| jr(n| d|  | _tj	| f||S )z:Instantiate cls after preprocessing its token definitions._tokensr   token_variantsrh   )
r   r   r   hasattrr   r   r   r   r&   __call__)rp   rq   kwdsr   r   r!   r   ;  s    
zRegexLexerMeta.__call__)N)r+   r,   r-   r.   r   r   r   r   r   r   r   r   r   r   r!   r     s   #,
1r   c                   @   s$   e Zd ZdZejZi ZdddZdS )r   z
    Base for simple stateful regular expression-based lexers.
    Simplifies the lexing process so that you need only
    provide a list of states and regular expressions.
    r   c                 c   s  d}| j }t|}||d  }|D ](\}}}	|||}
|
r"|dk	rrt|tkrb|||
 fV  n|| |
E dH  |
 }|	dk	rHt|	tr|	D ]D}|dkrt|dkr|	  q|dkr|
|d  q|
| qnbt|	trt|	t|kr|dd= n
||	d= n,|	dkr*|
|d  nds<td|	 ||d  } qq"zP|| d	krd
g}|d
 }|td	fV  |d7 }W q|t|| fV  |d7 }W q tk
r   Y qY qX qdS )z~
        Split ``text`` into (tokentype, text) pairs.

        ``stack`` is the initial stack (default: ``['root']``)
        r   r   Nr   r}   r   Fwrong state def: %rrD   r   )r   r   r&   r   rz   rx   r?   ro   rR   r   r@   r   absr   r   r   ry   )r9   rA   r   r   r   Z
statestackstatetokensrexmatchr   r   mr   r   r   r!   rG   l  sR    




z!RegexLexer.get_tokens_unprocessedN)r   )	r+   r,   r-   r.   r   	MULTILINEr   r   rG   r   r   r   r!   r   I  s   c                   @   s"   e Zd ZdZdddZdd ZdS )r   z9
    A helper object that holds lexer position data.
    Nc                 C   s*   || _ || _|pt|| _|p"dg| _d S )Nr   )rA   r   rR   rx   r   )r9   rA   r   r   rx   r   r   r!   r;     s    zLexerContext.__init__c                 C   s   d| j | j| jf S )NzLexerContext(%r, %r, %r))rA   r   r   r=   r   r   r!   r>     s
      zLexerContext.__repr__)NN)r+   r,   r-   r.   r;   r>   r   r   r   r!   r     s   
c                   @   s   e Zd ZdZdddZdS )r   zE
    A RegexLexer that uses a context object to store its state.
    Nc                 c   s<  | j }|st|d}|d }n|}||jd  }|j}|D ]`\}}}|||j|j}	|	r:|dk	rt|tkr|j||	 fV  |	 |_n$|| |	|E dH  |s||jd  }|dk	rt	|t
r|D ]P}
|
dkrt|jdkr|j  q|
dkr|j|jd  q|j|
 qnlt	|trZt|t|jkrL|jdd= n|j|d= n0|dkrx|j|jd  ndstd	| ||jd  } q6q:zz|j|jkrW q8||j d
krdg|_|d }|jtd
fV  | jd7  _W q6|jt||j fV  | jd7  _W q6 tk
r4   Y q8Y q6X q6dS )z
        Split ``text`` into (tokentype, text) pairs.
        If ``context`` is given, use this lexer context instead.
        r   r   r   Nr   r}   r   Fr   rD   )r   r   r   rA   r   rx   r&   r   rz   r?   ro   rR   r   r@   r   r   r   r   r   ry   )r9   rA   contextr   r   r   r   r   r   r   r   r   r   r!   rG     s`    




z)ExtendedRegexLexer.get_tokens_unprocessed)NN)r+   r,   r-   r.   rG   r   r   r   r!   r     s   c              	   c   s  t | } zt| \}}W n  tk
r8   |E dH  Y dS X d}d}|D ]\}}}|dkr\|}d}	|r|t| |kr||	||  }
|
r|||
fV  |t|
7 }|D ]"\}}}|||fV  |t|7 }q|| }	zt| \}}W q` tk
r   d}Y qY q`X q`|	t|k rF||||	d fV  |t||	 7 }qF|r|pHd}|D ]$\}}}|||fV  |t|7 }qNzt| \}}W n  tk
r   d}Y qY nX q:dS )ag  
    Helper for lexers which must combine the results of several
    sublexers.

    ``insertions`` is a list of ``(index, itokens)`` pairs.
    Each ``itokens`` iterable should be inserted at position
    ``index`` into the token stream given by the ``tokens``
    argument.

    The result is a combined token stream.

    TODO: clean up the code here.
    NTr   F)iternextStopIterationrR   )rj   r   r   r   realposZinsleftrk   rI   rJ   ZoldiZtmpvalZit_indexZit_tokenZit_valuepr   r   r!   ri     sN    

ri   c                   @   s   e Zd ZdZdd ZdS )ProfilingRegexLexerMetaz>Metaclass for ProfilingRegexLexer, collects regex timing info.c                    sL   t |tr t|j|j|jdn|t|tjf fdd	}|S )Nr   c                    s`    j d fddg}t }| ||}t }|d  d7  < |d  || 7  < |S )Nr   r   r   r}   )
_prof_data
setdefaulttimer   )rA   r   endposinfot0rest1rp   Zcompiledr   r   r   r!   
match_funcM  s    z:ProfilingRegexLexerMeta._process_regex.<locals>.match_func)	r?   r   r   r   r   r   r   sysmaxsize)rp   r   r   r   r   r   r   r!   r   E  s    

z&ProfilingRegexLexerMeta._process_regexN)r+   r,   r-   r.   r   r   r   r   r!   r   B  s   r   c                   @   s"   e Zd ZdZg ZdZdddZdS )ProfilingRegexLexerzFDrop-in replacement for RegexLexer that does profiling of its regexes.   r   c                 #   s    j ji  t ||E d H   j j }tdd | D  fdddd}tdd |D }t	  t	d j j
t||f  t	d	 t	d
d  t	d |D ]}t	d|  qt	d	 d S )Nc                 s   sN   | ]F\\}}\}}|t |d dddd |d| d| | fV  qdS )zu'z\\\NA   i  )reprrU   rC   ).0r   rnrI   r   r   r!   	<genexpr>c  s     
z=ProfilingRegexLexer.get_tokens_unprocessed.<locals>.<genexpr>c                    s
   |  j  S rF   )_prof_sort_indexr   r=   r   r!   r"   f  r#   z<ProfilingRegexLexer.get_tokens_unprocessed.<locals>.<lambda>T)keyreversec                 s   s   | ]}|d  V  qdS )   Nr   )r   r    r   r   r!   r   h  s     z2Profiling result for %s lexing %d chars in %.3f mszn==============================================================================================================z$%-20s %-64s ncalls  tottime  percall)r   r   zn--------------------------------------------------------------------------------------------------------------z%-20s %-65s %5d %8.4f %8.4f)r<   r   r@   r   rG   r   sortedr   sumprintr+   rR   )r9   rA   r   rawdatar   Z	sum_totalr*   r   r=   r!   rG   ^  s(    
z*ProfilingRegexLexer.get_tokens_unprocessedN)r   )r+   r,   r-   r.   r   r   rG   r   r   r   r!   r   X  s   r   )3r.   r   r   r   Zpip._vendor.pygments.filterr   r   Zpip._vendor.pygments.filtersr   Zpip._vendor.pygments.tokenr   r   r   r   Zpip._vendor.pygments.utilr	   r
   r   r   r   r   Zpip._vendor.pygments.regexoptr   __all__rP   staticmethodZ_default_analyser&   r$   r   r   rM   r   rm   r   ro   rn   rr   r   r   r   r   r   r   r   r   r   r   ri   r   r   r   r   r   r!   <module>   s`   
        !'2 )aH@