U
    `a[Ny                     @   s  d Z ddlmZ ddlZddlZddlZddlmZmZ ddl	m
Z
 ddlmZmZmZmZ ddlmZmZmZmZmZmZmZmZmZ ddlmZ d	d
ddddddddddgZdddddgZedd ZG dd de Z!ee!G dd	 d	e"Z#G dd de#Z$G d d de%Z&G d!d" d"e"Z'e' Z(G d#d$ d$e)Z*G d%d& d&e"Z+d'd Z,G d(d) d)e"Z-e- Z.d*d Z/G d+d dZ0G d,d deZ1G d-d. d.e!Z2ee2G d/d
 d
e#Z3G d0d de"Z4G d1d de3Z5d2d3 Z6G d4d5 d5e2Z7ee7G d6d7 d7e3Z8dS )8z
    pygments.lexer
    ~~~~~~~~~~~~~~

    Base lexer classes.

    :copyright: Copyright 2006-2017 by the Pygments team, see AUTHORS.
    :license: BSD, see LICENSE for details.
    )print_functionN)apply_filtersFilter)get_filter_by_name)ErrorTextOther
_TokenType)	get_bool_optget_int_optget_list_optmake_analysator	text_typeadd_metaclass	iteritemsFutureguess_decode)	regex_optLexer
RegexLexerExtendedRegexLexerDelegatingLexerLexerContextincludeinheritbygroupsusingthisdefaultwords)s   ﻿utf-8)s     zutf-32)s     zutf-32be)s   zutf-16)s   zutf-16bec                 C   s   dS )N         xr"   r"   0/usr/lib/python3/dist-packages/pygments/lexer.py<lambda>$       r&   c                   @   s   e Zd ZdZdd ZdS )	LexerMetaz
    This metaclass automagically converts ``analyse_text`` methods into
    static methods which always return float values.
    c                 C   s(   d|krt |d |d< t| |||S )Nanalyse_text)r   type__new__)Zmcsnamebasesdr"   r"   r%   r+   -   s    zLexerMeta.__new__N)__name__
__module____qualname____doc__r+   r"   r"   r"   r%   r(   '   s   r(   c                   @   sZ   e Zd ZdZdZg Zg Zg Zg ZdZ	dd Z
dd Zdd	 Zd
d ZdddZdd ZdS )r   a  
    Lexer for a specific language.

    Basic options recognized:
    ``stripnl``
        Strip leading and trailing newlines from the input (default: True).
    ``stripall``
        Strip all leading and trailing whitespace from the input
        (default: False).
    ``ensurenl``
        Make sure that the input ends with a newline (default: True).  This
        is required for some lexers that consume input linewise.

        .. versionadded:: 1.3

    ``tabsize``
        If given and greater than 0, expand tabs in the input (default: 0).
    ``encoding``
        If given, must be an encoding name. This encoding will be used to
        convert the input string to Unicode, if it is not already a Unicode
        string (default: ``'guess'``, which uses a simple UTF-8 / Locale /
        Latin1 detection.  Can also be ``'chardet'`` to use the chardet
        library, if it is installed.
    ``inencoding``
        Overrides the ``encoding`` if given.
    Nr   c                 K   s   || _ t|dd| _t|dd| _t|dd| _t|dd| _|dd	| _|d
pZ| j| _g | _	t
|ddD ]}| | qpd S )NstripnlTstripallFensurenltabsizer   encodingguessZ
inencodingfiltersr"   )optionsr
   r3   r4   r5   r   r6   getr7   r9   r   
add_filter)selfr:   filter_r"   r"   r%   __init__b   s    zLexer.__init__c                 C   s(   | j rd| jj| j f S d| jj S d S )Nz<pygments.lexers.%s with %r>z<pygments.lexers.%s>)r:   	__class__r/   r=   r"   r"   r%   __repr__n   s
    zLexer.__repr__c                 K   s&   t |tst|f|}| j| dS )z8
        Add a new stream filter to this lexer.
        N)
isinstancer   r   r9   append)r=   r>   r:   r"   r"   r%   r<   u   s    
zLexer.add_filterc                 C   s   dS )a~  
        Has to return a float between ``0`` and ``1`` that indicates
        if a lexer wants to highlight this text. Used by ``guess_lexer``.
        If this method returns ``0`` it won't highlight it in any case, if
        it returns ``1`` highlighting with this lexer is guaranteed.

        The `LexerMeta` metaclass automatically wraps this function so
        that it works like a static method (no ``self`` or ``cls``
        parameter) and the return value is automatically converted to
        `float`. If the return value is an object that is boolean `False`
        it's the same as if the return values was ``0.0``.
        Nr"   )textr"   r"   r%   r)   }   s    zLexer.analyse_textFc                    s  t ts jdkr"t\}nȈ jdkrzddl}W n tk
rT   tdY nX d}tD ].\}}|r^t|d 	|d} qq^|dkr|
dd }	|dpd	d}|n&	 jd
rtd
d nd
rtd
d dddd jr2 n jrDd jdkr\ j jrxdsxd7  fdd}	|	 }
|st|
 j }
|
S )a=  
        Return an iterable of (tokentype, value) pairs generated from
        `text`. If `unfiltered` is set to `True`, the filtering mechanism
        is bypassed even if filters are defined.

        Also preprocess the text, i.e. expand tabs and strip it if
        wanted and applies registered filters.
        r8   chardetr   NzkTo enable chardet encoding guessing, please install the chardet library from http://chardet.feedparser.org/replacei   r7   r    u   ﻿z

c                  3   s$     D ]\} }}||fV  q
d S N)get_tokens_unprocessed)_tvr=   rE   r"   r%   streamer   s    z"Lexer.get_tokens.<locals>.streamer)rC   r   r7   r   rF   ImportError_encoding_map
startswithlendecodeZdetectr;   rG   r4   stripr3   r6   
expandtabsr5   endswithr   r9   )r=   rE   Z
unfilteredrL   rF   ZdecodedZbomr7   encrP   streamr"   rO   r%   
get_tokens   sN    	






zLexer.get_tokensc                 C   s   t dS )z
        Return an iterable of (index, tokentype, value) pairs where "index"
        is the starting position of the token within the input text.

        In subclasses, implement this method as a generator to
        maximize effectiveness.
        N)NotImplementedErrorrO   r"   r"   r%   rK      s    zLexer.get_tokens_unprocessed)F)r/   r0   r1   r2   r,   aliases	filenamesZalias_filenamesZ	mimetypesZpriorityr?   rB   r<   r)   r[   rK   r"   r"   r"   r%   r   3   s   
;c                   @   s$   e Zd ZdZefddZdd ZdS )r   a   
    This lexer takes two lexer as arguments. A root lexer and
    a language lexer. First everything is scanned using the language
    lexer, afterwards all ``Other`` tokens are lexed using the root
    lexer.

    The lexers from the ``template`` lexer package use this base lexer.
    c                 K   s0   |f || _ |f || _|| _tj| f| d S rJ   )
root_lexerlanguage_lexerneedler   r?   )r=   Z_root_lexerZ_language_lexerZ_needler:   r"   r"   r%   r?      s    zDelegatingLexer.__init__c                 C   s   d}g }g }| j |D ]H\}}}|| jkrP|rF|t||f g }||7 }q||||f q|rx|t||f t|| j|S )N )r`   rK   ra   rD   rT   do_insertionsr_   )r=   rE   Zbuffered
insertionsZ
lng_bufferirM   rN   r"   r"   r%   rK      s    


z&DelegatingLexer.get_tokens_unprocessedN)r/   r0   r1   r2   r   r?   rK   r"   r"   r"   r%   r      s   	c                   @   s   e Zd ZdZdS )r   zI
    Indicates that a state should include rules from another state.
    Nr/   r0   r1   r2   r"   r"   r"   r%   r      s   c                   @   s   e Zd ZdZdd ZdS )_inheritzC
    Indicates the a state should inherit from its superclass.
    c                 C   s   dS )Nr   r"   rA   r"   r"   r%   rB     s    z_inherit.__repr__N)r/   r0   r1   r2   rB   r"   r"   r"   r%   rg      s   rg   c                   @   s    e Zd ZdZdd Zdd ZdS )combinedz:
    Indicates a state combined from multiple states.
    c                 G   s   t | |S rJ   )tupler+   )clsargsr"   r"   r%   r+     s    zcombined.__new__c                 G   s   d S rJ   r"   )r=   rk   r"   r"   r%   r?     s    zcombined.__init__N)r/   r0   r1   r2   r+   r?   r"   r"   r"   r%   rh   	  s   rh   c                   @   sF   e Zd ZdZdd ZdddZdddZdd	d
Zdd Zdd Z	dS )_PseudoMatchz:
    A pseudo match object constructed from a string.
    c                 C   s   || _ || _d S rJ   )_text_start)r=   startrE   r"   r"   r%   r?     s    z_PseudoMatch.__init__Nc                 C   s   | j S rJ   )rn   r=   argr"   r"   r%   ro     s    z_PseudoMatch.startc                 C   s   | j t| j S rJ   )rn   rT   rm   rp   r"   r"   r%   end"  s    z_PseudoMatch.endc                 C   s   |rt d| jS )NzNo such group)
IndexErrorrm   rp   r"   r"   r%   group%  s    z_PseudoMatch.groupc                 C   s   | j fS rJ   )rm   rA   r"   r"   r%   groups*  s    z_PseudoMatch.groupsc                 C   s   i S rJ   r"   rA   r"   r"   r%   	groupdict-  s    z_PseudoMatch.groupdict)N)N)N)
r/   r0   r1   r2   r?   ro   rr   rt   ru   rv   r"   r"   r"   r%   rl     s   


rl   c                     s   d fdd	}|S )zL
    Callback that yields multiple actions for each group in the match.
    Nc                 3   s   t  D ]\}}|d krqqt|tkrR||d }|r||d ||fV  q||d }|d k	r|r|||d |_|| t||d ||D ]}|r|V  qq|r| |_d S )N   )	enumerater*   r	   rt   ro   posrl   rr   )lexermatchctxre   actiondataitemrk   r"   r%   callback5  s&     
zbygroups.<locals>.callback)Nr"   )rk   r   r"   r   r%   r   1  s    c                   @   s   e Zd ZdZdS )_ThiszX
    Special singleton used for indicating the caller class.
    Used by ``using``.
    Nrf   r"   r"   r"   r%   r   K  s   r   c                    sj   i dkr: d}t|ttfr.|d< nd|fd<  tkrTdfdd	}nd	 fdd	}|S )
a  
    Callback that processes the match with a different lexer.

    The keyword arguments are forwarded to the lexer, except `state` which
    is handled separately.

    `state` specifies the state that the new lexer will start in, and can
    be an enumerable such as ('root', 'inline', 'string') or a simple
    string which is assumed to be on top of the root state.

    Note: For that to work, `_other` must not be an `ExtendedRegexLexer`.
    statestackrootNc                 3   sj   r | j | jf }n| }| }|j| f D ]\}}}|| ||fV  q<|rf| |_d S rJ   )updater:   r@   ro   rK   rt   rr   ry   rz   r{   r|   Zlxsre   rM   rN   )	gt_kwargskwargsr"   r%   r   i  s    zusing.<locals>.callbackc                 3   s^    | j  f }| }|j| fD ]\}}}|| ||fV  q0|rZ| |_d S rJ   )r   r:   ro   rK   rt   rr   ry   r   _otherr   r   r"   r%   r   x  s    
)N)N)poprC   listri   r   )r   r   r   r   r"   r   r%   r   S  s    


c                   @   s   e Zd ZdZdd ZdS )r   z
    Indicates a state or state action (e.g. #pop) to apply.
    For example default('#pop') is equivalent to ('', Token, '#pop')
    Note that state tuples may be used as well.

    .. versionadded:: 2.0
    c                 C   s
   || _ d S rJ   )r   )r=   r   r"   r"   r%   r?     s    zdefault.__init__N)r/   r0   r1   r2   r?   r"   r"   r"   r%   r     s   c                   @   s"   e Zd ZdZdddZdd ZdS )	r   z
    Indicates a list of literal words that is transformed into an optimized
    regex that matches any of the words.

    .. versionadded:: 2.0
    rb   c                 C   s   || _ || _|| _d S rJ   )r   prefixsuffix)r=   r   r   r   r"   r"   r%   r?     s    zwords.__init__c                 C   s   t | j| j| jdS )Nr   r   )r   r   r   r   rA   r"   r"   r%   r;     s    z	words.getN)rb   rb   )r/   r0   r1   r2   r?   r;   r"   r"   r"   r%   r     s   
c                   @   sJ   e Zd ZdZdd Zdd Zdd Zdd	 ZdddZdd Z	dd Z
d
S )RegexLexerMetazw
    Metaclass for RegexLexer, creates the self._tokens attribute from
    self.tokens on the first instantiation.
    c                 C   s    t |tr| }t||jS )zBPreprocess the regular expression component of a token definition.)rC   r   r;   recompiler{   )rj   regexrflagsr   r"   r"   r%   _process_regex  s    
zRegexLexerMeta._process_regexc                 C   s&   t |tks"t|s"td|f |S )z5Preprocess the token component of a token definition.z2token type must be simple type or callable, not %r)r*   r	   callableAssertionError)rj   tokenr"   r"   r%   _process_token  s    zRegexLexerMeta._process_tokenc                 C   s  t |trd|dkrdS ||kr$|fS |dkr0|S |dd dkrRt|dd  S dsbtd| nt |trd	| j }|  jd
7  _g }|D ],}||kstd| || ||| q|||< |fS t |tr |D ] }||ks|dkstd| q|S dstd| dS )z=Preprocess the state transition action of a token definition.#pop#pushN   z#pop:Fzunknown new state %rz_tmp_%drw   zcircular state ref %r)r   r   zunknown new state zunknown new state def %r)	rC   strintr   rh   _tmpnameextend_process_stateri   )rj   	new_stateunprocessed	processedZ	tmp_stateitokensZistater"   r"   r%   _process_new_state  s>    



 z!RegexLexerMeta._process_new_statec                 C   s  t |tkstd| |d dks0td| ||kr@|| S g  }||< | j}|| D ],}t|tr||ks~td| || ||t| qZt|trqZt|t	r| 
|j||}|tdjd|f qZt |tkstd| z| |d ||}W n< tk
rB }	 ztd	|d || |	f W 5 d}	~	X Y nX | |d
 }
t|dkrfd}n| 
|d ||}|||
|f qZ|S )z%Preprocess a single state definition.zwrong state name %rr   #zinvalid state name %rzcircular state reference %rrb   Nzwrong rule def %rz+uncompilable regex %r in state %r of %r: %srw      )r*   r   r   flagsrC   r   r   r   rg   r   r   r   rD   r   r   r{   ri   r   	Exception
ValueErrorr   rT   )rj   r   r   r   tokensr   Ztdefr   rexerrr   r"   r"   r%   r     sF    



 zRegexLexerMeta._process_stateNc                 C   s<   i  }| j |< |p| j| }t|D ]}| ||| q$|S )z-Preprocess a dictionary of token definitions.)_all_tokensr   r   r   )rj   r,   	tokendefsr   r   r"   r"   r%   process_tokendef  s
    zRegexLexerMeta.process_tokendefc           
   
   C   s   i }i }| j D ]}|jdi }t|D ]\}}||}|dkr||||< z|t}W n tk
rp   Y q(Y nX |||< q(||d}|dkrq(||||d < z|t}	W n tk
r   Y q(X ||	 ||< q(q|S )a  
        Merge tokens from superclasses in MRO order, returning a single tokendef
        dictionary.

        Any state that is not defined by a subclass will be inherited
        automatically.  States that *are* defined by subclasses will, by
        default, override that state in the superclass.  If a subclass wishes to
        inherit definitions from a superclass, it can use the special value
        "inherit", which will cause the superclass' state definition to be
        included at that point in the state.
        r   Nrw   )__mro____dict__r;   r   indexr   r   r   )
rj   r   ZinheritablecZtoksr   itemsZcuritemsZinherit_ndxZnew_inh_ndxr"   r"   r%   get_tokendefs
  s0    


zRegexLexerMeta.get_tokendefsc                 O   sL   d| j kr:i | _d| _t| dr(| jr(n| d|  | _tj	| f||S )z:Instantiate cls after preprocessing its token definitions._tokensr   token_variantsrb   )
r   r   r   hasattrr   r   r   r   r*   __call__)rj   rk   kwdsr"   r"   r%   r   ;  s    
zRegexLexerMeta.__call__)N)r/   r0   r1   r2   r   r   r   r   r   r   r   r"   r"   r"   r%   r     s   #,
1r   c                   @   s$   e Zd ZdZejZi ZdddZdS )r   z
    Base for simple stateful regular expression-based lexers.
    Simplifies the lexing process so that you need only
    provide a list of states and regular expressions.
    r   c                 c   s  d}| j }t|}||d  }|D ]\}}}	|||}
|
r"|dk	rxt|tkrb|||
 fV  n|| |
D ]
}|V  ql|
 }|	dk	r"t|	tr|	D ]8}|dkr|  q|dkr|	|d  q|	| qnBt|	t
r||	d= n,|	dkr|	|d  ndstd|	 ||d  } qq"zP|| dkr^d	g}|d	 }|tdfV  |d
7 }W q|t|| fV  |d
7 }W q tk
r   Y qY qX qdS )z}
        Split ``text`` into (tokentype, text) pairs.

        ``stack`` is the inital stack (default: ``['root']``)
        r   r   Nr   r   Fwrong state def: %rrH   r   rw   )r   r   r*   r	   rt   rr   rC   ri   r   rD   r   r   r   r   rs   )r=   rE   r   ry   r   Z
statestackstatetokensrexmatchr}   r   mr   r   r"   r"   r%   rK   h  sN    





z!RegexLexer.get_tokens_unprocessedN)r   )	r/   r0   r1   r2   r   	MULTILINEr   r   rK   r"   r"   r"   r%   r   I  s   c                   @   s"   e Zd ZdZdddZdd ZdS )r   z9
    A helper object that holds lexer position data.
    Nc                 C   s*   || _ || _|pt|| _|p"dg| _d S )Nr   )rE   ry   rT   rr   r   )r=   rE   ry   r   rr   r"   r"   r%   r?     s    zLexerContext.__init__c                 C   s   d| j | j| jf S )NzLexerContext(%r, %r, %r))rE   ry   r   rA   r"   r"   r%   rB     s
      zLexerContext.__repr__)NN)r/   r0   r1   r2   r?   rB   r"   r"   r"   r%   r     s   
c                   @   s   e Zd ZdZdddZdS )r   zE
    A RegexLexer that uses a context object to store its state.
    Nc                 c   s  | j }|st|d}|d }n|}||jd  }|j}|D ]6\}}}|||j|j}	|	r:|dk	rt|tkr|j||	 fV  |	 |_n*|| |	|D ]
}
|
V  q|s||jd  }|dk	rnt	|t
r|D ]B}|dkr|j  q|dkr|j|jd  q|j| qnJt	|tr0|j|d= n0|dkrN|j|jd  nds`td| ||jd  } q6q:zz|j|jkrW q||j d	krdg|_|d }|jtd	fV  | jd
7  _W q6|jt||j fV  | jd
7  _W q6 tk
r
   Y qY q6X q6dS )z
        Split ``text`` into (tokentype, text) pairs.
        If ``context`` is given, use this lexer context instead.
        r   r   r   Nr   r   Fr   rH   rw   )r   r   r   rE   ry   rr   r*   r	   rt   rC   ri   r   rD   r   r   r   r   rs   )r=   rE   contextr   r|   r   r   r}   r   r   r   r   r"   r"   r%   rK     s\    




z)ExtendedRegexLexer.get_tokens_unprocessed)NN)r/   r0   r1   r2   rK   r"   r"   r"   r%   r     s   c              	   c   s  t | } zt| \}}W n& tk
r>   |D ]
}|V  q,Y dS X d}d}|D ]\}}}	|dkrb|}d}
|r
|t|	 |kr
|	|
||  }|||fV  |t|7 }|D ]"\}}}|||fV  |t|7 }q|| }
zt| \}}W qf tk
r   d}Y q
Y qfX qf|||	|
d fV  |t|	|
 7 }qL|r|p>d}|D ]$\}}}	|||	fV  |t|	7 }qDzt| \}}W n  tk
r   d}Y qY nX q0dS )ag  
    Helper for lexers which must combine the results of several
    sublexers.

    ``insertions`` is a list of ``(index, itokens)`` pairs.
    Each ``itokens`` iterable should be inserted at position
    ``index`` into the token stream given by the ``tokens``
    argument.

    The result is a combined token stream.

    TODO: clean up the code here.
    NTr   F)iternextStopIterationrT   )rd   r   r   r   r   ZrealposZinsleftre   rM   rN   ZoldiZtmpvalZit_indexZit_tokenZit_valuepr"   r"   r%   rc     sL    
rc   c                   @   s   e Zd ZdZdd ZdS )ProfilingRegexLexerMetaz>Metaclass for ProfilingRegexLexer, collects regex timing info.c                    sL   t |tr t|j|j|jdn|t|tjf fdd	}|S )Nr   c                    s`    j d fddg}t }| ||}t }|d  d7  < |d  || 7  < |S )Nr   r   r!   rw   )
_prof_data
setdefaulttimer{   )rE   ry   endposinfoZt0rest1rj   Zcompiledr   r   r"   r%   
match_func@  s    z:ProfilingRegexLexerMeta._process_regex.<locals>.match_func)	rC   r   r   r   r   r   r   sysmaxsize)rj   r   r   r   r   r"   r   r%   r   8  s    

z&ProfilingRegexLexerMeta._process_regexN)r/   r0   r1   r2   r   r"   r"   r"   r%   r   5  s   r   c                   @   s"   e Zd ZdZg ZdZdddZdS )ProfilingRegexLexerzFDrop-in replacement for RegexLexer that does profiling of its regexes.   r   c                 #   s    j ji  t ||D ]
}|V  q j j }tdd | D  fdddd}tdd |D }t	  t	d j j
t||f  t	d	 t	d
d  t	d |D ]}t	d|  qt	d	 d S )Nc                 s   sN   | ]F\\}}\}}|t |d dddd |d| d| | fV  qdS )zu'z\\\NA   i  )reprrV   rG   ).0r   rnrM   r"   r"   r%   	<genexpr>X  s     
z=ProfilingRegexLexer.get_tokens_unprocessed.<locals>.<genexpr>c                    s
   |  j  S rJ   )_prof_sort_indexr#   rA   r"   r%   r&   [  r'   z<ProfilingRegexLexer.get_tokens_unprocessed.<locals>.<lambda>T)keyreversec                 s   s   | ]}|d  V  qdS )   Nr"   )r   r$   r"   r"   r%   r   ]  s     z2Profiling result for %s lexing %d chars in %.3f mszn==============================================================================================================z$%-20s %-64s ncalls  tottime  percall)r   r   zn--------------------------------------------------------------------------------------------------------------z%-20s %-65s %5d %8.4f %8.4f)r@   r   rD   r   rK   r   sortedr   sumprintr/   rT   )r=   rE   r   tokZrawdatar~   Z	sum_totalr.   r"   rA   r%   rK   R  s*    
z*ProfilingRegexLexer.get_tokens_unprocessedN)r   )r/   r0   r1   r2   r   r   rK   r"   r"   r"   r%   r   K  s   r   )9r2   Z
__future__r   r   r   r   Zpygments.filterr   r   Zpygments.filtersr   Zpygments.tokenr   r   r   r	   Zpygments.utilr
   r   r   r   r   r   r   r   r   Zpygments.regexoptr   __all__rR   staticmethodZ_default_analyser*   r(   objectr   r   r   r   rg   r   ri   rh   rl   r   r   r   r   r   r   r   r   r   r   rc   r   r   r"   r"   r"   r%   <module>   sh   
,       '2 )WE?