U
    pdGh                     @   s$  d Z ddlZddlZddlT ejeks.tdeehZe	e
ehZeehZeehZeeehB ZdZdd eD Zejfdd	Zd
d Zdd Zd-ddZejd Zde> d ZdZ ee!fddZ"dd Z#dd Z$dd Z%dd Z&dd Z'dd  Z(d!d" Z)d#d$ Z*d%d& Z+d'd( Z,d)d* Z-d.d+d,Z.dS )/zInternal support module for sre    N)*zSRE module mismatch))i   i1  )s   i  )   i  )iE  i  i  )i  i  )i  i  )i  i  )i  i  )i  i  )i  i  )i  i  )i  i  )i  i  )i  i  )ia  i  )i  i  c                    s.   i | ]&}|D ]  t  fd d|D qqS )c                 3   s   | ]} |kr|V  qd S N ).0jir   !/usr/lib/python3.8/sre_compile.py	<genexpr>>   s      z<dictcomp>.<genexpr>)tuple)r   tr   r
   r   
<dictcomp>>   s
      r   c                 C   s    ||@ r| | M } | |B | @ S r   r   )flags	add_flags	del_flags
TYPE_FLAGSr   r   r   _combine_flagsA   s    
r   c                 C   s  | j }t}t}t}t}t}d }	d }
d }|t@ r\|t@ s\|t@ rPt	j
}	t	j}
t}nt	j}	t	j}
|D ]|\}}||krr|t@ s|| || n|t@ r|t|  || n|	|s|| || n|
|}|s|t|  || n||kr|t|  || nh|t || }|d |tkr2|t |f||  D ]}|t || q@|t || | | |< q`|tkrt||	|
|\}}|t@ r|t@ r|t n(|s|t n|s|t n|t || }|d t|||  || | | |< q`|tkr*|t@ r |t n|t q`||kr6|t@ rLt d|f t!|d r|t"krn|t# n|t$ || }|d ||d  ||d  t%| |d | |t& || | | |< nl|t' || }|d ||d  ||d  t%| |d | || | | |< |t"kr,|t( n|t) q`|t*kr|\}}}}|rj|t+ ||d d  t%| |t,||| |r|t+ ||d d d  q`||kr|| q`||krD|| || }|d |d dkr|d n*|d - \}}||krt d|| t%| |d | |t& || | | |< q`|t.kr|| || }|d t%| || |t& || | | |< q`|t/kr|| |t0@ rt12||}|t@ rt32||}n|t@ rt42||}|| q`|t5kr|| g }|j }|d D ]N}|| }|d t%| || |t6 |||  |d || | | |< q|t |D ]}|| | | |< qlq`|t7kr|| |t@ rt8| }n|t@ rt9| }|| q`|t:kr |t@ s|| n,|t@ r|t; n|s
|t< n|t= ||d  q`|t>kr|| ||d d  || }|d t%| |d | |d r|t6 || }|d || | d | |< t%| |d | || | | |< n|| | d | |< q`t d|f q`d S )Nr   z*internal: unsupported template operator %r      z(look-behind requires fixed-width patternz%internal: unsupported operand type %r)?appendlen_LITERAL_CODES_REPEATING_CODES_SUCCESS_CODES_ASSERT_CODESSRE_FLAG_IGNORECASESRE_FLAG_LOCALESRE_FLAG_UNICODE_sreunicode_iscasedunicode_tolower_ignorecase_fixesascii_iscasedascii_tolowerOP_LOCALE_IGNORE	OP_IGNOREOP_UNICODE_IGNOREIN_UNI_IGNORENOT_LITERALNEGATELITERALFAILUREIN_optimize_charsetIN_LOC_IGNORE	IN_IGNORE_compile_charsetANYSRE_FLAG_DOTALLANY_ALLSRE_FLAG_TEMPLATEerror_simple
MAX_REPEAT
REPEAT_ONEMIN_REPEAT_ONE_compileSUCCESSREPEAT	MAX_UNTIL	MIN_UNTIL
SUBPATTERNMARKr   getwidthCALLATSRE_FLAG_MULTILINEAT_MULTILINEget	AT_LOCALE
AT_UNICODEBRANCHJUMPCATEGORY	CH_LOCALE
CH_UNICODEGROUPREFGROUPREF_LOC_IGNOREGROUPREF_IGNOREGROUPREF_UNI_IGNOREGROUPREF_EXISTS)codepatternr   emit_lenLITERAL_CODESREPEATING_CODESSUCCESS_CODESASSERT_CODESiscasedtolowerfixesopavloskipkcharsethascasedgroupr   r   phitail
tailappendskipyesskipnor   r   r   r=   G   sV   






 




 







  






 


 





  











 
 r=   c                 C   s   |j }| D ]\}}|| |tkr$q
|tkr6|| q
|tksF|tkr`||d  ||d  q
|tkrt|| q
|tkr|| q
|tkr|t	@ r|t
|  q|t@ r|t|  q|| q
td|f q
|t d S )Nr   r   z%internal: unsupported set operator %r)r   r,   r-   RANGERANGE_UNI_IGNORECHARSETextend
BIGCHARSETrN   r   rO   r    rP   r8   r.   )rf   r   rV   rX   ra   rb   r   r   r   r3      s,    

r3   c              	   C   s  g }g }t d}d}| D ]\}}	z,|tkr|rv||	}
d||
< |rd|
|krd||
 D ]}d||< qV|s~||	r~d}nd||	< n|tkr&t|	d |	d d }|r|rt||D ]*}d||< ||kr|| D ]}d||< qqnt||D ]}d||< q|s$tt||}n|D ]}d||< qn(|tkr@|||	f n|||	f W nZ tk
r   t	|dkr|dd 7 }Y q"|rd}|tkrt
}|||	f Y nX qq"qg }d}|d|}|dk rԐq(t	|dkrd }q(|d|}|dk r||t	|f q(|||f q|d k	r|D ]>\}}|| dkr\|t|f n|t||d ff q6||7 }|st	|t	| k r||fS | |fS t	|dkrt|}|t|f ||7 }||fS t|}i }t d}d}t  }tdd	dD ]V}|||d  }||kr4|| ||d < n$| ||d < ||< |d7 }||7 }qt|}|gt| |dd< |t|f ||7 }||fS )
N   Fr   Tr       i   r   i   )	bytearrayr-   ro   rangemapanyr,   r   
IndexErrorr   rp   find
_mk_bitmaprq   bytes_bytes_to_codesrs   )rf   r^   fixupr`   outrk   charmaprg   ra   rb   rc   re   rr   runsqri   datacompsmappingblockchunkr   r   r   r0     s    









r0      r   s   0111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111111c                    s8   |  td d d  fddttd  D S )Nc                    s"   g | ]}|  | d qS )r   r   )r   r   	_CODEBITS_intsr   r   
<listcomp>  s   z_mk_bitmap.<locals>.<listcomp>r   )	translate_BITS_TRANSrw   r   )bitsr   r   r   r   r   r|     s    r|   c                 C   s@   t | d}|jtjkstt||j t| ks8t| S )NI)
memoryviewcastitemsizer!   CODESIZEAssertionErrorr   tolist)bar   r   r   r~     s    r~   c                 C   sD   t | dkrdS | d \}}|tkr<|d d ko:t|d S |tkS )Nr   Fr   r   )r   rB   r9   _UNIT_CODES)ri   ra   rb   r   r   r   r9     s    r9   c                 C   sn   dgt |  }tdt | D ]L}||d  }| | | | kr\|dkrNd||< q||d  }q,|d ||< q|S )aj  
    Generate an overlap table for the following prefix.
    An overlap table is a table of the same size as the prefix which
    informs about the potential self-overlap for each index in the prefix:
    - if overlap[i] == 0, prefix[i:] can't overlap prefix[0:...]
    - if overlap[i] == k with 0 < k <= i, prefix[i-k+1:i+1] overlaps with
      prefix[0:k]
    r   r   )r   rw   )prefixtabler   idxr   r   r   _generate_overlap_table  s    	r   c                 C   s$   | t @ sd S | t@ rtjS tjS d S r   )r   r    r!   r"   r%   )r   r   r   r   _get_iscased  s
    r   c                 C   s   g }|j }d }t|}| jD ]\}}|tkrF|r<||r< q|| q|tkr|\}}	}
}t||	|
}|t@ rz|t@ rz qt||\}}}|d kr|d k	rt	|}n|d k	rt	|| }|
| |s qq qq||dfS ||dfS )NTF)r   r   r   r-   rB   r   r   r   _get_literal_prefixr   rr   )rW   r   r   prefixappendprefix_skipr^   ra   rb   rh   r   r   ri   flags1prefix1prefix_skip1got_allr   r   r   r     s4    



r   c                 C   sd  | j s
d S | j d \}}|tk	r"qP|\}}}} t|||}|t@ r |t@ r d S q t|}|tkrz|rp||rpd S ||fgS |tkrg }|j}	|d D ]B}
|
s d S |
d \}}|tkr|r||s|	||f q d S q|S |t	kr`|}|r\|D ]f\}}|tkr||rZ d S q|t
kr|d dkr4 d S tt|t|d |d d r d S q|S d S )Nr   r   i  )r   rB   r   r   r   r   r-   rL   r   r/   ro   ry   rx   rw   )rW   r   ra   rb   rh   r   r   r^   rf   charsetappendri   r   r   r   _get_charset_prefix  sN    



 r   c                 C   s|  |  \}}|tkrt}|dkr8| tdd||g d S g }d}g }|t@ rT|t@ srt||\}}}|srt||}| j}	|	t t	| }
|	d d}|rt
}|d kr|r|tB }n|r|tB }|	| |tk r|	| n|	t |d t }|	t|t |r@|	t	| |d krt	|}|	| | | | t| n(|rht|\}}|r\tt|||  t	| |
 | |
< d S )Nr      )rD   MAXCODErr   INFOr   r   r   r   r   r   SRE_INFO_PREFIXSRE_INFO_LITERALSRE_INFO_CHARSETminr   r0   r   r3   )rV   rW   r   rc   rj   r   r   rf   r   rX   rd   maskrg   r   r   r   _compile_info  sT    
 




r   c                 C   s   t | ttfS r   )
isinstancestrr}   )objr   r   r   isstringS  s    r   c                 C   s8   | j j|B }g }t|| | t|| j| |t |S r   )stater   r   r=   r   r   r>   )ri   r   rV   r   r   r   _codeV  s    
r   c                 C   s   dd dd | D  S )N[%s], c                 s   s$   | ]}d t jd d |f V  qdS )z%#0*xr   N)r!   r   r   xr   r   r   r   f  s     z_hex_code.<locals>.<genexpr>)joinrV   r   r   r   	_hex_codee  s    r   c                    sN   dd l t dttt d  fdddt  d S )Nr   r   c              	      s  d d fdd
}fdd}d7  }||k r| | }|d7 }t | }|tttttttfkrx|| q2|tt	t
tttttfkr| }|d7 }||d|t|f  q2|tkr| }|d7 }tt| }|d d d	kst|||dd   q2|tkrV| }|d7 }tt| }|d d
 dksBt|||d
d   q2|ttttfkr| }||||| d |d ||  ||7 }q2|ttfkr||d  \}}	|d7 }||d||	t|t|	f  q2|tkr||t||dt    |dt 7 }q2|t krʈ| }|d7 }t!d"fdd||dt#j$   D }
||||
 |dt#j$ 7 }d7 t%|D ].}|t||dt    |dt 7 }qd8 q2|t&t't(t)t*fkr| }|d7 }||| q2|t+kr(| }||||| d |d7 }q2|t,kr| }||||| d |r|d ||  ||7 }| | }|r|d||| d n|t qL|d7 }q2|t-t.t/fkr||d  \}}}|t0krd}||||||| d |d ||  ||7 }q2|t1krJ||d  \}}|||||| d |d7 }q2|t2t3fkr||d  \}}|||||| d |d ||  ||7 }q2|t4krĈ||d  \}}}}|t0krd}|||t5||||| d |d  |t6@ r|d |d  \}}|d| |d    |  }|ddd"dd |D  dd"t7t|   |7  |d  |    |7  |t8@ rd7 |d  ||  d8 ||7 }q2t9|q2d8 d S )N)toc                    sX   | d k	r"  |  |d| f f7 }td kr6dndf dd  d t|  d S )Nz(to %d)z%*d%s :.z  r   end)addprint)r   args)labelsleveloffset_widthstartr   r   print_p  s    

z!dis.<locals>.dis_.<locals>.print_c                     s"   t dd    d t |   d S )N r   r   )r   )r   )r   r   r   r   print_2x  s    z"dis.<locals>.dis_.<locals>.print_2r   z
%#02x (%r)   AT_	   	CATEGORY_r   z%#02x %#02x (%r-%r)rt       c                 3   s   | ]}| tj jV  qd S r   )to_bytesr!   r   	byteorderr   )sysr   r   r     s   z$dis.<locals>.dis_.<locals>.<genexpr>branch	MAXREPEATr      z  prefix_skipz  prefixr   r   c                 s   s   | ]}d | V  qdS )z%#02xNr   r   r   r   r   r     s     z(%r) z	  overlapin):OPCODESr>   r.   r4   r6   r@   rA   r,   r-   r+   LITERAL_IGNORENOT_LITERAL_IGNORELITERAL_UNI_IGNORENOT_LITERAL_UNI_IGNORELITERAL_LOC_IGNORENOT_LITERAL_LOC_IGNOREchrrF   r   ATCODESr   rN   CHCODESr/   r2   r*   r1   ro   rp   rq   r   r   rs   listr   r!   r   rw   rC   rQ   rS   rT   rR   rM   rL   r?   r;   r<   r   rU   ASSERT
ASSERT_NOTr   binr   rx   r   
ValueError)r   r   r   r   r   ra   argrd   rc   rj   r   r	   r   maxr   
prefix_lenr   r   rV   dis_r   r   r   r   )r   r   r   o  s    

  
   


 




















zdis.<locals>.dis_)r   setr   r   r   r   r   r   dish  s     r   c              	   C   s   t | r| }t| |} nd }t| |}|t@ r>t  t| | jj}d g| jj	 }|
 D ]\}}|||< q\t||| jjB || jj	d |t|S )Nr   )r   	sre_parseparser   SRE_FLAG_DEBUGr   r   r   	groupdictgroupsitemsr!   compiler   r   )ri   r   rW   rV   
groupindex
indexgroupre   r   r   r   r   r     s(    

 
 
 r   )NNN)r   )/__doc__r!   r   sre_constantsMAGICr   r-   r+   r   r?   
MIN_REPEATr:   r   r>   r.   r   r   r   r   r4   r/   r   _equivalencesr$   r   r   r=   r3   r0   r   r   r   r   intr|   r~   r9   r   r   r   r   r   r   r   r   r   r   r   r   r   r   <module>   sJ   
$
 3
 
	,; 