Your IP : 13.58.82.214


Current Path : /lib64/python3.6/html/__pycache__/
Upload File :
Current File : //lib64/python3.6/html/__pycache__/parser.cpython-36.opt-2.pyc

3


 \AE�@s�ddlZddlZddlZddlmZdgZejd�Zejd�Zejd�Z	ejd�Z
ejd�Zejd	�Zejd
�Z
ejd�Zejd�Zejd
ej�Zejd	�Zejd�ZGdd�dej�ZdS)�N)�unescape�
HTMLParserz[&<]z
&[a-zA-Z#]z%&([a-zA-Z][-.a-zA-Z0-9]*)[^a-zA-Z0-9]z)&#(?:[0-9]+|[xX][0-9a-fA-F]+)[^0-9a-fA-F]z	<[a-zA-Z]�>z--\s*>z+([a-zA-Z][^\t\n\r\f />\x00]*)(?:\s|/(?!>))*z]((?<=[\'"\s/])[^\s/>][^\s/=>]*)(\s*=+\s*(\'[^\']*\'|"[^"]*"|(?![\'"])[^>\s]*))?(?:\s|/(?!>))*aF
  <[a-zA-Z][^\t\n\r\f />\x00]*       # tag name
  (?:[\s/]*                          # optional whitespace before attribute name
    (?:(?<=['"\s/])[^\s/>][^\s/=>]*  # attribute name
      (?:\s*=+\s*                    # value indicator
        (?:'[^']*'                   # LITA-enclosed value
          |"[^"]*"                   # LIT-enclosed value
          |(?!['"])[^>\s]*           # bare value
         )
         (?:\s*,)*                   # possibly followed by a comma
       )?(?:\s|/(?!>))*
     )*
   )?
  \s*                                # trailing whitespace
z#</\s*([a-zA-Z][-.a-zA-Z0-9:_]*)\s*>c@s�eZdZd9Zdd�dd�Zdd�Zd	d
�Zdd�Zd
Zdd�Z	dd�Z
dd�Zdd�Zdd�Z
d:dd�Zdd�Zdd�Zdd �Zd!d"�Zd#d$�Zd%d&�Zd'd(�Zd)d*�Zd+d,�Zd-d.�Zd/d0�Zd1d2�Zd3d4�Zd5d6�Zd7d8�Zd
S);r�script�styleT)�convert_charrefscCs||_|j�dS)N)r�reset)�selfr�r
�#/usr/lib64/python3.6/html/parser.py�__init__WszHTMLParser.__init__cCs(d|_d|_t|_d|_tjj|�dS)N�z???)�rawdata�lasttag�interesting_normal�interesting�
cdata_elem�_markupbase�
ParserBaser)r	r
r
rr`s
zHTMLParser.resetcCs|j||_|jd�dS)Nr)r�goahead)r	�datar
r
r�feedhszHTMLParser.feedcCs|jd�dS)N�)r)r	r
r
r�closeqszHTMLParser.closeNcCs|jS)N)�_HTMLParser__starttag_text)r	r
r
r�get_starttag_textwszHTMLParser.get_starttag_textcCs$|j�|_tjd|jtj�|_dS)Nz</\s*%s\s*>)�lowerr�re�compile�Ir)r	�elemr
r
r�set_cdata_mode{s
zHTMLParser.set_cdata_modecCst|_d|_dS)N)rrr)r	r
r
r�clear_cdata_modeszHTMLParser.clear_cdata_modecCsL|j}d}t|�}�x�||k�r�|jr||jr||jd|�}|dkr�|jdt||d��}|dkrvtjd�j	||�rvP|}n(|j
j	||�}|r�|j�}n|jr�P|}||kr�|jr�|jr�|jt
|||���n|j|||��|j||�}||kr�P|j}|d|��rLtj||��r&|j|�}	n�|d|��r>|j|�}	nl|d|��rV|j|�}	nT|d|��rn|j|�}	n<|d	|��r�|j|�}	n$|d
|k�r�|jd�|d
}	nP|	dk�r>|�s�P|jd|d
�}	|	dk�r�|jd|d
�}	|	dk�r|d
}	n|	d
7}	|j�r,|j�r,|jt
|||	���n|j|||	��|j||	�}q|d|��r�tj||�}|�r�|j�d
d�}
|j|
�|j�}	|d|	d
��s�|	d
}	|j||	�}qn:d||d�k�r�|j|||d
��|j||d
�}Pq|d|�rtj||�}|�rN|jd
�}
|j|
�|j�}	|d|	d
��s@|	d
}	|j||	�}qtj||�}|�r�|�r�|j�||d�k�r�|j�}	|	|k�r�|}	|j||d
�}Pn,|d
|k�r�|jd�|j||d
�}nPqqW|�r:||k�r:|j�r:|j�r|j�r|jt
|||���n|j|||��|j||�}||d�|_dS)Nr�<�&�"z[\s;]z</z<!--z<?z<!rrz&#��;���)r�lenrr�find�rfind�maxrr�searchr�start�handle_datarZ	updatepos�
startswith�starttagopen�match�parse_starttag�parse_endtag�
parse_comment�parse_pi�parse_html_declaration�charref�group�handle_charref�end�	entityref�handle_entityref�
incomplete)r	r;r�i�n�jZampposr2r0�k�namer
r
rr�s�












zHTMLParser.goaheadcCs�|j}|||d�dkr$|j|�S|||d�dkrB|j|�S|||d�j�dkr�|jd|d�}|d
krvdS|j||d	|��|dS|j|�SdS)N�z<!--�z<![�	z	<!doctyperrr&r(r()rr5Zparse_marked_sectionrr*�handle_decl�parse_bogus_comment)r	r?r�gtposr
r
rr7s

z!HTMLParser.parse_html_declarationrcCsD|j}|jd|d�}|dkr"dS|r<|j||d|��|dS)Nrr&rr(r()rr*�handle_comment)r	r?Zreportr�posr
r
rrHszHTMLParser.parse_bogus_commentcCsH|j}tj||d�}|sdS|j�}|j||d|��|j�}|S)Nr&rr()r�picloser-r.�	handle_pir;)r	r?rr2rAr
r
rr6!szHTMLParser.parse_picCs�d|_|j|�}|dkr|S|j}|||�|_g}tj||d�}|j�}|jd�j�|_}x�||k�r$t	j||�}|s~P|jddd�\}	}
}|
s�d}n^|dd�dko�|d
d�kns�|dd�dko�|dd�kn�r�|dd�}|�rt
|�}|j|	j�|f�|j�}qbW|||�j�}|d
k�r�|j
�\}
}d	|jk�r�|
|jjd	�}
t|j�|jjd	�}n|t|j�}|j|||��|S|jd��r�|j||�n"|j||�||jk�r�|j|�|S)Nrrr&rE�'�"r�/>�
r(r(r()rrP)r�check_for_whole_start_tagr�tagfind_tolerantr2r;r9rr�attrfind_tolerantr�append�stripZgetpos�countr)r+r/�endswith�handle_startendtag�handle_starttag�CDATA_CONTENT_ELEMENTSr!)r	r?�endposr�attrsr2rB�tag�mZattrname�restZ	attrvaluer;�lineno�offsetr
r
rr3-sP
(*

zHTMLParser.parse_starttagcCs�|j}tj||�}|r�|j�}|||d�}|dkr>|dS|dkr~|jd|�rZ|dS|jd|�rjd	S||krv|S|dS|dkr�d
S|dkr�dS||kr�|S|dStd��dS)Nrr�/z/>r&r
z6abcdefghijklmnopqrstuvwxyz=/ABCDEFGHIJKLMNOPQRSTUVWXYZzwe should not get here!r(r(r()r�locatestarttagend_tolerantr2r;r0�AssertionError)r	r?rr_rA�nextr
r
rrR`s.z$HTMLParser.check_for_whole_start_tagcCs|j}tj||d�}|sdS|j�}tj||�}|s�|jdk	rV|j|||��|Stj||d�}|s�|||d�dkr�|dS|j	|�S|j
d�j�}|jd|j��}|j
|�|dS|j
d�j�}|jdk	�r�||jk�r�|j|||��|S|j
|j��|j�|S)Nrr&rEz</>rr()r�	endendtagr-r;�
endtagfindr2rr/rSrHr9rr*�
handle_endtagr")r	r?rr2rIZ	namematchZtagnamer r
r
rr4�s6


zHTMLParser.parse_endtagcCs|j||�|j|�dS)N)rZri)r	r^r]r
r
rrY�szHTMLParser.handle_startendtagcCsdS)Nr
)r	r^r]r
r
rrZ�szHTMLParser.handle_starttagcCsdS)Nr
)r	r^r
r
rri�szHTMLParser.handle_endtagcCsdS)Nr
)r	rCr
r
rr:�szHTMLParser.handle_charrefcCsdS)Nr
)r	rCr
r
rr=�szHTMLParser.handle_entityrefcCsdS)Nr
)r	rr
r
rr/�szHTMLParser.handle_datacCsdS)Nr
)r	rr
r
rrJ�szHTMLParser.handle_commentcCsdS)Nr
)r	Zdeclr
r
rrG�szHTMLParser.handle_declcCsdS)Nr
)r	rr
r
rrM�szHTMLParser.handle_picCsdS)Nr
)r	rr
r
r�unknown_decl�szHTMLParser.unknown_declcCstjdtdd�t|�S)NzZThe unescape method is deprecated and will be removed in 3.5, use html.unescape() instead.r&)�
stacklevel)�warnings�warn�DeprecationWarningr)r	�sr
r
rr�s
zHTMLParser.unescape)rr)r)�__name__�
__module__�__qualname__r[rrrrrrr!r"rr7rHr6r3rRr4rYrZrir:r=r/rJrGrMrjrr
r
r
rr?s6		z
3"()rrlrZhtmlr�__all__rrr>r<r8r1rLZcommentcloserSrT�VERBOSErdrgrhrrr
r
r
r�<module>s&