Your IP : 18.224.44.249


Current Path : /lib64/python2.7/
Upload File :
Current File : //lib64/python2.7/HTMLParser.pyc

�
�mec@sdZddlZddlZejd�Zejd�Zejd�Zejd�Zejd�Zejd�Z	ejd	�Z
ejd
�Zejd�Zejd�Z
ejd
ej�Zejd�Zejd�Zdefd��YZdejfd��YZdS(sA parser for HTML and XHTML.i����Ns[&<]s
&[a-zA-Z#]s%&([a-zA-Z][-.a-zA-Z0-9]*)[^a-zA-Z0-9]s)&#(?:[0-9]+|[xX][0-9a-fA-F]+)[^0-9a-fA-F]s	<[a-zA-Z]t>s--\s*>s(([a-zA-Z][-.a-zA-Z0-9:_]*)(?:\s|/(?!>))*s[a-zA-Z][^	

 />]*s]((?<=[\'"\s/])[^\s/>][^\s/=>]*)(\s*=+\s*(\'[^\']*\'|"[^"]*"|(?![\'"])[^>\s]*))?(?:\s|/(?!>))*s
  <[a-zA-Z][-.a-zA-Z0-9:_]*          # tag name
  (?:[\s/]*                          # optional whitespace before attribute name
    (?:(?<=['"\s/])[^\s/>][^\s/=>]*  # attribute name
      (?:\s*=+\s*                    # value indicator
        (?:'[^']*'                   # LITA-enclosed value
          |"[^"]*"                   # LIT-enclosed value
          |(?!['"])[^>\s]*           # bare value
         )
       )?(?:\s|/(?!>))*
     )*
   )?
  \s*                                # trailing whitespace
s#</\s*([a-zA-Z][-.a-zA-Z0-9:_]*)\s*>tHTMLParseErrorcBs#eZdZdd�Zd�ZRS(s&Exception raised for all parse errors.cCs3|st�||_|d|_|d|_dS(Nii(tAssertionErrortmsgtlinenotoffset(tselfRtposition((s"/usr/lib64/python2.7/HTMLParser.pyt__init__9s	
cCsW|j}|jdk	r,|d|j}n|jdk	rS|d|jd}n|S(Ns, at line %ds, column %di(RRtNoneR(Rtresult((s"/usr/lib64/python2.7/HTMLParser.pyt__str__?s	N(NN(t__name__t
__module__t__doc__R	RR(((s"/usr/lib64/python2.7/HTMLParser.pyR6st
HTMLParsercBs
eZdZdZd�Zd�Zd�Zd�Zd�ZdZ
d�Zd	�Zd
�Z
d�Zd�Zd
d�Zd�Zd�Zd�Zd�Zd�Zd�Zd�Zd�Zd�Zd�Zd�Zd�Zd�Zd�ZdZd�Z RS( s�Find tags and other markup and call handler functions.

    Usage:
        p = HTMLParser()
        p.feed(data)
        ...
        p.close()

    Start tags are handled by calling self.handle_starttag() or
    self.handle_startendtag(); end tags by self.handle_endtag().  The
    data between tags is passed from the parser to the derived class
    by calling self.handle_data() with the data as argument (the data
    may be split up in arbitrary chunks).  Entity references are
    passed by calling self.handle_entityref() with the entity
    reference as the argument.  Numeric character references are
    passed to self.handle_charref() with the string containing the
    reference as the argument.
    tscripttstylecCs|j�dS(s#Initialize and reset this instance.N(treset(R((s"/usr/lib64/python2.7/HTMLParser.pyR_scCs8d|_d|_t|_d|_tjj|�dS(s1Reset this instance.  Loses all unprocessed data.ts???N(	trawdatatlasttagtinteresting_normaltinterestingR	t
cdata_elemt
markupbaset
ParserBaseR(R((s"/usr/lib64/python2.7/HTMLParser.pyRcs
				cCs!|j||_|jd�dS(s�Feed data to the parser.

        Call this as often as you want, with as little or as much text
        as you want (may include '\n').
        iN(Rtgoahead(Rtdata((s"/usr/lib64/python2.7/HTMLParser.pytfeedkscCs|jd�dS(sHandle any buffered data.iN(R(R((s"/usr/lib64/python2.7/HTMLParser.pytclosetscCst||j���dS(N(Rtgetpos(Rtmessage((s"/usr/lib64/python2.7/HTMLParser.pyterrorxscCs|jS(s)Return full source of start tag: '<...>'.(t_HTMLParser__starttag_text(R((s"/usr/lib64/python2.7/HTMLParser.pytget_starttag_text}scCs2|j�|_tjd|jtj�|_dS(Ns</\s*%s\s*>(tlowerRtretcompiletIR(Rtelem((s"/usr/lib64/python2.7/HTMLParser.pytset_cdata_mode�scCst|_d|_dS(N(RRR	R(R((s"/usr/lib64/python2.7/HTMLParser.pytclear_cdata_mode�s	c
Cst|j}d}t|�}x||kr|jj||�}|rT|j�}n|jraPn|}||kr�|j|||!�n|j||�}||kr�Pn|j}|d|�r7t	j
||�r�|j|�}n�|d|�r	|j|�}n�|d|�r*|j
|�}nm|d|�rK|j|�}nL|d|�rl|j|�}n+|d|kr�|jd�|d}nP|dkr"|s�Pn|jd|d�}|dkr|jd|d�}|dkr|d}qn
|d7}|j|||!�n|j||�}q|d	|�r�tj
||�}|r�|j�d
d!}	|j|	�|j�}|d|d�s�|d}n|j||�}qqd||kr�|j|dd
!�|j|d
�}nPq|d
|�rtj
||�}|r�|jd�}	|j|	�|j�}|d|d�sn|d}n|j||�}qntj
||�}|r�|r�|j�||kr�|jd�nPq|d|kr|jd
�|j||d�}qPqdstd��qW|rc||krc|jrc|j|||!�|j||�}n|||_dS(Nit<s</s<!--s<?s<!iRs&#ii����t;t&s#EOF in middle of entity or char refsinteresting.search() lied(RtlenRtsearchtstartRthandle_datat	updatepost
startswithtstarttagopentmatchtparse_starttagtparse_endtagt
parse_commenttparse_pitparse_html_declarationtfindtcharreftgroupthandle_charreftendt	entityrefthandle_entityreft
incompleteR!R(
RR?RtitnR5tjR3tktname((s"/usr/lib64/python2.7/HTMLParser.pyR�s�			







cCs�|j}|||d!dkr0|jd�n|||d!dkrT|j|�S|||d!dkrx|j|�S|||d!j�d	kr�|jd
|d�}|dkr�dS|j||d|!�|dS|j|�SdS(
Nis<!s+unexpected call to parse_html_declaration()is<!--is<![i	s	<!doctypeRi����i(RR!R8tparse_marked_sectionR$R;thandle_decltparse_bogus_comment(RRCRtgtpos((s"/usr/lib64/python2.7/HTMLParser.pyR:�s	

icCs|j}|||d!dkr0|jd�n|jd|d�}|dkrVdS|rw|j||d|!�n|dS(	Nis<!s</s"unexpected call to parse_comment()Ri����i(s<!s</(RR!R;thandle_comment(RRCtreportRtpos((s"/usr/lib64/python2.7/HTMLParser.pyRJ�s	cCs�|j}|||d!dks,td��tj||d�}|sLdS|j�}|j||d|!�|j�}|S(Nis<?sunexpected call to parse_pi()i����(RRtpicloseR/R0t	handle_piR?(RRCRR5RE((s"/usr/lib64/python2.7/HTMLParser.pyR9s	#cCs�d|_|j|�}|dkr(|S|j}|||!|_g}tj||d�}|sotd��|j�}|jd�j	�|_
}x�||kr�tj||�}|s�Pn|jddd�\}	}
}|
s�d}nX|d dko|dkns7|d dko2|dknrG|dd!}n|r_|j|�}n|j
|	j	�|f�|j�}q�W|||!j�}|dkr+|j�\}
}d|jkr|
|jjd�}
t|j�|jjd�}n|t|j�}|j|||!�|S|jd
�rM|j||�n/|j||�||jkr||j|�n|S(
Niis#unexpected call to parse_starttag()iis'i����t"Rs/>s
(Rs/>(R	R"tcheck_for_whole_start_tagRttagfindR5RR?R=R$RtattrfindtunescapetappendtstripRtcountR.trfindR1tendswiththandle_startendtagthandle_starttagtCDATA_CONTENT_ELEMENTSR)(RRCtendposRtattrsR5RFttagtmtattrnametrestt	attrvalueR?RR((s"/usr/lib64/python2.7/HTMLParser.pyR6sR			$$cCs�|j}tj||�}|r�|j�}|||d!}|dkrR|dS|dkr�|jd|�rx|dS|jd|�r�dS|j||d�|jd�n|dkr�dS|d	kr�dS||kr�|S|dSntd
��dS(NiRt/s/>ii����smalformed empty start tagRs6abcdefghijklmnopqrstuvwxyz=/ABCDEFGHIJKLMNOPQRSTUVWXYZswe should not get here!(RtlocatestarttagendR5R?R3R2R!R(RRCRRaREtnext((s"/usr/lib64/python2.7/HTMLParser.pyRRKs,	cCs�|j}|||d!dks,td��tj||d�}|sLdS|j�}tj||�}|s!|jdk	r�|j	|||!�|St
j||d�}|s�|||d!dkr�|dS|j|�Sn|j�j
�}|jd|j��}|j|�|dS|jd�j
�}|jdk	ro||jkro|j	|||!�|Sn|j|�|j�|S(	Nis</sunexpected call to parse_endtagii����is</>R(RRt	endendtagR/R?t
endtagfindR5RR	R1ttagfind_tolerantRJR=R$R;t
handle_endtagR*(RRCRR5RKt	namematchttagnameR(((s"/usr/lib64/python2.7/HTMLParser.pyR7ks8	#


cCs!|j||�|j|�dS(N(R\Rk(RR`R_((s"/usr/lib64/python2.7/HTMLParser.pyR[�scCsdS(N((RR`R_((s"/usr/lib64/python2.7/HTMLParser.pyR\�scCsdS(N((RR`((s"/usr/lib64/python2.7/HTMLParser.pyRk�scCsdS(N((RRG((s"/usr/lib64/python2.7/HTMLParser.pyR>�scCsdS(N((RRG((s"/usr/lib64/python2.7/HTMLParser.pyRA�scCsdS(N((RR((s"/usr/lib64/python2.7/HTMLParser.pyR1�scCsdS(N((RR((s"/usr/lib64/python2.7/HTMLParser.pyRL�scCsdS(N((Rtdecl((s"/usr/lib64/python2.7/HTMLParser.pyRI�scCsdS(N((RR((s"/usr/lib64/python2.7/HTMLParser.pyRP�scCsdS(N((RR((s"/usr/lib64/python2.7/HTMLParser.pytunknown_decl�scs2d|kr|S�fd�}tjd||�S(NR-cs|j�d}yZ|ddkri|d}|dd
krSt|dd�}nt|�}t|�SWntk
r�d|dSXd	dl}tjdkr�id
d6}t_x0|jj	�D]\}}t|�||<q�Wny�j|SWnt
k
rd|dSXdS(Nit#itxtXis&#R,i����u'taposR-(RqRr(tgroupstinttunichrt
ValueErrorthtmlentitydefsRt
entitydefsR	tname2codepointt	iteritemstKeyError(tstcRxRyRFtv(R(s"/usr/lib64/python2.7/HTMLParser.pytreplaceEntities�s&



s#&(#?[xX]?(?:[0-9a-fA-F]+|\w{1,8}));(R%tsub(RR}R�((Rs"/usr/lib64/python2.7/HTMLParser.pyRU�s(RRN(!RR
RR]RRRRR!R	R"R#R)R*RR:RJR9R6RRR7R[R\RkR>RAR1RLRIRPRoRyRU(((s"/usr/lib64/python2.7/HTMLParser.pyRHs<										^			4	 	(										(RRR%R&RRBR@R<R4ROtcommentcloseRSRjRTtVERBOSERfRhRit	ExceptionRRR(((s"/usr/lib64/python2.7/HTMLParser.pyt<module>s&