o
    /h4                     @  s   d Z ddlmZ ddlZddlmZ ddlmZmZm	Z	 ddl
mZmZmZmZmZmZmZmZmZmZmZmZmZmZmZmZmZ erJddlmZ G dd	 d	eeZG d
d dZ e!dj"Z#e!dj$Z%e!dj$Z&G dd dZ'G dd de'Z(dS )z
cssselect.xpath
===============

Translation of parsed CSS selectors to XPath expressions.


:copyright: (c) 2007-2012 Ian Bicking and contributors.
See AUTHORS for more details.
:license: BSD, see LICENSE for more details.

    )annotationsN)Callable)TYPE_CHECKINGOptionalcast)AttribClassCombinedSelectorElementFunctionHashMatchingNegationPseudoPseudoElementRelationSelectorSelectorErrorSpecificityAdjustmentTreeparseparse_series)Selfc                   @  s   e Zd ZdZdS )ExpressionErrorz3Unknown or unsupported selector (eg. pseudo-class).N)__name__
__module____qualname____doc__ r   r   C/var/www/html/myenv/lib/python3.10/site-packages/cssselect/xpath.pyr   -   s    r   c                   @  sd   e Zd Z				d#d$ddZd%ddZd%ddZd&d'ddZd(ddZd(ddZ		d)d*d!d"Z	dS )+	XPathExpr *Fpathstrelement	conditionstar_prefixboolreturnNonec                 C  s   || _ || _|| _d S N)r#   r%   r&   )selfr#   r%   r&   r'   r   r   r   __init__5   s   
zXPathExpr.__init__c                 C  s0   t | jt | j }| jr|d| j d7 }|S N[]r$   r#   r%   r&   )r,   r#   r   r   r   __str__@   s   zXPathExpr.__str__c                 C  s   | j j d|  dS r.   )	__class__r   r,   r   r   r   __repr__F   s   zXPathExpr.__repr__and
conjuctionr   c                 C  s0   | j rd| j  d| d| d| _ | S || _ | S )N(z) z ())r&   )r,   r&   r7   r   r   r   add_conditionI   s
   zXPathExpr.add_conditionc                 C  s0   | j dkrd S | dt| j   d| _ d S )Nr"   z	name() = )r%   r:   GenericTranslatorxpath_literalr4   r   r   r   add_name_testP   s   

zXPathExpr.add_name_testc                 C  s   |  j d7  _ dS )ze
        Append '*/' to the path to keep the context constrained
        to a single parent.
        */N)r#   r4   r   r   r   add_star_prefixW   s   zXPathExpr.add_star_prefixNcombinerotherclosing_combiner
str | Nonehas_inner_conditionc                 C  s   t | | }|jdkr||j7 }|| _|s&|r|j| n|j| _|j| _| S |j| _|jr9|  jd|j d 7  _|rB|  j|7  _| S )Nr>   r/   r0   r1   )r,   r@   rA   rB   rD   r#   r   r   r   join^   s   

zXPathExpr.join)r!   r"   r!   F)
r#   r$   r%   r$   r&   r$   r'   r(   r)   r*   )r)   r$   )r6   )r&   r$   r7   r$   r)   r   )r)   r*   )NF)
r@   r$   rA   r    rB   rC   rD   r(   r)   r   )
r   r   r   r-   r2   r5   r:   r=   r?   rE   r   r   r   r   r    4   s    



r    z('+)z^[a-zA-Z_][a-zA-Z0-9_.-]*$z^[^ \t\r\n\f]+$c                	   @  sb  e Zd ZdZdddddZddd	d
dddddZdZdZdZdZ	dZ
eZddddZ		ddddZdd$d%Zedd'd(Zdd+d,Zdd/d0Zdd3d4Zdd7d8Zdd;d<Zdd>d?ZddBdCZddFdGZddIdJZddMdNZddQdRZddTdUZddXdYZddZd[Zdd\d]Z dd^d_Z!dd`daZ"ddbdcZ#ddddeZ$ddfdgZ%		hdddkdlZ&ddmdnZ'ddodpZ(ddqdrZ)ddsdtZ*ddudvZ+ddwdxZ,ddydzZ-dd{d|Z.dd}d~Z/dddZ0dddZ1dddZ2dddZ3dddZ4dddZ5e5Z6e5Z7e5Z8e5Z9e5Z:e5Z;e5Z<e5Z=e5Z>dddZ?dddZ@dddZAdddZBdddZCdddZDdddZEdddZFdS )r;   z
    Translator for "generic" XML documents.

    Everything is case-sensitive, no assumption is made on the meaning
    of element names and attribute names.

    
descendantchilddirect_adjacentindirect_adjacent) >+~existsequalsincludes	dashmatchprefixmatchsuffixmatchsubstringmatch	different)rN   =z~=z|=z^=z$=z*=z!=idzxml:langFdescendant-or-self::cssr$   prefixr)   c                   s   d  fddt|D S )u  Translate a *group of selectors* to XPath.

        Pseudo-elements are not supported here since XPath only knows
        about "real" elements.

        :param css:
            A *group of selectors* as a string.
        :param prefix:
            This string is prepended to the XPath expression for each selector.
            The default makes selectors scoped to the context node’s subtree.
        :raises:
            :class:`~cssselect.SelectorSyntaxError` on invalid selectors,
            :class:`ExpressionError` on unknown/unsupported selectors,
            including pseudo-elements.
        :returns:
            The equivalent XPath 1.0 expression as a string.

        z | c                 3  s     | ]}j | d dV  qdS )T)translate_pseudo_elementsN)selector_to_xpath.0selectorrZ   r,   r   r   	<genexpr>   s
    
z1GenericTranslator.css_to_xpath.<locals>.<genexpr>)rE   r   )r,   rY   rZ   r   r`   r   css_to_xpath   s   zGenericTranslator.css_to_xpathr_   r   r[   r(   c                 C  s`   t |dd}|std|| |}t|| jsJ |r(|jr(| ||j}|p+dt| S )u+  Translate a parsed selector to XPath.


        :param selector:
            A parsed :class:`Selector` object.
        :param prefix:
            This string is prepended to the resulting XPath expression.
            The default makes selectors scoped to the context node’s subtree.
        :param translate_pseudo_elements:
            Unless this is set to ``True`` (as :meth:`css_to_xpath` does),
            the :attr:`~Selector.pseudo_element` attribute of the selector
            is ignored.
            It is the caller's responsibility to reject selectors
            with pseudo-elements, or to account for them somehow.
        :raises:
            :class:`ExpressionError` on unknown/unsupported selectors.
        :returns:
            The equivalent XPath 1.0 expression as a string.

        parsed_treeNz Expected a parsed selector, got r!   )getattr	TypeErrorxpath
isinstancexpathexpr_clspseudo_elementxpath_pseudo_elementr$   )r,   r_   rZ   r[   treerf   r   r   r   r\      s   

z#GenericTranslator.selector_to_xpathrf   r    ri   r   c                 C  s   t d)zTranslate a pseudo-element.

        Defaults to not supporting pseudo-elements at all,
        but can be overridden by sub-classes.

        z"Pseudo-elements are not supported.)r   )r,   rf   ri   r   r   r   rj     s   	z&GenericTranslator.xpath_pseudo_elementsc                 C  s^   t | } d| vrd|  d} | S d| vrd|  d} | S dd t| D }dd|} | S )N'"c                 S  s0   g | ]}|rd |v rd| dnd | d qS )rm   rn   r   )r^   partr   r   r   
<listcomp>  s    z3GenericTranslator.xpath_literal.<locals>.<listcomp>z
concat({}),)r$   split_at_single_quotesformatrE   )rl   parts_quotedr   r   r   r<     s   
zGenericTranslator.xpath_literalparsed_selectorr   c                 C  sR   t |j}ttttgtf  t| d|  d}|du r%t	| d||S )z%Translate any parsed selector object.xpath_Nz is not supported.)
typer   r   r   r   r   r    rd   lowerr   )r,   ru   	type_namemethodr   r   r   rf      s   
zGenericTranslator.xpathcombinedr	   c                 C  sJ   | j |j }ttttgtf t| d| d}|| |j| |jS )zTranslate a combined selector.rv   _combinator)	combinator_mapping
combinatorr   r   r    rd   rf   r_   subselector)r,   r{   r~   rz   r   r   r   xpath_combinedselector-  s   z(GenericTranslator.xpath_combinedselectornegationr   c                 C  sD   |  |j}|  |j}|  |jr|d|j dS |dS )Nnot(r9   0)rf   r_   r   r=   r&   r:   )r,   r   rf   	sub_xpathr   r   r   xpath_negation6  s   
z GenericTranslator.xpath_negationrelationr   c              	   C  s`   |  |j}|j}|j}|  |j}ttttgtf t| d| j	tt
|j  d}|||S )Nxpath_relation_r|   )rf   r_   r~   r   rc   r   r   r    rd   r}   r$   value)r,   r   rf   r~   r   rightrz   r   r   r   xpath_relation>  s   
z GenericTranslator.xpath_relationmatchingr   c                   J     |j} fdd|jD }|D ]}|  |jr"||jd q|S )Nc                      g | ]}  |qS r   rf   r]   r4   r   r   rp   N      z4GenericTranslator.xpath_matching.<locals>.<listcomp>orrf   r_   selector_listr=   r&   r:   r,   r   rf   exprser   r4   r   xpath_matchingL     z GenericTranslator.xpath_matchingr   c                   r   )Nc                   r   r   r   r]   r4   r   r   rp   W  r   zAGenericTranslator.xpath_specificityadjustment.<locals>.<listcomp>r   r   r   r   r4   r   xpath_specificityadjustmentU  r   z-GenericTranslator.xpath_specificityadjustmentfunctionr   c                 C  s^   d |jdd}tttttgtf  t| |d}|s&t	d|j d|| 
|j|S )z$Translate a functional pseudo-class.zxpath_{}_function-_NThe pseudo-class :z() is unknown)rs   namereplacer   r   r   r    r   rd   r   rf   r_   )r,   r   method_namerz   r   r   r   xpath_function^  s   
z GenericTranslator.xpath_functionpseudor   c                 C  sZ   d |jdd}ttttgtf  t| |d}|s%td|j d|| 	|j
S )zTranslate a pseudo-class.zxpath_{}_pseudor   r   Nr   z is unknown)rs   identr   r   r   r   r    rd   r   rf   r_   )r,   r   r   rz   r   r   r   xpath_pseudoi  s   zGenericTranslator.xpath_pseudor   c                 C  s   | j |j }tttttt gtf t| d| }| jr#|j	
 }n|j	}t|}|jr<|j d| }|o;t|j}|rCd| }n	d| | d}|jdu rTd}n| jratt|jj
 }n|jj}|| |j||S )z Translate an attribute selector.xpath_attrib_:@zattribute::*[name() = r0   N)attribute_operator_mappingoperatorr   r   r    r$   r   rd   lower_case_attribute_namesattribrx   is_safe_name	namespacer<   r   lower_case_attribute_valuesrf   r_   )r,   r_   r   rz   r   safer   r   r   r   r   xpath_attribt  s*   

zGenericTranslator.xpath_attribclass_selectorr   c                 C     |  |j}| |d|jS )zTranslate a class selector.z@class)rf   r_   xpath_attrib_includes
class_name)r,   r   rf   r   r   r   xpath_class  s   zGenericTranslator.xpath_classid_selectorr   c                 C  r   )zTranslate an ID selector.z@id)rf   r_   xpath_attrib_equalsrW   )r,   r   rf   r   r   r   
xpath_hash  s   zGenericTranslator.xpath_hashr
   c                 C  sr   |j }|s
d}d}ntt|}| jr| }|jr+|j d| }|o*tt|j}| j|d}|s7|  |S )z'Translate a type or universal selector.r"   Tr   )r%   )r%   r(   r   lower_case_element_namesrx   r   rh   r=   )r,   r_   r%   r   rf   r   r   r   xpath_element  s   zGenericTranslator.xpath_elementleftr   c                 C     | d|S )z;right is a child, grand-child or further descendant of leftz/descendant-or-self::*/rE   r,   r   r   r   r   r   xpath_descendant_combinator     z-GenericTranslator.xpath_descendant_combinatorc                 C  r   )z#right is an immediate child of left/r   r   r   r   r   xpath_child_combinator  s   z(GenericTranslator.xpath_child_combinatorc                 C  s   | d|}|  |dS )z)right is a sibling immediately after left/following-sibling::zposition() = 1)rE   r=   r:   )r,   r   r   rf   r   r   r    xpath_direct_adjacent_combinator  s   
z2GenericTranslator.xpath_direct_adjacent_combinatorc                 C  r   )z1right is a sibling after left, immediately or notr   r   r   r   r   r   "xpath_indirect_adjacent_combinator  r   z4GenericTranslator.xpath_indirect_adjacent_combinatorc                 C  s   |j d|dddS )zHright is a child, grand-child or further descendant of left; select leftz[descendant::r0   T)rB   rD   r   r   r   r   r   $xpath_relation_descendant_combinator  s   z6GenericTranslator.xpath_relation_descendant_combinatorc                 C     |j d|ddS )z0right is an immediate child of left; select leftz[./r0   rB   r   r   r   r   r   xpath_relation_child_combinator     z1GenericTranslator.xpath_relation_child_combinatorc                 C  s   | d|j dS )z6right is a sibling immediately after left; select leftz following-sibling::*[(name() = 'z') and (position() = 1)])r:   r%   r   r   r   r   )xpath_relation_direct_adjacent_combinator  s   z;GenericTranslator.xpath_relation_direct_adjacent_combinatorc                 C  r   )z>right is a sibling after left, immediately or not; select leftz[following-sibling::r0   r   r   r   r   r   r   +xpath_relation_indirect_adjacent_combinator  r   z=GenericTranslator.xpath_relation_indirect_adjacent_combinatorTlastr=   c              
     s  z	t |j\}}W n ty } z
td|jd|d }~ww |d }|dkr.|dkr.|S |dk r;|dk r;|dS |r?dn|j }	|sLd|	 d}
nd	|	 d}
|dkr`||
 d
| S g }|dkru|dkrt||
 d|  n
||
 d|  t|dkr|
}| t| }|dkrd| d| d}|| d| d t|dkrdnd |d	 fdd|D  |S )NzInvalid series: 'rm      r   r   r"   count(preceding-sibling::r9   count(following-sibling:: = z >= z <= r8   z +z mod z = 0z(%s)z%sz and c                 3  s    | ]} | V  qd S r+   r   )r^   
expressiontemplater   r   ra   f  s    z=GenericTranslator.xpath_nth_child_function.<locals>.<genexpr>)
r   	arguments
ValueErrorr   r:   r%   appendabslenrE   )r,   rf   r   r   r=   abexb_min_1nodetestsiblings_countexpressionsr   b_negr   r   r   xpath_nth_child_function  sD   ,
z*GenericTranslator.xpath_nth_child_functionc                 C  s   | j ||ddS )NT)r   )r   r,   rf   r   r   r   r   xpath_nth_last_child_functionj  s   z/GenericTranslator.xpath_nth_last_child_functionc                 C  s"   |j dkr	td| j||ddS )Nr"   "*:nth-of-type() is not implementedF)r=   r%   r   r   r   r   r   r   xpath_nth_of_type_functiono  s   
z,GenericTranslator.xpath_nth_of_type_functionc                 C  s$   |j dkr	td| j||dddS )Nr"   r   TF)r   r=   r   r   r   r   r   xpath_nth_last_of_type_functionv  s
   
z1GenericTranslator.xpath_nth_last_of_type_functionc                 C  N   |  dgdgfvrtd|jtt|jd j}|d| | dS )NSTRINGIDENTz7Expected a single string or ident for :contains(), got r   zcontains(., r9   argument_typesr   r   r   r$   r   r:   r<   r,   rf   r   r   r   r   r   xpath_contains_function  s   
z)GenericTranslator.xpath_contains_functionc                 C  r   )Nr   r   3Expected a single string or ident for :lang(), got r   zlang(r9   r   r   r   r   r   xpath_lang_function  s   
z%GenericTranslator.xpath_lang_functionc                 C  
   | dS )Nznot(parent::*)r:   r,   rf   r   r   r   xpath_root_pseudo     
z#GenericTranslator.xpath_root_pseudoc                 C  r   )N1r   r   r   r   r   xpath_scope_pseudo  r   z$GenericTranslator.xpath_scope_pseudoc                 C  r   )Nzcount(preceding-sibling::*) = 0r   r   r   r   r   xpath_first_child_pseudo  r   z*GenericTranslator.xpath_first_child_pseudoc                 C  r   )Nzcount(following-sibling::*) = 0r   r   r   r   r   xpath_last_child_pseudo  r   z)GenericTranslator.xpath_last_child_pseudoc                 C  &   |j dkr	td|d|j  dS )Nr"   z"*:first-of-type is not implementedr   ) = 0r%   r   r:   r   r   r   r   xpath_first_of_type_pseudo     
z,GenericTranslator.xpath_first_of_type_pseudoc                 C  r   )Nr"   z!*:last-of-type is not implementedr   r   r   r   r   r   r   xpath_last_of_type_pseudo  r   z+GenericTranslator.xpath_last_of_type_pseudoc                 C  r   )Nzcount(parent::*/child::*) = 1r   r   r   r   r   xpath_only_child_pseudo  r   z)GenericTranslator.xpath_only_child_pseudoc                 C  r   )Nr"   z!*:only-of-type is not implementedzcount(parent::*/child::z) = 1r   r   r   r   r   xpath_only_of_type_pseudo  r   z+GenericTranslator.xpath_only_of_type_pseudoc                 C  r   )Nznot(*) and not(string-length())r   r   r   r   r   xpath_empty_pseudo  r   z$GenericTranslator.xpath_empty_pseudoc                 C  r   )z:Common implementation for pseudo-classes that never match.r   r   r   r   r   r   pseudo_never_matches  s   
z&GenericTranslator.pseudo_never_matchesr   r   rC   c                 C  s   |rJ | | |S r+   r   r,   rf   r   r   r   r   r   xpath_attrib_exists  s   
z%GenericTranslator.xpath_attrib_existsc                 C  s*   |d usJ | | d| |  |S )Nr   r:   r<   r  r   r   r   r     s   z%GenericTranslator.xpath_attrib_equalsc              
   C  sT   |d usJ |r| d| d| d| |  |S | | d| |  |S )Nr   z) or z != r  r  r   r   r   xpath_attrib_different  s   "z(GenericTranslator.xpath_attrib_differentc                 C  sL   |rt |r| d| d }|| d| d| d |S |d |S )NrJ   z* and contains(concat(' ', normalize-space(z	), ' '), r9   r   )is_non_whitespacer<   r:   )r,   rf   r   r   argr   r   r   r     s   
z'GenericTranslator.xpath_attrib_includesc                 C  sP   |d usJ |  |}|  |d }|| d| d| d| d| d
 |S )Nr   z and (r   z or starts-with(, z)))r<   r:   )r,   rf   r   r   r	  arg_dashr   r   r   xpath_attrib_dashmatch  s   
 z(GenericTranslator.xpath_attrib_dashmatchc              	   C  8   |r| | d| d| | d |S | d |S )Nz and starts-with(r
  r9   r   r  r  r   r   r   xpath_attrib_prefixmatch  s   
z*GenericTranslator.xpath_attrib_prefixmatchc                 C  sJ   |r| | d| d| dt|d  d| | 	 |S | d |S )Nz and substring(z, string-length(z)-r   z) = r   )r:   r   r<   r  r   r   r   xpath_attrib_suffixmatch  s   ,
z*GenericTranslator.xpath_attrib_suffixmatchc              	   C  r  )Nz and contains(r
  r9   r   r  r  r   r   r   xpath_attrib_substringmatch  s   
z-GenericTranslator.xpath_attrib_substringmatchN)rX   )rY   r$   rZ   r$   r)   r$   )rX   F)r_   r   rZ   r$   r[   r(   r)   r$   )rf   r    ri   r   r)   r    )rl   r$   r)   r$   )ru   r   r)   r    )r{   r	   r)   r    )r   r   r)   r    )r   r   r)   r    )r   r   r)   r    )r   r   r)   r    )r   r   r)   r    )r   r   r)   r    )r_   r   r)   r    )r   r   r)   r    )r   r   r)   r    )r_   r
   r)   r    )r   r    r   r    r)   r    )FT)
rf   r    r   r   r   r(   r=   r(   r)   r    rf   r    r   r   r)   r    rf   r    r)   r    )rf   r    r   r$   r   rC   r)   r    )Gr   r   r   r   r}   r   id_attributelang_attributer   r   r   r    rh   rb   r\   rj   staticmethodr<   rf   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r  r  r  xpath_link_pseudoxpath_visited_pseudoxpath_hover_pseudoxpath_active_pseudoxpath_focus_pseudoxpath_target_pseudoxpath_enabled_pseudoxpath_disabled_pseudoxpath_checked_pseudor  r   r  r   r  r  r  r  r   r   r   r   r;      s    
#


	


	
	












 



	


















r;   c                   @  sR   e Zd ZdZdZdddd	ZdddZdddZdddZdddZ	dddZ
dS )HTMLTranslatora  
    Translator for (X)HTML documents.

    Has a more useful implementation of some pseudo-classes based on
    HTML-specific element names and attribute names, as described in
    the `HTML5 specification`_. It assumes no-quirks mode.
    The API is the same as :class:`GenericTranslator`.

    .. _HTML5 specification: http://www.w3.org/TR/html5/links.html#selectors

    :param xhtml:
        If false (the default), element names and attribute names
        are case-insensitive.

    langFxhtmlr(   r)   r*   c                 C  s   || _ |sd| _d| _d S d S )NT)r!  r   r   )r,   r!  r   r   r   r-   3  s
   
zHTMLTranslator.__init__rf   r    c                 C  r   )Nz(@selected and name(.) = 'option') or (@checked and (name(.) = 'input' or name(.) = 'command')and (@type = 'checkbox' or @type = 'radio'))r   r   r   r   r   r  :     z#HTMLTranslator.xpath_checked_pseudor   r   c                 C  sd   |  dgdgfvrtd|j|jd j}|sJ | | d }|d| j d| dS )	Nr   r   r   r   r   z<ancestor-or-self::*[@lang][1][starts-with(concat(translate(@zE, 'ABCDEFGHIJKLMNOPQRSTUVWXYZ', 'abcdefghijklmnopqrstuvwxyz'), '-'), z)])r   r   r   r   r<   rx   r:   r  )r,   rf   r   r   r	  r   r   r   r   C  s   
z"HTMLTranslator.xpath_lang_functionc                 C  r   )NzA@href and (name(.) = 'a' or name(.) = 'link' or name(.) = 'area')r   r   r   r   r   r  S  s   z HTMLTranslator.xpath_link_pseudoc                 C  r   )Na  
        (
            @disabled and
            (
                (name(.) = 'input' and @type != 'hidden') or
                name(.) = 'button' or
                name(.) = 'select' or
                name(.) = 'textarea' or
                name(.) = 'command' or
                name(.) = 'fieldset' or
                name(.) = 'optgroup' or
                name(.) = 'option'
            )
        ) or (
            (
                (name(.) = 'input' and @type != 'hidden') or
                name(.) = 'button' or
                name(.) = 'select' or
                name(.) = 'textarea'
            )
            and ancestor::fieldset[@disabled]
        )
        r   r   r   r   r   r  [  r"  z$HTMLTranslator.xpath_disabled_pseudoc                 C  r   )Na'  
        (
            @href and (
                name(.) = 'a' or
                name(.) = 'link' or
                name(.) = 'area'
            )
        ) or (
            (
                name(.) = 'command' or
                name(.) = 'fieldset' or
                name(.) = 'optgroup'
            )
            and not(@disabled)
        ) or (
            (
                (name(.) = 'input' and @type != 'hidden') or
                name(.) = 'button' or
                name(.) = 'select' or
                name(.) = 'textarea' or
                name(.) = 'keygen'
            )
            and not (@disabled or ancestor::fieldset[@disabled])
        ) or (
            name(.) = 'option' and not(
                @disabled or ancestor::optgroup[@disabled]
            )
        )
        r   r   r   r   r   r  y  r"  z#HTMLTranslator.xpath_enabled_pseudoN)F)r!  r(   r)   r*   r  r  )r   r   r   r   r  r-   r  r   r  r  r  r   r   r   r   r     s    

	

r  ))r   
__future__r   recollections.abcr   typingr   r   r   cssselect.parserr   r   r	   r
   r   r   r   r   r   r   r   r   r   r   r   r   r   typing_extensionsr   RuntimeErrorr   r    compilesplitrr   matchr   r  r;   r  r   r   r   r   <module>   s(    LD     