U
    cUh?                     @   s  d Z ddlZddlZddlZddlZddlZddlZddlZddl	Z
ddlZ
ddlmZ ddlmZ ddlmZ ddlmZmZmZmZmZmZmZmZmZmZmZ ddlmZ ddl m!Z! dd	l"m#Z#m$Z$ dd
l%m&Z& ddl'm(Z( ddl)m*Z* ddl+m,Z, ddl-m.Z. ddl/m0Z0 ddl1m2Z2 ddl3m4Z4 ddl5m6Z6m7Z7m8Z8 e9e:Z;ee<e<f Z=e<ee< dddZ>G dd de?Z@e!ddddZAG dd de?ZBe<e,dddd ZCe<e,e!dd!d"ZDe=ee< d#d$d%ZEG d&d' d'ZFG d(d) d)eZGeGeGd*d+d,ZHeHd-ee( d.d/d0ZIed1d2G d3d- d-ZJG d4d5 d5eZKdDe(ee<e?f eed6  dd7d8d9ZLdEe!eMeJd:d;d<ZNe(e,ed- d=d>d?ZOG d@dA dAeZPG dBdC dCZQdS )FzO
The main purpose of this module is to expose LinkCollector.collect_sources().
    N)	dataclass)
HTMLParser)Values)CallableDictIterableListMutableMapping
NamedTupleOptionalProtocolSequenceTupleUnion)requests)Response)
RetryErrorSSLError)NetworkConnectionError)Link)SearchScope)
PipSession)raise_for_status)is_archive_fileredact_auth_from_url)vcs   )CandidatesFromPage
LinkSourcebuild_sourceurlreturnc                 C   s6   t jD ]*}|  |r| t| dkr|  S qdS )zgLook for VCS schemes in the URL.

    Returns the matched VCS scheme, or None if there's no match.
    z+:N)r   Zschemeslower
startswithlen)r"   scheme r(   ]/opt/bot/vods_filmes/script/venv/lib/python3.8/site-packages/pip/_internal/index/collector.py_match_vcs_scheme3   s    

r*   c                       s&   e Zd Zeedd fddZ  ZS )_NotAPIContentN)content_typerequest_descr#   c                    s   t  || || _|| _d S N)super__init__r,   r-   )selfr,   r-   	__class__r(   r)   r0   ?   s    z_NotAPIContent.__init__)__name__
__module____qualname__strr0   __classcell__r(   r(   r2   r)   r+   >   s   r+   )responser#   c                 C   s6   | j dd}| }|dr$dS t|| jjdS )z
    Check the Content-Type header to ensure the response contains a Simple
    API Response.

    Raises `_NotAPIContent` if the content type is not a valid content-type.
    Content-TypeUnknown)z	text/htmlz#application/vnd.pypi.simple.v1+html#application/vnd.pypi.simple.v1+jsonN)headersgetr$   r%   r+   requestmethod)r9   r,   content_type_lr(   r(   r)   _ensure_api_headerE   s    rB   c                   @   s   e Zd ZdS )_NotHTTPN)r4   r5   r6   r(   r(   r(   r)   rC   [   s   rC   )r"   sessionr#   c                 C   sF   t j| \}}}}}|dkr$t |j| dd}t| t| dS )z
    Send a HEAD request to the URL, and ensure the response contains a simple
    API Response.

    Raises `_NotHTTP` if the URL is not available for a HEAD request, or
    `_NotAPIContent` if the content type is not a valid content type.
    >   httpshttpT)Zallow_redirectsN)urllibparseurlsplitrC   headr   rB   )r"   rD   r'   netlocpathqueryfragmentrespr(   r(   r)   _ensure_api_response_   s    rP   c                 C   sz   t t| jrt| |d tdt|  |j| ddddgddd	}t	| t
| td
t| |jdd |S )aY  Access an Simple API response with GET, and return the response.

    This consists of three parts:

    1. If the URL looks suspiciously like an archive, send a HEAD first to
       check the Content-Type is HTML or Simple API, to avoid downloading a
       large file. Raise `_NotHTTP` if the content type cannot be determined, or
       `_NotAPIContent` if it is not HTML or a Simple API.
    2. Actually perform the request. Raise HTTP exceptions on network failures.
    3. Check the Content-Type header to make sure we got a Simple API response,
       and raise `_NotAPIContent` otherwise.
    rD   zGetting page %sz, r<   z*application/vnd.pypi.simple.v1+html; q=0.1ztext/html; q=0.01z	max-age=0)AcceptzCache-Control)r=   zFetched page %s as %sr:   r;   )r   r   filenamerP   loggerdebugr   r>   joinr   rB   r=   )r"   rD   rO   r(   r(   r)   _get_simple_responseq   s,    rW   )r=   r#   c                 C   s<   | r8d| kr8t j }| d |d< |d}|r8t|S dS )z=Determine if we have any encoding information in our headers.r:   zcontent-typecharsetN)emailmessageMessage	get_paramr7   )r=   mrX   r(   r(   r)   _get_encoding_from_headers   s    

r^   c                   @   s:   e Zd ZdddddZeedddZed	d
dZdS )CacheablePageContentIndexContentNpager#   c                 C   s   |j s
t|| _d S r.   )cache_link_parsingAssertionErrorrb   r1   rb   r(   r(   r)   r0      s    
zCacheablePageContent.__init__)otherr#   c                 C   s   t |t| o| jj|jjkS r.   )
isinstancetyperb   r"   )r1   rf   r(   r(   r)   __eq__   s    zCacheablePageContent.__eq__r#   c                 C   s   t | jjS r.   )hashrb   r"   r1   r(   r(   r)   __hash__   s    zCacheablePageContent.__hash__)	r4   r5   r6   r0   objectboolri   intrm   r(   r(   r(   r)   r_      s   r_   c                   @   s    e Zd Zdee dddZdS )
ParseLinksr`   ra   c                 C   s   d S r.   r(   re   r(   r(   r)   __call__       zParseLinks.__call__N)r4   r5   r6   r   r   rr   r(   r(   r(   r)   rq      s   rq   )fnr#   c                    sL   t jddttt d fddt  dtt d fdd	}|S )
z
    Given a function that parses an Iterable[Link] from an IndexContent, cache the
    function's result (keyed by CacheablePageContent), unless the IndexContent
    `page` has `page.cache_link_parsing == False`.
    N)maxsize)cacheable_pager#   c                    s   t  | jS r.   )listrb   )rv   )rt   r(   r)   wrapper   s    z*with_cached_index_content.<locals>.wrapperr`   ra   c                    s   | j rt| S t | S r.   )rc   r_   rw   )rb   rt   rx   r(   r)   wrapper_wrapper   s    z2with_cached_index_content.<locals>.wrapper_wrapper)	functools	lru_cacher_   r   r   wraps)rt   rz   r(   ry   r)   with_cached_index_content   s
    
r~   r`   ra   c           
      c   s   | j  }|drTt| j}|dg D ]"}t|| j	}|dkrHq,|V  q,dS t
| j	}| jpfd}|| j| | j	}|jp|}|jD ]$}	tj|	||d}|dkrq|V  qdS )z\
    Parse a Simple API's Index Content, and yield its anchor elements as Link objects.
    r<   filesNzutf-8)Zpage_urlbase_url)r,   r$   r%   jsonloadscontentr>   r   	from_jsonr"   HTMLLinkParserencodingfeeddecoder   anchorsZfrom_element)
rb   rA   datafilelinkparserr   r"   r   anchorr(   r(   r)   parse_links   s&    





r   T)frozenc                   @   sP   e Zd ZU dZeed< eed< ee ed< eed< dZe	ed< edd	d
Z
dS )r`   a  Represents one response (or page), along with its URL.

    :param encoding: the encoding to decode the given content.
    :param url: the URL from which the HTML was downloaded.
    :param cache_link_parsing: whether links parsed from this page's url
                               should be cached. PyPI index urls should
                               have this set to False, for example.
    r   r,   r   r"   Trc   rj   c                 C   s
   t | jS r.   )r   r"   rl   r(   r(   r)   __str__  s    zIndexContent.__str__N)r4   r5   r6   __doc__bytes__annotations__r7   r   rc   ro   r   r(   r(   r(   r)   r`      s   
	c                       sn   e Zd ZdZedd fddZeeeeee f  ddddZ	eeeee f  ee d	d
dZ
  ZS )r   zf
    HTMLParser that keeps the first base HREF and a list of all anchor
    elements' attributes.
    Nr!   c                    s$   t  jdd || _d | _g | _d S )NT)Zconvert_charrefs)r/   r0   r"   r   r   )r1   r"   r2   r(   r)   r0     s    zHTMLLinkParser.__init__)tagattrsr#   c                 C   sH   |dkr,| j d kr,| |}|d k	rD|| _ n|dkrD| jt| d S )Nbasea)r   get_hrefr   appenddict)r1   r   r   hrefr(   r(   r)   handle_starttag  s    
zHTMLLinkParser.handle_starttag)r   r#   c                 C   s"   |D ]\}}|dkr|  S qd S )Nr   r(   )r1   r   namevaluer(   r(   r)   r   &  s    
zHTMLLinkParser.get_href)r4   r5   r6   r   r7   r0   r   r   r   r   r   r8   r(   r(   r2   r)   r     s   "r   ).N)r   reasonmethr#   c                 C   s   |d krt j}|d| | d S )Nz%Could not fetch URL %s: %s - skipping)rT   rU   )r   r   r   r(   r(   r)   _handle_get_simple_fail-  s    r   )r9   rc   r#   c                 C   s&   t | j}t| j| jd || j|dS )Nr:   )r   r"   rc   )r^   r=   r`   r   r"   )r9   rc   r   r(   r(   r)   _make_index_content7  s    
r   )r   rD   r#   c          
   
   C   s  | j ddd }t|}|r0td||  d S tj|\}}}}}}|dkrtj	
tj|r|dsv|d7 }tj|d}td| zt||d	}W nD tk
r   td
|  Y n2 tk
r } ztd| |j|j W 5 d }~X Y n tk
r$ } zt| | W 5 d }~X Y n tk
rP } zt| | W 5 d }~X Y n tk
r } z$d}	|	t|7 }	t| |	tjd W 5 d }~X Y nd tjk
r } zt| d|  W 5 d }~X Y n0 tjk
r   t| d Y nX t|| jdS d S )N#r   r   zICannot look at %s URL %s because it does not support lookup as web pages.r   /z
index.htmlz# file: URL is directory, getting %srQ   z`Skipping page %s because it looks like an archive, and cannot be checked by a HTTP HEAD request.zSkipping page %s because the %s request got Content-Type: %s. The only supported Content-Types are application/vnd.pypi.simple.v1+json, application/vnd.pypi.simple.v1+html, and text/htmlz4There was a problem confirming the ssl certificate: )r   zconnection error: z	timed out)rc   ) r"   splitr*   rT   warningrG   rH   urlparseosrL   isdirr?   url2pathnameendswithurljoinrU   rW   rC   r+   r-   r,   r   r   r   r   r7   infor   ConnectionErrorZTimeoutr   rc   )
r   rD   r"   Z
vcs_schemer'   _rL   rO   excr   r(   r(   r)   _get_index_contentD  sV    

  r   c                   @   s.   e Zd ZU eee  ed< eee  ed< dS )CollectedSources
find_links
index_urlsN)r4   r5   r6   r   r   r   r   r(   r(   r(   r)   r     s   
r   c                   @   sx   e Zd ZdZeeddddZedeee	d ddd	Z
eee d
ddZeee dddZeeedddZdS )LinkCollectorz
    Responsible for collecting Link objects from all configured locations,
    making network requests as needed.

    The class's main method is its collect_sources() method.
    N)rD   search_scoper#   c                 C   s   || _ || _d S r.   )r   rD   )r1   rD   r   r(   r(   r)   r0     s    zLinkCollector.__init__F)rD   optionssuppress_no_indexr#   c                 C   sd   |j g|j }|jr8|s8tdddd |D  g }|jp@g }tj|||jd}t	||d}|S )z
        :param session: The Session to use to make requests.
        :param suppress_no_index: Whether to ignore the --no-index option
            when constructing the SearchScope object.
        zIgnoring indexes: %s,c                 s   s   | ]}t |V  qd S r.   r   ).0r"   r(   r(   r)   	<genexpr>  s     z'LinkCollector.create.<locals>.<genexpr>)r   r   no_index)rD   r   )
	index_urlextra_index_urlsr   rT   rU   rV   r   r   creater   )clsrD   r   r   r   r   r   link_collectorr(   r(   r)   r     s$    

zLinkCollector.createrj   c                 C   s   | j jS r.   )r   r   rl   r(   r(   r)   r     s    zLinkCollector.find_links)locationr#   c                 C   s   t || jdS )z>
        Fetch an HTML page containing package links.
        rQ   )r   rD   )r1   r   r(   r(   r)   fetch_response  s    zLinkCollector.fetch_response)project_namecandidates_from_pager#   c                    s   t  fddjD  }t  fddjD  }ttj	rdd t
||D }t| d dg| }td| tt|t|d	S )
Nc              	   3   s&   | ]}t | jjd d dV  qdS )Fr   Zpage_validatorZ
expand_dirrc   r   Nr    rD   Zis_secure_originr   locr   r   r1   r(   r)   r     s   	z0LinkCollector.collect_sources.<locals>.<genexpr>c              	   3   s&   | ]}t | jjd d dV  qdS )Tr   Nr   r   r   r(   r)   r     s   	c                 S   s*   g | ]"}|d k	r|j d k	rd|j  qS )Nz* )r   )r   sr(   r(   r)   
<listcomp>  s    
z1LinkCollector.collect_sources.<locals>.<listcomp>z' location(s) to search for versions of :
)r   r   )collectionsOrderedDictr   Zget_index_urls_locationsvaluesr   rT   isEnabledForloggingDEBUG	itertoolschainr&   rU   rV   r   rw   )r1   r   r   Zindex_url_sourcesZfind_links_sourceslinesr(   r   r)   collect_sources  s&    	
	
zLinkCollector.collect_sources)F)r4   r5   r6   r   r   r   r0   classmethodr   ro   r   propertyr   r7   r   r   r   r`   r   r   r   r   r(   r(   r(   r)   r     s(   	 !r   )N)T)Rr   r   email.messagerY   r{   r   r   r   r   urllib.parserG   urllib.requestdataclassesr   Zhtml.parserr   optparser   typingr   r   r   r   r	   r
   r   r   r   r   r   Zpip._vendorr   Zpip._vendor.requestsr   Zpip._vendor.requests.exceptionsr   r   pip._internal.exceptionsr   Zpip._internal.models.linkr   Z!pip._internal.models.search_scoper   pip._internal.network.sessionr   Zpip._internal.network.utilsr   Zpip._internal.utils.filetypesr   pip._internal.utils.miscr   Zpip._internal.vcsr   sourcesr   r   r    	getLoggerr4   rT   r7   ZResponseHeadersr*   	Exceptionr+   rB   rC   rP   rW   r^   r_   rq   r~   r   r`   r   r   ro   r   r   r   r   r(   r(   r(   r)   <module>   st   4
? 

  =