
    gX                     Z   U d Z ddlZddlZddlZddlZddlZddlZddlmZ ddl	m
Z
 ddlmZmZmZmZmZ ddlZddlmZmZ ddlmZ ddlmZ dd	lmZ d
dlmZ d
dlmZmZmZm Z m!Z!m"Z"m#Z# ddlm$Z$ ddl%m&Z& ddl'm(Z( ddl)m*Z*  e$jV                  e,      Z-dZ.dZ/ ej`                  dejb                        Z2 G d de      Z3 G d de      Z4dejj                  fdZ6eg ejj                  f   Z7e6a8e7e9d<   e6fde7ddfdZ:dejj                  fdZ;d8d Z<ed!e=d"e=dejj                  fd#       Z>d$dd%ej~                  ej                  fe
j                  d&d'e*d(eBd)e=d*eCd+eCd,eeeD   eeeD   d-f   f   d.ee=ee=d-f   f   defd/ZEd(eBd0eeB   deBfd1ZFd9d2ed3eeB   ddfd4ZGd5ee!   d6eBd2ede!fd7ZHy):z>Contains utilities to handle HTTP requests in Huggingface Hub.    N)	lru_cache)
HTTPStatus)CallableOptionalTupleTypeUnion)	HTTPErrorResponse)HTTPAdapter)PreparedRequest)OfflineModeIsEnabled   )	constants)BadRequestErrorDisabledRepoErrorEntryNotFoundErrorGatedRepoErrorHfHubHTTPErrorRepositoryNotFoundErrorRevisionNotFoundError   )logging)JSONDecodeError)SliceFileObj)HTTP_METHOD_TX-Amzn-Trace-Idzx-request-ida  
        # staging or production endpoint
        ^https://[^/]+
        (
            # on /api/repo_type/repo_id
            /api/(models|datasets|spaces)/(.+)
            |
            # or /repo_id/resolve/revision/...
            /(.+)/resolve/(.+)
        )
    )flagsc                   6     e Zd ZdZ fdZdedef fdZ xZS )UniqueRequestIdAdapterr   c                    t        |   |fi | t        |j                  vrO|j                  j	                  t
              xs t        t        j                               |j                  t        <   t        |j                  j	                  dd            j                  d      }t        j                  d|j                  t            d|j                   d|j                   d| d	       y )	Nauthorization z
Bearer hf_zRequest z:  z (authenticated: ))superadd_headersX_AMZN_TRACE_IDheadersgetX_REQUEST_IDstruuiduuid4
startswithloggerdebugmethodurl)selfrequestkwargs	has_token	__class__s       P/var/www/openai/venv/lib/python3.12/site-packages/huggingface_hub/utils/_http.pyr'   z"UniqueRequestIdAdapter.add_headersM   s    G.v. '//1/6/B/B</P/eTWX\XbXbXdTeGOOO, ++OR@ALL\Z	w787>>:J!GKK=Xijsittuv	
    r5   returnc                     	 t        |   |g|i |S # t        j                  $ rA}|j                  j                  t              }|g |j                  d| d|_         d}~ww xY w)zSCatch any RequestException to append request id to the error message for debugging.Nz(Request ID: r%   )r&   sendrequestsRequestExceptionr)   r*   r(   args)r4   r5   r@   r6   e
request_idr8   s         r9   r=   zUniqueRequestIdAdapter.sendZ   sr    	7<9$9&99(( 	 ,,_=J%A166A]:,a#@A	s    A*<A%%A*)	__name__
__module____qualname__r(   r'   r   r   r=   __classcell__)r8   s   @r9   r    r    J   s%    'O
	O 	 	 	r:   r    c                       e Zd ZdedefdZy)OfflineAdapterr5   r;   c                 4    t        d|j                   d      )NzCannot reach za: offline mode is enabled. To disable it, please unset the `HF_HUB_OFFLINE` environment variable.)r   r3   )r4   r5   r@   r6   s       r9   r=   zOfflineAdapter.sendg   s&    "GKK=  )J  K
 	
r:   N)rC   rD   rE   r   r   r=    r:   r9   rH   rH   f   s    
O 
 
r:   rH   r;   c                  "   t        j                         } t        j                  r6| j	                  dt                      | j	                  dt                      | S | j	                  dt                      | j	                  dt                      | S )Nzhttp://zhttps://)r>   Sessionr   HF_HUB_OFFLINEmountrH   r    )sessions    r9   _default_backend_factoryrP   m   sm     Gi!12j."23 N 	i!7!9:j"8":;Nr:   _GLOBAL_BACKEND_FACTORYbackend_factoryc                     | a t                y)a  
    Configure the HTTP backend by providing a `backend_factory`. Any HTTP calls made by `huggingface_hub` will use a
    Session object instantiated by this factory. This can be useful if you are running your scripts in a specific
    environment requiring custom configuration (e.g. custom proxy or certifications).

    Use [`get_session`] to get a configured Session. Since `requests.Session` is not guaranteed to be thread-safe,
    `huggingface_hub` creates 1 Session instance per thread. They are all instantiated using the same `backend_factory`
    set in [`configure_http_backend`]. A LRU cache is used to cache the created sessions (and connections) between
    calls. Max size is 128 to avoid memory leaks if thousands of threads are spawned.

    See [this issue](https://github.com/psf/requests/issues/2766) to know more about thread-safety in `requests`.

    Example:
    ```py
    import requests
    from huggingface_hub import configure_http_backend, get_session

    # Create a factory function that returns a Session with configured proxies
    def backend_factory() -> requests.Session:
        session = requests.Session()
        session.proxies = {"http": "http://10.10.1.10:3128", "https": "https://10.10.1.11:1080"}
        return session

    # Set it as the default session factory
    configure_http_backend(backend_factory=backend_factory)

    # In practice, this is mostly done internally in `huggingface_hub`
    session = get_session()
    ```
    N)rQ   reset_sessions)rR   s    r9   configure_http_backendrU   |   s    @ .r:   c                  d    t        t        j                         t        j                               S )a  
    Get a `requests.Session` object, using the session factory from the user.

    Use [`get_session`] to get a configured Session. Since `requests.Session` is not guaranteed to be thread-safe,
    `huggingface_hub` creates 1 Session instance per thread. They are all instantiated using the same `backend_factory`
    set in [`configure_http_backend`]. A LRU cache is used to cache the created sessions (and connections) between
    calls. Max size is 128 to avoid memory leaks if thousands of threads are spawned.

    See [this issue](https://github.com/psf/requests/issues/2766) to know more about thread-safety in `requests`.

    Example:
    ```py
    import requests
    from huggingface_hub import configure_http_backend, get_session

    # Create a factory function that returns a Session with configured proxies
    def backend_factory() -> requests.Session:
        session = requests.Session()
        session.proxies = {"http": "http://10.10.1.10:3128", "https": "https://10.10.1.11:1080"}
        return session

    # Set it as the default session factory
    configure_http_backend(backend_factory=backend_factory)

    # In practice, this is mostly done internally in `huggingface_hub`
    session = get_session()
    ```
    
process_id	thread_id)_get_session_from_cacheosgetpid	threading	get_identrJ   r:   r9   get_sessionr_      s     : #biikYEXEXEZ[[r:   c                  ,    t         j                          y)zReset the cache of sessions.

    Mostly used internally when sessions are reconfigured or an SSLError is raised.
    See [`configure_http_backend`] for more details.
    N)rZ   cache_clearrJ   r:   r9   rT   rT      s     '')r:   rX   rY   c                     t               S )z
    Create a new session per thread using global factory. Using LRU cache (maxsize 128) to avoid memory leaks when
    using thousands of threads. Cache is cleared when `configure_http_backend` is called.
    )rQ   rW   s     r9   rZ   rZ      s     #$$r:         )max_retriesbase_wait_timemax_wait_timeretry_on_exceptionsretry_on_status_codesr2   r3   re   rf   rg   rh   .ri   c          	      $   t        |t              r|f}t        |t              r|f}d}|}	d}
d|v r6t        |d   t        j                  t
        f      r|d   j                         }
t               }	 |dz  }	 |
|d   j                  |
        |j                  d| |d|}|j                  |vr|S t        j                  d|j                   d|  d|        ||kD  r|j                          |S 	 t        j                  d|	 d| d| d       t#        j$                  |	       t'        ||	dz        }	# |$ rS}t        j                  d	| d
|  d|        t        |t        j                        r
t!                ||kD  r|Y d}~d}~ww xY w)a#  Wrapper around requests to retry calls on an endpoint, with exponential backoff.

    Endpoint call is retried on exceptions (ex: connection timeout, proxy error,...)
    and/or on specific status codes (ex: service unavailable). If the call failed more
    than `max_retries`, the exception is thrown or `raise_for_status` is called on the
    response object.

    Re-implement mechanisms from the `backoff` library to avoid adding an external
    dependencies to `hugging_face_hub`. See https://github.com/litl/backoff.

    Args:
        method (`Literal["GET", "OPTIONS", "HEAD", "POST", "PUT", "PATCH", "DELETE"]`):
            HTTP method to perform.
        url (`str`):
            The URL of the resource to fetch.
        max_retries (`int`, *optional*, defaults to `5`):
            Maximum number of retries, defaults to 5 (no retries).
        base_wait_time (`float`, *optional*, defaults to `1`):
            Duration (in seconds) to wait before retrying the first time.
            Wait time between retries then grows exponentially, capped by
            `max_wait_time`.
        max_wait_time (`float`, *optional*, defaults to `8`):
            Maximum duration (in seconds) to wait before retrying.
        retry_on_exceptions (`Type[Exception]` or `Tuple[Type[Exception]]`, *optional*):
            Define which exceptions must be caught to retry the request. Can be a single type or a tuple of types.
            By default, retry on `requests.Timeout` and `requests.ConnectionError`.
        retry_on_status_codes (`int` or `Tuple[int]`, *optional*, defaults to `503`):
            Define on which status codes the request must be retried. By default, only
            HTTP 503 Service Unavailable is retried.
        **kwargs (`dict`, *optional*):
            kwargs to pass to `requests.request`.

    Example:
    ```
    >>> from huggingface_hub.utils import http_backoff

    # Same usage as "requests.request".
    >>> response = http_backoff("GET", "https://www.google.com")
    >>> response.raise_for_status()

    # If you expect a Gateway Timeout from time to time
    >>> http_backoff("PUT", upload_url, data=data, retry_on_status_codes=504)
    >>> response.raise_for_status()
    ```

    <Tip warning={true}>

    When using `requests` it is possible to stream data by passing an iterator to the
    `data` argument. On http backoff this is a problem as the iterator is not reset
    after a failed call. This issue is mitigated for file objects or any IO streams
    by saving the initial position of the cursor (with `data.tell()`) and resetting the
    cursor between each call (with `data.seek()`). For arbitrary iterators, http backoff
    will fail. If this is a hard constraint for you, please let us know by opening an
    issue on [Github](https://github.com/huggingface/huggingface_hub).

    </Tip>
    r   Ndatar   )r2   r3   zHTTP Error z thrown while requesting r$   'z' thrown while requesting zRetrying in z	s [Retry /z].r   rJ   )
isinstancetypeintioIOBaser   tellr_   seekr5   status_coder0   warningraise_for_statusr>   ConnectionErrorrT   timesleepmin)r2   r3   re   rf   rg   rh   ri   r6   nb_tries
sleep_timeio_obj_initial_posrO   responseerrs                 r9   http_backoffr      s   N %t,24'-!6 8HJ
 Jvf~		<7PQ#F^002mG
A	 "-v##$67 'wHf#HHH##+@@ NN[)=)=(>>WX^W__`ad`efg+%))+  	 &  	j\8*Ak]RTUV

: 
Q7
G * # 	NNQse#=fXQseLM#x778 +%	 &	s   8:D7 3>D7 7F<A	F

Fendpointc                     |xs t         j                  }|dt         j                  t         j                  fvr@| j	                  t         j                  |      } | j	                  t         j                  |      } | S )zReplace the default endpoint in a URL by a custom one.

    This is useful when using a proxy and the Hugging Face Hub returns a URL with the default endpoint.
    N)r   ENDPOINT_HF_DEFAULT_ENDPOINT_HF_DEFAULT_STAGING_ENDPOINTreplace)r3   r   s     r9   fix_hf_endpoint_in_urlr   P  s`    
 -9--Hi<<i>d>deekk)88(Ckk)@@(KJr:   r   endpoint_namec                    	 | j                          y# t        $ r}| j                  j                  d      }| j                  j                  d      }|dk(  r5| j                   ddz   d| j
                   dz   }t        t        ||       ||dk(  r5| j                   ddz   d	| j
                   dz   }t        t        ||       ||d
k(  r5| j                   ddz   d| j
                   dz   }t        t        ||       ||dk(  r;| j                   ddz   d| j
                   dz   dz   dz   }t        t        ||       ||dk(  sZ| j                  dk(  r| j                  w| j                  j
                  at        j                  | j                  j
                        8| j                   ddz   d| j
                   dz   dz   }t        t        ||       || j                  dk(  r|d| dnd}t        t        ||       || j                  dk(  r9d| j                   d| dd| j
                   dz   dz   }t        t         ||       || j                  dk(  r[| j                  j                  j                  d      }| d| d| j                  j                  d        d}t        t         ||       |t        t         t#        |      |       |d}~ww xY w)!a  
    Internal version of `response.raise_for_status()` that will refine a
    potential HTTPError. Raised exception will be an instance of `HfHubHTTPError`.

    This helper is meant to be the unique method to raise_for_status when making a call
    to the Hugging Face Hub.


    Example:
    ```py
        import requests
        from huggingface_hub.utils import get_session, hf_raise_for_status, HfHubHTTPError

        response = get_session().post(...)
        try:
            hf_raise_for_status(response)
        except HfHubHTTPError as e:
            print(str(e)) # formatted message
            e.request_id, e.server_message # details returned by server

            # Complete the error message with additional information once it's raised
            e.append_to_message("
`create_commit` expects the repository to exist.")
            raise
    ```

    Args:
        response (`Response`):
            Response from the server.
        endpoint_name (`str`, *optional*):
            Name of the endpoint that has been called. If provided, the error message
            will be more complete.

    <Tip warning={true}>

    Raises when the request has failed:

        - [`~utils.RepositoryNotFoundError`]
            If the repository to download from cannot be found. This may be because it
            doesn't exist, because `repo_type` is not set correctly, or because the repo
            is `private` and you do not have access.
        - [`~utils.GatedRepoError`]
            If the repository exists but is gated and the user is not on the authorized
            list.
        - [`~utils.RevisionNotFoundError`]
            If the repository exists but the revision couldn't be find.
        - [`~utils.EntryNotFoundError`]
            If the repository exists but the entry (e.g. the requested file) couldn't be
            find.
        - [`~utils.BadRequestError`]
            If request failed with a HTTP 400 BadRequest error.
        - [`~utils.HfHubHTTPError`]
            If request failed for a reason not listed above.

    </Tip>
    zX-Error-CodeX-Error-MessageRevisionNotFoundz Client Error.

zRevision Not Found for url: .EntryNotFoundzEntry Not Found for url: 	GatedRepoz!Cannot access gated repo for url z$Access to this resource is disabled.z!Cannot access repository for url 
RepoNotFoundi  NzRepository Not Found for url: z
Please make sure you specified the correct `repo_id` and `repo_type`.
If you are trying to access a private or gated repo, make sure you are authenticated.i  z

Bad request for z
 endpoint:z

Bad request:i  z Forbidden: z
Cannot access content at: z2
Make sure your token has the correct permissions.i  Rangez. Requested range: z. Content-Range: zContent-Range)rw   r
   r)   r*   ru   r3   _formatr   r   r   r   r5   REPO_API_REGEXsearchr   r   r   r,   )r   r   rA   
error_codeerror_messagemessagerange_headers          r9   hf_raise_for_statusr   ]  s[   pH?!!# F?%%)).9
 ((,,->?++!--.n=FKghphthtguuvIwwG/(CJ?*!--.n=FKdemeqeqdrrsIttG,gx@aG;&''(7&@EfgogsgsfttuCvv  .'8<!CDD''(75hll^1EF  9	9  +Wh?QF>)  C'  ,  $$0%%h&6&6&:&:;G ''(728<<.BC44  17HE1L!!S(DQD]&}oZ@cu  /7H=1D!!S(x++,LqI0a@AGH 
 .'8<!C!!S(#++3377@L.|n<MhN^N^NbNbcrNsMttuvG.'8<!C nc!fh7Q>MF?s    
KJ3KK
error_typecustom_messagec                    g }|j                   j                  d      }||j                  |       	 |j                         }|j                  d      }|3t	        |t
              r|j                  |       n|j                  |       |j                  d      }| |D ]  }d|v s|j                  |d           |D 	cg c]#  }	|	j                         s|	j                         % }}	t        t        j                  |            }dj                  |      }
|}|
r5|
j                         |j                         vrd	|v r	|d|
z   z  }n|d	|
z   z  }t        |j                   j                  t        d            }|rd
| d}n1t        |j                   j                  t         d            }|rd| d}|rI|j                         |j                         vr)d|v r |j#                  d      }|d | z   ||d  z   }n|z  } | |j                         ||
xs d       S # t        $ rY |j                   j                  dd      }|j                  r-d|j                         vr|j                  |j                         Y w xY wc c}	w )Nr   errorerrorsr   zContent-Typer#   htmlr   r   z (Request ID: r%   z (Amzn Trace ID: )r   server_message)r)   r*   appendjsonrn   listextendr   textlowerstripdictfromkeysjoinr,   r+   r(   index)r   r   r   server_errorsfrom_headersrk   r   r   content_typeliner   final_error_messagerB   request_id_messagenewline_indexs                  r9   r   r     s   M ##''(9:L\*0}}!%&$$U+ $$U+(#%!((y)9:   /<Lmdtzz|TZZ\mML }56M YY}-N )...08L8L8NN^#4.#886N#::X%%)),;<J-j\; ))--orBC
#4ZL!Bj&&(0C0I0I0KK&&/55d;M#N]36HHK^_l_mKnn    #55 )//1HUcUkgkllU  0''++NB?==V<+=+=+??  /	0 Ms%   A2H %H ?JJAI>=I>)r;   N)N)I__doc__rq   r[   rer]   ry   r-   	functoolsr   httpr   typingr   r   r   r   r	   r>   r
   r   requests.adaptersr   requests.modelsr   huggingface_hub.errorsr   r#   r   r   r   r   r   r   r   r   r   r   _fixesr   _lfsr   _typingr   
get_loggerrC   r0   r(   r+   compileVERBOSEr   r    rH   rL   rP   BACKEND_FACTORY_TrQ   __annotations__rU   r_   rT   rp   rZ   Timeoutrx   SERVICE_UNAVAILABLEr,   float	Exceptionr   r   r   r   rJ   r:   r9   <module>r      su   E 	 	 	      9 9  ( ) + 7     #  " 
		H	%
 $
 ** [ 8
[ 
("2"2  R!1!112 -E * E AY !,= !]a !H\X%% \@* % % %@P@P % %   P :D9W9W{8{8	{8 	{8
 {8 {8 tId9os6J0KKL{8 !eCHo!56{8 {8|
 
x} 
 
@?( @?8C= @?TX @?FGm^, Gmc GmX GmZh Gmr:   