
    h.-                         d Z ddlZddlmZ ddlmZmZmZmZm	Z	m
Z
mZ ddlZddlZddlZddlmZ ddlmZmZ ddlmZmZmZmZmZ ddlmZ d	gZ G d
 d	ee      Z G d d      Zy)a  
TextEmbed: Embedding Inference Server

TextEmbed provides a high-throughput, low-latency solution for serving embeddings.
It supports various sentence-transformer models.
Now, it includes the ability to deploy image embedding models.
TextEmbed offers flexibility and scalability for diverse applications.

TextEmbed is maintained by Keval Dekivadiya and is licensed under the Apache-2.0 license.
    N)ThreadPoolExecutor)AnyCallableDictListOptionalTupleUnion)
Embeddings)from_envsecret_from_env)	BaseModel
ConfigDictField	SecretStrmodel_validator)SelfTextEmbedEmbeddingsc                   ,   e Zd ZU dZeed<   	  e edd            Zeed<   	  e e	d            Z
eed	<   	 d
Zeed<   	  ed      Z ed      defd       Zdee   deee      fdZdee   deee      fdZdedee   fdZdedee   fdZy
)r   a  
    A class to handle embedding requests to the TextEmbed API.

    Attributes:
        model : The TextEmbed model ID to use for embeddings.
        api_url : The base URL for the TextEmbed API.
        api_key : The API key for authenticating with the TextEmbed API.
        client : The TextEmbed client instance.

    Example:
        .. code-block:: python

            from langchain_community.embeddings import TextEmbedEmbeddings

            embeddings = TextEmbedEmbeddings(
                model="sentence-transformers/clip-ViT-B-32",
                api_url="http://localhost:8000/v1",
                api_key="<API_KEY>"
            )

    For more information: https://github.com/kevaldekivadiya2415/textembed/blob/main/docs/setup.md
    modelTEXTEMBED_API_URLhttp://localhost:8000/v1)default)default_factoryapi_urlTEXTEMBED_API_KEYapi_keyNclientforbid)extraafter)modereturnc                 n    t        | j                  | j                  j                               | _        | S )z7Validate that api key and URL exist in the environment.)hostr   )#AsyncOpenAITextEmbedEmbeddingClientr   r   get_secret_valuer   )selfs    f/var/www/html/eduruby.in/venv/lib/python3.12/site-packages/langchain_community/embeddings/textembed.pyvalidate_environmentz(TextEmbedEmbeddings.validate_environmentG   s-     :t||'D'D'F
     textsc                 T    | j                   j                  | j                  |      }|S )zCall out to TextEmbed's embedding endpoint.

        Args:
            texts (List[str]): The list of texts to embed.

        Returns:
            List[List[float]]: List of embeddings, one for each text.
        r   r,   )r   embedr   r(   r,   
embeddingss      r)   embed_documentsz#TextEmbedEmbeddings.embed_documentsO   s/     [[&&** ' 

 r+   c                 p   K   | j                   j                  | j                  |       d{   }|S 7 w)zAsync call out to TextEmbed's embedding endpoint.

        Args:
            texts (List[str]): The list of texts to embed.

        Returns:
            List[List[float]]: List of embeddings, one for each text.
        r.   N)r   aembedr   r0   s      r)   aembed_documentsz$TextEmbedEmbeddings.aembed_documents^   s=       ;;--** . 
 

 	
s   +646textc                 ,    | j                  |g      d   S )zCall out to TextEmbed's embedding endpoint for a single query.

        Args:
            text (str): The text to embed.

        Returns:
            List[float]: Embeddings for the text.
        r   )r2   )r(   r6   s     r)   embed_queryzTextEmbedEmbeddings.embed_querym   s     ##TF+A..r+   c                 L   K   | j                  |g       d{   }|d   S 7 	w)zAsync call out to TextEmbed's embedding endpoint for a single query.

        Args:
            text (str): The text to embed.

        Returns:
            List[float]: Embeddings for the text.
        Nr   )r5   )r(   r6   r1   s      r)   aembed_queryz TextEmbedEmbeddings.aembed_queryx   s,       00$88
!} 9s   $"
$)__name__
__module____qualname____doc__str__annotations__r   r   r   r   r   r   r   r   r   model_configr   r   r*   r   floatr2   r5   r8   r:    r+   r)   r   r      s    . J( )C
GS 
 ?R/STGYT$FCL '"d  #T#Y 4U3D DI $tE{:K 	/ 	/U 	/
s 
tE{ 
r+   c            
          e Zd ZdZ	 	 	 ddedeedf   deej                     ddfdZ	e
efdee   d	edeee   ef   fd
       Zdee   deee      fdZe
deee      dee   fd       Zdedee   deeef   fdZdedee   deee      fdZdedee   deee      fdZdej                  deeef   deee      fdZdedee   deee      fdZy)r&   a  
    A client to handle synchronous and asynchronous requests to the TextEmbed API.

    Attributes:
        host (str): The base URL for the TextEmbed API.
        api_key (str): The API key for authenticating with the TextEmbed API.
        aiosession (Optional[aiohttp.ClientSession]): The aiohttp session for async requests.
        _batch_size (int): Maximum batch size for a single request.
    Nr%   r   
aiosessionr#   c                     || _         || _        || _        | j                   t        | j                         dk  rt	        d      d| _        y )N   z+Parameter `host` must be set to a valid URL   )r%   r   rE   len
ValueError_batch_size)r(   r%   r   rE   s       r)   __init__z,AsyncOpenAITextEmbedEmbeddingClient.__init__   sF     	$99DII 2JKKr+   r,   sorterc                     t        |       dk(  r| d fS t        j                  | D cg c]  } ||        c}      D cg c]  }| |   	 }}|fdfS c c}w c c}w )al  
        Sorts texts in ascending order and provides a function to restore the original order.

        Args:
            texts (List[str]): List of texts to sort.
            sorter (Callable, optional): Sorting function, defaults to length.

        Returns:
            Tuple[List[str], Callable]: Sorted texts and a function to restore original order.
           c                     | S NrC   )ts    r)   <lambda>z>AsyncOpenAITextEmbedEmbeddingClient._permute.<locals>.<lambda>   s    A r+   c                 Z    t        j                        D cg c]  }| |   	 c}S c c}w rQ   )npargsort)unsorted_embeddingsidxlength_sorted_idxs     r)   rS   z>AsyncOpenAITextEmbedEmbeddingClient._permute.<locals>.<lambda>   s-    02

;L0M:
),$:
  :
s   ()rI   rU   rV   )r,   rM   senrX   texts_sortedrY   s        @r)   _permutez,AsyncOpenAITextEmbedEmbeddingClient._permute   sm     u:?+%%JJ'F'FG.?@sc
@@ 
 
 	
 (G@s   AAc                     t        |      dk(  r|gS g }t        dt        |      | j                        D ]#  }|j                  |||| j                  z           % |S )z
        Splits a list of texts into batches of size max `self._batch_size`.

        Args:
            texts (List[str]): List of texts to split.

        Returns:
            List[List[str]]: List of batches of texts.
        rO   r   )rI   rangerK   append)r(   r,   batchesstart_indexs       r)   _batchz*AsyncOpenAITextEmbedEmbeddingClient._batch   sb     u:?7N CJ0@0@A 	PKNN5{T=M=M/MNO	Pr+   batch_of_textsc                     t        |       dk(  rt        | d         dk(  r| d   S g }| D ]  }|j                  |        |S )z
        Merges batches of texts into a single list.

        Args:
            batch_of_texts (List[List[Any]]): List of batches of texts.

        Returns:
            List[Any]: Merged list of texts.
        rO   r   )rI   extend)rc   r,   sublists      r)   _unbatchz,AsyncOpenAITextEmbedEmbeddingClient._unbatch   sR     ~!#N1,=(>!(C!!$$% 	"GLL!	"r+   r   c                 p    t        | j                   dddd| j                   dt        ||            S )a"  
        Builds the kwargs for the POST request, used by sync method.

        Args:
            model (str): The model to use for embedding.
            texts (List[str]): List of texts to embed.

        Returns:
            Dict[str, Any]: Dictionary of POST request parameters.
        z
/embeddingzapplication/jsonzBearer )acceptzcontent-typeAuthorization)inputr   )urlheadersjson)dictr%   r   )r(   r   r,   s      r)   _kwargs_post_requestz8AsyncOpenAITextEmbedEmbeddingClient._kwargs_post_request   sH     99+Z(, 2#*4<<.!9
 
 	
r+   batch_textsc                    t        j                  di | j                  ||      }|j                  dk7  r%t	        d|j                   d|j
                         |j                         d   D cg c]  }|d   	 c}S c c}w )al  
        Sends a synchronous request to the embedding endpoint.

        Args:
            model (str): The model to use for embedding.
            batch_texts (List[str]): Batch of texts to embed.

        Returns:
            List[List[float]]: List of embeddings for the batch.

        Raises:
            Exception: If the response status is not 200.
        r.      6TextEmbed responded with an unexpected status message : data	embeddingrC   )requestspostrp   status_code	Exceptionr6   rn   )r(   r   rq   responsees        r)   _sync_request_embedz7AsyncOpenAITextEmbedEmbeddingClient._sync_request_embed   s      == 
''e;'G
 3&H''(8==/;  )1(?@1+@@@s   0A?c                 j   | j                  |      \  }}| j                  |      }| j                  |gt        |      z  |f}t        |      dk(  rt	        t        |       }n,t        d      5 }t	         |j
                  |       }ddd       | j                        }	 ||	      }
|
S # 1 sw Y   $xY w)a	  
        Embeds a list of texts synchronously.

        Args:
            model (str): The model to use for embedding.
            texts (List[str]): List of texts to embed.

        Returns:
            List[List[float]]: List of embeddings for the texts.
        rO       N)r\   rb   r~   rI   listmapr   rg   )r(   r   r,   
perm_textsunpermute_funcperm_texts_batchedmap_argsembeddings_batch_permpembeddings_permr1   s              r)   r/   z)AsyncOpenAITextEmbedEmbeddingClient.embed
  s     &*]]5%9"
N![[4 $$Gc,--

 !"a'$(h$8!#B' ?1(,UQUUH-=(>%? --(=>#O4
? ?s   -B))B2sessionkwargsc                 f  K    |j                   di |4 d{   }|j                  dk7  r%t        d|j                   d|j                         |j	                          d{   d   }|D cg c]  }|d   	 c}cddd      d{    S 7 w7 -c c}w 7 # 1 d{  7  sw Y   yxY ww)a  
        Sends an asynchronous request to the embedding endpoint.

        Args:
            session (aiohttp.ClientSession): The aiohttp session for the request.
            kwargs (Dict[str, Any]): Dictionary of POST request parameters.

        Returns:
            List[List[float]]: List of embeddings for the request.

        Raises:
            Exception: If the response status is not 200.
        Nrs   rt   ru   rv   rw   rC   )ry   statusr{   r6   rn   )r(   r   r   r|   rw   r}   s         r)   _async_requestz2AsyncOpenAITextEmbedEmbeddingClient._async_request(  s        7<<)&) 	7 	7X#%L'r(--:   (}}.7I,56qAkN6	7 	7 	7 /6	7 	7 	7 	7si   B1BB1AB%B&B1B=B?B1BB1BBB1B."B%#B.*B1c                   K   | j                  |      \  }}| j                  |      }t        j                  t        j                  d            4 d{   }t        j                  |D cg c]'  } | j                  dd|i| j                  ||      ) c}  d{   }ddd      d{    | j                        }	 ||	      }
|
S 7 zc c}w 7 67 (# 1 d{  7  sw Y   8xY ww)a
  
        Embeds a list of texts asynchronously.

        Args:
            model (str): The model to use for embedding.
            texts (List[str]): List of texts to embed.

        Returns:
            List[List[float]]: List of embeddings for the texts.
        r   )limit)	connectorNr   r.   rC   )
r\   rb   aiohttpClientSessionTCPConnectorasynciogatherr   rp   rg   )r(   r   r,   r   r   r   r   rR   r   r   r1   s              r)   r4   z*AsyncOpenAITextEmbedEmbeddingClient.aembedA  s      &*]]5%9"
N![[4((**4
 	 	*1.. 0
 	 (D''  '33%q3I+ %!	 	 --(=>#O4
	%	 	 	 	sf   AC1CC1C.,C
C!C"C&C11C2 C1CC1C."C%#C.*C1)r   NN)r;   r<   r=   r>   r?   r
   r   r   r   rL   staticmethodrI   r   r   r	   r\   rb   r   rg   r   rp   rB   r~   r/   r   r4   rC   r+   r)   r&   r&      s    /$(6:	 sDy! W223	
 
 -0
Cy
"*
	tCy("	#
 
,DI $tCy/ " d3i T#Y  "
# 
d3i 
DcN 
0AA'+CyA	d5k	A43 tCy T$u+5F <7,,78<S#X7	d5k	72# d3i De<M r+   r&   ) r>   r   concurrent.futuresr   typingr   r   r   r   r   r	   r
   r   numpyrU   rx   langchain_core.embeddingsr   langchain_core.utilsr   r   pydanticr   r   r   r   r   typing_extensionsr   __all__r   r&   rC   r+   r)   <module>r      sX   	  1 D D D    0 : M M " 
!g)Z gTY Yr+   