Spaces:

GameScribes
/

Multipurpose-AI-Agent-Development

Paused

App Files Files Community

devve1 commited on Jul 5

Commit

eb93a92

•

1 Parent(s): a1ddbe5

Update optimum_encoder.py

Browse files

Files changed (1) hide show

optimum_encoder.py +1 -136

optimum_encoder.py CHANGED Viewed

@@ -154,139 +154,4 @@ class OptimumEncoder(BaseEncoder):
             attention_mask.unsqueeze(-1).expand(token_embeddings.size()).float()
         )
         token_embeddings[input_mask_expanded == 0] = -1e9
-        return self._torch.max(token_embeddings, 1)[0]
-class HFEndpointEncoder(BaseEncoder):
-    """
-    A class to encode documents using a Hugging Face transformer model endpoint.
-    Attributes:
-        huggingface_url (str): The URL of the Hugging Face API endpoint.
-        huggingface_api_key (str): The API key for authenticating with the Hugging Face API.
-        score_threshold (float): A threshold value used for filtering or processing the embeddings.
-    """
-    name: str = "hugging_face_custom_endpoint"
-    huggingface_url: Optional[str] = None
-    huggingface_api_key: Optional[str] = None
-    score_threshold: float = 0.8
-    def __init__(
-        self,
-        name: Optional[str] = "hugging_face_custom_endpoint",
-        huggingface_url: Optional[str] = None,
-        huggingface_api_key: Optional[str] = None,
-        score_threshold: float = 0.8,
-    ):
-        """
-        Initializes the HFEndpointEncoder with the specified parameters.
-        Args:
-            name (str, optional): The name of the encoder. Defaults to
-                "hugging_face_custom_endpoint".
-            huggingface_url (str, optional): The URL of the Hugging Face API endpoint.
-                Cannot be None.
-            huggingface_api_key (str, optional): The API key for the Hugging Face API.
-                Cannot be None.
-            score_threshold (float, optional): A threshold for processing the embeddings.
-                Defaults to 0.8.
-        Raises:
-            ValueError: If either `huggingface_url` or `huggingface_api_key` is None.
-        """
-        huggingface_url = huggingface_url or os.getenv("HF_API_URL")
-        huggingface_api_key = huggingface_api_key or os.getenv("HF_API_KEY")
-        super().__init__(name=name, score_threshold=score_threshold)  # type: ignore
-        if huggingface_url is None:
-            raise ValueError("HuggingFace endpoint url cannot be 'None'.")
-        if huggingface_api_key is None:
-            raise ValueError("HuggingFace API key cannot be 'None'.")
-        self.huggingface_url = huggingface_url or os.getenv("HF_API_URL")
-        self.huggingface_api_key = huggingface_api_key or os.getenv("HF_API_KEY")
-        try:
-            self.query({"inputs": "Hello World!", "parameters": {}})
-        except Exception as e:
-            raise ValueError(
-                f"HuggingFace endpoint client failed to initialize. Error: {e}"
-            ) from e
-    def __call__(self, docs: List[str]) -> List[List[float]]:
-        """
-        Encodes a list of documents into embeddings using the Hugging Face API.
-        Args:
-            docs (List[str]): A list of documents to encode.
-        Returns:
-            List[List[float]]: A list of embeddings for the given documents.
-        Raises:
-            ValueError: If no embeddings are returned for a document.
-        """
-        embeddings = []
-        for d in docs:
-            try:
-                output = self.query({"inputs": d, "parameters": {}})
-                if not output or len(output) == 0:
-                    raise ValueError("No embeddings returned from the query.")
-                embeddings.append(output)
-            except Exception as e:
-                raise ValueError(
-                    f"No embeddings returned for document. Error: {e}"
-                ) from e
-        return embeddings
-    def query(self, payload, max_retries=3, retry_interval=5):
-        """
-        Sends a query to the Hugging Face API and returns the response.
-        Args:
-            payload (dict): The payload to send in the request.
-        Returns:
-            dict: The response from the Hugging Face API.
-        Raises:
-            ValueError: If the query fails or the response status is not 200.
-        """
-        headers = {
-            "Accept": "application/json",
-            "Authorization": f"Bearer {self.huggingface_api_key}",
-            "Content-Type": "application/json",
-        }
-        for attempt in range(1, max_retries + 1):
-            try:
-                response = requests.post(
-                    self.huggingface_url,
-                    headers=headers,
-                    json=payload,
-                    # timeout=timeout_seconds,
-                )
-                if response.status_code == 503:
-                    estimated_time = response.json().get("estimated_time", "")
-                    if estimated_time:
-                        logger.info(
-                            f"Model Initializing wait for - {estimated_time:.2f}s "
-                        )
-                        time.sleep(estimated_time)
-                        continue
-                else:
-                    response.raise_for_status()
-            except requests.exceptions.RequestException:
-                if attempt < max_retries - 1:
-                    logger.info(f"Retrying attempt: {attempt} for payload: {payload} ")
-                    time.sleep(retry_interval)
-                    retry_interval += attempt
-                else:
-                    raise ValueError(
-                        f"Query failed with status {response.status_code}: {response.text}"
-                    )
-        return response.json()

             attention_mask.unsqueeze(-1).expand(token_embeddings.size()).float()
         )
         token_embeddings[input_mask_expanded == 0] = -1e9
+        return self._torch.max(token_embeddings, 1)[0]