# -----------------------------------------------------------------------------------------
# (C) Copyright IBM Corp. 2024-2025.
# https://opensource.org/licenses/BSD-3-Clause
# -----------------------------------------------------------------------------------------
from __future__ import annotations
from typing import TYPE_CHECKING, TypedDict
from copy import deepcopy
from ibm_watsonx_ai.wml_client_error import InvalidMultipleArguments
from ibm_watsonx_ai.wml_resource import WMLResource
from ibm_watsonx_ai._wrappers import requests
from ibm_watsonx_ai.foundation_models.schema import (
RerankParameters,
BaseSchema,
)
if TYPE_CHECKING:
from ibm_watsonx_ai import APIClient, Credentials
class TextDict(TypedDict):
text: str
[docs]
class Rerank(WMLResource):
"""
Rerank texts based on some queries.
:param model_id: type of model to use
:type model_id: str
:param params: parameters to use during request generation
:type params: dict, RerankParameters, optional
:param credentials: credentials for the Watson Machine Learning instance
:type credentials: Credentials or dict, optional
:param project_id: ID of the Watson Studio project
:type project_id: str, optional
:param space_id: ID of the Watson Studio space
:type space_id: str, optional
:param verify: You can pass one of the following as verify:
* the path to a CA_BUNDLE file
* the path of directory with certificates of trusted CAs
* `True` - default path to truststore will be taken
* `False` - no verification will be made
:type verify: bool or str, optional
:param api_client: initialized APIClient object with a set project ID or space ID. If passed, ``credentials`` and ``project_id``/``space_id`` are not required.
:type api_client: APIClient, optional
**Example:**
.. code-block:: python
from ibm_watsonx_ai import Credentials
from ibm_watsonx_ai.foundation_models import Rerank
generate_params = {
"truncate_input_tokens": 10
}
wx_ranker = Rerank(
model_id="<RERANK MODEL>",
params=generate_params,
credentials=Credentials(
api_key = IAM_API_KEY,
url = "https://us-south.ml.cloud.ibm.com"),
project_id=project_id
)
"""
def __init__(
self,
model_id: str,
params: dict | RerankParameters | None = None,
credentials: Credentials | None = None,
project_id: str | None = None,
space_id: str | None = None,
verify: bool | str | None = None,
api_client: APIClient | None = None,
) -> None:
self.model_id = model_id
Rerank._validate_type(model_id, "model_id", str, True)
self.params = params
Rerank._validate_type(params, "params", [dict, RerankParameters], False, True)
if credentials:
from ibm_watsonx_ai import APIClient
self._client = APIClient(credentials, verify=verify)
elif api_client:
self._client = api_client
else:
raise InvalidMultipleArguments(
params_names_list=["credentials", "api_client"],
reason="None of the arguments were provided.",
)
if space_id:
self._client.set.default_space(space_id)
elif project_id:
self._client.set.default_project(project_id)
elif not api_client:
raise InvalidMultipleArguments(
params_names_list=["space_id", "project_id"],
reason="None of the arguments were provided.",
)
WMLResource.__init__(self, __name__, self._client)
[docs]
def generate(
self,
query: str,
inputs: list[str | TextDict],
params: dict | RerankParameters | None = None,
) -> dict:
"""
Calling this method generates the following auditing event.
:param query: The rank query.
:type query: str
:param inputs: The rank input strings.
:type inputs: list[str], list[dict['text', str]]
:param params:
:type params: dict, RerankParameters, optional
**Example:**
.. code-block:: python
query = "As a Youth, I craved excitement while in adulthood I followed Enthusiastic Pursuit."
inputs = [
"In my younger years, I often reveled in the excitement of spontaneous adventures and embraced the thrill of the unknown, whereas in my grownup life, I have come to appreciate the comforting stability of a well-established routine.",
"As a young man, I frequently sought out exhilarating experiences, craving the adrenaline rush of lifes novelties, while as a responsible adult, I have come to understand the profound value of accumulated wisdom and life experience."
]
response = wx_ranker.generate(query=query, inputs=inputs)
# Print all response
print(response)
"""
self._client._check_if_either_is_set()
self._validate_type(query, "query", str, True)
self._validate_type(inputs, "inputs", list, True)
if all(isinstance(el, str) for el in inputs):
inputs_payload = [{"text": el_input} for el_input in inputs]
else:
inputs_payload = inputs # type: ignore
payload: dict = {
"model_id": self.model_id,
"query": query,
"inputs": inputs_payload,
}
if params is not None:
parameters = params
elif self.params is not None:
parameters = deepcopy(self.params)
else:
parameters = None
if isinstance(parameters, BaseSchema):
parameters = parameters.to_dict()
if parameters:
payload["parameters"] = parameters
if self._client.default_project_id:
payload["project_id"] = self._client.default_project_id
elif self._client.default_space_id:
payload["space_id"] = self._client.default_space_id
response = requests.post(
url=self._client.service_instance._href_definitions.get_rerank_href(),
json=payload,
params=self._client._params(skip_for_create=True, skip_userfs=True),
headers=self._client._get_headers(),
)
return self._handle_response(200, "generate_rerank", response)