nebius.py 3.4 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283
  1. import base64
  2. from typing import Any
  3. from huggingface_hub.hf_api import InferenceProviderMapping
  4. from huggingface_hub.inference._common import RequestParameters, _as_dict
  5. from huggingface_hub.inference._providers._common import (
  6. BaseConversationalTask,
  7. BaseTextGenerationTask,
  8. TaskProviderHelper,
  9. filter_none,
  10. )
  11. class NebiusTextGenerationTask(BaseTextGenerationTask):
  12. def __init__(self):
  13. super().__init__(provider="nebius", base_url="https://api.studio.nebius.ai")
  14. def get_response(self, response: bytes | dict, request_params: RequestParameters | None = None) -> Any:
  15. output = _as_dict(response)["choices"][0]
  16. return {
  17. "generated_text": output["text"],
  18. "details": {
  19. "finish_reason": output.get("finish_reason"),
  20. "seed": output.get("seed"),
  21. },
  22. }
  23. class NebiusConversationalTask(BaseConversationalTask):
  24. def __init__(self):
  25. super().__init__(provider="nebius", base_url="https://api.studio.nebius.ai")
  26. def _prepare_payload_as_dict(
  27. self, inputs: Any, parameters: dict, provider_mapping_info: InferenceProviderMapping
  28. ) -> dict | None:
  29. payload = super()._prepare_payload_as_dict(inputs, parameters, provider_mapping_info)
  30. response_format = parameters.get("response_format")
  31. if isinstance(response_format, dict) and response_format.get("type") == "json_schema":
  32. json_schema_details = response_format.get("json_schema")
  33. if isinstance(json_schema_details, dict) and "schema" in json_schema_details:
  34. payload["guided_json"] = json_schema_details["schema"] # type: ignore
  35. return payload
  36. class NebiusTextToImageTask(TaskProviderHelper):
  37. def __init__(self):
  38. super().__init__(task="text-to-image", provider="nebius", base_url="https://api.studio.nebius.ai")
  39. def _prepare_route(self, mapped_model: str, api_key: str) -> str:
  40. return "/v1/images/generations"
  41. def _prepare_payload_as_dict(
  42. self, inputs: Any, parameters: dict, provider_mapping_info: InferenceProviderMapping
  43. ) -> dict | None:
  44. mapped_model = provider_mapping_info.provider_id
  45. parameters = filter_none(parameters)
  46. if "guidance_scale" in parameters:
  47. parameters.pop("guidance_scale")
  48. if parameters.get("response_format") not in ("b64_json", "url"):
  49. parameters["response_format"] = "b64_json"
  50. return {"prompt": inputs, **parameters, "model": mapped_model}
  51. def get_response(self, response: bytes | dict, request_params: RequestParameters | None = None) -> Any:
  52. response_dict = _as_dict(response)
  53. return base64.b64decode(response_dict["data"][0]["b64_json"])
  54. class NebiusFeatureExtractionTask(TaskProviderHelper):
  55. def __init__(self):
  56. super().__init__(task="feature-extraction", provider="nebius", base_url="https://api.studio.nebius.ai")
  57. def _prepare_route(self, mapped_model: str, api_key: str) -> str:
  58. return "/v1/embeddings"
  59. def _prepare_payload_as_dict(
  60. self, inputs: Any, parameters: dict, provider_mapping_info: InferenceProviderMapping
  61. ) -> dict | None:
  62. return {"input": inputs, "model": provider_mapping_info.provider_id}
  63. def get_response(self, response: bytes | dict, request_params: RequestParameters | None = None) -> Any:
  64. embeddings = _as_dict(response)["data"]
  65. return [embedding["embedding"] for embedding in embeddings]