together.py 3.3 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788
  1. import base64
  2. from abc import ABC
  3. from typing import Any
  4. from huggingface_hub.hf_api import InferenceProviderMapping
  5. from huggingface_hub.inference._common import RequestParameters, _as_dict
  6. from huggingface_hub.inference._providers._common import (
  7. BaseConversationalTask,
  8. BaseTextGenerationTask,
  9. TaskProviderHelper,
  10. filter_none,
  11. )
  12. _PROVIDER = "together"
  13. _BASE_URL = "https://api.together.xyz"
  14. class TogetherTask(TaskProviderHelper, ABC):
  15. """Base class for Together API tasks."""
  16. def __init__(self, task: str):
  17. super().__init__(provider=_PROVIDER, base_url=_BASE_URL, task=task)
  18. def _prepare_route(self, mapped_model: str, api_key: str) -> str:
  19. if self.task == "text-to-image":
  20. return "/v1/images/generations"
  21. elif self.task == "conversational":
  22. return "/v1/chat/completions"
  23. elif self.task == "text-generation":
  24. return "/v1/completions"
  25. raise ValueError(f"Unsupported task '{self.task}' for Together API.")
  26. class TogetherTextGenerationTask(BaseTextGenerationTask):
  27. def __init__(self):
  28. super().__init__(provider=_PROVIDER, base_url=_BASE_URL)
  29. def get_response(self, response: bytes | dict, request_params: RequestParameters | None = None) -> Any:
  30. output = _as_dict(response)["choices"][0]
  31. return {
  32. "generated_text": output["text"],
  33. "details": {
  34. "finish_reason": output.get("finish_reason"),
  35. "seed": output.get("seed"),
  36. },
  37. }
  38. class TogetherConversationalTask(BaseConversationalTask):
  39. def __init__(self):
  40. super().__init__(provider=_PROVIDER, base_url=_BASE_URL)
  41. def _prepare_payload_as_dict(
  42. self, inputs: Any, parameters: dict, provider_mapping_info: InferenceProviderMapping
  43. ) -> dict | None:
  44. payload = super()._prepare_payload_as_dict(inputs, parameters, provider_mapping_info)
  45. response_format = parameters.get("response_format")
  46. if isinstance(response_format, dict) and response_format.get("type") == "json_schema":
  47. json_schema_details = response_format.get("json_schema")
  48. if isinstance(json_schema_details, dict) and "schema" in json_schema_details:
  49. payload["response_format"] = { # type: ignore
  50. "type": "json_object",
  51. "schema": json_schema_details["schema"],
  52. }
  53. return payload
  54. class TogetherTextToImageTask(TogetherTask):
  55. def __init__(self):
  56. super().__init__("text-to-image")
  57. def _prepare_payload_as_dict(
  58. self, inputs: Any, parameters: dict, provider_mapping_info: InferenceProviderMapping
  59. ) -> dict | None:
  60. mapped_model = provider_mapping_info.provider_id
  61. parameters = filter_none(parameters)
  62. if "num_inference_steps" in parameters:
  63. parameters["steps"] = parameters.pop("num_inference_steps")
  64. if "guidance_scale" in parameters:
  65. parameters["guidance"] = parameters.pop("guidance_scale")
  66. return {"prompt": inputs, "response_format": "base64", **parameters, "model": mapped_model}
  67. def get_response(self, response: bytes | dict, request_params: RequestParameters | None = None) -> Any:
  68. response_dict = _as_dict(response)
  69. return base64.b64decode(response_dict["data"][0]["b64_json"])