cohere-ai · billytrend-cohere · Sep 30, 2024 · Sep 30, 2024 · Sep 30, 2024 · Sep 30, 2024
diff --git a/mypy.ini b/mypy.ini
@@ -0,0 +1,2 @@
+[mypy]
+exclude = src/cohere/manually_maintained/cohere_aws
diff --git a/poetry.lock b/poetry.lock
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "cohere"
-version = "5.10.0"
+version = "5.11.0"
 description = ""
 readme = "README.md"
 authors = []
@@ -43,6 +43,7 @@ requests = "^2.0.0"
 tokenizers = ">=0.15,<1"
 types-requests = "^2.0.0"
 typing_extensions = ">= 4.0.0"
+sagemaker = "^2.232.1"
 
 [tool.poetry.dev-dependencies]
 mypy = "1.0.1"

diff --git a/src/cohere/core/client_wrapper.py b/src/cohere/core/client_wrapper.py
@@ -24,7 +24,7 @@ def get_headers(self) -> typing.Dict[str, str]:
  headers: typing.Dict[str, str] = {
  "X-Fern-Language": "Python",
  "X-Fern-SDK-Name": "cohere",
- "X-Fern-SDK-Version": "5.10.0",
+ "X-Fern-SDK-Version": "5.11.0",
  }
  if self._client_name is not None:
  headers["X-Client-Name"] = self._client_name

diff --git a/src/cohere/manually_maintained/cohere_aws/__init__.py b/src/cohere/manually_maintained/cohere_aws/__init__.py
@@ -0,0 +1,3 @@
+from .client import Client
+from .error import CohereError
+from .mode import Mode
diff --git a/src/cohere/manually_maintained/cohere_aws/chat.py b/src/cohere/manually_maintained/cohere_aws/chat.py
@@ -0,0 +1,325 @@
+from .response import CohereObject
+from .error import CohereError
+from .mode import Mode
+from typing import List, Optional, Generator, Dict, Any, Union
+from enum import Enum
+import json
+
+# Tools
+
+class ToolParameterDefinitionsValue(CohereObject, dict):
+ def __init__(
+ self,
+ type: str,
+ description: str,
+ required: Optional[bool] = None,
+ **kwargs,
+ ) -> None:
+ super().__init__(**kwargs)
+ self.__dict__ = self
+ self.type = type
+ self.description = description
+ if required is not None:
+ self.required = required
+
+
+class Tool(CohereObject, dict):
+ def __init__(
+ self,
+ name: str,
+ description: str,
+ parameter_definitions: Optional[Dict[str, ToolParameterDefinitionsValue]] = None,
+ **kwargs,
+ ) -> None:
+ super().__init__(**kwargs)
+ self.__dict__ = self
+ self.name = name
+ self.description = description
+ if parameter_definitions is not None:
+ self.parameter_definitions = parameter_definitions
+
+
+class ToolCall(CohereObject, dict):
+ def __init__(
+ self,
+ name: str,
+ parameters: Dict[str, Any],
+ generation_id: str,
+ **kwargs,
+ ) -> None:
+ super().__init__(**kwargs)
+ self.__dict__ = self
+ self.name = name
+ self.parameters = parameters
+ self.generation_id = generation_id
+
+ @classmethod
+ def from_dict(cls, tool_call_res: Dict[str, Any]) -> "ToolCall":
+ return cls(
+ name=tool_call_res.get("name"),
+ parameters=tool_call_res.get("parameters"),
+ generation_id=tool_call_res.get("generation_id"),
+ )
+
+ @classmethod
+ def from_list(cls, tool_calls_res: Optional[List[Dict[str, Any]]]) -> Optional[List["ToolCall"]]:
+ if tool_calls_res is None or not isinstance(tool_calls_res, list):
+ return None
+
+ return [ToolCall.from_dict(tc) for tc in tool_calls_res]
+
+# Chat
+
+class Chat(CohereObject):
+ def __init__(
+ self,
+ response_id: str,
+ generation_id: str,
+ text: str,
+ chat_history: Optional[List[Dict[str, Any]]] = None,
+ preamble: Optional[str] = None,
+ finish_reason: Optional[str] = None,
+ token_count: Optional[Dict[str, int]] = None,
+ tool_calls: Optional[List[ToolCall]] = None,
+ citations: Optional[List[Dict[str, Any]]] = None,
+ documents: Optional[List[Dict[str, Any]]] = None,
+ search_results: Optional[List[Dict[str, Any]]] = None,
+ search_queries: Optional[List[Dict[str, Any]]] = None,
+ is_search_required: Optional[bool] = None,
+ ) -> None:
+ self.response_id = response_id
+ self.generation_id = generation_id
+ self.text = text
+ self.chat_history = chat_history
+ self.preamble = preamble
+ self.finish_reason = finish_reason
+ self.token_count = token_count
+ self.tool_calls = tool_calls
+ self.citations = citations
+ self.documents = documents
+ self.search_results = search_results
+ self.search_queries = search_queries
+ self.is_search_required = is_search_required
+
+ @classmethod
+ def from_dict(cls, response: Dict[str, Any]) -> "Chat":
+ return cls(
+ response_id=response["response_id"],
+ generation_id=response.get("generation_id"), # optional
+ text=response.get("text"),
+ chat_history=response.get("chat_history"), # optional
+ preamble=response.get("preamble"), # optional
+ token_count=response.get("token_count"),
+ is_search_required=response.get("is_search_required"), # optional
+ citations=response.get("citations"), # optional
+ documents=response.get("documents"), # optional
+ search_results=response.get("search_results"), # optional
+ search_queries=response.get("search_queries"), # optional
+ finish_reason=response.get("finish_reason"),
+ tool_calls=ToolCall.from_list(response.get("tool_calls")), # optional
+ )
+
+# ---------------|
+# Steaming event |
+# ---------------|
+
+class StreamEvent(str, Enum):
+ STREAM_START = "stream-start"
+ SEARCH_QUERIES_GENERATION = "search-queries-generation"
+ SEARCH_RESULTS = "search-results"
+ TEXT_GENERATION = "text-generation"
+ TOOL_CALLS_GENERATION = "tool-calls-generation"
+ CITATION_GENERATION = "citation-generation"
+ STREAM_END = "stream-end"
+
+class StreamResponse(CohereObject):
+ def __init__(
+ self,
+ is_finished: bool,
+ event_type: Union[StreamEvent, str],
+ index: Optional[int],
+ **kwargs,
+ ) -> None:
+ super().__init__(**kwargs)
+ self.is_finished = is_finished
+ self.index = index
+ self.event_type = event_type
+
+
+class StreamStart(StreamResponse):
+ def __init__(
+ self,
+ generation_id: str,
+ conversation_id: Optional[str],
+ **kwargs,
+ ) -> None:
+ super().__init__(**kwargs)
+ self.generation_id = generation_id
+ self.conversation_id = conversation_id
+
+
+class StreamTextGeneration(StreamResponse):
+ def __init__(
+ self,
+ text: str,
+ **kwargs,
+ ) -> None:
+ super().__init__(**kwargs)
+ self.text = text
+
+
+class StreamCitationGeneration(StreamResponse):
+ def __init__(
+ self,
+ citations: Optional[List[Dict[str, Any]]],
+ **kwargs,
+ ) -> None:
+ super().__init__(**kwargs)
+ self.citations = citations
+
+
+class StreamQueryGeneration(StreamResponse):
+ def __init__(
+ self,
+ search_queries: Optional[List[Dict[str, Any]]],
+ **kwargs,
+ ) -> None:
+ super().__init__(**kwargs)
+ self.search_queries = search_queries
+
+
+class StreamSearchResults(StreamResponse):
+ def __init__(
+ self,
+ search_results: Optional[List[Dict[str, Any]]],
+ documents: Optional[List[Dict[str, Any]]],
+ **kwargs,
+ ) -> None:
+ super().__init__(**kwargs)
+ self.search_results = search_results
+ self.documents = documents
+
+
+class StreamEnd(StreamResponse):
+ def __init__(
+ self,
+ finish_reason: str,
+ **kwargs,
+ ) -> None:
+ super().__init__(**kwargs)
+ self.finish_reason = finish_reason
+
+
+class ChatToolCallsGenerationEvent(StreamResponse):
+ def __init__(
+ self,
+ tool_calls: Optional[List[ToolCall]],
+ **kwargs,
+ ) -> None:
+ super().__init__(**kwargs)
+ self.tool_calls = tool_calls
+
+class StreamingChat(CohereObject):
+ def __init__(self, stream_response, mode):
+ self.stream_response = stream_response
+ self.text = None
+ self.response_id = None
+ self.generation_id = None
+ self.preamble = None
+ self.prompt = None
+ self.chat_history = None
+ self.finish_reason = None
+ self.token_count = None
+ self.is_search_required = None
+ self.citations = None
+ self.documents = None
+ self.search_results = None
+ self.search_queries = None
+ self.tool_calls = None
+
+ self.bytes = bytearray()
+ if mode == Mode.SAGEMAKER:
+ self.payload_key = "PayloadPart"
+ self.bytes_key = "Bytes"
+ elif mode == Mode.BEDROCK:
+ self.payload_key = "chunk"
+ self.bytes_key = "bytes"
+
+ def _make_response_item(self, index, streaming_item) -> Any:
+ event_type = streaming_item.get("event_type")
+
+ if event_type == StreamEvent.STREAM_START:
+ self.conversation_id = streaming_item.get("conversation_id")
+ self.generation_id = streaming_item.get("generation_id")
+ return StreamStart(
+ conversation_id=self.conversation_id,
+ generation_id=self.generation_id,
+ is_finished=False,
+ event_type=event_type,
+ index=index,
+ )
+ elif event_type == StreamEvent.SEARCH_QUERIES_GENERATION:
+ search_queries = streaming_item.get("search_queries")
+ return StreamQueryGeneration(
+ search_queries=search_queries, is_finished=False, event_type=event_type, index=index
+ )
+ elif event_type == StreamEvent.SEARCH_RESULTS:
+ search_results = streaming_item.get("search_results")
+ documents = streaming_item.get("documents")
+ return StreamSearchResults(
+ search_results=search_results,
+ documents=documents,
+ is_finished=False,
+ event_type=event_type,
+ index=index,
+ )
+ elif event_type == StreamEvent.TEXT_GENERATION:
+ text = streaming_item.get("text")
+ return StreamTextGeneration(text=text, is_finished=False, event_type=event_type, index=index)
+ elif event_type == StreamEvent.CITATION_GENERATION:
+ citations = streaming_item.get("citations")
+ return StreamCitationGeneration(citations=citations, is_finished=False, event_type=event_type, index=index)
+ elif event_type == StreamEvent.TOOL_CALLS_GENERATION:
+ tool_calls = ToolCall.from_list(streaming_item.get("tool_calls"))
+ return ChatToolCallsGenerationEvent(
+ tool_calls=tool_calls, is_finished=False, event_type=event_type, index=index
+ )
+ elif event_type == StreamEvent.STREAM_END:
+ response = streaming_item.get("response")
+ finish_reason = streaming_item.get("finish_reason")
+ self.finish_reason = finish_reason
+
+ if response is None:
+ return None
+
+ self.response_id = response.get("response_id")
+ self.conversation_id = response.get("conversation_id")
+ self.text = response.get("text")
+ self.generation_id = response.get("generation_id")
+ self.preamble = response.get("preamble")
+ self.prompt = response.get("prompt")
+ self.chat_history = response.get("chat_history")
+ self.token_count = response.get("token_count")
+ self.is_search_required = response.get("is_search_required") # optional
+ self.citations = response.get("citations") # optional
+ self.documents = response.get("documents") # optional
+ self.search_results = response.get("search_results") # optional
+ self.search_queries = response.get("search_queries") # optional
+ self.tool_calls = ToolCall.from_list(response.get("tool_calls")) # optional
+ return StreamEnd(finish_reason=finish_reason, is_finished=True, event_type=event_type, index=index)
+ return None
+
+ def __iter__(self) -> Generator[StreamResponse, None, None]:
+ index = 0
+ for payload in self.stream_response:
+ self.bytes.extend(payload[self.payload_key][self.bytes_key])
+ try:
+ item = self._make_response_item(index, json.loads(self.bytes))
+ except json.decoder.JSONDecodeError:
+ # payload contained only a partion JSON object
+ continue
+
+ self.bytes = bytearray()
+ if item is not None:
+ index += 1
+ yield item