llm interface v2 support added to cohere

serengil · serengil · commit 8c324abd90e6 · 2025-10-29T16:05:36.000Z
diff --git a/src/neo4j_graphrag/llm/cohere_llm.py b/src/neo4j_graphrag/llm/cohere_llm.py
@@ -12,14 +12,17 @@
 #  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 #  See the License for the specific language governing permissions and
 #  limitations under the License.
-from __future__ import annotations
 
-from typing import TYPE_CHECKING, Any, Iterable, List, Optional, Union, cast
+# built-in dependencies
+from __future__ import annotations
+from typing import TYPE_CHECKING, Any, Iterable, List, Optional, Union, cast, overload
 
+# 3rd party dependencies
 from pydantic import ValidationError
 
+# project dependencies
 from neo4j_graphrag.exceptions import LLMGenerationError
-from neo4j_graphrag.llm.base import LLMInterface
+from neo4j_graphrag.llm.base import LLMInterface, LLMInterfaceV2
 from neo4j_graphrag.utils.rate_limit import (
     RateLimitHandler,
     rate_limit_handler,
@@ -39,7 +42,8 @@
     from cohere import ChatMessages
 
 
-class CohereLLM(LLMInterface):
+# pylint: disable=redefined-builtin, arguments-differ, raise-missing-from, no-else-return
+class CohereLLM(LLMInterface, LLMInterfaceV2):
     """Interface for large language models on the Cohere platform
 
     Args:
@@ -82,28 +86,67 @@ def __init__(
         self.client = cohere.ClientV2(**kwargs)
         self.async_client = cohere.AsyncClientV2(**kwargs)
 
-    def get_messages(
+    # overloads for LLMInterface and LLMInterfaceV2 methods
+    @overload
+    def invoke(
         self,
         input: str,
         message_history: Optional[Union[List[LLMMessage], MessageHistory]] = None,
         system_instruction: Optional[str] = None,
-    ) -> ChatMessages:
-        messages = []
-        if system_instruction:
-            messages.append(SystemMessage(content=system_instruction).model_dump())
-        if message_history:
-            if isinstance(message_history, MessageHistory):
-                message_history = message_history.messages
-            try:
-                MessageList(messages=cast(list[BaseMessage], message_history))
-            except ValidationError as e:
-                raise LLMGenerationError(e.errors()) from e
-            messages.extend(cast(Iterable[dict[str, Any]], message_history))
-        messages.append(UserMessage(content=input).model_dump())
-        return messages  # type: ignore
+    ) -> LLMResponse: ...
 
-    @rate_limit_handler
+    @overload
+    def invoke(
+        self,
+        input: List[LLMMessage],
+    ) -> LLMResponse: ...
+
+    @overload
+    async def ainvoke(
+        self,
+        input: str,
+        message_history: Optional[Union[List[LLMMessage], MessageHistory]] = None,
+        system_instruction: Optional[str] = None,
+    ) -> LLMResponse: ...
+
+    @overload
+    async def ainvoke(
+        self,
+        input: List[LLMMessage],
+    ) -> LLMResponse: ...
+
+    # switching logics to LLMInterface or LLMInterfaceV2
     def invoke(
+        self,
+        input: Union[str, List[LLMMessage]],
+        message_history: Optional[Union[List[LLMMessage], MessageHistory]] = None,
+        system_instruction: Optional[str] = None,
+    ) -> LLMResponse:
+        if isinstance(input, str):
+            return self.__legacy_invoke(input, message_history, system_instruction)
+        elif isinstance(input, list):
+            return self.__brand_new_invoke(input)
+        else:
+            raise ValueError(f"Invalid input type for invoke method - {type(input)}")
+
+    async def ainvoke(
+        self,
+        input: Union[str, List[LLMMessage]],
+        message_history: Optional[Union[List[LLMMessage], MessageHistory]] = None,
+        system_instruction: Optional[str] = None,
+    ) -> LLMResponse:
+        if isinstance(input, str):
+            return await self.__legacy_ainvoke(
+                input, message_history, system_instruction
+            )
+        elif isinstance(input, list):
+            return await self.__brand_new_ainvoke(input)
+        else:
+            raise ValueError(f"Invalid input type for ainvoke method - {type(input)}")
+
+    # implementations
+    @rate_limit_handler
+    def __legacy_invoke(
         self,
         input: str,
         message_history: Optional[Union[List[LLMMessage], MessageHistory]] = None,
@@ -134,8 +177,32 @@ def invoke(
             content=res.message.content[0].text if res.message.content else "",
         )
 
+    def __brand_new_invoke(
+        self,
+        input: List[LLMMessage],
+    ) -> LLMResponse:
+        """Sends text to the LLM and returns a response.
+
+        Args:
+            input (str): The text to send to the LLM.
+
+        Returns:
+            LLMResponse: The response from the LLM.
+        """
+        try:
+            messages = self.get_brand_new_messages(input)
+            res = self.client.chat(
+                messages=messages,
+                model=self.model_name,
+            )
+        except self.cohere_api_error as e:
+            raise LLMGenerationError("Error calling cohere") from e
+        return LLMResponse(
+            content=res.message.content[0].text if res.message.content else "",
+        )
+
     @async_rate_limit_handler
-    async def ainvoke(
+    async def __legacy_ainvoke(
         self,
         input: str,
         message_history: Optional[Union[List[LLMMessage], MessageHistory]] = None,
@@ -165,3 +232,60 @@ async def ainvoke(
         return LLMResponse(
             content=res.message.content[0].text if res.message.content else "",
         )
+
+    async def __brand_new_ainvoke(
+        self,
+        input: List[LLMMessage],
+    ) -> LLMResponse:
+        try:
+            messages = self.get_brand_new_messages(input)
+            res = await self.async_client.chat(
+                messages=messages,
+                model=self.model_name,
+            )
+        except self.cohere_api_error as e:
+            raise LLMGenerationError("Error calling cohere") from e
+        return LLMResponse(
+            content=res.message.content[0].text if res.message.content else "",
+        )
+
+    # subsdiary methods
+    def get_messages(
+        self,
+        input: str,
+        message_history: Optional[Union[List[LLMMessage], MessageHistory]] = None,
+        system_instruction: Optional[str] = None,
+    ) -> ChatMessages:
+        """Converts input and message history to ChatMessages for Cohere."""
+        messages = []
+        if system_instruction:
+            messages.append(SystemMessage(content=system_instruction).model_dump())
+        if message_history:
+            if isinstance(message_history, MessageHistory):
+                message_history = message_history.messages
+            try:
+                MessageList(messages=cast(list[BaseMessage], message_history))
+            except ValidationError as e:
+                raise LLMGenerationError(e.errors()) from e
+            messages.extend(cast(Iterable[dict[str, Any]], message_history))
+        messages.append(UserMessage(content=input).model_dump())
+        return messages  # type: ignore
+
+    def get_brand_new_messages(
+        self,
+        input: list[LLMMessage],
+    ) -> ChatMessages:
+        """Converts a list of LLMMessage to ChatMessages for Cohere."""
+        messages: ChatMessages = []
+        for i in input:
+            if i["role"] == "system":
+                messages.append(self.cohere.SystemChatMessageV2(content=i["content"]))
+            elif i["role"] == "user":
+                messages.append(self.cohere.UserChatMessageV2(content=i["content"]))
+            elif i["role"] == "assistant":
+                messages.append(
+                    self.cohere.AssistantChatMessageV2(content=i["content"])
+                )
+            else:
+                raise ValueError(f"Unknown role: {i['role']}")
+        return messages
diff --git a/tests/unit/llm/test_cohere_llm.py b/tests/unit/llm/test_cohere_llm.py
@@ -152,3 +152,114 @@ async def test_cohere_llm_failed_async(mock_cohere: Mock) -> None:
     with pytest.raises(LLMGenerationError) as excinfo:
         await llm.ainvoke("my text")
     assert "ApiError" in str(excinfo)
+
+
+# V2 Interface Tests
+
+
+def test_cohere_llm_invoke_v2_happy_path(mock_cohere: Mock) -> None:
+    """Test V2 interface invoke method with List[LLMMessage] input."""
+    chat_response_mock = MagicMock()
+    chat_response_mock.message.content = [MagicMock(text="cohere v2 response text")]
+    mock_cohere.ClientV2.return_value.chat.return_value = chat_response_mock
+
+    # Mock Cohere message types
+    mock_cohere.SystemChatMessageV2 = MagicMock()
+    mock_cohere.UserChatMessageV2 = MagicMock()
+    mock_cohere.AssistantChatMessageV2 = MagicMock()
+
+    messages = [
+        {"role": "system", "content": "You are a helpful assistant."},
+        {"role": "user", "content": "What is the capital of France?"},
+    ]
+
+    llm = CohereLLM(model_name="something")
+    response = llm.invoke(messages)
+
+    assert isinstance(response, LLMResponse)
+    assert response.content == "cohere v2 response text"
+
+    # Verify the client was called correctly
+    mock_cohere.ClientV2.return_value.chat.assert_called_once()
+    call_args = mock_cohere.ClientV2.return_value.chat.call_args[1]
+    assert call_args["model"] == "something"
+
+
+@pytest.mark.asyncio
+async def test_cohere_llm_ainvoke_v2_happy_path(mock_cohere: Mock) -> None:
+    """Test V2 interface async invoke method with List[LLMMessage] input."""
+    chat_response_mock = MagicMock()
+    chat_response_mock.message.content = [
+        MagicMock(text="cohere v2 async response text")
+    ]
+    mock_cohere.AsyncClientV2.return_value.chat = AsyncMock(
+        return_value=chat_response_mock
+    )
+
+    # Mock Cohere message types
+    mock_cohere.SystemChatMessageV2 = MagicMock()
+    mock_cohere.UserChatMessageV2 = MagicMock()
+    mock_cohere.AssistantChatMessageV2 = MagicMock()
+
+    messages = [
+        {"role": "system", "content": "You are a helpful assistant."},
+        {"role": "user", "content": "What is the capital of France?"},
+    ]
+
+    llm = CohereLLM(model_name="something")
+    response = await llm.ainvoke(messages)
+
+    assert isinstance(response, LLMResponse)
+    assert response.content == "cohere v2 async response text"
+
+    # Verify the async client was called correctly
+    mock_cohere.AsyncClientV2.return_value.chat.assert_awaited_once()
+
+
+def test_cohere_llm_invoke_v2_validation_error(mock_cohere: Mock) -> None:
+    """Test V2 interface invoke with invalid message role raises error."""
+    chat_response_mock = MagicMock()
+    chat_response_mock.message.content = [MagicMock(text="should not get here")]
+    mock_cohere.ClientV2.return_value.chat.return_value = chat_response_mock
+
+    messages = [
+        {"role": "invalid_role", "content": "This should fail."},
+    ]
+
+    llm = CohereLLM(model_name="something")
+
+    with pytest.raises(ValueError) as exc_info:
+        llm.invoke(messages)
+    assert "Unknown role: invalid_role" in str(exc_info.value)
+
+
+def test_cohere_llm_get_brand_new_messages_all_roles(mock_cohere: Mock) -> None:
+    """Test get_brand_new_messages method handles all message roles correctly."""
+    # Mock Cohere message types
+    mock_system_msg = MagicMock()
+    mock_user_msg = MagicMock()
+    mock_assistant_msg = MagicMock()
+
+    mock_cohere.SystemChatMessageV2.return_value = mock_system_msg
+    mock_cohere.UserChatMessageV2.return_value = mock_user_msg
+    mock_cohere.AssistantChatMessageV2.return_value = mock_assistant_msg
+
+    messages = [
+        {"role": "system", "content": "You are a helpful assistant."},
+        {"role": "user", "content": "Hello"},
+        {"role": "assistant", "content": "Hi there!"},
+        {"role": "user", "content": "How are you?"},
+    ]
+
+    llm = CohereLLM(model_name="something")
+    result_messages = llm.get_brand_new_messages(messages)
+
+    # Verify the correct number of messages are returned
+    assert len(result_messages) == 4
+
+    # Verify the correct Cohere message constructors were called
+    mock_cohere.SystemChatMessageV2.assert_called_once_with(
+        content="You are a helpful assistant."
+    )
+    assert mock_cohere.UserChatMessageV2.call_count == 2
+    mock_cohere.AssistantChatMessageV2.assert_called_once_with(content="Hi there!")