-
Notifications
You must be signed in to change notification settings - Fork 46
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
* Added Vertex AI LLM class * Updated docstrings * Updated unit test workflow * Removed duplicate poetry install for pr workflow * Removed --no-root from poetry install in pr.yaml * Fixed typo * Updated docs * Updated CHANGELOG for previous PR * Updated CHANGELOG * Fixed typo
- Loading branch information
1 parent
bf65ddd
commit d1cef28
Showing
9 changed files
with
182 additions
and
14 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,98 @@ | ||
# Neo4j Sweden AB [https://neo4j.com] | ||
# # | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# # | ||
# https://www.apache.org/licenses/LICENSE-2.0 | ||
# # | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
from __future__ import annotations | ||
|
||
from typing import Any, Optional | ||
|
||
from neo4j_graphrag.exceptions import LLMGenerationError | ||
from neo4j_graphrag.llm.base import LLMInterface | ||
from neo4j_graphrag.llm.types import LLMResponse | ||
|
||
try: | ||
from vertexai.generative_models import GenerativeModel, ResponseValidationError | ||
except ImportError: | ||
GenerativeModel = None | ||
ResponseValidationError = None | ||
|
||
|
||
class VertexAILLM(LLMInterface): | ||
"""Interface for large language models on Vertex AI | ||
Args: | ||
model_name (str, optional): Name of the LLM to use. Defaults to "gemini-1.5-flash-001". | ||
model_params (Optional[dict], optional): Additional parameters passed to the model when text is sent to it. Defaults to None. | ||
**kwargs (Any): Arguments passed to the model when for the class is initialised. Defaults to None. | ||
Raises: | ||
LLMGenerationError: If there's an error generating the response from the model. | ||
Example: | ||
.. code-block:: python | ||
from neo4j_graphrag.llm import VertexAILLM | ||
from vertexai.generative_models import GenerationConfig | ||
generation_config = GenerationConfig(temperature=0.0) | ||
llm = VertexAILLM( | ||
model_name="gemini-1.5-flash-001", generation_config=generation_config | ||
) | ||
llm.invoke("Who is the mother of Paul Atreides?") | ||
""" | ||
|
||
def __init__( | ||
self, | ||
model_name: str = "gemini-1.5-flash-001", | ||
model_params: Optional[dict[str, Any]] = None, | ||
**kwargs: Any, | ||
): | ||
if GenerativeModel is None or ResponseValidationError is None: | ||
raise ImportError( | ||
"Could not import Vertex AI Python client. " | ||
"Please install it with `pip install google-cloud-aiplatform`." | ||
) | ||
super().__init__(model_name, model_params) | ||
self.model = GenerativeModel(model_name=model_name, **kwargs) | ||
|
||
def invoke(self, input: str) -> LLMResponse: | ||
"""Sends text to the LLM and returns a response. | ||
Args: | ||
input (str): The text to send to the LLM. | ||
Returns: | ||
LLMResponse: The response from the LLM. | ||
""" | ||
try: | ||
response = self.model.generate_content(input, **self.model_params) | ||
return LLMResponse(content=response.text) | ||
except ResponseValidationError as e: | ||
raise LLMGenerationError(e) | ||
|
||
async def ainvoke(self, input: str) -> LLMResponse: | ||
"""Asynchronously sends text to the LLM and returns a response. | ||
Args: | ||
input (str): The text to send to the LLM. | ||
Returns: | ||
LLMResponse: The response from the LLM. | ||
""" | ||
try: | ||
response = await self.model.generate_content_async( | ||
input, **self.model_params | ||
) | ||
return LLMResponse(content=response.text) | ||
except ResponseValidationError as e: | ||
raise LLMGenerationError(e) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,54 @@ | ||
# Neo4j Sweden AB [https://neo4j.com] | ||
# # | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# # | ||
# https://www.apache.org/licenses/LICENSE-2.0 | ||
# # | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
from __future__ import annotations | ||
|
||
from unittest.mock import AsyncMock, MagicMock, Mock, patch | ||
|
||
import pytest | ||
from neo4j_graphrag.llm.vertexai import VertexAILLM | ||
|
||
|
||
@patch("neo4j_graphrag.llm.vertexai.GenerativeModel", None) | ||
def test_vertexai_llm_missing_dependency() -> None: | ||
with pytest.raises(ImportError): | ||
VertexAILLM(model_name="gemini-1.5-flash-001") | ||
|
||
|
||
@patch("neo4j_graphrag.llm.vertexai.GenerativeModel") | ||
def test_invoke_happy_path(GenerativeModelMock: MagicMock) -> None: | ||
mock_response = Mock() | ||
mock_response.text = "Return text" | ||
mock_model = GenerativeModelMock.return_value | ||
mock_model.generate_content.return_value = mock_response | ||
model_params = {"temperature": 0.5} | ||
llm = VertexAILLM("gemini-1.5-flash-001", model_params) | ||
input_text = "may thy knife chip and shatter" | ||
response = llm.invoke(input_text) | ||
assert response.content == "Return text" | ||
llm.model.generate_content.assert_called_once_with(input_text, **model_params) | ||
|
||
|
||
@pytest.mark.asyncio | ||
@patch("neo4j_graphrag.llm.vertexai.GenerativeModel") | ||
async def test_ainvoke_happy_path(GenerativeModelMock: MagicMock) -> None: | ||
mock_response = AsyncMock() | ||
mock_response.text = "Return text" | ||
mock_model = GenerativeModelMock.return_value | ||
mock_model.generate_content_async = AsyncMock(return_value=mock_response) | ||
model_params = {"temperature": 0.5} | ||
llm = VertexAILLM("gemini-1.5-flash-001", model_params) | ||
input_text = "may thy knife chip and shatter" | ||
response = await llm.ainvoke(input_text) | ||
assert response.content == "Return text" | ||
llm.model.generate_content_async.assert_called_once_with(input_text, **model_params) |