From 321ba1b8e15e40f7e36396856bb27b65ac688d50 Mon Sep 17 00:00:00 2001
From: Alex Thomas <alexthomas93@users.noreply.github.com>
Date: Wed, 11 Dec 2024 13:52:06 +0000
Subject: [PATCH 1/9] Added tests for _format_schema helper function

---
 .../langchain_neo4j/graphs/neo4j_graph.py     |   8 +-
 .../integration_tests/graphs/test_neo4j.py    |  48 ++-
 .../unit_tests/graphs/test_neo4j_graph.py     | 384 +++++++++++++++++-
 3 files changed, 434 insertions(+), 6 deletions(-)

diff --git a/libs/neo4j/langchain_neo4j/graphs/neo4j_graph.py b/libs/neo4j/langchain_neo4j/graphs/neo4j_graph.py
index dd97de0..e6d2428 100644
--- a/libs/neo4j/langchain_neo4j/graphs/neo4j_graph.py
+++ b/libs/neo4j/langchain_neo4j/graphs/neo4j_graph.py
@@ -191,7 +191,7 @@ def _format_schema(schema: Dict, is_enhanced: bool) -> str:
                     "DATE_TIME",
                     "LOCAL_DATE_TIME",
                 ]:
-                    if prop.get("min") is not None:
+                    if prop.get("min") and prop.get("max"):
                         example = f'Min: {prop["min"]}, Max: {prop["max"]}'
                     else:
                         example = (
@@ -238,8 +238,8 @@ def _format_schema(schema: Dict, is_enhanced: bool) -> str:
                     "DATE_TIME",
                     "LOCAL_DATE_TIME",
                 ]:
-                    if prop.get("min"):  # If we have min/max
-                        example = f'Min: {prop["min"]}, Max:  {prop["max"]}'
+                    if prop.get("min") and prop.get("max"):  # If we have min/max
+                        example = f'Min: {prop["min"]}, Max: {prop["max"]}'
                     else:  # return a single value
                         example = (
                             f'Example: "{prop["values"][0]}"' if prop["values"] else ""
@@ -252,7 +252,7 @@ def _format_schema(schema: Dict, is_enhanced: bool) -> str:
                         f'Min Size: {prop["min_size"]}, Max Size: {prop["max_size"]}'
                     )
                 formatted_rel_props.append(
-                    f"  - `{prop['property']}: {prop['type']}` {example}"
+                    f"  - `{prop['property']}`: {prop['type']} {example}"
                 )
     else:
         # Format node properties
diff --git a/libs/neo4j/tests/integration_tests/graphs/test_neo4j.py b/libs/neo4j/tests/integration_tests/graphs/test_neo4j.py
index 6c27707..3f5c28f 100644
--- a/libs/neo4j/tests/integration_tests/graphs/test_neo4j.py
+++ b/libs/neo4j/tests/integration_tests/graphs/test_neo4j.py
@@ -1,5 +1,7 @@
 import os
+import urllib
 
+import pytest
 from langchain_core.documents import Document
 
 from langchain_neo4j import Neo4jGraph
@@ -130,7 +132,7 @@ def test_neo4j_timeout() -> None:
 
 
 def test_neo4j_sanitize_values() -> None:
-    """Test that neo4j uses the timeout correctly."""
+    """Test that lists with more than 128 elements are removed from the results."""
     url = os.environ.get("NEO4J_URI", "bolt://localhost:7687")
     username = os.environ.get("NEO4J_USERNAME", "neo4j")
     password = os.environ.get("NEO4J_PASSWORD", "pleaseletmein")
@@ -558,3 +560,47 @@ def test_neo4j_multiple_close() -> None:
     # Test that multiple closes don't raise errors
     graph.close()
     graph.close()  # This should not raise an error
+
+
+def test_invalid_url() -> None:
+    """Test initializing with invalid credentials raises ValueError."""
+    url = os.environ.get("NEO4J_URI", "bolt://localhost:7687")
+    username = os.environ.get("NEO4J_USERNAME", "neo4j")
+    password = os.environ.get("NEO4J_PASSWORD", "pleaseletmein")
+    assert url is not None
+    assert username is not None
+    assert password is not None
+
+    # Parse the original URL
+    parsed_url = urllib.parse.urlparse(url)
+    # Increment the port number by 1 and wrap around if necessary
+    original_port = parsed_url.port or 7687
+    new_port = (original_port + 1) % 65535 or 1
+    # Reconstruct the netloc (hostname:port)
+    new_netloc = f"{parsed_url.hostname}:{new_port}"
+    # Rebuild the URL with the new netloc
+    new_url = parsed_url._replace(netloc=new_netloc).geturl()
+
+    with pytest.raises(ValueError) as exc_info:
+        Neo4jGraph(
+            url=new_url,
+            username=username,
+            password=password,
+        )
+    assert "Please ensure that the url is correct" in str(exc_info.value)
+
+
+def test_invalid_credentials() -> None:
+    """Test initializing with invalid credentials raises ValueError."""
+    url = os.environ.get("NEO4J_URI", "bolt://localhost:7687")
+    assert url is not None
+
+    with pytest.raises(ValueError) as exc_info:
+        Neo4jGraph(
+            url=url,
+            username="invalid_username",
+            password="invalid_password",
+        )
+    assert "Please ensure that the username and password are correct" in str(
+        exc_info.value
+    )
diff --git a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
index 3a617b5..ce1b15c 100644
--- a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
+++ b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
@@ -1,8 +1,14 @@
+from types import ModuleType
+from typing import Mapping, Sequence, Union
 from unittest.mock import MagicMock, patch
 
 import pytest
 
-from langchain_neo4j.graphs.neo4j_graph import Neo4jGraph, value_sanitize
+from langchain_neo4j.graphs.neo4j_graph import (
+    Neo4jGraph,
+    _format_schema,
+    value_sanitize,
+)
 
 
 def test_value_sanitize_with_small_list() -> None:
@@ -148,3 +154,379 @@ def test_multiple_close_calls_safe() -> None:
 
         # Second close should not raise an error
         graph.close()  # Should not raise any exception
+
+
+def test_import_error() -> None:
+    """Test that ImportError is raised when neo4j package is not installed."""
+    original_import = __import__
+
+    def mock_import(
+        name: str,
+        globals: Union[Mapping[str, object], None] = None,
+        locals: Union[Mapping[str, object], None] = None,
+        fromlist: Sequence[str] = (),
+        level: int = 0,
+    ) -> ModuleType:
+        if name == "neo4j":
+            raise ImportError()
+        return original_import(name, globals, locals, fromlist, level)
+
+    with patch("builtins.__import__", side_effect=mock_import):
+        with pytest.raises(ImportError) as exc_info:
+            Neo4jGraph()
+        assert "Could not import neo4j python package." in str(exc_info.value)
+
+
+def test_format_schema_string_high_distinct_count() -> None:
+    schema = {
+        "node_props": {
+            "Person": [
+                {
+                    "property": "name",
+                    "type": "STRING",
+                    "values": ["Alice", "Bob", "Charlie"],
+                    "distinct_count": 11,  # Greater than DISTINCT_VALUE_LIMIT (10)
+                }
+            ]
+        },
+        "rel_props": {},
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "- **Person**\n"
+        '  - `name`: STRING Example: "Alice"\n'
+        "Relationship properties:\n"
+        "\n"
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_string_low_distinct_count() -> None:
+    schema = {
+        "node_props": {
+            "Animal": [
+                {
+                    "property": "species",
+                    "type": "STRING",
+                    "values": ["Cat", "Dog"],
+                    "distinct_count": 2,  # Less than DISTINCT_VALUE_LIMIT (10)
+                }
+            ]
+        },
+        "rel_props": {},
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "- **Animal**\n"
+        "  - `species`: STRING Available options: ['Cat', 'Dog']\n"
+        "Relationship properties:\n"
+        "\n"
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_numeric_with_min_max() -> None:
+    schema = {
+        "node_props": {
+            "Person": [{"property": "age", "type": "INTEGER", "min": 20, "max": 70}]
+        },
+        "rel_props": {},
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "- **Person**\n"
+        "  - `age`: INTEGER Min: 20, Max: 70\n"
+        "Relationship properties:\n"
+        "\n"
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_numeric_with_values() -> None:
+    schema = {
+        "node_props": {
+            "Event": [
+                {
+                    "property": "date",
+                    "type": "DATE",
+                    "values": ["2021-01-01", "2021-01-02"],
+                }
+            ]
+        },
+        "rel_props": {},
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "- **Event**\n"
+        '  - `date`: DATE Example: "2021-01-01"\n'
+        "Relationship properties:\n"
+        "\n"
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_list_skipped() -> None:
+    schema = {
+        "node_props": {
+            "Document": [
+                {
+                    "property": "embedding",
+                    "type": "LIST",
+                    "min_size": 150,  # Greater than LIST_LIMIT (128)
+                    "max_size": 200,
+                }
+            ]
+        },
+        "rel_props": {},
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "- **Document**\n"
+        # 'embedding' property should be skipped
+        "Relationship properties:\n"
+        "\n"
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_list_included() -> None:
+    schema = {
+        "node_props": {
+            "Document": [
+                {"property": "keywords", "type": "LIST", "min_size": 2, "max_size": 5}
+            ]
+        },
+        "rel_props": {},
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "- **Document**\n"
+        "  - `keywords`: LIST Min Size: 2, Max Size: 5\n"
+        "Relationship properties:\n"
+        "\n"
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_rel_string_high_distinct_count() -> None:
+    schema = {
+        "node_props": {},
+        "rel_props": {
+            "KNOWS": [
+                {
+                    "property": "since",
+                    "type": "STRING",
+                    "values": ["2000", "2001", "2002"],
+                    "distinct_count": 15,
+                }
+            ]
+        },
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "\n"
+        "Relationship properties:\n"
+        "- **KNOWS**\n"
+        '  - `since`: STRING Example: "2000"\n'
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_rel_string_low_distinct_count() -> None:
+    schema = {
+        "node_props": {},
+        "rel_props": {
+            "LIKES": [
+                {
+                    "property": "intensity",
+                    "type": "STRING",
+                    "values": ["High", "Medium", "Low"],
+                    "distinct_count": 3,
+                }
+            ]
+        },
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "\n"
+        "Relationship properties:\n"
+        "- **LIKES**\n"
+        "  - `intensity`: STRING Available options: ['High', 'Medium', 'Low']\n"
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_rel_numeric_with_min_max() -> None:
+    schema = {
+        "node_props": {},
+        "rel_props": {
+            "WORKS_WITH": [
+                {"property": "since", "type": "INTEGER", "min": 1995, "max": 2020}
+            ]
+        },
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "\n"
+        "Relationship properties:\n"
+        "- **WORKS_WITH**\n"
+        "  - `since`: INTEGER Min: 1995, Max: 2020\n"
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_rel_list_skipped() -> None:
+    schema = {
+        "node_props": {},
+        "rel_props": {
+            "KNOWS": [
+                {
+                    "property": "embedding",
+                    "type": "LIST",
+                    "min_size": 150,
+                    "max_size": 200,
+                }
+            ]
+        },
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "\n"
+        "Relationship properties:\n"
+        "- **KNOWS**\n"
+        # 'embedding' property should be skipped
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_rel_list_included() -> None:
+    schema = {
+        "node_props": {},
+        "rel_props": {
+            "KNOWS": [
+                {"property": "messages", "type": "LIST", "min_size": 2, "max_size": 5}
+            ]
+        },
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "\n"
+        "Relationship properties:\n"
+        "- **KNOWS**\n"
+        "  - `messages`: LIST Min Size: 2, Max Size: 5\n"
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_rel_numeric_no_min_max() -> None:
+    schema = {
+        "node_props": {},
+        "rel_props": {
+            "OWES": [
+                {
+                    "property": "amount",
+                    "type": "FLOAT",
+                    # 'min' and 'max' are missing
+                    "values": [3.14, 2.71],
+                }
+            ]
+        },
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "\n"
+        "Relationship properties:\n"
+        "- **OWES**\n"
+        '  - `amount`: FLOAT Example: "3.14"\n'
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_values_empty() -> None:
+    schema = {
+        "node_props": {
+            "Person": [
+                {
+                    "property": "name",
+                    "type": "STRING",
+                    "values": [],
+                    "distinct_count": 15,
+                }
+            ]
+        },
+        "rel_props": {},
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "- **Person**\n"
+        "  - `name`: STRING \n"  # Example should be empty
+        "Relationship properties:\n"
+        "\n"
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output
+
+
+def test_format_schema_values_none() -> None:
+    schema = {
+        "node_props": {
+            "Person": [
+                {
+                    "property": "name",
+                    "type": "STRING",
+                    # 'values' is missing
+                    "distinct_count": 15,
+                }
+            ]
+        },
+        "rel_props": {},
+        "relationships": [],
+    }
+    expected_output = (
+        "Node properties:\n"
+        "- **Person**\n"
+        "  - `name`: STRING \n"  # Example should be empty
+        "Relationship properties:\n"
+        "\n"
+        "The relationships:\n"
+    )
+    result = _format_schema(schema, is_enhanced=True)
+    assert result == expected_output

From 6df56ac7293ca1e1fae1d830f10bf5f628cce201 Mon Sep 17 00:00:00 2001
From: Alex Thomas <alexthomas93@users.noreply.github.com>
Date: Wed, 11 Dec 2024 14:20:51 +0000
Subject: [PATCH 2/9] Added mock Neo4j driver to Neo4jGraph tests

---
 .../unit_tests/graphs/test_neo4j_graph.py     | 147 ++++++++----------
 1 file changed, 65 insertions(+), 82 deletions(-)

diff --git a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
index ce1b15c..76d32ad 100644
--- a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
+++ b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
@@ -11,6 +11,17 @@
 )
 
 
+@pytest.fixture
+def mock_neo4j_driver():
+    with patch("neo4j.GraphDatabase.driver", autospec=True) as mock_driver:
+        mock_driver_instance = MagicMock()
+        mock_driver.return_value = mock_driver_instance
+        mock_driver_instance.verify_connectivity.return_value = None
+        mock_driver_instance.execute_query = MagicMock(return_value=([], None, None))
+        mock_driver_instance._closed = False
+        yield mock_driver_instance
+
+
 def test_value_sanitize_with_small_list() -> None:
     small_list = list(range(15))  # list size > LIST_LIMIT
     input_dict = {"key1": "value1", "small_list": small_list}
@@ -51,109 +62,81 @@ def test_value_sanitize_with_dict_in_nested_list() -> None:
     assert value_sanitize(input_dict) == expected_output
 
 
-def test_driver_state_management() -> None:
+def test_driver_state_management(mock_neo4j_driver: MagicMock) -> None:
     """Comprehensive test for driver state management."""
-    with patch("neo4j.GraphDatabase.driver", autospec=True) as mock_driver:
-        # Setup mock driver
-        mock_driver_instance = MagicMock()
-        mock_driver.return_value = mock_driver_instance
-        mock_driver_instance.execute_query = MagicMock(return_value=([], None, None))
-
-        # Create graph instance
-        graph = Neo4jGraph(
-            url="bolt://localhost:7687", username="neo4j", password="password"
-        )
+    # Create graph instance
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
 
-        # Store original driver
-        original_driver = graph._driver
-        assert isinstance(original_driver.close, MagicMock)
+    # Store original driver
+    original_driver = graph._driver
+    assert isinstance(original_driver.close, MagicMock)
 
-        # Test initial state
-        assert hasattr(graph, "_driver")
+    # Test initial state
+    assert hasattr(graph, "_driver")
 
-        # First close
-        graph.close()
-        original_driver.close.assert_called_once()
-        assert not hasattr(graph, "_driver")
+    # First close
+    graph.close()
+    original_driver.close.assert_called_once()
+    assert not hasattr(graph, "_driver")
 
-        # Verify methods raise error when driver is closed
-        with pytest.raises(
-            RuntimeError,
-            match="Cannot perform operations - Neo4j connection has been closed",
-        ):
-            graph.query("RETURN 1")
+    # Verify methods raise error when driver is closed
+    with pytest.raises(
+        RuntimeError,
+        match="Cannot perform operations - Neo4j connection has been closed",
+    ):
+        graph.query("RETURN 1")
 
-        with pytest.raises(
-            RuntimeError,
-            match="Cannot perform operations - Neo4j connection has been closed",
-        ):
-            graph.refresh_schema()
+    with pytest.raises(
+        RuntimeError,
+        match="Cannot perform operations - Neo4j connection has been closed",
+    ):
+        graph.refresh_schema()
 
 
-def test_close_method_removes_driver() -> None:
+def test_close_method_removes_driver(mock_neo4j_driver: MagicMock) -> None:
     """Test that close method removes the _driver attribute."""
-    with patch("neo4j.GraphDatabase.driver", autospec=True) as mock_driver:
-        # Configure mock to return a mock driver
-        mock_driver_instance = MagicMock()
-        mock_driver.return_value = mock_driver_instance
-
-        # Configure mock execute_query to return empty result
-        mock_driver_instance.execute_query = MagicMock(return_value=([], None, None))
-
-        # Add a _closed attribute to simulate driver state
-        mock_driver_instance._closed = False
-
-        graph = Neo4jGraph(
-            url="bolt://localhost:7687", username="neo4j", password="password"
-        )
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
 
-        # Store a reference to the original driver
-        original_driver = graph._driver
-        assert isinstance(original_driver.close, MagicMock)
+    # Store a reference to the original driver
+    original_driver = graph._driver
+    assert isinstance(original_driver.close, MagicMock)
 
-        # Call close method
-        graph.close()
+    # Call close method
+    graph.close()
 
-        # Verify driver.close was called
-        original_driver.close.assert_called_once()
+    # Verify driver.close was called
+    original_driver.close.assert_called_once()
 
-        # Verify _driver attribute is removed
-        assert not hasattr(graph, "_driver")
+    # Verify _driver attribute is removed
+    assert not hasattr(graph, "_driver")
 
-        # Verify second close does not raise an error
-        graph.close()  # Should not raise any exception
+    # Verify second close does not raise an error
+    graph.close()  # Should not raise any exception
 
 
-def test_multiple_close_calls_safe() -> None:
+def test_multiple_close_calls_safe(mock_neo4j_driver: MagicMock) -> None:
     """Test that multiple close calls do not raise errors."""
-    with patch("neo4j.GraphDatabase.driver", autospec=True) as mock_driver:
-        # Configure mock to return a mock driver
-        mock_driver_instance = MagicMock()
-        mock_driver.return_value = mock_driver_instance
-
-        # Configure mock execute_query to return empty result
-        mock_driver_instance.execute_query = MagicMock(return_value=([], None, None))
-
-        # Add a _closed attribute to simulate driver state
-        mock_driver_instance._closed = False
-
-        graph = Neo4jGraph(
-            url="bolt://localhost:7687", username="neo4j", password="password"
-        )
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
 
-        # Store a reference to the original driver
-        original_driver = graph._driver
-        assert isinstance(original_driver.close, MagicMock)
+    # Store a reference to the original driver
+    original_driver = graph._driver
+    assert isinstance(original_driver.close, MagicMock)
 
-        # First close
-        graph.close()
-        original_driver.close.assert_called_once()
+    # First close
+    graph.close()
+    original_driver.close.assert_called_once()
 
-        # Verify _driver attribute is removed
-        assert not hasattr(graph, "_driver")
+    # Verify _driver attribute is removed
+    assert not hasattr(graph, "_driver")
 
-        # Second close should not raise an error
-        graph.close()  # Should not raise any exception
+    # Second close should not raise an error
+    graph.close()  # Should not raise any exception
 
 
 def test_import_error() -> None:

From fa317aae2b850c7770a26a097eeee8105d99f851 Mon Sep 17 00:00:00 2001
From: Alex Thomas <alexthomas93@users.noreply.github.com>
Date: Wed, 11 Dec 2024 16:09:33 +0000
Subject: [PATCH 3/9] Added _enhanced_schema_cypher tests

---
 .../unit_tests/graphs/test_neo4j_graph.py     | 206 +++++++++++++++++-
 1 file changed, 204 insertions(+), 2 deletions(-)

diff --git a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
index 76d32ad..f8c4ecf 100644
--- a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
+++ b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
@@ -1,5 +1,5 @@
 from types import ModuleType
-from typing import Mapping, Sequence, Union
+from typing import Generator, Mapping, Sequence, Union
 from unittest.mock import MagicMock, patch
 
 import pytest
@@ -12,7 +12,7 @@
 
 
 @pytest.fixture
-def mock_neo4j_driver():
+def mock_neo4j_driver() -> Generator[MagicMock, None, None]:
     with patch("neo4j.GraphDatabase.driver", autospec=True) as mock_driver:
         mock_driver_instance = MagicMock()
         mock_driver.return_value = mock_driver_instance
@@ -160,6 +160,9 @@ def mock_import(
         assert "Could not import neo4j python package." in str(exc_info.value)
 
 
+# _format_schema tests
+
+
 def test_format_schema_string_high_distinct_count() -> None:
     schema = {
         "node_props": {
@@ -513,3 +516,202 @@ def test_format_schema_values_none() -> None:
     )
     result = _format_schema(schema, is_enhanced=True)
     assert result == expected_output
+
+
+# _enhanced_schema_cypher tests
+
+
+def test_enhanced_schema_cypher_integer_exhaustive_true(
+    mock_neo4j_driver: MagicMock,
+) -> None:
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
+
+    graph.structured_schema = {"metadata": {"index": []}}
+    properties = [{"property": "age", "type": "INTEGER"}]
+    query = graph._enhanced_schema_cypher("Person", properties, exhaustive=True)
+    assert "min(n.`age`) AS `age_min`" in query
+    assert "max(n.`age`) AS `age_max`" in query
+    assert "count(distinct n.`age`) AS `age_distinct`" in query
+    assert (
+        "min: toString(`age_min`), max: toString(`age_max`), "
+        "distinct_count: `age_distinct`" in query
+    )
+
+
+def test_enhanced_schema_cypher_list_exhaustive_true(
+    mock_neo4j_driver: MagicMock,
+) -> None:
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
+    graph.structured_schema = {"metadata": {"index": []}}
+    properties = [{"property": "tags", "type": "LIST"}]
+    query = graph._enhanced_schema_cypher("Article", properties, exhaustive=True)
+    assert "min(size(n.`tags`)) AS `tags_size_min`" in query
+    assert "max(size(n.`tags`)) AS `tags_size_max`" in query
+    assert "min_size: `tags_size_min`, max_size: `tags_size_max`" in query
+
+
+def test_enhanced_schema_cypher_boolean_exhaustive_true(
+    mock_neo4j_driver: MagicMock,
+) -> None:
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
+    properties = [{"property": "active", "type": "BOOLEAN"}]
+    query = graph._enhanced_schema_cypher("User", properties, exhaustive=True)
+    # BOOLEAN types should be skipped, so their properties should not be in the query
+    assert "n.`active`" not in query
+
+
+def test_enhanced_schema_cypher_integer_exhaustive_false_no_index(
+    mock_neo4j_driver: MagicMock,
+) -> None:
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
+    graph.structured_schema = {"metadata": {"index": []}}
+    properties = [{"property": "age", "type": "INTEGER"}]
+    query = graph._enhanced_schema_cypher("Person", properties, exhaustive=False)
+    assert "collect(distinct toString(n.`age`)) AS `age_values`" in query
+    assert "values: `age_values`" in query
+
+
+def test_enhanced_schema_cypher_integer_exhaustive_false_with_index(
+    mock_neo4j_driver: MagicMock,
+) -> None:
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
+    graph.structured_schema = {
+        "metadata": {
+            "index": [
+                {
+                    "label": "Person",
+                    "properties": ["age"],
+                    "type": "RANGE",
+                }
+            ]
+        }
+    }
+    properties = [{"property": "age", "type": "INTEGER"}]
+    query = graph._enhanced_schema_cypher("Person", properties, exhaustive=False)
+    assert "min(n.`age`) AS `age_min`" in query
+    assert "max(n.`age`) AS `age_max`" in query
+    assert "count(distinct n.`age`) AS `age_distinct`" in query
+    assert (
+        "min: toString(`age_min`), max: toString(`age_max`), "
+        "distinct_count: `age_distinct`" in query
+    )
+
+
+def test_enhanced_schema_cypher_list_exhaustive_false(
+    mock_neo4j_driver: MagicMock,
+) -> None:
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
+    properties = [{"property": "tags", "type": "LIST"}]
+    query = graph._enhanced_schema_cypher("Article", properties, exhaustive=False)
+    assert "min(size(n.`tags`)) AS `tags_size_min`" in query
+    assert "max(size(n.`tags`)) AS `tags_size_max`" in query
+    assert "min_size: `tags_size_min`, max_size: `tags_size_max`" in query
+
+
+def test_enhanced_schema_cypher_boolean_exhaustive_false(
+    mock_neo4j_driver: MagicMock,
+) -> None:
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
+    properties = [{"property": "active", "type": "BOOLEAN"}]
+    query = graph._enhanced_schema_cypher("User", properties, exhaustive=False)
+    # BOOLEAN types should be skipped, so their properties should not be in the query
+    assert "n.`active`" not in query
+
+
+def test_enhanced_schema_cypher_string_exhaustive_false_with_index(
+    mock_neo4j_driver: MagicMock,
+) -> None:
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
+    graph.structured_schema = {
+        "metadata": {
+            "index": [
+                {
+                    "label": "Person",
+                    "properties": ["status"],
+                    "type": "RANGE",
+                    "size": 5,
+                    "distinctValues": 5,
+                }
+            ]
+        }
+    }
+    graph.query = MagicMock(return_value=[{"value": ["Single", "Married", "Divorced"]}])
+    properties = [{"property": "status", "type": "STRING"}]
+    query = graph._enhanced_schema_cypher("Person", properties, exhaustive=False)
+    assert "values: ['Single', 'Married', 'Divorced'], distinct_count: 3" in query
+
+
+def test_enhanced_schema_cypher_string_exhaustive_false_no_index(
+    mock_neo4j_driver: MagicMock,
+) -> None:
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
+    graph.structured_schema = {"metadata": {"index": []}}
+    properties = [{"property": "status", "type": "STRING"}]
+    query = graph._enhanced_schema_cypher("Person", properties, exhaustive=False)
+    assert (
+        "collect(distinct substring(toString(n.`status`), 0, 50)) AS `status_values`"
+        in query
+    )
+    assert "values: `status_values`" in query
+
+
+def test_enhanced_schema_cypher_point_type(mock_neo4j_driver: MagicMock) -> None:
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
+    properties = [{"property": "location", "type": "POINT"}]
+    query = graph._enhanced_schema_cypher("Place", properties, exhaustive=True)
+    # POINT types should be skipped
+    assert "n.`location`" not in query
+
+
+def test_enhanced_schema_cypher_duration_type(mock_neo4j_driver: MagicMock) -> None:
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
+    properties = [{"property": "duration", "type": "DURATION"}]
+    query = graph._enhanced_schema_cypher("Event", properties, exhaustive=False)
+    # DURATION types should be skipped
+    assert "n.`duration`" not in query
+
+
+def test_enhanced_schema_cypher_relationship(mock_neo4j_driver: MagicMock) -> None:
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687", username="neo4j", password="password"
+    )
+    properties = [{"property": "since", "type": "INTEGER"}]
+
+    query = graph._enhanced_schema_cypher(
+        label_or_type="FRIENDS_WITH",
+        properties=properties,
+        exhaustive=True,
+        is_relationship=True,
+    )
+
+    assert query.startswith("MATCH ()-[n:`FRIENDS_WITH`]->()")
+    assert "min(n.`since`) AS `since_min`" in query
+    assert "max(n.`since`) AS `since_max`" in query
+    assert "count(distinct n.`since`) AS `since_distinct`" in query
+    expected_return_clause = (
+        "`since`: {min: toString(`since_min`), max: toString(`since_max`), "
+        "distinct_count: `since_distinct`}"
+    )
+    assert expected_return_clause in query

From 4b73061155679b5c5f6e5db65edb3a2755d8d3a2 Mon Sep 17 00:00:00 2001
From: Alex Thomas <alexthomas93@users.noreply.github.com>
Date: Wed, 11 Dec 2024 16:22:38 +0000
Subject: [PATCH 4/9] Parametrised _format_schema tests

---
 .../unit_tests/graphs/test_neo4j_graph.py     | 699 +++++++++---------
 1 file changed, 347 insertions(+), 352 deletions(-)

diff --git a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
index f8c4ecf..34e9a52 100644
--- a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
+++ b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
@@ -163,359 +163,354 @@ def mock_import(
 # _format_schema tests
 
 
-def test_format_schema_string_high_distinct_count() -> None:
-    schema = {
-        "node_props": {
-            "Person": [
-                {
-                    "property": "name",
-                    "type": "STRING",
-                    "values": ["Alice", "Bob", "Charlie"],
-                    "distinct_count": 11,  # Greater than DISTINCT_VALUE_LIMIT (10)
-                }
-            ]
-        },
-        "rel_props": {},
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "- **Person**\n"
-        '  - `name`: STRING Example: "Alice"\n'
-        "Relationship properties:\n"
-        "\n"
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_string_low_distinct_count() -> None:
-    schema = {
-        "node_props": {
-            "Animal": [
-                {
-                    "property": "species",
-                    "type": "STRING",
-                    "values": ["Cat", "Dog"],
-                    "distinct_count": 2,  # Less than DISTINCT_VALUE_LIMIT (10)
-                }
-            ]
-        },
-        "rel_props": {},
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "- **Animal**\n"
-        "  - `species`: STRING Available options: ['Cat', 'Dog']\n"
-        "Relationship properties:\n"
-        "\n"
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_numeric_with_min_max() -> None:
-    schema = {
-        "node_props": {
-            "Person": [{"property": "age", "type": "INTEGER", "min": 20, "max": 70}]
-        },
-        "rel_props": {},
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "- **Person**\n"
-        "  - `age`: INTEGER Min: 20, Max: 70\n"
-        "Relationship properties:\n"
-        "\n"
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_numeric_with_values() -> None:
-    schema = {
-        "node_props": {
-            "Event": [
-                {
-                    "property": "date",
-                    "type": "DATE",
-                    "values": ["2021-01-01", "2021-01-02"],
-                }
-            ]
-        },
-        "rel_props": {},
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "- **Event**\n"
-        '  - `date`: DATE Example: "2021-01-01"\n'
-        "Relationship properties:\n"
-        "\n"
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_list_skipped() -> None:
-    schema = {
-        "node_props": {
-            "Document": [
-                {
-                    "property": "embedding",
-                    "type": "LIST",
-                    "min_size": 150,  # Greater than LIST_LIMIT (128)
-                    "max_size": 200,
-                }
-            ]
-        },
-        "rel_props": {},
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "- **Document**\n"
-        # 'embedding' property should be skipped
-        "Relationship properties:\n"
-        "\n"
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_list_included() -> None:
-    schema = {
-        "node_props": {
-            "Document": [
-                {"property": "keywords", "type": "LIST", "min_size": 2, "max_size": 5}
-            ]
-        },
-        "rel_props": {},
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "- **Document**\n"
-        "  - `keywords`: LIST Min Size: 2, Max Size: 5\n"
-        "Relationship properties:\n"
-        "\n"
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_rel_string_high_distinct_count() -> None:
-    schema = {
-        "node_props": {},
-        "rel_props": {
-            "KNOWS": [
-                {
-                    "property": "since",
-                    "type": "STRING",
-                    "values": ["2000", "2001", "2002"],
-                    "distinct_count": 15,
-                }
-            ]
-        },
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "\n"
-        "Relationship properties:\n"
-        "- **KNOWS**\n"
-        '  - `since`: STRING Example: "2000"\n'
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_rel_string_low_distinct_count() -> None:
-    schema = {
-        "node_props": {},
-        "rel_props": {
-            "LIKES": [
-                {
-                    "property": "intensity",
-                    "type": "STRING",
-                    "values": ["High", "Medium", "Low"],
-                    "distinct_count": 3,
-                }
-            ]
-        },
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "\n"
-        "Relationship properties:\n"
-        "- **LIKES**\n"
-        "  - `intensity`: STRING Available options: ['High', 'Medium', 'Low']\n"
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_rel_numeric_with_min_max() -> None:
-    schema = {
-        "node_props": {},
-        "rel_props": {
-            "WORKS_WITH": [
-                {"property": "since", "type": "INTEGER", "min": 1995, "max": 2020}
-            ]
-        },
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "\n"
-        "Relationship properties:\n"
-        "- **WORKS_WITH**\n"
-        "  - `since`: INTEGER Min: 1995, Max: 2020\n"
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_rel_list_skipped() -> None:
-    schema = {
-        "node_props": {},
-        "rel_props": {
-            "KNOWS": [
-                {
-                    "property": "embedding",
-                    "type": "LIST",
-                    "min_size": 150,
-                    "max_size": 200,
-                }
-            ]
-        },
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "\n"
-        "Relationship properties:\n"
-        "- **KNOWS**\n"
-        # 'embedding' property should be skipped
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_rel_list_included() -> None:
-    schema = {
-        "node_props": {},
-        "rel_props": {
-            "KNOWS": [
-                {"property": "messages", "type": "LIST", "min_size": 2, "max_size": 5}
-            ]
-        },
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "\n"
-        "Relationship properties:\n"
-        "- **KNOWS**\n"
-        "  - `messages`: LIST Min Size: 2, Max Size: 5\n"
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_rel_numeric_no_min_max() -> None:
-    schema = {
-        "node_props": {},
-        "rel_props": {
-            "OWES": [
-                {
-                    "property": "amount",
-                    "type": "FLOAT",
-                    # 'min' and 'max' are missing
-                    "values": [3.14, 2.71],
-                }
-            ]
-        },
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "\n"
-        "Relationship properties:\n"
-        "- **OWES**\n"
-        '  - `amount`: FLOAT Example: "3.14"\n'
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_values_empty() -> None:
-    schema = {
-        "node_props": {
-            "Person": [
-                {
-                    "property": "name",
-                    "type": "STRING",
-                    "values": [],
-                    "distinct_count": 15,
-                }
-            ]
-        },
-        "rel_props": {},
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "- **Person**\n"
-        "  - `name`: STRING \n"  # Example should be empty
-        "Relationship properties:\n"
-        "\n"
-        "The relationships:\n"
-    )
-    result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
-
-
-def test_format_schema_values_none() -> None:
-    schema = {
-        "node_props": {
-            "Person": [
-                {
-                    "property": "name",
-                    "type": "STRING",
-                    # 'values' is missing
-                    "distinct_count": 15,
-                }
-            ]
-        },
-        "rel_props": {},
-        "relationships": [],
-    }
-    expected_output = (
-        "Node properties:\n"
-        "- **Person**\n"
-        "  - `name`: STRING \n"  # Example should be empty
-        "Relationship properties:\n"
-        "\n"
-        "The relationships:\n"
-    )
+@pytest.mark.parametrize(
+    "description, schema, expected_output",
+    [
+        (
+            "String property with high distinct count",
+            {
+                "node_props": {
+                    "Person": [
+                        {
+                            "property": "name",
+                            "type": "STRING",
+                            "values": ["Alice", "Bob", "Charlie"],
+                            "distinct_count": 11,
+                        }
+                    ]
+                },
+                "rel_props": {},
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "- **Person**\n"
+                '  - `name`: STRING Example: "Alice"\n'
+                "Relationship properties:\n"
+                "\n"
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "String property with low distinct count",
+            {
+                "node_props": {
+                    "Animal": [
+                        {
+                            "property": "species",
+                            "type": "STRING",
+                            "values": ["Cat", "Dog"],
+                            "distinct_count": 2,
+                        }
+                    ]
+                },
+                "rel_props": {},
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "- **Animal**\n"
+                "  - `species`: STRING Available options: ['Cat', 'Dog']\n"
+                "Relationship properties:\n"
+                "\n"
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "Numeric property with min and max",
+            {
+                "node_props": {
+                    "Person": [
+                        {"property": "age", "type": "INTEGER", "min": 20, "max": 70}
+                    ]
+                },
+                "rel_props": {},
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "- **Person**\n"
+                "  - `age`: INTEGER Min: 20, Max: 70\n"
+                "Relationship properties:\n"
+                "\n"
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "Numeric property with values",
+            {
+                "node_props": {
+                    "Event": [
+                        {
+                            "property": "date",
+                            "type": "DATE",
+                            "values": ["2021-01-01", "2021-01-02"],
+                        }
+                    ]
+                },
+                "rel_props": {},
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "- **Event**\n"
+                '  - `date`: DATE Example: "2021-01-01"\n'
+                "Relationship properties:\n"
+                "\n"
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "List property that should be skipped",
+            {
+                "node_props": {
+                    "Document": [
+                        {
+                            "property": "embedding",
+                            "type": "LIST",
+                            "min_size": 150,
+                            "max_size": 200,
+                        }
+                    ]
+                },
+                "rel_props": {},
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "- **Document**\n"
+                "Relationship properties:\n"
+                "\n"
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "List property that should be included",
+            {
+                "node_props": {
+                    "Document": [
+                        {
+                            "property": "keywords",
+                            "type": "LIST",
+                            "min_size": 2,
+                            "max_size": 5,
+                        }
+                    ]
+                },
+                "rel_props": {},
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "- **Document**\n"
+                "  - `keywords`: LIST Min Size: 2, Max Size: 5\n"
+                "Relationship properties:\n"
+                "\n"
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "Relationship string property with high distinct count",
+            {
+                "node_props": {},
+                "rel_props": {
+                    "KNOWS": [
+                        {
+                            "property": "since",
+                            "type": "STRING",
+                            "values": ["2000", "2001", "2002"],
+                            "distinct_count": 15,
+                        }
+                    ]
+                },
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "\n"
+                "Relationship properties:\n"
+                "- **KNOWS**\n"
+                '  - `since`: STRING Example: "2000"\n'
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "Relationship string property with low distinct count",
+            {
+                "node_props": {},
+                "rel_props": {
+                    "LIKES": [
+                        {
+                            "property": "intensity",
+                            "type": "STRING",
+                            "values": ["High", "Medium", "Low"],
+                            "distinct_count": 3,
+                        }
+                    ]
+                },
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "\n"
+                "Relationship properties:\n"
+                "- **LIKES**\n"
+                "  - `intensity`: STRING Available options: ['High', 'Medium', 'Low']\n"
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "Relationship numeric property with min and max",
+            {
+                "node_props": {},
+                "rel_props": {
+                    "WORKS_WITH": [
+                        {
+                            "property": "since",
+                            "type": "INTEGER",
+                            "min": 1995,
+                            "max": 2020,
+                        }
+                    ]
+                },
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "\n"
+                "Relationship properties:\n"
+                "- **WORKS_WITH**\n"
+                "  - `since`: INTEGER Min: 1995, Max: 2020\n"
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "Relationship list property that should be skipped",
+            {
+                "node_props": {},
+                "rel_props": {
+                    "KNOWS": [
+                        {
+                            "property": "embedding",
+                            "type": "LIST",
+                            "min_size": 150,
+                            "max_size": 200,
+                        }
+                    ]
+                },
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "\n"
+                "Relationship properties:\n"
+                "- **KNOWS**\n"
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "Relationship list property that should be included",
+            {
+                "node_props": {},
+                "rel_props": {
+                    "KNOWS": [
+                        {
+                            "property": "messages",
+                            "type": "LIST",
+                            "min_size": 2,
+                            "max_size": 5,
+                        }
+                    ]
+                },
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "\n"
+                "Relationship properties:\n"
+                "- **KNOWS**\n"
+                "  - `messages`: LIST Min Size: 2, Max Size: 5\n"
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "Relationship numeric property without min and max",
+            {
+                "node_props": {},
+                "rel_props": {
+                    "OWES": [
+                        {
+                            "property": "amount",
+                            "type": "FLOAT",
+                            "values": [3.14, 2.71],
+                        }
+                    ]
+                },
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "\n"
+                "Relationship properties:\n"
+                "- **OWES**\n"
+                '  - `amount`: FLOAT Example: "3.14"\n'
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "Property with empty values list",
+            {
+                "node_props": {
+                    "Person": [
+                        {
+                            "property": "name",
+                            "type": "STRING",
+                            "values": [],
+                            "distinct_count": 15,
+                        }
+                    ]
+                },
+                "rel_props": {},
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "- **Person**\n"
+                "  - `name`: STRING \n"
+                "Relationship properties:\n"
+                "\n"
+                "The relationships:\n"
+            ),
+        ),
+        (
+            "Property with missing values",
+            {
+                "node_props": {
+                    "Person": [
+                        {
+                            "property": "name",
+                            "type": "STRING",
+                            "distinct_count": 15,
+                        }
+                    ]
+                },
+                "rel_props": {},
+                "relationships": [],
+            },
+            (
+                "Node properties:\n"
+                "- **Person**\n"
+                "  - `name`: STRING \n"
+                "Relationship properties:\n"
+                "\n"
+                "The relationships:\n"
+            ),
+        ),
+    ],
+)
+def test_format_schema(description, schema, expected_output):
     result = _format_schema(schema, is_enhanced=True)
-    assert result == expected_output
+    assert result == expected_output, f"Failed test case: {description}"
 
 
 # _enhanced_schema_cypher tests

From 5a73219275148e71507fb6dc02ce698ef438be76 Mon Sep 17 00:00:00 2001
From: Alex Thomas <alexthomas93@users.noreply.github.com>
Date: Wed, 11 Dec 2024 16:36:55 +0000
Subject: [PATCH 5/9] Parametrised value_sanitize tests

---
 .../unit_tests/graphs/test_neo4j_graph.py     | 84 +++++++++----------
 1 file changed, 42 insertions(+), 42 deletions(-)

diff --git a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
index 34e9a52..59e671c 100644
--- a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
+++ b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
@@ -22,44 +22,48 @@ def mock_neo4j_driver() -> Generator[MagicMock, None, None]:
         yield mock_driver_instance
 
 
-def test_value_sanitize_with_small_list() -> None:
-    small_list = list(range(15))  # list size > LIST_LIMIT
-    input_dict = {"key1": "value1", "small_list": small_list}
-    expected_output = {"key1": "value1", "small_list": small_list}
-    assert value_sanitize(input_dict) == expected_output
-
-
-def test_value_sanitize_with_oversized_list() -> None:
-    oversized_list = list(range(150))  # list size > LIST_LIMIT
-    input_dict = {"key1": "value1", "oversized_list": oversized_list}
-    expected_output = {
-        "key1": "value1"
-        # oversized_list should not be included
-    }
-    assert value_sanitize(input_dict) == expected_output
-
-
-def test_value_sanitize_with_nested_oversized_list() -> None:
-    oversized_list = list(range(150))  # list size > LIST_LIMIT
-    input_dict = {"key1": "value1", "oversized_list": {"key": oversized_list}}
-    expected_output = {"key1": "value1", "oversized_list": {}}
-    assert value_sanitize(input_dict) == expected_output
-
-
-def test_value_sanitize_with_dict_in_list() -> None:
-    oversized_list = list(range(150))  # list size > LIST_LIMIT
-    input_dict = {"key1": "value1", "oversized_list": [1, 2, {"key": oversized_list}]}
-    expected_output = {"key1": "value1", "oversized_list": [1, 2, {}]}
-    assert value_sanitize(input_dict) == expected_output
-
-
-def test_value_sanitize_with_dict_in_nested_list() -> None:
-    input_dict = {
-        "key1": "value1",
-        "deeply_nested_lists": [[[[{"final_nested_key": list(range(200))}]]]],
-    }
-    expected_output = {"key1": "value1", "deeply_nested_lists": [[[[{}]]]]}
-    assert value_sanitize(input_dict) == expected_output
+@pytest.mark.parametrize(
+    "description, input_value, expected_output",
+    [
+        (
+            "Small list",
+            {"key1": "value1", "small_list": list(range(15))},
+            {"key1": "value1", "small_list": list(range(15))},
+        ),
+        (
+            "Oversized list",
+            {"key1": "value1", "oversized_list": list(range(150))},
+            {"key1": "value1"},
+        ),
+        (
+            "Nested oversized list",
+            {"key1": "value1", "oversized_list": {"key": list(range(150))}},
+            {"key1": "value1", "oversized_list": {}},
+        ),
+        (
+            "Dict in list",
+            {"key1": "value1", "oversized_list": [1, 2, {"key": list(range(150))}]},
+            {"key1": "value1", "oversized_list": [1, 2, {}]},
+        ),
+        (
+            "Dict in nested list",
+            {
+                "key1": "value1",
+                "deeply_nested_lists": [[[[{"final_nested_key": list(range(200))}]]]],
+            },
+            {"key1": "value1", "deeply_nested_lists": [[[[{}]]]]},
+        ),
+        (
+            "None value",
+            None,
+            None,
+        ),
+    ],
+)
+def test_value_sanitize(description, input_value, expected_output):
+    assert (
+        value_sanitize(input_value) == expected_output
+    ), f"Failed test case: {description}"
 
 
 def test_driver_state_management(mock_neo4j_driver: MagicMock) -> None:
@@ -159,10 +163,6 @@ def mock_import(
             Neo4jGraph()
         assert "Could not import neo4j python package." in str(exc_info.value)
 
-
-# _format_schema tests
-
-
 @pytest.mark.parametrize(
     "description, schema, expected_output",
     [

From d68209bfb9cb29eaea25176d0abc8b1d5b72e5ce Mon Sep 17 00:00:00 2001
From: Alex Thomas <alexthomas93@users.noreply.github.com>
Date: Wed, 11 Dec 2024 17:22:36 +0000
Subject: [PATCH 6/9] test_format_schema refactoring

---
 .../unit_tests/graphs/test_neo4j_graph.py     | 49 ++++++++++++-------
 1 file changed, 32 insertions(+), 17 deletions(-)

diff --git a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
index 59e671c..02e8dad 100644
--- a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
+++ b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
@@ -163,11 +163,12 @@ def mock_import(
             Neo4jGraph()
         assert "Could not import neo4j python package." in str(exc_info.value)
 
+
 @pytest.mark.parametrize(
-    "description, schema, expected_output",
+    "description, schema, is_enhanced, expected_output",
     [
         (
-            "String property with high distinct count",
+            "Enhanced, string property with high distinct count",
             {
                 "node_props": {
                     "Person": [
@@ -182,6 +183,7 @@ def mock_import(
                 "rel_props": {},
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "- **Person**\n"
@@ -192,7 +194,7 @@ def mock_import(
             ),
         ),
         (
-            "String property with low distinct count",
+            "Enhanced, string property with low distinct count",
             {
                 "node_props": {
                     "Animal": [
@@ -207,6 +209,7 @@ def mock_import(
                 "rel_props": {},
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "- **Animal**\n"
@@ -217,7 +220,7 @@ def mock_import(
             ),
         ),
         (
-            "Numeric property with min and max",
+            "Enhanced, numeric property with min and max",
             {
                 "node_props": {
                     "Person": [
@@ -227,6 +230,7 @@ def mock_import(
                 "rel_props": {},
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "- **Person**\n"
@@ -237,7 +241,7 @@ def mock_import(
             ),
         ),
         (
-            "Numeric property with values",
+            "Enhanced, numeric property with values",
             {
                 "node_props": {
                     "Event": [
@@ -251,6 +255,7 @@ def mock_import(
                 "rel_props": {},
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "- **Event**\n"
@@ -261,7 +266,7 @@ def mock_import(
             ),
         ),
         (
-            "List property that should be skipped",
+            "Enhanced, list property that should be skipped",
             {
                 "node_props": {
                     "Document": [
@@ -276,6 +281,7 @@ def mock_import(
                 "rel_props": {},
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "- **Document**\n"
@@ -285,7 +291,7 @@ def mock_import(
             ),
         ),
         (
-            "List property that should be included",
+            "Enhanced, list property that should be included",
             {
                 "node_props": {
                     "Document": [
@@ -300,6 +306,7 @@ def mock_import(
                 "rel_props": {},
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "- **Document**\n"
@@ -310,7 +317,7 @@ def mock_import(
             ),
         ),
         (
-            "Relationship string property with high distinct count",
+            "Enhanced, relationship string property with high distinct count",
             {
                 "node_props": {},
                 "rel_props": {
@@ -325,6 +332,7 @@ def mock_import(
                 },
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "\n"
@@ -335,7 +343,7 @@ def mock_import(
             ),
         ),
         (
-            "Relationship string property with low distinct count",
+            "Enhanced, relationship string property with low distinct count",
             {
                 "node_props": {},
                 "rel_props": {
@@ -350,6 +358,7 @@ def mock_import(
                 },
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "\n"
@@ -360,7 +369,7 @@ def mock_import(
             ),
         ),
         (
-            "Relationship numeric property with min and max",
+            "Enhanced, relationship numeric property with min and max",
             {
                 "node_props": {},
                 "rel_props": {
@@ -375,6 +384,7 @@ def mock_import(
                 },
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "\n"
@@ -385,7 +395,7 @@ def mock_import(
             ),
         ),
         (
-            "Relationship list property that should be skipped",
+            "Enhanced, relationship list property that should be skipped",
             {
                 "node_props": {},
                 "rel_props": {
@@ -400,6 +410,7 @@ def mock_import(
                 },
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "\n"
@@ -409,7 +420,7 @@ def mock_import(
             ),
         ),
         (
-            "Relationship list property that should be included",
+            "Enhanced, relationship list property that should be included",
             {
                 "node_props": {},
                 "rel_props": {
@@ -424,6 +435,7 @@ def mock_import(
                 },
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "\n"
@@ -434,7 +446,7 @@ def mock_import(
             ),
         ),
         (
-            "Relationship numeric property without min and max",
+            "Enhanced, relationship numeric property without min and max",
             {
                 "node_props": {},
                 "rel_props": {
@@ -448,6 +460,7 @@ def mock_import(
                 },
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "\n"
@@ -458,7 +471,7 @@ def mock_import(
             ),
         ),
         (
-            "Property with empty values list",
+            "Enhanced, property with empty values list",
             {
                 "node_props": {
                     "Person": [
@@ -473,6 +486,7 @@ def mock_import(
                 "rel_props": {},
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "- **Person**\n"
@@ -483,7 +497,7 @@ def mock_import(
             ),
         ),
         (
-            "Property with missing values",
+            "Enhanced, property with missing values",
             {
                 "node_props": {
                     "Person": [
@@ -497,6 +511,7 @@ def mock_import(
                 "rel_props": {},
                 "relationships": [],
             },
+            True,
             (
                 "Node properties:\n"
                 "- **Person**\n"
@@ -508,8 +523,8 @@ def mock_import(
         ),
     ],
 )
-def test_format_schema(description, schema, expected_output):
-    result = _format_schema(schema, is_enhanced=True)
+def test_format_schema(description, schema, is_enhanced, expected_output):
+    result = _format_schema(schema, is_enhanced)
     assert result == expected_output, f"Failed test case: {description}"
 
 

From 9912137356b4295ae06049de05da2877559a7ea1 Mon Sep 17 00:00:00 2001
From: Alex Thomas <alexthomas93@users.noreply.github.com>
Date: Wed, 11 Dec 2024 17:48:14 +0000
Subject: [PATCH 7/9] More refactoring + minor tests added

---
 .../unit_tests/graphs/test_neo4j_graph.py     | 30 +++++++++++++++++--
 1 file changed, 27 insertions(+), 3 deletions(-)

diff --git a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
index 02e8dad..7a353bc 100644
--- a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
+++ b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
@@ -5,6 +5,7 @@
 import pytest
 
 from langchain_neo4j.graphs.neo4j_graph import (
+    LIST_LIMIT,
     Neo4jGraph,
     _format_schema,
     value_sanitize,
@@ -32,7 +33,7 @@ def mock_neo4j_driver() -> Generator[MagicMock, None, None]:
         ),
         (
             "Oversized list",
-            {"key1": "value1", "oversized_list": list(range(150))},
+            {"key1": "value1", "oversized_list": list(range(LIST_LIMIT + 1))},
             {"key1": "value1"},
         ),
         (
@@ -42,17 +43,27 @@ def mock_neo4j_driver() -> Generator[MagicMock, None, None]:
         ),
         (
             "Dict in list",
-            {"key1": "value1", "oversized_list": [1, 2, {"key": list(range(150))}]},
+            {
+                "key1": "value1",
+                "oversized_list": [1, 2, {"key": list(range(LIST_LIMIT + 1))}],
+            },
             {"key1": "value1", "oversized_list": [1, 2, {}]},
         ),
         (
             "Dict in nested list",
             {
                 "key1": "value1",
-                "deeply_nested_lists": [[[[{"final_nested_key": list(range(200))}]]]],
+                "deeply_nested_lists": [
+                    [[[{"final_nested_key": list(range(LIST_LIMIT + 1))}]]]
+                ],
             },
             {"key1": "value1", "deeply_nested_lists": [[[[{}]]]]},
         ),
+        (
+            "Bare oversized list",
+            list(range(LIST_LIMIT + 1)),
+            None,
+        ),
         (
             "None value",
             None,
@@ -99,6 +110,19 @@ def test_driver_state_management(mock_neo4j_driver: MagicMock) -> None:
         graph.refresh_schema()
 
 
+def test_neo4j_graph_del_method(mock_neo4j_driver: MagicMock) -> None:
+    """Test the __del__ method."""
+    with patch.object(Neo4jGraph, "close") as mock_close:
+        graph = Neo4jGraph(
+            url="bolt://localhost:7687", username="neo4j", password="password"
+        )
+        # Ensure exceptions are suppressed when the graph's destructor is called
+        mock_close.side_effect = Exception()
+        mock_close.assert_not_called()
+        graph.__del__()
+        mock_close.assert_called_once()
+
+
 def test_close_method_removes_driver(mock_neo4j_driver: MagicMock) -> None:
     """Test that close method removes the _driver attribute."""
     graph = Neo4jGraph(

From 551b03f6c6136f69f843ba4c228e64db9fa60ad7 Mon Sep 17 00:00:00 2001
From: Alex Thomas <alexthomas93@users.noreply.github.com>
Date: Thu, 12 Dec 2024 17:22:36 +0000
Subject: [PATCH 8/9] Neo4jGraph 100% coverage

---
 .../langchain_neo4j/graphs/neo4j_graph.py     |   2 +-
 .../integration_tests/graphs/test_neo4j.py    |  41 ++++-
 .../unit_tests/graphs/test_neo4j_graph.py     | 151 +++++++++++++++++-
 3 files changed, 184 insertions(+), 10 deletions(-)

diff --git a/libs/neo4j/langchain_neo4j/graphs/neo4j_graph.py b/libs/neo4j/langchain_neo4j/graphs/neo4j_graph.py
index e6d2428..237c5d5 100644
--- a/libs/neo4j/langchain_neo4j/graphs/neo4j_graph.py
+++ b/libs/neo4j/langchain_neo4j/graphs/neo4j_graph.py
@@ -215,7 +215,7 @@ def _format_schema(schema: Dict, is_enhanced: bool) -> str:
             formatted_rel_props.append(f"- **{rel_type}**")
             for prop in properties:
                 example = ""
-                if prop["type"] == "STRING":
+                if prop["type"] == "STRING" and prop.get("values"):
                     if prop.get("distinct_count", 11) > DISTINCT_VALUE_LIMIT:
                         example = (
                             f'Example: "{clean_string_values(prop["values"][0])}"'
diff --git a/libs/neo4j/tests/integration_tests/graphs/test_neo4j.py b/libs/neo4j/tests/integration_tests/graphs/test_neo4j.py
index 3f5c28f..bd47454 100644
--- a/libs/neo4j/tests/integration_tests/graphs/test_neo4j.py
+++ b/libs/neo4j/tests/integration_tests/graphs/test_neo4j.py
@@ -21,6 +21,7 @@
                 source=Node(id="foo", type="foo"),
                 target=Node(id="bar", type="bar"),
                 type="REL",
+                properties={"key": "val"},
             )
         ],
         source=Document(page_content="source document"),
@@ -349,7 +350,16 @@ def test_enhanced_schema() -> None:
                 }
             ],
         },
-        "rel_props": {},
+        "rel_props": {
+            "REL": [
+                {
+                    "distinct_count": 1,
+                    "property": "key",
+                    "type": "STRING",
+                    "values": ["val"],
+                }
+            ]
+        },
         "relationships": [{"start": "foo", "type": "REL", "end": "bar"}],
     }
     # remove metadata portion of schema
@@ -367,16 +377,37 @@ def test_enhanced_schema_exception() -> None:
     assert password is not None
 
     graph = Neo4jGraph(
-        url=url, username=username, password=password, enhanced_schema=True
+        url=url,
+        username=username,
+        password=password,
+        enhanced_schema=True,
+        refresh_schema=False,
     )
     graph.query("MATCH (n) DETACH DELETE n")
-    graph.query("CREATE (:Node {foo:'bar'})," "(:Node {foo: 1}), (:Node {foo: [1,2]})")
+    graph.query(
+        "CREATE (:Node {foo: 'bar'}), (:Node {foo: 1}), (:Node {foo: [1,2]}), "
+        "(: EmptyNode)"
+    )
+    graph.query(
+        "MATCH (a:Node {foo: 'bar'}), (b:Node {foo: 1}), "
+        "(c:Node {foo: [1,2]}), (d: EmptyNode) "
+        "CREATE (a)-[:REL {foo: 'bar'}]->(b), (b)-[:REL {foo: 1}]->(c), "
+        "(c)-[:REL {foo: [1,2]}]->(a), (d)-[:EMPTY_REL {}]->(d)"
+    )
     graph.refresh_schema()
     expected_output = {
         "node_props": {"Node": [{"property": "foo", "type": "STRING"}]},
-        "rel_props": {},
-        "relationships": [],
+        "rel_props": {"REL": [{"property": "foo", "type": "STRING"}]},
+        "relationships": [
+            {
+                "end": "Node",
+                "start": "Node",
+                "type": "REL",
+            },
+            {"end": "EmptyNode", "start": "EmptyNode", "type": "EMPTY_REL"},
+        ],
     }
+
     # remove metadata portion of schema
     del graph.structured_schema["metadata"]
     assert graph.structured_schema == expected_output
diff --git a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
index 7a353bc..c24df53 100644
--- a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
+++ b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
@@ -1,8 +1,9 @@
 from types import ModuleType
-from typing import Generator, Mapping, Sequence, Union
+from typing import Any, Dict, Generator, Mapping, Sequence, Union
 from unittest.mock import MagicMock, patch
 
 import pytest
+from neo4j.exceptions import ClientError, Neo4jError
 
 from langchain_neo4j.graphs.neo4j_graph import (
     LIST_LIMIT,
@@ -71,7 +72,10 @@ def mock_neo4j_driver() -> Generator[MagicMock, None, None]:
         ),
     ],
 )
-def test_value_sanitize(description, input_value, expected_output):
+def test_value_sanitize(
+    description: str, input_value: Dict[str, Any], expected_output: Any
+) -> None:
+    """Test the value_sanitize function."""
     assert (
         value_sanitize(input_value) == expected_output
     ), f"Failed test case: {description}"
@@ -188,6 +192,143 @@ def mock_import(
         assert "Could not import neo4j python package." in str(exc_info.value)
 
 
+def test_neo4j_graph_init_with_empty_credentials() -> None:
+    """Test the __init__ method when no credentials have been provided."""
+    with patch("neo4j.GraphDatabase.driver", autospec=True) as mock_driver:
+        mock_driver_instance = MagicMock()
+        mock_driver.return_value = mock_driver_instance
+        mock_driver_instance.verify_connectivity.return_value = None
+        Neo4jGraph(
+            url="bolt://localhost:7687", username="", password="", refresh_schema=False
+        )
+        mock_driver.assert_called_with("bolt://localhost:7687", auth=None)
+
+
+def test_init_apoc_procedure_not_found(
+    mock_neo4j_driver: MagicMock,
+) -> None:
+    """Test an error is raised when APOC is not installed."""
+    with patch("langchain_neo4j.Neo4jGraph.refresh_schema") as mock_refresh_schema:
+        err = ClientError()
+        err.code = "Neo.ClientError.Procedure.ProcedureNotFound"
+        mock_refresh_schema.side_effect = err
+        with pytest.raises(ValueError) as exc_info:
+            Neo4jGraph(url="bolt://localhost:7687", username="", password="")
+        assert "Could not use APOC procedures." in str(exc_info.value)
+
+
+def test_init_refresh_schema_other_err(
+    mock_neo4j_driver: MagicMock,
+) -> None:
+    """Test any other ClientErrors raised when calling refresh_schema in __init__ are
+    re-raised."""
+    with patch("langchain_neo4j.Neo4jGraph.refresh_schema") as mock_refresh_schema:
+        err = ClientError()
+        err.code = "other_error"
+        mock_refresh_schema.side_effect = err
+        with pytest.raises(ClientError) as exc_info:
+            Neo4jGraph(url="bolt://localhost:7687", username="", password="")
+        assert exc_info.value == err
+
+
+def test_query_fallback_execution(mock_neo4j_driver: MagicMock) -> None:
+    """Test the fallback to allow for implicit transactions in query."""
+    err = Neo4jError()
+    err.code = "Neo.DatabaseError.Statement.ExecutionFailed"
+    err.message = "in an implicit transaction"
+    mock_neo4j_driver.execute_query.side_effect = err
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687",
+        username="neo4j",
+        password="password",
+        database="test_db",
+        sanitize=True,
+    )
+    mock_session = MagicMock()
+    mock_result = MagicMock()
+    mock_result.data.return_value = {
+        "key1": "value1",
+        "oversized_list": list(range(LIST_LIMIT + 1)),
+    }
+    mock_session.run.return_value = [mock_result]
+    mock_neo4j_driver.session.return_value.__enter__.return_value = mock_session
+    mock_neo4j_driver.session.return_value.__exit__.return_value = None
+    query = "MATCH (n) RETURN n;"
+    params = {"param1": "value1"}
+    json_data = graph.query(query, params)
+    mock_neo4j_driver.session.assert_called_with(database="test_db")
+    called_args, _ = mock_session.run.call_args
+    called_query = called_args[0]
+    assert called_query.text == query
+    assert called_query.timeout == graph.timeout
+    assert called_args[1] == params
+    assert json_data == [{"key1": "value1"}]
+
+
+def test_refresh_schema_handles_client_error(mock_neo4j_driver: MagicMock) -> None:
+    """Test refresh schema handles a client error which might arise due to a user
+    not having access to schema information"""
+
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687",
+        username="neo4j",
+        password="password",
+        database="test_db",
+    )
+    node_properties = [
+        {
+            "output": {
+                "properties": [{"property": "property_a", "type": "STRING"}],
+                "labels": "LabelA",
+            }
+        }
+    ]
+    relationships_properties = [
+        {
+            "output": {
+                "type": "REL_TYPE",
+                "properties": [{"property": "rel_prop", "type": "STRING"}],
+            }
+        }
+    ]
+    relationships = [
+        {"output": {"start": "LabelA", "type": "REL_TYPE", "end": "LabelB"}},
+        {"output": {"start": "LabelA", "type": "REL_TYPE", "end": "LabelC"}},
+    ]
+
+    # Mock the query method to raise ClientError for constraint and index queries
+    graph.query = MagicMock(  # type: ignore[method-assign]
+        side_effect=[
+            node_properties,
+            relationships_properties,
+            relationships,
+            ClientError("Mock ClientError"),
+        ]
+    )
+    graph.refresh_schema()
+
+    # Assertions
+    # Ensure constraints and indexes are empty due to the ClientError
+    assert graph.structured_schema["metadata"]["constraint"] == []
+    assert graph.structured_schema["metadata"]["index"] == []
+
+    # Ensure the query method was called as expected
+    assert graph.query.call_count == 4
+    graph.query.assert_any_call("SHOW CONSTRAINTS")
+
+
+def test_get_schema(mock_neo4j_driver) -> None:
+    """Tests the get_schema property."""
+    graph = Neo4jGraph(
+        url="bolt://localhost:7687",
+        username="neo4j",
+        password="password",
+        refresh_schema=False
+    )
+    graph.schema = "test"
+    assert graph.get_schema == "test"
+
+
 @pytest.mark.parametrize(
     "description, schema, is_enhanced, expected_output",
     [
@@ -547,7 +688,9 @@ def mock_import(
         ),
     ],
 )
-def test_format_schema(description, schema, is_enhanced, expected_output):
+def test_format_schema(
+    description: str, schema: Dict, is_enhanced: bool, expected_output: str
+) -> None:
     result = _format_schema(schema, is_enhanced)
     assert result == expected_output, f"Failed test case: {description}"
 
@@ -685,7 +828,7 @@ def test_enhanced_schema_cypher_string_exhaustive_false_with_index(
             ]
         }
     }
-    graph.query = MagicMock(return_value=[{"value": ["Single", "Married", "Divorced"]}])
+    graph.query = MagicMock(return_value=[{"value": ["Single", "Married", "Divorced"]}])  # type: ignore[method-assign]
     properties = [{"property": "status", "type": "STRING"}]
     query = graph._enhanced_schema_cypher("Person", properties, exhaustive=False)
     assert "values: ['Single', 'Married', 'Divorced'], distinct_count: 3" in query

From 8f30f9492c25ddcb3196ae7d2ef2b47b04256d8c Mon Sep 17 00:00:00 2001
From: Alex Thomas <alexthomas93@users.noreply.github.com>
Date: Fri, 13 Dec 2024 10:41:35 +0000
Subject: [PATCH 9/9] Fixed linting issues

---
 libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
index c24df53..265af31 100644
--- a/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
+++ b/libs/neo4j/tests/unit_tests/graphs/test_neo4j_graph.py
@@ -317,13 +317,13 @@ def test_refresh_schema_handles_client_error(mock_neo4j_driver: MagicMock) -> No
     graph.query.assert_any_call("SHOW CONSTRAINTS")
 
 
-def test_get_schema(mock_neo4j_driver) -> None:
+def test_get_schema(mock_neo4j_driver: MagicMock) -> None:
     """Tests the get_schema property."""
     graph = Neo4jGraph(
         url="bolt://localhost:7687",
         username="neo4j",
         password="password",
-        refresh_schema=False
+        refresh_schema=False,
     )
     graph.schema = "test"
     assert graph.get_schema == "test"