import os from langchain_core.documents import Document from langchain_community.graphs import Neo4jGraph from langchain_community.graphs.graph_document import GraphDocument, Node, Relationship from langchain_community.graphs.neo4j_graph import ( BASE_ENTITY_LABEL, node_properties_query, rel_properties_query, rel_query, ) test_data = [ GraphDocument( nodes=[Node(id="foo", type="foo"), Node(id="bar", type="bar")], relationships=[ Relationship( source=Node(id="foo", type="foo"), target=Node(id="bar", type="bar"), type="REL", ) ], source=Document(page_content="source document"), ) ] def test_cypher_return_correct_schema() -> None: """Test that chain returns direct results.""" url = os.environ.get("NEO4J_URI") username = os.environ.get("NEO4J_USERNAME") password = os.environ.get("NEO4J_PASSWORD") assert url is not None assert username is not None assert password is not None graph = Neo4jGraph( url=url, username=username, password=password, ) # Delete all nodes in the graph graph.query("MATCH (n) DETACH DELETE n") # Create two nodes and a relationship graph.query( """ CREATE (la:LabelA {property_a: 'a'}) CREATE (lb:LabelB) CREATE (lc:LabelC) MERGE (la)-[:REL_TYPE]-> (lb) MERGE (la)-[:REL_TYPE {rel_prop: 'abc'}]-> (lc) """ ) # Refresh schema information graph.refresh_schema() node_properties = graph.query( node_properties_query, params={"EXCLUDED_LABELS": [BASE_ENTITY_LABEL]} ) relationships_properties = graph.query( rel_properties_query, params={"EXCLUDED_LABELS": [BASE_ENTITY_LABEL]} ) relationships = graph.query( rel_query, params={"EXCLUDED_LABELS": [BASE_ENTITY_LABEL]} ) expected_node_properties = [ { "output": { "properties": [{"property": "property_a", "type": "STRING"}], "labels": "LabelA", } } ] expected_relationships_properties = [ { "output": { "type": "REL_TYPE", "properties": [{"property": "rel_prop", "type": "STRING"}], } } ] expected_relationships = [ {"output": {"start": "LabelA", "type": "REL_TYPE", "end": "LabelB"}}, {"output": {"start": "LabelA", "type": "REL_TYPE", "end": "LabelC"}}, ] assert node_properties == expected_node_properties assert relationships_properties == expected_relationships_properties # Order is not guaranteed with Neo4j returns assert ( sorted(relationships, key=lambda x: x["output"]["end"]) == expected_relationships ) def test_neo4j_timeout() -> None: """Test that neo4j uses the timeout correctly.""" url = os.environ.get("NEO4J_URI") username = os.environ.get("NEO4J_USERNAME") password = os.environ.get("NEO4J_PASSWORD") assert url is not None assert username is not None assert password is not None graph = Neo4jGraph(url=url, username=username, password=password, timeout=0.1) try: graph.query("UNWIND range(0,100000,1) AS i MERGE (:Foo {id:i})") except Exception as e: assert ( e.code # type: ignore[attr-defined] == "Neo.ClientError.Transaction.TransactionTimedOutClientConfiguration" ) def test_neo4j_sanitize_values() -> None: """Test that neo4j uses the timeout correctly.""" url = os.environ.get("NEO4J_URI") username = os.environ.get("NEO4J_USERNAME") password = os.environ.get("NEO4J_PASSWORD") assert url is not None assert username is not None assert password is not None graph = Neo4jGraph(url=url, username=username, password=password, sanitize=True) # Delete all nodes in the graph graph.query("MATCH (n) DETACH DELETE n") # Create two nodes and a relationship graph.query( """ CREATE (la:LabelA {property_a: 'a'}) CREATE (lb:LabelB) CREATE (lc:LabelC) MERGE (la)-[:REL_TYPE]-> (lb) MERGE (la)-[:REL_TYPE {rel_prop: 'abc'}]-> (lc) """ ) graph.refresh_schema() output = graph.query("RETURN range(0,130,1) AS result") assert output == [{}] def test_neo4j_add_data() -> None: """Test that neo4j correctly import graph document.""" url = os.environ.get("NEO4J_URI") username = os.environ.get("NEO4J_USERNAME") password = os.environ.get("NEO4J_PASSWORD") assert url is not None assert username is not None assert password is not None graph = Neo4jGraph(url=url, username=username, password=password, sanitize=True) # Delete all nodes in the graph graph.query("MATCH (n) DETACH DELETE n") # Remove all constraints graph.query("CALL apoc.schema.assert({}, {})") graph.refresh_schema() # Create two nodes and a relationship graph.add_graph_documents(test_data) output = graph.query( "MATCH (n) RETURN labels(n) AS label, count(*) AS count ORDER BY label" ) assert output == [{"label": ["bar"], "count": 1}, {"label": ["foo"], "count": 1}] assert graph.structured_schema["metadata"]["constraint"] == [] def test_neo4j_add_data_source() -> None: """Test that neo4j correctly import graph document with source.""" url = os.environ.get("NEO4J_URI") username = os.environ.get("NEO4J_USERNAME") password = os.environ.get("NEO4J_PASSWORD") assert url is not None assert username is not None assert password is not None graph = Neo4jGraph(url=url, username=username, password=password, sanitize=True) # Delete all nodes in the graph graph.query("MATCH (n) DETACH DELETE n") # Remove all constraints graph.query("CALL apoc.schema.assert({}, {})") graph.refresh_schema() # Create two nodes and a relationship graph.add_graph_documents(test_data, include_source=True) output = graph.query( "MATCH (n) RETURN labels(n) AS label, count(*) AS count ORDER BY label" ) assert output == [ {"label": ["Document"], "count": 1}, {"label": ["bar"], "count": 1}, {"label": ["foo"], "count": 1}, ] assert graph.structured_schema["metadata"]["constraint"] == [] def test_neo4j_add_data_base() -> None: """Test that neo4j correctly import graph document with base_entity.""" url = os.environ.get("NEO4J_URI") username = os.environ.get("NEO4J_USERNAME") password = os.environ.get("NEO4J_PASSWORD") assert url is not None assert username is not None assert password is not None graph = Neo4jGraph(url=url, username=username, password=password, sanitize=True) # Delete all nodes in the graph graph.query("MATCH (n) DETACH DELETE n") # Remove all constraints graph.query("CALL apoc.schema.assert({}, {})") graph.refresh_schema() # Create two nodes and a relationship graph.add_graph_documents(test_data, baseEntityLabel=True) output = graph.query( "MATCH (n) RETURN apoc.coll.sort(labels(n)) AS label, " "count(*) AS count ORDER BY label" ) assert output == [ {"label": [BASE_ENTITY_LABEL, "bar"], "count": 1}, {"label": [BASE_ENTITY_LABEL, "foo"], "count": 1}, ] assert graph.structured_schema["metadata"]["constraint"] != [] def test_neo4j_add_data_base_source() -> None: """Test that neo4j correctly import graph document with base_entity and source.""" url = os.environ.get("NEO4J_URI") username = os.environ.get("NEO4J_USERNAME") password = os.environ.get("NEO4J_PASSWORD") assert url is not None assert username is not None assert password is not None graph = Neo4jGraph(url=url, username=username, password=password, sanitize=True) # Delete all nodes in the graph graph.query("MATCH (n) DETACH DELETE n") # Remove all constraints graph.query("CALL apoc.schema.assert({}, {})") graph.refresh_schema() # Create two nodes and a relationship graph.add_graph_documents(test_data, baseEntityLabel=True, include_source=True) output = graph.query( "MATCH (n) RETURN apoc.coll.sort(labels(n)) AS label, " "count(*) AS count ORDER BY label" ) assert output == [ {"label": ["Document"], "count": 1}, {"label": [BASE_ENTITY_LABEL, "bar"], "count": 1}, {"label": [BASE_ENTITY_LABEL, "foo"], "count": 1}, ] assert graph.structured_schema["metadata"]["constraint"] != [] def test_neo4j_filtering_labels() -> None: """Test that neo4j correctly filters excluded labels.""" url = os.environ.get("NEO4J_URI") username = os.environ.get("NEO4J_USERNAME") password = os.environ.get("NEO4J_PASSWORD") assert url is not None assert username is not None assert password is not None graph = Neo4jGraph(url=url, username=username, password=password, sanitize=True) # Delete all nodes in the graph graph.query("MATCH (n) DETACH DELETE n") # Remove all constraints graph.query("CALL apoc.schema.assert({}, {})") graph.query( "CREATE (:`_Bloom_Scene_`)-[:_Bloom_HAS_SCENE_]->(:`_Bloom_Perspective_`)" ) graph.refresh_schema() # Assert both are empty assert graph.structured_schema["node_props"] == {} assert graph.structured_schema["relationships"] == [] def test_driver_config() -> None: """Test that neo4j works with driver config.""" url = os.environ.get("NEO4J_URI") username = os.environ.get("NEO4J_USERNAME") password = os.environ.get("NEO4J_PASSWORD") assert url is not None assert username is not None assert password is not None graph = Neo4jGraph( url=url, username=username, password=password, driver_config={"max_connection_pool_size": 1}, ) graph.query("RETURN 'foo'") def test_enhanced_schema() -> None: """Test that neo4j works with driver config.""" url = os.environ.get("NEO4J_URI") username = os.environ.get("NEO4J_USERNAME") password = os.environ.get("NEO4J_PASSWORD") assert url is not None assert username is not None assert password is not None graph = Neo4jGraph( url=url, username=username, password=password, enhanced_schema=True ) graph.query("MATCH (n) DETACH DELETE n") graph.add_graph_documents(test_data) graph.refresh_schema() expected_output = { "node_props": { "foo": [ { "property": "id", "type": "STRING", "values": ["foo"], "distinct_count": 1, } ], "bar": [ { "property": "id", "type": "STRING", "values": ["bar"], "distinct_count": 1, } ], }, "rel_props": {}, "relationships": [{"start": "foo", "type": "REL", "end": "bar"}], } # remove metadata portion of schema del graph.structured_schema["metadata"] assert graph.structured_schema == expected_output