diff --git a/lightrag/kg/__init__.py b/lightrag/kg/__init__.py
index bbddb2857a..fe3ed9c87b 100644
--- a/lightrag/kg/__init__.py
+++ b/lightrag/kg/__init__.py
@@ -14,6 +14,7 @@
             "NetworkXStorage",
             "Neo4JStorage",
             "PGGraphStorage",
+            "NebulaStorage",
             # "AGEStorage",
             # "MongoGraphStorage",
             # "TiDBGraphStorage",
@@ -55,6 +56,7 @@
     # Graph Storage Implementations
     "NetworkXStorage": [],
     "Neo4JStorage": ["NEO4J_URI", "NEO4J_USERNAME", "NEO4J_PASSWORD"],
+    "NebulaStorage": ["NEBULA_HOSTS", "NEBULA_USER", "NEBULA_PASSWORD","NEBULA_POOL_SIZE"],
     "MongoGraphStorage": [],
     # "TiDBGraphStorage": ["TIDB_USER", "TIDB_PASSWORD", "TIDB_DATABASE"],
     "AGEStorage": [
@@ -90,6 +92,7 @@
     "NanoVectorDBStorage": ".kg.nano_vector_db_impl",
     "JsonDocStatusStorage": ".kg.json_doc_status_impl",
     "Neo4JStorage": ".kg.neo4j_impl",
+     "NebulaStorage": ".kg.nebula_impl",
     "MilvusVectorDBStorage": ".kg.milvus_impl",
     "MongoKVStorage": ".kg.mongo_impl",
     "MongoDocStatusStorage": ".kg.mongo_impl",
diff --git a/lightrag/kg/nebula_impl.py b/lightrag/kg/nebula_impl.py
new file mode 100644
index 0000000000..57b9716774
--- /dev/null
+++ b/lightrag/kg/nebula_impl.py
@@ -0,0 +1,928 @@
+import asyncio
+import inspect
+import os
+import re
+from dataclasses import dataclass
+from typing import Any, final
+import numpy as np
+import configparser
+
+from tenacity import (
+    retry,
+    stop_after_attempt,
+    wait_exponential,
+    retry_if_exception_type,
+)
+
+import logging
+from ..utils import logger
+from ..base import BaseGraphStorage
+from ..types import KnowledgeGraph, KnowledgeGraphNode, KnowledgeGraphEdge
+import pipmaster as pm
+if not pm.is_installed("nebula3-python"):
+    pm.install("nebula3-python")
+
+from nebula3.gclient.net import ConnectionPool  # type: ignore
+from nebula3.Config import Config  # type: ignore
+from nebula3.Exception import IOErrorException, AuthFailedException  # type: ignore
+
+config = configparser.ConfigParser()
+config.read("config.ini", "utf-8")
+
+# Get maximum number of graph nodes from environment variable, default is 1000
+MAX_GRAPH_NODES = int(os.getenv("MAX_GRAPH_NODES", 1000))
+
+# Set nebula logger level to ERROR to suppress warning logs
+logging.getLogger("nebula3").setLevel(logging.ERROR)
+
+
+@final
+@dataclass
+class NebulaStorage(BaseGraphStorage):
+    def __init__(self, namespace, global_config, embedding_func):
+        super().__init__(
+            namespace=namespace,
+            global_config=global_config,
+            embedding_func=embedding_func,
+        )
+        global config
+        self._connection_pool = None
+        self._connection_pool_lock = asyncio.Lock()
+        self._space_name = re.sub(r"[^a-zA-Z0-9_]", "_", namespace)
+
+        # Nebula configuration
+        HOSTS = os.environ.get(
+            "NEBULA_HOSTS", config.get("nebula", "hosts", fallback="127.0.0.1:9669")
+        ).split(":")
+        self.USERNAME = os.environ.get(
+            "NEBULA_USER", config.get("nebula", "user", fallback="root")
+        )
+        self.PASSWORD = os.environ.get(
+            "NEBULA_PASSWORD", config.get("nebula", "password", fallback="nebula")
+        )
+        # POOL_SIZE = int(
+        #     os.environ.get(
+        #         "NEBULA_POOL_SIZE",
+        #         config.get("nebula", "pool_size", fallback=10),
+        #     )
+        # )
+        # TIMEOUT = int(
+        #     os.environ.get(
+        #         "NEBULA_TIMEOUT",
+        #         config.get("nebula", "timeout", fallback=30000),
+        #     )
+        # )
+
+        # Initialize connection pool
+       
+        # config.max_connection_pool_size = POOL_SIZE
+        self._connection_pool = ConnectionPool()
+        
+        # Try to connect to Nebula
+        try:
+            self._connection_pool.init([HOSTS])
+            
+            # Check if space exists
+            with self._connection_pool.session_context(self.USERNAME, self.PASSWORD) as session:
+                session.execute(f"USE {self._space_name}")
+                result = session.execute("SHOW SPACES").as_data_frame()
+                spaces = [row[0] for _,row in result.iterrows()]
+                
+                if self._space_name not in spaces:
+                    logger.info(f"Space {self._space_name} not found, creating...")
+                    # Create space with default schema
+                    session.execute(f"CREATE SPACE IF NOT EXISTS {self._space_name} (vid_type=FIXED_STRING(256))")
+                    session.execute(f"USE {self._space_name}")                    # Create tag and edge types
+                   
+                    logger.info(f"Space {self._space_name} created successfully")
+                else:
+                    session.execute(f"USE {self._space_name}")
+                    logger.info(f"Connected to space {self._space_name}")
+                session.execute(" CREATE TAG IF NOT EXISTS base (    entity_id string,    entity_type string,    description string,    source_id string,    file_path string);")
+                session.execute("CREATE EDGE IF NOT EXISTS DIRECTED(weight float, description string,keywords string ,source_id string ,file_path string) ")
+                    
+        except (IOErrorException, AuthFailedException) as e:
+            logger.error(f"Failed to connect to Nebula Graph: {str(e)}")
+            raise
+
+    def __post_init__(self):
+        self._node_embed_algorithms = {
+            "node2vec": self._node2vec_embed,
+        }
+
+    async def close(self):
+        """Close the Nebula connection pool"""
+        if self._connection_pool:
+            self._connection_pool.close()
+            self._connection_pool = None
+
+    async def __aexit__(self, exc_type, exc, tb):
+        """Ensure connection pool is closed when context manager exits"""
+        await self.close()
+
+    async def index_done_callback(self) -> None:
+        # Nebula handles persistence automatically
+        pass
+
+    async def has_node(self, node_id: str) -> bool:
+        """
+        Check if a node with the given label exists in the database
+
+        Args:
+            node_id: Label of the node to check
+
+        Returns:
+            bool: True if node exists, False otherwise
+
+        Raises:
+            ValueError: If node_id is invalid
+            Exception: If there is an error executing the query
+        """
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+              try:
+                session.execute(f"USE {self._space_name}")
+                query = f""" MATCH (n) 
+                        WHERE id(n) == '{node_id}' return count(n) as icount """
+                result = session.execute(query)
+                return result.is_succeeded() and len(result.as_data_frame())> 0
+              except Exception as e:
+                logger.error(f"Error checking node existence for {node_id}: {str(e)}")
+                raise
+             
+
+    async def has_edge(self, source_node_id: str, target_node_id: str) -> bool:
+        """
+        Check if an edge exists between two nodes
+
+        Args:
+            source_node_id: Label of the source node
+            target_node_id: Label of the target node
+
+        Returns:
+            bool: True if edge exists, False otherwise
+
+        Raises:
+            ValueError: If either node_id is invalid
+            Exception: If there is an error executing the query
+        """
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                try:
+                    session.execute(f"USE {self._space_name}")
+                    query =  f''' MATCH (src)-[r]-(neighbor)
+                        WHERE id(src) =='{source_node_id}' AND id(neighbor)=='{target_node_id}'
+                        RETURN count(r) as icount
+                    '''   
+                    result = session.execute(query)
+                    return result.is_succeeded() and len(result.as_data_frame()) > 0
+                except Exception as e:
+                    logger.error(
+                        f"Error checking edge existence between {source_node_id} and {target_node_id}: {str(e)}"
+                    )                 
+                    raise
+
+    async def get_node(self, node_id: str) -> dict[str, str] | None:
+        """Get node by its label identifier, return only node properties
+
+        Args:
+            node_id: The node label to look up
+
+        Returns:
+            dict: Node properties if found
+            None: If node not found
+
+        Raises:
+            ValueError: If node_id is invalid
+            Exception: If there is an error executing the query
+        """
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")
+                query = f""" MATCH (n) 
+                        WHERE id(n) == '{node_id}' 
+                        RETURN id(n) AS id, properties(n) AS props """
+                try:                
+                    result = session.execute(query).as_data_frame()
+                   
+                        
+                    if len(result) > 1:
+                        logger.warning(
+                            f"Multiple nodes found with label '{node_id}'. Using first node."
+                        )
+                    if len(result) ==1:
+                        node_dict = result['props'][0]
+                        # Remove base label from labels list if it exists
+                        if "labels" in node_dict:
+                            node_dict["labels"] = [
+                                label
+                                for label in node_dict["labels"]
+                                if label != "base"
+                            ]
+                        logger.debug(f"nebula query node {query} return: {node_dict}")
+                        return node_dict
+                    return None                    
+                except Exception as e:
+                    logger.error(f"Error getting node for {node_id}: {str(e)}")
+                    raise
+                
+    async def get_nodes_batch(self, node_ids: list[str]) -> dict[str, dict]:
+        """
+        Retrieve multiple nodes in one query using UNWIND.
+
+        Args:
+            node_ids: List of node entity IDs to fetch.
+
+        Returns:
+            A dictionary mapping each node_id to its node data (or None if not found).
+        """
+        async with self._driver.session(
+            database=self._DATABASE, default_access_mode="READ"
+        ) as session:
+             with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")               
+                query = f"""
+               
+                MATCH (n:base)
+                where id(n) in {node_ids}
+                RETURN id(n) AS entity_id,  properties(n) AS props
+                """
+                result = session.execute(query).as_data_frame()
+                nodes = {}
+                for _,record in result.iterrows():
+                    entity_id = record["entity_id"]
+                    node = record["props"]
+                    node_dict = dict(node)
+                    # Remove the 'base' label if present in a 'labels' property
+                    if "labels" in node_dict:
+                        node_dict["labels"] = [
+                            label for label in node_dict["labels"] if label != "base"
+                        ]
+                    nodes[entity_id] = node_dict               
+                return nodes
+
+    async def node_degree(self, node_id: str) -> int:
+        """Get the degree (number of relationships) of a node with the given label.
+        If multiple nodes have the same label, returns the degree of the first node.
+        If no node is found, returns 0.
+
+        Args:
+            node_id: The label of the node
+
+        Returns:
+            int: The number of relationships the node has, or 0 if no node found
+
+        Raises:
+            ValueError: If node_id is invalid
+            Exception: If there is an error executing the query
+        """
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")
+                query = f" MATCH (v:base)-[r]-(n) WHERE id(v) == '{node_id}' RETURN count(r)  as degree"
+                try:
+                    result = session.execute(query).as_data_frame()
+                    return  int(result['degree'][0]) if len(result)>0 else 0
+                except Exception as e:
+                    logger.error(f"Error getting node degree for {node_id}: {str(e)}")
+                    raise
+                
+    async def node_degrees_batch(self, node_ids: list[str]) -> dict[str, int]:
+        """
+        Retrieve the degree for multiple nodes in a single query using UNWIND.
+
+        Args:
+            node_ids: List of node labels (entity_id values) to look up.
+
+        Returns:
+            A dictionary mapping each node_id to its degree (number of relationships).
+            If a node is not found, its degree will be set to 0.
+        """
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")
+                query = f"""
+                  
+                    MATCH (v:base)-[r]-(n) 
+                     WHERE id(v) in '{node_ids}' 
+                    RETURN id(v) AS entity_id,count(r)  AS degree;
+                """
+                result = session.execute(query).as_data_frame()
+                degrees = {}
+                for _,record in result.iterrows():
+                    entity_id = record["entity_id"]
+                    degrees[entity_id] = record["degree"]
+                
+
+                # For any node_id that did not return a record, set degree to 0.
+                for nid in node_ids:
+                    if nid not in degrees:
+                        logger.warning(f"No node found with label '{nid}'")
+                        degrees[nid] = 0
+
+                logger.debug(f"nebular batch node degree query returned: {degrees}")
+                return degrees
+
+    async def edge_degree(self, src_id: str, tgt_id: str) -> int:
+        """Get the total degree (sum of relationships) of two nodes.
+
+        Args:
+            src_id: Label of the source node
+            tgt_id: Label of the target node
+
+        Returns:
+            int: Sum of the degrees of both nodes
+        """
+        src_degree = await self.node_degree(src_id)
+        trg_degree = await self.node_degree(tgt_id)
+        return src_degree + trg_degree
+    
+    async def edge_degrees_batch(
+        self, edge_pairs: list[tuple[str, str]]
+    ) -> dict[tuple[str, str], int]:
+        """
+        Calculate the combined degree for each edge (sum of the source and target node degrees)
+        in batch using the already implemented node_degrees_batch.
+
+        Args:
+            edge_pairs: List of (src, tgt) tuples.
+
+        Returns:
+            A dictionary mapping each (src, tgt) tuple to the sum of their degrees.
+        """
+        # Collect unique node IDs from all edge pairs.
+        unique_node_ids = {src for src, _ in edge_pairs}
+        unique_node_ids.update({tgt for _, tgt in edge_pairs})
+
+        # Get degrees for all nodes in one go.
+        degrees = await self.node_degrees_batch(list(unique_node_ids))
+
+        # Sum up degrees for each edge pair.
+        edge_degrees = {}
+        for src, tgt in edge_pairs:
+            edge_degrees[(src, tgt)] = degrees.get(src, 0) + degrees.get(tgt, 0)
+        return edge_degrees
+
+    async def get_edge(
+        self, source_node_id: str, target_node_id: str
+    ) -> dict[str, str] | None:
+        """Get edge properties between two nodes.
+
+        Args:
+            source_node_id: Label of the source node
+            target_node_id: Label of the target node
+
+        Returns:
+            dict: Edge properties if found, default properties if not found or on error
+
+        Raises:
+            ValueError: If either node_id is invalid
+            Exception: If there is an error executing the query
+        """
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")
+                query =  f''' MATCH (src)-[r]-(neighbor)
+                       WHERE id(src) =='{source_node_id}' AND id(neighbor)=='{target_node_id}'
+                      RETURN properties(r) as edge_properties
+                   '''   
+                result = session.execute(query).as_data_frame()
+
+                if len(result) > 1:
+                    logger.warning(
+                        f"Multiple edges found between '{source_node_id}' and '{target_node_id}'. Using first edge."
+                    )
+                
+                try:
+                    edge_result = result['edge_properties'][0]
+                    logger.debug(f"Result: {edge_result}")
+                    # Ensure required keys exist with defaults
+                    required_keys = {
+                        "weight": 0.0,
+                        "source_id": None,
+                        "description": None,
+                        "keywords": None,
+                    }
+                    for key, default_value in required_keys.items():
+                        if key not in edge_result:
+                            edge_result[key] = default_value
+                            logger.warning(
+                                f"Edge between {source_node_id} and {target_node_id} "
+                                f"missing {key}, using default: {default_value}"
+                            )
+
+                    logger.debug(
+                        f"{inspect.currentframe().f_code.co_name}:query:{query}:result:{edge_result}"
+                    )
+                    return edge_result
+                except (KeyError, TypeError, ValueError) as e:
+                    logger.error(
+                        f"Error processing edge properties between {source_node_id} "
+                        f"and {target_node_id}: {str(e)}"
+                    )
+                    # Return default edge properties on error
+                    return {
+                        "weight": 0.0,
+                        "source_id": None,
+                        "description": None,
+                        "keywords": None,
+                    }
+                    
+                    
+    async def get_edges_batch(
+        self, pairs: list[dict[str, str]]
+    ) -> dict[tuple[str, str], dict]:
+        """
+        Retrieve edge properties for multiple (src, tgt) pairs in one query.
+
+        Args:
+            pairs: List of dictionaries, e.g. [{"src": "node1", "tgt": "node2"}, ...]
+
+        Returns:
+            A dictionary mapping (src, tgt) tuples to their edge properties.
+        """
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")
+                sCondition=""
+                for adata in pairs:
+                    asrc=adata["src"]
+                    atag=adata["tag"]
+                    sCondition +=f"  or  (id(start)={asrc} and id(end)={atag}) "
+                    
+                    
+                query = f"""
+                
+                MATCH (start:base )-[r:DIRECTED]-(end:base)
+                where 1=1  {sCondition}
+                
+                RETURN id(start) AS src_id, id(end) AS tgt_id,  properties(r)  AS edges
+                """
+                result = session.execute(query).as_data_frame()
+                edges_dict = {}
+                for _, record in result.iterrows():
+                    src = record["src_id"]
+                    tgt = record["tgt_id"]
+                    edges = record["edges"]
+                    if edges and len(edges) > 0:
+                        edge_props = edges[0]  # choose the first if multiple exist
+                        # Ensure required keys exist with defaults
+                        for key, default in {
+                            "weight": 0.0,
+                            "source_id": None,
+                            "description": None,
+                            "keywords": None,
+                        }.items():
+                            if key not in edge_props:
+                                edge_props[key] = default
+                        edges_dict[(src, tgt)] = edge_props
+                    else:
+                        # No edge found – set default edge properties
+                        edges_dict[(src, tgt)] = {
+                            "weight": 0.0,
+                            "source_id": None,
+                            "description": None,
+                            "keywords": None,
+                        }
+               
+                return edges_dict
+
+
+                   
+
+
+    async def get_node_edges(self, source_node_id: str) -> list[tuple[str, str]] | None:
+        """Retrieves all edges (relationships) for a particular node identified by its label.
+
+        Args:
+            source_node_id: Label of the node to get edges for
+
+        Returns:
+            list[tuple[str, str]]: List of (source_label, target_label) tuples representing edges
+            None: If no edges found
+
+        Raises:
+            ValueError: If source_node_id is invalid
+            Exception: If there is an error executing the query
+        """
+        try:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                try:
+                    session.execute(f"USE {self._space_name}")
+                
+                    query = """MATCH (n:base)-[r]-(connected:base)
+                              WHERE  id(n)=='{source_node_id}' and connected.entity_id IS NOT NULL 
+                            RETURN n, r, connected"""
+                    results =  session.execute(query).as_data_frame()
+
+                    edges = []
+                    for _,record in results.iterrows():
+                        source_node = record["n"]
+                        connected_node = record["connected"]
+
+                        # Skip if either node is None
+                        if not source_node or not connected_node:
+                            continue
+
+                        source_label = (
+                            source_node.get("entity_id")
+                            if source_node.get("entity_id")
+                            else None
+                        )
+                        target_label = (
+                            connected_node.get("entity_id")
+                            if connected_node.get("entity_id")
+                            else None
+                        )
+
+                        if source_label and target_label:
+                            edges.append((source_label, target_label))
+
+                   
+                    return edges
+                except Exception as e:
+                    logger.error(
+                        f"Error getting edges for node {source_node_id}: {str(e)}"
+                    )                   
+                    raise
+        except Exception as e:
+            logger.error(f"Error in get_node_edges for {source_node_id}: {str(e)}")
+            raise
+    
+    async def get_nodes_edges_batch(
+        self, node_ids: list[str]
+    ) -> dict[str, list[tuple[str, str]]]:
+        """
+        Batch retrieve edges for multiple nodes in one query using UNWIND.
+        For each node, returns both outgoing and incoming edges to properly represent
+        the undirected graph nature.
+
+        Args:
+            node_ids: List of node IDs (entity_id) for which to retrieve edges.
+
+        Returns:
+            A dictionary mapping each node ID to its list of edge tuples (source, target).
+            For each node, the list includes both:
+            - Outgoing edges: (queried_node, connected_node)
+            - Incoming edges: (connected_node, queried_node)
+        """
+        with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+            # Query to get both outgoing and incoming edges
+            session.execute(f"USE {self._space_name}")
+            query = f"""
+               
+                MATCH (n:base )-[r]-(connected:base)
+                where id(n) in {node_ids}                
+                RETURN id(n) AS queried_id, id(n) AS node_entity_id,
+                       id(connected) AS connected_entity_id,
+                       src(r) AS start_entity_id
+            """
+            result =  session.execute(query).as_data_frame()
+
+            # Initialize the dictionary with empty lists for each node ID
+            edges_dict = {node_id: [] for node_id in node_ids}
+
+            # Process results to include both outgoing and incoming edges
+            for _, record in result.iterrows():
+                queried_id = record["queried_id"]
+                node_entity_id = record["node_entity_id"]
+                connected_entity_id = record["connected_entity_id"]
+                start_entity_id = record["start_entity_id"]
+
+                # Skip if either node is None
+                if not node_entity_id or not connected_entity_id:
+                    continue
+
+                # Determine the actual direction of the edge
+                # If the start node is the queried node, it's an outgoing edge
+                # Otherwise, it's an incoming edge
+                if start_entity_id == node_entity_id:
+                    # Outgoing edge: (queried_node -> connected_node)
+                    edges_dict[queried_id].append((node_entity_id, connected_entity_id))
+                else:
+                    # Incoming edge: (connected_node -> queried_node)
+                    edges_dict[queried_id].append((connected_entity_id, node_entity_id))
+
+          
+            return edges_dict
+
+    @retry(
+        stop=stop_after_attempt(3),
+        wait=wait_exponential(multiplier=1, min=4, max=10),
+        retry=retry_if_exception_type((IOErrorException,)),
+    )
+    async def upsert_node(self, node_id: str, node_data: dict[str, str]) -> None:
+        """
+        Upsert a node in the nebula database.
+
+        Args:
+            node_id: The unique identifier for the node (used as label)
+            node_data: Dictionary of node properties
+        """
+        if "entity_id" not in node_data:
+            raise ValueError("Node properties must contain an 'entity_id' field")
+        fields=  ", ".join(f"{k}" for k, v in node_data.items())   
+        properties = ", ".join(f"{repr(v)}" for k, v in node_data.items())
+        
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")
+                
+                query = (
+                    f"INSERT VERTEX IF NOT EXISTS base({fields}) "
+                    f"VALUES '{node_id}':({properties})"
+                )
+                session.execute(query)
+
+    @retry(
+        stop=stop_after_attempt(3),
+        wait=wait_exponential(multiplier=1, min=4, max=10),
+        retry=retry_if_exception_type((IOErrorException,)),
+    )
+    async def upsert_edge(
+        self, source_node_id: str, target_node_id: str, edge_data: dict[str, str]
+    ) -> None:
+        """
+        Upsert an edge and its properties between two nodes identified by their labels.
+        Ensures both source and target nodes exist and are unique before creating the edge.
+        Uses entity_id property to uniquely identify nodes.
+
+        Args:
+            source_node_id (str): Label of the source node (used as identifier)
+            target_node_id (str): Label of the target node (used as identifier)
+            edge_data (dict): Dictionary of properties to set on the edge
+
+        Raises:
+            ValueError: If either source or target node does not exist or is not unique
+        """
+        fields=", ".join(f"{k}" for k, v in edge_data.items())
+        properties = ", ".join(f"{repr(v)}" for k, v in edge_data.items())
+        
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")                
+                # Nebula requires edges to have a rank (0 by default)
+                query = (
+                    f"INSERT EDGE IF NOT EXISTS DIRECTED({fields}) "
+                    f"VALUES '{source_node_id}' -> '{target_node_id}'@0:({properties})"
+                )
+                session.execute(query)
+
+   
+    async def get_knowledge_graph(
+        self,
+        node_label: str,
+        max_depth: int = 3,
+        max_nodes: int = MAX_GRAPH_NODES,
+    ) -> KnowledgeGraph:
+        """
+        Retrieve a connected subgraph of nodes where the label includes the specified `node_label`.
+
+        Args:
+            node_label: Label of the starting node, * means all nodes
+            max_depth: Maximum depth of the subgraph, Defaults to 3
+            max_nodes: Maxiumu nodes to return by BFS, Defaults to 1000
+
+        Returns:
+            KnowledgeGraph object containing nodes and edges, with an is_truncated flag
+            indicating whether the graph was truncated due to max_nodes limit
+        """
+        result = KnowledgeGraph()
+        seen_nodes = set()
+        seen_edges = set()
+
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")
+                
+                if node_label == "*":
+                    # Get all nodes with minimum degree
+                    query = (
+                        f"MATCH (n:base) "
+                        f"WHERE id(n) >= '' "
+                        f"RETURN id(n) AS id, properties(n) AS props "
+                        f"LIMIT {max_nodes}"
+                    )
+                else:
+                    # Start from specific node and traverse
+                    query = f"""
+                        MATCH (n)
+                        WHERE id(n) == "{node_label}"
+                        RETURN id(n) AS id, properties(n) AS props 
+                        LIMIT {max_nodes}
+                        """
+                
+                try:
+                    result_set = session.execute(query).as_data_frame()
+                    
+                   
+                    matched_ids=[]    # Process nodes from direct query
+                    for _,row in result_set.iterrows():
+                        node_id = row['id']
+                        props = row['props']
+                        # props = {k: v for k, v in props}
+                        matched_ids.append(node_id)
+                        if node_id not in seen_nodes:
+                            result.nodes.append(
+                                KnowledgeGraphNode(
+                                    id=node_id,
+                                    labels=[node_id],
+                                    properties=props,
+                                )
+                            )
+                            seen_nodes.add(node_id)
+                   
+                            
+                    
+                      
+                    neighbors_query = f"""
+                    MATCH (src)-[e*1..{max_depth}]-(neighbor)
+                    WHERE id(src) IN {matched_ids}
+                    RETURN DISTINCT id(neighbor) AS id,properties(neighbor) AS props 
+                    LIMIT {max_nodes - len(matched_ids)}
+                    """
+                    
+                    result_set = session.execute(neighbors_query).as_data_frame()
+                    
+                    for _,row in result_set.iterrows():
+                        node_id = row['id']
+                        
+                        if node_id not in seen_nodes:
+                            props = row['props']                                
+                            result.nodes.append(
+                                KnowledgeGraphNode(
+                                    id=node_id,
+                                    labels=[node_id],
+                                    properties=props,
+                                )
+                            )
+                            seen_nodes.add(node_id)
+                    
+                        # Process edges
+                        
+                    edge_query=f'''
+                       MATCH (src)-[e]->(neighbor)
+                       WHERE id(src) IN {seen_nodes} AND id(neighbor) IN {seen_nodes}
+                        RETURN DISTINCT id(src) AS srcId,id(neighbor) AS destId  ,properties(e) as edgeProps ,type(e) as edgeType
+                       
+                    
+                    '''
+                    result_set = session.execute(edge_query).as_data_frame() 
+                    for _,row in result_set.iterrows():       
+                            edge_id = f"{row['srcId']}-{row['destId']}-{row['edgeType']}"
+                            if edge_id not in seen_edges:
+                                result.edges.append(
+                                    KnowledgeGraphEdge(
+                                        id=edge_id,
+                                        type=row['edgeType'],
+                                        source=row['srcId'],
+                                        target=row['destId'],
+                                        properties=row['edgeProps'],
+                                    )
+                                )
+                                seen_edges.add(edge_id)
+                    
+                        
+                       
+                       
+                    
+                    logger.info(
+                        f"Graph query return: {len(result.nodes)} nodes, {len(result.edges)} edges"
+                    )
+                    
+                except Exception as e:
+                    logger.error(f"Error executing graph query: {str(e)}")
+                    raise
+
+        return result
+
+    async def get_all_labels(self) -> list[str]:
+        """
+        Get all existing node labels in the database
+        Returns:
+            ["Person", "Company", ...]  # Alphabetically sorted label list
+        """
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")
+                query = "MATCH (n:base) RETURN id(n) AS label ORDER BY label"
+                result = session.execute(query).as_data_frame()
+                return [row[0] for _,row in result.iterrows()]
+
+    @retry(
+        stop=stop_after_attempt(3),
+        wait=wait_exponential(multiplier=1, min=4, max=10),
+        retry=retry_if_exception_type((IOErrorException,)),
+    )
+    async def delete_node(self, node_id: str) -> None:
+        """Delete a node with the specified label
+
+        Args:
+            node_id: The label of the node to delete
+        """
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")
+                query = f"DELETE VERTEX '{node_id}' "
+                session.execute(query)
+
+    @retry(
+        stop=stop_after_attempt(3),
+        wait=wait_exponential(multiplier=1, min=4, max=10),
+        retry=retry_if_exception_type((IOErrorException,)),
+    )
+    async def remove_nodes(self, nodes: list[str]):
+        """Delete multiple nodes
+
+        Args:
+            nodes: List of node labels to be deleted
+        """
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")
+                for node in nodes:
+                    await self.delete_node(node)
+
+    @retry(
+        stop=stop_after_attempt(3),
+        wait=wait_exponential(multiplier=1, min=4, max=10),
+        retry=retry_if_exception_type((IOErrorException,)),
+    )
+    async def remove_edges(self, edges: list[tuple[str, str]]):
+        """Delete multiple edges
+
+        Args:
+            edges: List of edges to be deleted, each edge is a (source, target) tuple
+        """
+        async with self._connection_pool_lock:
+            with self._connection_pool.session_context(
+                self.USERNAME, self.PASSWORD
+            ) as session:
+                session.execute(f"USE {self._space_name}")
+                for source, target in edges:
+                    # Nebula requires edge type to delete specific edges
+                    query = (
+                        f"DELETE EDGE DIRECTED '{source}' -> '{target}'@0"
+                    )
+                    session.execute(query)
+
+
+    async def drop(self) -> dict[str, str]:
+        """Drop all data from storage and clean up resources
+
+        This method will delete all nodes and relationships in the nebula database.
+
+        Returns:
+            dict[str, str]: Operation status and message
+            - On success: {"status": "success", "message": "data dropped"}
+            - On failure: {"status": "error", "message": "<error details>"}
+        """
+        try:
+            async with self._connection_pool_lock:
+                with self._connection_pool.session_context(
+                    self.USERNAME, self.PASSWORD
+                ) as session:
+                    # Delete all nodes and relationships
+                    session.execute(f"USE {self._space_name}")
+                    
+                    query = f" drop space {self._space_name}"
+                    session.execute(query)                   
+                    logger.info(
+                        f"Process {os.getpid()} drop nebula space {self._space_name}"
+                    )
+                    return {"status": "success", "message": "data dropped"}
+        except Exception as e:
+            logger.error(f"Error dropping nebula space {self._space_name}: {e}")
+            return {"status": "error", "message": str(e)}