FalkorDB · gkorland · Mar 10, 2026
diff --git a/api/analyzers/javascript/__init__.py b/api/analyzers/javascript/__init__.py
diff --git a/api/analyzers/javascript/analyzer.py b/api/analyzers/javascript/analyzer.py
@@ -0,0 +1,110 @@
+from pathlib import Path
+from typing import Optional
+
+from multilspy import SyncLanguageServer
+from ...entities.entity import Entity
+from ...entities.file import File
+from ..analyzer import AbstractAnalyzer
+
+import tree_sitter_javascript as tsjs
+from tree_sitter import Language, Node
+
+import logging
+logger = logging.getLogger('code_graph')
+
+
+class JavaScriptAnalyzer(AbstractAnalyzer):
+    def __init__(self) -> None:
+        super().__init__(Language(tsjs.language()))
+
+    def add_dependencies(self, path: Path, files: list[Path]):
+        pass
+
+    def get_entity_label(self, node: Node) -> str:
+        if node.type == 'function_declaration':
+            return "Function"
+        elif node.type == 'class_declaration':
+            return "Class"
+        elif node.type == 'method_definition':
+            return "Method"
+        raise ValueError(f"Unknown entity type: {node.type}")
+
+    def get_entity_name(self, node: Node) -> str:
+        if node.type in ['function_declaration', 'class_declaration', 'method_definition']:
+            name_node = node.child_by_field_name('name')
+            if name_node is None:
+                return ''
+            return name_node.text.decode('utf-8')
+        raise ValueError(f"Unknown entity type: {node.type}")
+
+    def get_entity_docstring(self, node: Node) -> Optional[str]:
+        if node.type in ['function_declaration', 'class_declaration', 'method_definition']:
+            if node.prev_sibling and node.prev_sibling.type == 'comment':
+                return node.prev_sibling.text.decode('utf-8')
+            return None
+        raise ValueError(f"Unknown entity type: {node.type}")
+
+    def get_entity_types(self) -> list[str]:
+        return ['function_declaration', 'class_declaration', 'method_definition']
+
+    def add_symbols(self, entity: Entity) -> None:
+        if entity.node.type == 'class_declaration':
+            heritage = entity.node.child_by_field_name('body')
+            if heritage is None:
+                return
+            superclass_node = entity.node.child_by_field_name('name')
+            # Check for `extends` clause via class_heritage
+            for child in entity.node.children:
+                if child.type == 'class_heritage':
+                    for heritage_child in child.children:
+                        if heritage_child.type == 'identifier':
+                            entity.add_symbol("base_class", heritage_child)
+        elif entity.node.type in ['function_declaration', 'method_definition']:
+            query = self.language.query("(call_expression) @reference.call")
+            captures = query.captures(entity.node)
+            if 'reference.call' in captures:
+                for caller in captures['reference.call']:
+                    entity.add_symbol("call", caller)
+            query = self.language.query("(formal_parameters (identifier) @parameter)")
+            captures = query.captures(entity.node)
+            if 'parameter' in captures:
+                for parameter in captures['parameter']:
+                    entity.add_symbol("parameters", parameter)
+
+    def is_dependency(self, file_path: str) -> bool:
+        return "node_modules" in file_path
+
+    def resolve_path(self, file_path: str, path: Path) -> str:
+        return file_path
+
+    def resolve_type(self, files: dict[Path, File], lsp: SyncLanguageServer, file_path: Path, path: Path, node: Node) -> list[Entity]:
+        res = []
+        for file, resolved_node in self.resolve(files, lsp, file_path, path, node):
+            type_dec = self.find_parent(resolved_node, ['class_declaration'])
+            if type_dec in file.entities:
+                res.append(file.entities[type_dec])
+        return res
+
+    def resolve_method(self, files: dict[Path, File], lsp: SyncLanguageServer, file_path: Path, path: Path, node: Node) -> list[Entity]:
+        res = []
+        if node.type == 'call_expression':
+            func_node = node.child_by_field_name('function')
+            if func_node and func_node.type == 'member_expression':
+                func_node = func_node.child_by_field_name('property')
+            if func_node:
+                node = func_node
+        for file, resolved_node in self.resolve(files, lsp, file_path, path, node):
+            method_dec = self.find_parent(resolved_node, ['function_declaration', 'method_definition', 'class_declaration'])
+            if method_dec and method_dec.type == 'class_declaration':
+                continue
+            if method_dec in file.entities:
+                res.append(file.entities[method_dec])
+        return res
+
+    def resolve_symbol(self, files: dict[Path, File], lsp: SyncLanguageServer, file_path: Path, path: Path, key: str, symbol: Node) -> list[Entity]:
+        if key in ["base_class", "parameters"]:
+            return self.resolve_type(files, lsp, file_path, path, symbol)
+        elif key in ["call"]:
+            return self.resolve_method(files, lsp, file_path, path, symbol)
+        else:
+            raise ValueError(f"Unknown key {key}")
diff --git a/api/analyzers/source_analyzer.py b/api/analyzers/source_analyzer.py
@@ -11,6 +11,7 @@
 from .java.analyzer import JavaAnalyzer
 from .python.analyzer import PythonAnalyzer
 from .csharp.analyzer import CSharpAnalyzer
+from .javascript.analyzer import JavaScriptAnalyzer
 
 from multilspy import SyncLanguageServer
 from multilspy.multilspy_config import MultilspyConfig
@@ -26,7 +27,8 @@
     # '.h': CAnalyzer(),
     '.py': PythonAnalyzer(),
     '.java': JavaAnalyzer(),
-    '.cs': CSharpAnalyzer()}
+    '.cs': CSharpAnalyzer(),
+    '.js': JavaScriptAnalyzer()}
 
 class NullLanguageServer:
     def start_server(self):
@@ -143,7 +145,8 @@
             lsps[".cs"] = SyncLanguageServer.create(config, logger, str(path))
         else:
             lsps[".cs"] = NullLanguageServer()
-        with lsps[".java"].start_server(), lsps[".py"].start_server(), lsps[".cs"].start_server():
+        lsps[".js"] = NullLanguageServer()
+        with lsps[".java"].start_server(), lsps[".py"].start_server(), lsps[".cs"].start_server(), lsps[".js"].start_server():
             files_len = len(self.files)
             for i, file_path in enumerate(files):
                 file = self.files[file_path]
@@ -174,7 +177,7 @@
 
     def analyze_sources(self, path: Path, ignore: list[str], graph: Graph) -> None:
         path = path.resolve()
-        files = list(path.rglob("*.java")) + list(path.rglob("*.py")) + list(path.rglob("*.cs"))
+        files = list(path.rglob("*.java")) + list(path.rglob("*.py")) + list(path.rglob("*.cs")) + list(path.rglob("*.js"))
@@ -1,6 +1,7 @@
 from contextlib import nullcontext
 from pathlib import Path
 from typing import Optional
+import os
 from api.entities.entity import Entity
 from api.entities.file import File
@@ -184,6 +185,34 @@
        # Second pass analysis of the source code
        self.second_pass(graph, files, path)
+    def _resolve_and_validate_path(self, user_path: str) -> Path:
+        """
+        Resolve a user-supplied path against a safe root and ensure it does not escape.
+
+        The safe root can be configured via the CODE_GRAPH_PROJECTS_ROOT environment
+        variable; if unset, the current working directory is used.
+        """
+        base_dir_env = os.environ.get("CODE_GRAPH_PROJECTS_ROOT")
+        if base_dir_env:
+            base_dir = Path(base_dir_env)
+        else:
+            base_dir = Path.cwd()
+
+        base_dir = base_dir.resolve()
+        candidate = Path(user_path)
+        if not candidate.is_absolute():
+            candidate = base_dir / candidate
+        candidate = candidate.resolve()
+
+        try:
+            # Ensure candidate is within base_dir
+            candidate.relative_to(base_dir)
+        except ValueError:
+            logging.error(f"Requested path '{candidate}' is outside of allowed base directory '{base_dir}'")
+            raise ValueError("Requested path is not allowed")
+
+        return candidate
+
    def analyze_local_folder(self, path: str, g: Graph, ignore: Optional[list[str]] = []) -> None:
        """
        Analyze path.
@@ -195,8 +224,11 @@
        logging.info(f"Analyzing local folder {path}")
+        # Resolve and validate the provided path against a safe root
+        safe_path = self._resolve_and_validate_path(path)
+
        # Analyze source files
-        self.analyze_sources(Path(path), ignore, g)
+        self.analyze_sources(safe_path, ignore, g)
        logging.info("Done analyzing path")
@@ -1,6 +1,7 @@
 from contextlib import nullcontext
 from pathlib import Path
 from typing import Optional
+import os
 from api.entities.entity import Entity
 from api.entities.file import File
@@ -21,6 +22,36 @@
 # Configure logging
 logging.basicConfig(level=logging.DEBUG, format='%(filename)s - %(asctime)s - %(levelname)s - %(message)s')
+
+def _get_safe_root() -> Path:
+    """
+    Returns the root directory under which analysis is allowed.
+    The root can be configured via the CODEGRAPH_ROOT environment variable,
+    otherwise the current working directory is used.
+    """
+    root_env = os.environ.get("CODEGRAPH_ROOT")
+    if root_env:
+        return Path(root_env).resolve()
+    return Path.cwd().resolve()
+
+
+def _ensure_within_root(requested_path: Path) -> Path:
+    """
+    Resolve the requested path and ensure it resides within the safe root.
+    Raises a ValueError if the path is outside the allowed root.
+    """
+    safe_root = _get_safe_root()
+    resolved = requested_path.resolve()
+    try:
+        # Python 3.9+: Path.is_relative_to
+        if resolved.is_relative_to(safe_root):
+            return resolved
+    except AttributeError:
+        # Fallback for older Python versions
+        if os.path.commonpath([str(safe_root), str(resolved)]) == str(safe_root):
+            return resolved
+    raise ValueError(f"Path '{resolved}' is outside of the allowed root '{safe_root}'")
+
 # List of available analyzers
 analyzers: dict[str, AbstractAnalyzer] = {
    # '.c': CAnalyzer(),
@@ -195,8 +226,15 @@
        logging.info(f"Analyzing local folder {path}")
+        # Normalize and validate that the path is within the allowed root
+        try:
+            target_path = _ensure_within_root(Path(path))
+        except ValueError as e:
+            logging.error(str(e))
+            raise
+
        # Analyze source files
-        self.analyze_sources(Path(path), ignore, g)
+        self.analyze_sources(target_path, ignore, g)
        logging.info("Done analyzing path")
@@ -213,12 +250,19 @@
        from pygit2.repository import Repository
-        proj_name = Path(path).name
+        # Normalize and validate repository path
+        try:
+            repo_path = _ensure_within_root(Path(path))
+        except ValueError as e:
+            logging.error(str(e))
+            raise
+
+        proj_name = repo_path.name
        graph = Graph(proj_name)
-        self.analyze_local_folder(path, graph, ignore)
+        self.analyze_local_folder(str(repo_path), graph, ignore)
        # Save processed commit hash to the DB
-        repo = Repository(path)
+        repo = Repository(str(repo_path))
        current_commit = repo.walk(repo.head.target).__next__()
        graph.set_graph_commit(current_commit.short_id)
@@ -18,6 +18,7 @@
 from multilspy.multilspy_logger import MultilspyLogger
 import logging
+import os
 # Configure logging
 logging.basicConfig(level=logging.DEBUG, format='%(filename)s - %(asctime)s - %(levelname)s - %(message)s')
@@ -193,10 +194,29 @@
            ignore (List(str)): List of paths to skip
        """
-        logging.info(f"Analyzing local folder {path}")
+        try:
+            base_path = Path(path).resolve(strict=True)
+        except FileNotFoundError:
+            logging.error("Path '%s' does not exist or is not accessible", path)
+            return
+        safe_root = os.environ.get("CODEGRAPH_REPOS_ROOT")
+        if safe_root:
+            try:
+                root_path = Path(safe_root).resolve(strict=True)
+            except FileNotFoundError:
+                logging.error("Configured CODEGRAPH_REPOS_ROOT '%s' does not exist", safe_root)
+                return
+            base_path_str = str(base_path)
+            root_path_str = str(root_path)
+            if not base_path_str.startswith(root_path_str.rstrip(os.sep) + os.sep) and base_path_str != root_path_str:
+                logging.error("Path '%s' is outside of allowed root '%s'", base_path, root_path)
+                return
+
+        logging.info(f"Analyzing local folder {base_path}")
+
        # Analyze source files
-        self.analyze_sources(Path(path), ignore, g)
+        self.analyze_sources(base_path, ignore, g)
        logging.info("Done analyzing path")
@@ -1,6 +1,7 @@
 from contextlib import nullcontext
 from pathlib import Path
 from typing import Optional
+import os
 from api.entities.entity import Entity
 from api.entities.file import File
@@ -176,7 +177,16 @@
        self.second_pass(graph, files, path)
    def analyze_sources(self, path: Path, ignore: list[str], graph: Graph) -> None:
+        # Resolve the target path and enforce that it lies within an allowed base directory.
        path = path.resolve()
+        base_dir_env = os.getenv("CODE_GRAPH_BASE_DIR", ".")
+        base_dir = Path(base_dir_env).resolve()
+        try:
+            # This will raise ValueError if 'path' is not inside 'base_dir'.
+            path.relative_to(base_dir)
+        except ValueError:
+            logging.error("Refusing to analyze path '%s' outside of base directory '%s'", path, base_dir)
+            raise ValueError(f"Path '{path}' is not allowed for analysis")
        files = list(path.rglob("*.java")) + list(path.rglob("*.py")) + list(path.rglob("*.cs")) + list(path.rglob("*.js"))
        # First pass analysis of the source code
        self.first_pass(path, files, ignore, graph)
@@ -1,6 +1,7 @@
 from contextlib import nullcontext
 from pathlib import Path
 from typing import Optional
+import os

 from api.entities.entity import Entity
 from api.entities.file import File
@@ -184,6 +185,34 @@
        # Second pass analysis of the source code
        self.second_pass(graph, files, path)

+    def _resolve_and_validate_path(self, user_path: str) -> Path:
+        """
+        Resolve a user-supplied path against a safe root and ensure it does not escape.
+
+        The safe root can be configured via the CODE_GRAPH_PROJECTS_ROOT environment
+        variable; if unset, the current working directory is used.
+        """
+        base_dir_env = os.environ.get("CODE_GRAPH_PROJECTS_ROOT")
+        if base_dir_env:
+            base_dir = Path(base_dir_env)
+        else:
+            base_dir = Path.cwd()
+
+        base_dir = base_dir.resolve()
+        candidate = Path(user_path)
+        if not candidate.is_absolute():
+            candidate = base_dir / candidate
+        candidate = candidate.resolve()
+
+        try:
+            # Ensure candidate is within base_dir
+            candidate.relative_to(base_dir)
+        except ValueError:
+            logging.error(f"Requested path '{candidate}' is outside of allowed base directory '{base_dir}'")
+            raise ValueError("Requested path is not allowed")
+
+        return candidate
+
    def analyze_local_folder(self, path: str, g: Graph, ignore: Optional[list[str]] = []) -> None:
        """
        Analyze path.
@@ -195,8 +224,11 @@

        logging.info(f"Analyzing local folder {path}")

+        # Resolve and validate the provided path against a safe root
+        safe_path = self._resolve_and_validate_path(path)
+
        # Analyze source files
-        self.analyze_sources(Path(path), ignore, g)
+        self.analyze_sources(safe_path, ignore, g)

        logging.info("Done analyzing path")

@@ -1,6 +1,7 @@
 from contextlib import nullcontext
 from pathlib import Path
 from typing import Optional
+import os

 from api.entities.entity import Entity
 from api.entities.file import File
@@ -21,6 +22,36 @@
 # Configure logging
 logging.basicConfig(level=logging.DEBUG, format='%(filename)s - %(asctime)s - %(levelname)s - %(message)s')

+
+def _get_safe_root() -> Path:
+    """
+    Returns the root directory under which analysis is allowed.
+    The root can be configured via the CODEGRAPH_ROOT environment variable,
+    otherwise the current working directory is used.
+    """
+    root_env = os.environ.get("CODEGRAPH_ROOT")
+    if root_env:
+        return Path(root_env).resolve()
+    return Path.cwd().resolve()
+
+
+def _ensure_within_root(requested_path: Path) -> Path:
+    """
+    Resolve the requested path and ensure it resides within the safe root.
+    Raises a ValueError if the path is outside the allowed root.
+    """
+    safe_root = _get_safe_root()
+    resolved = requested_path.resolve()
+    try:
+        # Python 3.9+: Path.is_relative_to
+        if resolved.is_relative_to(safe_root):
+            return resolved
+    except AttributeError:
+        # Fallback for older Python versions
+        if os.path.commonpath([str(safe_root), str(resolved)]) == str(safe_root):
+            return resolved
+    raise ValueError(f"Path '{resolved}' is outside of the allowed root '{safe_root}'")
+
 # List of available analyzers
 analyzers: dict[str, AbstractAnalyzer] = {
    # '.c': CAnalyzer(),
@@ -195,8 +226,15 @@

        logging.info(f"Analyzing local folder {path}")

+        # Normalize and validate that the path is within the allowed root
+        try:
+            target_path = _ensure_within_root(Path(path))
+        except ValueError as e:
+            logging.error(str(e))
+            raise
+
        # Analyze source files
-        self.analyze_sources(Path(path), ignore, g)
+        self.analyze_sources(target_path, ignore, g)

        logging.info("Done analyzing path")

@@ -213,12 +250,19 @@

        from pygit2.repository import Repository

-        proj_name = Path(path).name
+        # Normalize and validate repository path
+        try:
+            repo_path = _ensure_within_root(Path(path))
+        except ValueError as e:
+            logging.error(str(e))
+            raise
+
+        proj_name = repo_path.name
        graph = Graph(proj_name)
-        self.analyze_local_folder(path, graph, ignore)
+        self.analyze_local_folder(str(repo_path), graph, ignore)

        # Save processed commit hash to the DB
-        repo = Repository(path)
+        repo = Repository(str(repo_path))
        current_commit = repo.walk(repo.head.target).__next__()
        graph.set_graph_commit(current_commit.short_id)

@@ -18,6 +18,7 @@
 from multilspy.multilspy_logger import MultilspyLogger

 import logging
+import os
 # Configure logging
 logging.basicConfig(level=logging.DEBUG, format='%(filename)s - %(asctime)s - %(levelname)s - %(message)s')

@@ -193,10 +194,29 @@
            ignore (List(str)): List of paths to skip
        """

-        logging.info(f"Analyzing local folder {path}")
+        try:
+            base_path = Path(path).resolve(strict=True)
+        except FileNotFoundError:
+            logging.error("Path '%s' does not exist or is not accessible", path)
+            return

+        safe_root = os.environ.get("CODEGRAPH_REPOS_ROOT")
+        if safe_root:
+            try:
+                root_path = Path(safe_root).resolve(strict=True)
+            except FileNotFoundError:
+                logging.error("Configured CODEGRAPH_REPOS_ROOT '%s' does not exist", safe_root)
+                return
+            base_path_str = str(base_path)
+            root_path_str = str(root_path)
+            if not base_path_str.startswith(root_path_str.rstrip(os.sep) + os.sep) and base_path_str != root_path_str:
+                logging.error("Path '%s' is outside of allowed root '%s'", base_path, root_path)
+                return
+
+        logging.info(f"Analyzing local folder {base_path}")
+
        # Analyze source files
-        self.analyze_sources(Path(path), ignore, g)
+        self.analyze_sources(base_path, ignore, g)

        logging.info("Done analyzing path")

@@ -1,6 +1,7 @@
 from contextlib import nullcontext
 from pathlib import Path
 from typing import Optional
+import os

 from api.entities.entity import Entity
 from api.entities.file import File
@@ -176,7 +177,16 @@
        self.second_pass(graph, files, path)

    def analyze_sources(self, path: Path, ignore: list[str], graph: Graph) -> None:
+        # Resolve the target path and enforce that it lies within an allowed base directory.
        path = path.resolve()
+        base_dir_env = os.getenv("CODE_GRAPH_BASE_DIR", ".")
+        base_dir = Path(base_dir_env).resolve()
+        try:
+            # This will raise ValueError if 'path' is not inside 'base_dir'.
+            path.relative_to(base_dir)
+        except ValueError:
+            logging.error("Refusing to analyze path '%s' outside of base directory '%s'", path, base_dir)
+            raise ValueError(f"Path '{path}' is not allowed for analysis")
        files = list(path.rglob("*.java")) + list(path.rglob("*.py")) + list(path.rglob("*.cs")) + list(path.rglob("*.js"))
        # First pass analysis of the source code
        self.first_pass(path, files, ignore, graph)
         # First pass analysis of the source code
         self.first_pass(path, files, ignore, graph)
 

diff --git a/pyproject.toml b/pyproject.toml
@@ -13,6 +13,7 @@ dependencies = [
     "tree-sitter-c>=0.24.1,<0.25.0",
     "tree-sitter-python>=0.25.0,<0.26.0",
     "tree-sitter-java>=0.23.5,<0.24.0",
+"tree-sitter-javascript>=0.23.0",
     "tree-sitter-c-sharp>=0.23.1,<0.24.0",
     "flask>=3.1.0,<4.0.0",
     "python-dotenv>=1.0.1,<2.0.0",