From e50476b30a6d3426e50aa9666ed93de9f78e20fb Mon Sep 17 00:00:00 2001
From: Bar Nuri <barnuri@hotmail.com>
Date: Tue, 29 Apr 2025 08:59:00 +0300
Subject: [PATCH] feat: ability to run flow without langflow server (#7507)

* flow-runner

* flow-runner

* flow-runner - fix lint

* Update flow_runner.py

* [autofix.ci] apply automated fixes

* Update flow_runner.py

* [autofix.ci] apply automated fixes

* Update flow_runner.py

* [autofix.ci] apply automated fixes

* Update flow_runner.py

* [autofix.ci] apply automated fixes

* CR

* Add docs and require sessionid

* fix lint

* [autofix.ci] apply automated fixes

* refactor: simplify flow ID handling and update class docstring

* refactor: update flow runner import to experimental version

* removed obsolete test

* remove test that use io

* remove another io test

---------

Co-authored-by: autofix-ci[bot] <114827586+autofix-ci[bot]@users.noreply.github.com>
Co-authored-by: Edwin Jose <edwin.jose@datastax.com>
Co-authored-by: Jordan Frazier <jordan.frazier@datastax.com>
Co-authored-by: Jordan Frazier <122494242+jordanrfrazier@users.noreply.github.com>
Co-authored-by: Gabriel Luiz Freitas Almeida <gabriel@langflow.org>
---
 .../base/langflow/services/flow/__init__.py   |   0
 .../langflow/services/flow/flow_runner.py     | 172 ++++++++++++++++++
 .../tests/unit/services/flow/__init__.py      |   0
 .../unit/services/flow/test_flow_runner.py    |  84 +++++++++
 4 files changed, 256 insertions(+)
 create mode 100644 src/backend/base/langflow/services/flow/__init__.py
 create mode 100644 src/backend/base/langflow/services/flow/flow_runner.py
 create mode 100644 src/backend/tests/unit/services/flow/__init__.py
 create mode 100644 src/backend/tests/unit/services/flow/test_flow_runner.py

diff --git a/src/backend/base/langflow/services/flow/__init__.py b/src/backend/base/langflow/services/flow/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/src/backend/base/langflow/services/flow/flow_runner.py b/src/backend/base/langflow/services/flow/flow_runner.py
new file mode 100644
index 000000000..a578a00cf
--- /dev/null
+++ b/src/backend/base/langflow/services/flow/flow_runner.py
@@ -0,0 +1,172 @@
+import json
+import os
+from collections.abc import Callable
+from pathlib import Path
+from typing import Any
+from uuid import UUID
+
+from aiofile import async_open
+from loguru import logger
+from sqlalchemy import text
+
+from langflow.api.utils import cascade_delete_flow
+from langflow.graph import Graph
+from langflow.load import aload_flow_from_json
+from langflow.processing.process import run_graph
+from langflow.services.cache.service import AsyncBaseCacheService
+from langflow.services.database.models.flow import Flow
+from langflow.services.database.utils import initialize_database
+from langflow.services.deps import get_cache_service, session_scope
+
+
+class LangflowRunnerExperimental:
+    """LangflowRunnerExperimental orchestrates flow execution without a dedicated server.
+
+    .. warning::
+        This class is currently **experimental** and in a **beta phase**.
+        Its API and behavior may change in future releases. Use with caution in production environments.
+
+    Usage:
+    ------
+    Instantiate the class and call the `run` method with the desired flow and input.
+
+    Example:
+        runner = LangflowRunnerExperimental()
+        result = await runner.run(flow="path/to/flow.json", input_value="Hello", session_id=str(uuid.uuid4()))
+
+    """
+
+    should_initialize_db: bool = True
+
+    async def run(
+        self,
+        session_id: str,  # UUID required currently
+        flow: Path | str | dict,
+        input_value: str,
+        input_type: str = "chat",
+        output_type: str = "chat",
+    ):
+        logger.info(f"Start Handling {session_id=}")
+        await self.init_db_if_needed()
+        flow_dict = await self.get_flow_dict(flow)
+        self.set_flow_id(session_id, flow_dict)
+        # we must modify the flow schema to set the session_id and for load_from_db=True we load the value from env vars
+        self.modification(flow_dict, lambda obj, parent, key: self.modify_flow_schema(session_id, obj, parent, key))
+        await self.clear_flow_state(session_id, flow_dict)
+        await self.add_flow_to_db(session_id, flow_dict)
+        graph = await self.create_graph_from_flow(session_id, flow_dict)
+        try:
+            result = await self.run_graph(input_value, input_type, output_type, session_id, graph)
+        finally:
+            await self.clear_flow_state(session_id, flow_dict)
+        logger.info(f"Finish Handling {session_id=}")
+        return result
+
+    @staticmethod
+    def set_flow_id(session_id: str, flow_dict: dict) -> None:
+        flow_dict["id"] = session_id
+
+    @staticmethod
+    async def add_flow_to_db(session_id: str, flow_dict: dict):
+        async with session_scope() as session:
+            flow_db = Flow(name=session_id, id=UUID(flow_dict["id"]), data=flow_dict.get("data", {}))
+            session.add(flow_db)
+            await session.commit()
+
+    @staticmethod
+    async def run_graph(input_value: str, input_type: str, output_type: str, session_id: str, graph: Graph):
+        return await run_graph(
+            graph=graph,
+            session_id=session_id,
+            input_value=input_value,
+            fallback_to_env_vars=True,
+            input_type=input_type,
+            output_type=output_type,
+        )
+
+    @staticmethod
+    async def create_graph_from_flow(session_id: str, flow_dict: dict):
+        graph = await aload_flow_from_json(flow=flow_dict, disable_logs=False)
+        graph.flow_id = flow_dict["id"]
+        graph.session_id = session_id
+        return graph
+
+    @staticmethod
+    async def clear_flow_state(_session_id: str, flow_dict: dict):
+        cache_service = get_cache_service()
+        if isinstance(cache_service, AsyncBaseCacheService):
+            await cache_service.clear()
+        else:
+            cache_service.clear()
+        async with session_scope() as session:
+            flow_id = flow_dict["id"]
+            uuid_obj = flow_id if isinstance(flow_id, UUID) else UUID(str(flow_id))
+            await cascade_delete_flow(session, uuid_obj)
+
+    async def init_db_if_needed(self):
+        if not await self.database_exists_check() and self.should_initialize_db:
+            logger.info("Initializing database...")
+            await initialize_database(fix_migration=True)
+            self.should_initialize_db = False
+            logger.info("Database initialized.")
+
+    @staticmethod
+    async def database_exists_check():
+        async with session_scope() as session:
+            try:
+                result = await session.exec(text("SELECT version_num FROM public.alembic_version"))
+                return result.first() is not None
+            except Exception as e:  # noqa: BLE001
+                logger.debug(f"Database check failed: {e}")
+                return False
+
+    @staticmethod
+    async def get_flow_dict(flow: Path | str | dict) -> dict:
+        if isinstance(flow, str | Path):
+            async with async_open(Path(flow), encoding="utf-8") as f:
+                content = await f.read()
+                return json.loads(content)
+        # If input is a dictionary, assume it's a JSON object
+        elif isinstance(flow, dict):
+            return flow
+        error_msg = "Input must be a file path (str or Path object) or a JSON object (dict)."
+        raise TypeError(error_msg)
+
+    @staticmethod
+    def modify_flow_schema(session_id: str, obj: Any, parent: Any | None, _key: str | None):
+        if not isinstance(obj, dict):
+            return
+        parent_dict = parent if isinstance(parent, dict) else {}
+        parent_display = parent_dict.get("display_name", parent_dict.get("name", parent_dict.get("id", "unknown")))
+        if "session_id" in obj:
+            obj["session_id"] = session_id
+            logger.info(f"Setting {session_id=} for {parent_display=}")
+        if obj.get("load_from_db"):
+            obj["load_from_db"] = False
+            env_var_name = obj["value"]
+            if not env_var_name:
+                return
+            env_var_value = os.getenv(env_var_name)
+            if not env_var_value:
+                error_msg = f"Environment variable {env_var_name} not set for {parent_display}"
+                raise ValueError(error_msg)
+            obj["value"] = os.getenv(env_var_name)
+            logger.info(f"Loading env var {env_var_name=} for {parent_display=}")
+
+    def modification(self, obj: Any, func: Callable[[Any, Any | None, str | None], None], parent: Any = None) -> None:
+        """Recursively apply a function to all elements in a nested structure (dict or list).
+
+        The function is called with three arguments: the current object, its parent, and the key (if applicable).
+        """
+        if isinstance(obj, dict):
+            for key, value in obj.items():
+                func(value, parent, key)
+                self.modification(value, func, obj)
+            return
+        if isinstance(obj, list):
+            for item in obj:
+                func(item, parent, None)
+                self.modification(item, func, obj)
+            return
+        # primitive types (int, float, str, bool, None)
+        func(obj, parent, None)
diff --git a/src/backend/tests/unit/services/flow/__init__.py b/src/backend/tests/unit/services/flow/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/src/backend/tests/unit/services/flow/test_flow_runner.py b/src/backend/tests/unit/services/flow/test_flow_runner.py
new file mode 100644
index 000000000..3d4ae5da4
--- /dev/null
+++ b/src/backend/tests/unit/services/flow/test_flow_runner.py
@@ -0,0 +1,84 @@
+from uuid import uuid4
+
+import pytest
+from langflow.services.flow.flow_runner import LangflowRunnerExperimental
+
+
+@pytest.fixture
+def sample_flow_dict():
+    return {
+        "data": {
+            "nodes": [],
+            "edges": [],
+        }
+    }
+
+
+@pytest.fixture
+def flow_runner():
+    return LangflowRunnerExperimental()
+
+
+@pytest.mark.asyncio
+async def test_database_exists_check(flow_runner):
+    """Test database exists check functionality."""
+    result = await flow_runner.database_exists_check()
+    assert isinstance(result, bool)
+
+
+@pytest.mark.asyncio
+async def test_get_flow_dict_from_dict(flow_runner, sample_flow_dict):
+    """Test loading flow from a dictionary."""
+    result = await flow_runner.get_flow_dict(sample_flow_dict)
+    assert result == sample_flow_dict
+
+
+@pytest.mark.asyncio
+async def test_get_flow_dict_invalid_input(flow_runner):
+    """Test loading flow with invalid input type."""
+    pattern = r"Input must be a file path .* or a JSON object .*"
+    with pytest.raises(TypeError, match=pattern):
+        await flow_runner.get_flow_dict(123)
+
+
+@pytest.mark.asyncio
+async def test_run_with_dict_input(flow_runner, sample_flow_dict):
+    """Test running flow with dictionary input."""
+    session_id = str(uuid4())
+    input_value = "test input"
+
+    result = await flow_runner.run(
+        flow=sample_flow_dict,
+        input_value=input_value,
+        session_id=session_id,
+    )
+    assert result is not None
+
+
+@pytest.mark.asyncio
+async def test_run_with_different_input_types(flow_runner, sample_flow_dict):
+    """Test running flow with different input and output types."""
+    session_id = str(uuid4())
+    test_cases = [
+        ("text input", "text", "text"),
+        ("chat input", "chat", "chat"),
+        ("test input", "chat", "text"),
+    ]
+
+    for input_value, input_type, output_type in test_cases:
+        result = await flow_runner.run(
+            flow=sample_flow_dict,
+            input_value=input_value,
+            input_type=input_type,
+            output_type=output_type,
+            session_id=session_id,
+        )
+        assert result is not None
+
+
+@pytest.mark.asyncio
+async def test_initialize_database(flow_runner):
+    """Test database initialization."""
+    flow_runner.should_initialize_db = True
+    await flow_runner.init_db_if_needed()
+    assert not flow_runner.should_initialize_db