From a190fd6b4739e038338d23ae4436298b7e638be0 Mon Sep 17 00:00:00 2001
From: Eugene Batalov <eugene@tensorlake.ai>
Date: Mon, 13 Jan 2025 12:13:50 +0000
Subject: [PATCH] Test for Function routing to Executors with function
 allowlists

The test might not catch a routing bug on a single run but will catch
it eventually if it happens.
---
 .../src/tests/test_function_allowlist.py      | 159 ++++++++++++++++++
 indexify/tests/src/tests/testing.py           |  37 ++++
 2 files changed, 196 insertions(+)
 create mode 100644 indexify/tests/src/tests/test_function_allowlist.py
 create mode 100644 indexify/tests/src/tests/testing.py

diff --git a/indexify/tests/src/tests/test_function_allowlist.py b/indexify/tests/src/tests/test_function_allowlist.py
new file mode 100644
index 000000000..dfd8d365b
--- /dev/null
+++ b/indexify/tests/src/tests/test_function_allowlist.py
@@ -0,0 +1,159 @@
+import os
+import subprocess
+import time
+import unittest
+from typing import List, Optional
+
+from indexify import Graph, indexify_function
+from indexify.remote_graph import RemoteGraph
+from tests.testing import ExecutorProcessContextManager, function_uri, test_graph_name
+
+# There's a dev mode executor already running in the testing environment.
+# It's used for all other tests that don't check the function allowlist.
+# This existing Executor can run any function.
+dev_mode_executor_pid: Optional[int] = None
+# This Executor can only run function_a.
+function_a_executor_pid: Optional[int] = None
+# This Executor can only run function_b.
+function_b_executor_pid: Optional[int] = None
+
+
+def get_executor_pid() -> int:
+    # Assuming Subprocess Function Executors are used in Open Source.
+    return os.getppid()
+
+
+@indexify_function()
+def get_dev_mode_executor_pid() -> int:
+    return get_executor_pid()
+
+
+@indexify_function()
+def function_a() -> str:
+    global dev_mode_executor_pid
+    global function_a_executor_pid
+    global function_b_executor_pid
+
+    current_executor_pid: int = get_executor_pid()
+    allowed_executor_pids: List[int] = [function_a_executor_pid, dev_mode_executor_pid]
+    if current_executor_pid not in allowed_executor_pids:
+        raise Exception(
+            f"function_a Executor PID {current_executor_pid} is not in the allowlist: {allowed_executor_pids}"
+        )
+    return "success"
+
+
+@indexify_function()
+def function_b(_: str) -> str:
+    global dev_mode_executor_pid
+    global function_a_executor_pid
+    global function_b_executor_pid
+
+    current_executor_pid: int = get_executor_pid()
+    allowed_executor_pids: List[int] = [function_b_executor_pid, dev_mode_executor_pid]
+    if current_executor_pid not in allowed_executor_pids:
+        raise Exception(
+            f"function_b Executor PID {current_executor_pid} is not in the allowlist: {allowed_executor_pids}"
+        )
+    return "success"
+
+
+@indexify_function()
+def function_dev(_: str) -> str:
+    current_executor_pid: int = get_executor_pid()
+    allowed_executor_pids: List[int] = [dev_mode_executor_pid]
+    if current_executor_pid not in allowed_executor_pids:
+        raise Exception(
+            f"function_dev Executor PID {current_executor_pid} is not in the allowlist: {allowed_executor_pids}"
+        )
+    return "success"
+
+
+class TestFunctionAllowlist(unittest.TestCase):
+    def test_function_routing(self):
+        graph = Graph(
+            name=test_graph_name(self),
+            description="test",
+            start_node=get_dev_mode_executor_pid,
+            version="1.0",
+        )
+        graph = RemoteGraph.deploy(graph)
+
+        global dev_mode_executor_pid
+        invocation_id = graph.run(block_until_done=True)
+        output = graph.output(invocation_id, "get_dev_mode_executor_pid")
+        self.assertEqual(len(output), 1)
+        dev_mode_executor_pid = output[0]
+        print(f"Found dev mode Executor PID: {dev_mode_executor_pid}")
+
+        with ExecutorProcessContextManager(
+            [
+                "--function",
+                function_uri(
+                    "default",
+                    "test_different_executors_run_different_functions",
+                    "function_a",
+                    "2.0",
+                ),
+                "--ports",
+                "60000",
+                "60001",
+            ]
+        ) as executor_a:
+            executor_a: subprocess.Popen
+            global function_a_executor_pid
+            function_a_executor_pid = executor_a.pid
+            print(f"Started Executor A with PID: {function_a_executor_pid}")
+
+            with ExecutorProcessContextManager(
+                [
+                    "--function",
+                    function_uri(
+                        "default",
+                        "test_different_executors_run_different_functions",
+                        "function_b",
+                        "2.0",
+                    ),
+                    "--ports",
+                    "60001",
+                    "60002",
+                ]
+            ) as executor_b:
+                executor_b: subprocess.Popen
+                global function_b_executor_pid
+                function_b_executor_pid = executor_b.pid
+                print(f"Started Executor B with PID: {function_b_executor_pid}")
+
+                print(
+                    "Waiting 5 secs for Executors A and B to start and join the Server."
+                )
+                time.sleep(5)
+
+                graph = Graph(
+                    name=test_graph_name(self),
+                    description="test",
+                    start_node=function_a,
+                    version="2.0",
+                )
+                graph.add_edge(function_a, function_b)
+                graph.add_edge(function_b, function_dev)
+                graph = RemoteGraph.deploy(graph)
+                # As invocations might land on dev Executor, we need to run the graph multiple times
+                # to ensure that we catch wrong routing to Executor A or B if it ever happens.
+                for _ in range(10):
+                    invocation_id = graph.run(block_until_done=True)
+                    output = graph.output(invocation_id, "function_a")
+                    self.assertEqual(len(output), 1)
+                    self.assertEqual(output[0], "success")
+
+                    output = graph.output(invocation_id, "function_b")
+                    self.assertEqual(len(output), 1)
+                    self.assertEqual(output[0], "success")
+
+                    output = graph.output(invocation_id, "function_dev")
+                    self.assertEqual(len(output), 1)
+                    self.assertEqual(output[0], "success")
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/indexify/tests/src/tests/testing.py b/indexify/tests/src/tests/testing.py
new file mode 100644
index 000000000..00851bcdf
--- /dev/null
+++ b/indexify/tests/src/tests/testing.py
@@ -0,0 +1,37 @@
+import subprocess
+import unittest
+from typing import List, Optional
+
+
+def test_graph_name(test_case: unittest.TestCase) -> str:
+    """Converts a test case to a unique graph name.
+
+    Example:
+    >>> class TestGraphReduce(unittest.TestCase):
+    ...     def test_simple(self):
+    ...         g = Graph(name=graph_name(self), start_node=generate_seq)
+    ...         # ...
+    ...         print(g.name)
+    ...         # test_graph_reduce_test_simple
+    """
+    return unittest.TestCase.id(test_case).replace(".", "_")
+
+
+def function_uri(namespace: str, graph: str, function: str, version: str) -> str:
+    return ":".join([namespace, graph, function, version])
+
+
+class ExecutorProcessContextManager:
+    def __init__(self, args: List[str]):
+        self._args = ["indexify-cli", "executor"]
+        self._args.extend(args)
+        self._process: Optional[subprocess.Popen] = None
+
+    def __enter__(self) -> subprocess.Popen:
+        self._process = subprocess.Popen(self._args)
+        return self._process
+
+    def __exit__(self, exc_type, exc_value, traceback):
+        if self._process:
+            self._process.terminate()
+            self._process.wait()