From 2abe076336bf9d2d892b3455fddc62e7a005e1de Mon Sep 17 00:00:00 2001
From: Dekel Reches <dekel.reches@granulate.com>
Date: Tue, 24 Sep 2024 01:00:28 +0300
Subject: [PATCH] rework complex files to use granulate-utils

---
 gprofiler/profilers/java.py | 670 +-----------------------------------
 gprofiler/utils/__init__.py | 525 +++-------------------------
 2 files changed, 64 insertions(+), 1131 deletions(-)

diff --git a/gprofiler/profilers/java.py b/gprofiler/profilers/java.py
index a5737541f..1ad08be77 100644
--- a/gprofiler/profilers/java.py
+++ b/gprofiler/profilers/java.py
@@ -13,21 +13,13 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
-import errno
 import functools
 import json
 import os
-import re
-import secrets
-import signal
-from enum import Enum
 from pathlib import Path
-from subprocess import CompletedProcess
-from threading import Event, Lock
-from types import TracebackType
-from typing import Any, Dict, Iterable, List, Optional, Set, Type, TypeVar, Union, cast
+from threading import Event
+from typing import Any, Dict, Iterable, List, Optional, Set, Union
 
-import psutil
 from granulate_utils.java import (
     CONTAINER_INFO_REGEX,
     DETECTED_JAVA_PROCESSES_REGEX,
@@ -38,34 +30,28 @@
     JvmVersion,
     is_java_fatal_signal,
     java_exit_code_to_signo,
-    locate_hotspot_error_file,
     parse_jvm_flags,
     parse_jvm_version,
 )
 
-from gprofiler.platform import is_linux
+from granulate_utils.gprofiler.platform import is_linux
 from gprofiler.utils.collapsed_format import parse_one_collapsed
 
 if is_linux():
     from granulate_utils.linux import proc_events
     from granulate_utils.linux.kernel_messages import KernelMessage
-    from granulate_utils.linux.ns import get_proc_root_path, get_process_nspid, resolve_proc_root_links, run_in_ns
     from granulate_utils.linux.oom import get_oom_entry
     from granulate_utils.linux.process import (
         get_mapped_dso_elf_id,
-        is_musl,
-        is_process_basename_matching,
         is_process_running,
         process_exe,
-        read_proc_file,
     )
     from granulate_utils.linux.signals import get_signal_entry
 
 from packaging.version import Version
-from psutil import NoSuchProcess, Process
+from psutil import Process
 
 from gprofiler.diagnostics import is_diagnostics
-from gprofiler.exceptions import CalledProcessError, CalledProcessTimeoutError, NoRwExecDirectoryFoundError
 from gprofiler.gprofiler_types import (
     ProcessToProfileData,
     ProfileData,
@@ -85,21 +71,15 @@
     GPROFILER_DIRECTORY_NAME,
     TEMPORARY_STORAGE_PATH,
     pgrep_maps,
-    remove_path,
-    remove_prefix,
     resource_path,
-    run_process,
-    touch_path,
     wait_event,
 )
-from gprofiler.utils.fs import is_owned_by_root, is_rw_exec_dir, mkdir_owned_root, safe_copy
 from gprofiler.utils.perf import can_i_use_perf_events
 from gprofiler.utils.process import process_comm, search_proc_maps
+from granulate_utils.gprofiler.java import *
 
 logger = get_logger_adapter(__name__)
 
-libap_copy_lock = Lock()
-
 # directories we check for rw,exec as candidates for libasyncProfiler.so placement.
 POSSIBLE_AP_DIRS = (
     TEMPORARY_STORAGE_PATH,
@@ -108,261 +88,6 @@
     f"/dev/{GPROFILER_DIRECTORY_NAME}",  # unfortunately, we encoundered some systems that left us no other option
 )
 
-
-def frequency_to_ap_interval(frequency: int) -> int:
-    # async-profiler accepts interval between samples (nanoseconds)
-    return int((1 / frequency) * 1_000_000_000)
-
-
-@functools.lru_cache(maxsize=1024)
-def needs_musl_ap_cached(process: Process) -> bool:
-    """
-    AP needs musl build if the JVM itself is built against musl. If the JVM is built against glibc,
-    we need the glibc build of AP. For this reason we also check for glibc-compat, which is an indicator
-    for glibc-based JVM despite having musl loaded.
-    """
-    maps = process.memory_maps()
-    return is_musl(process, maps) and not any("glibc-compat" in m.path for m in maps)
-
-
-class JavaSafemodeOptions(str, Enum):
-    # a profiled process was OOM-killed and we saw it in the kernel log
-    PROFILED_OOM = "profiled-oom"
-    # a profiled process was signaled:
-    # * fatally signaled and we saw it in the kernel log
-    # * we saw an exit code of signal in a proc_events event.
-    PROFILED_SIGNALED = "profiled-signaled"
-    # hs_err file was written for a profiled process
-    HSERR = "hserr"
-    # a process was OOM-killed and we saw it in the kernel log
-    GENERAL_OOM = "general-oom"
-    # a process was fatally signaled and we saw it in the kernel log
-    GENERAL_SIGNALED = "general-signaled"
-    # we saw the PID of a profiled process in the kernel logs
-    PID_IN_KERNEL_MESSAGES = "pid-in-kernel-messages"
-    # employ extended version checks before deciding to profile
-    # see _is_jvm_profiling_supported() docs for more information
-    JAVA_EXTENDED_VERSION_CHECKS = "java-extended-version-checks"
-    # refuse profiling if async-profiler is already loaded (and not by gProfiler)
-    # in the target process
-    AP_LOADED_CHECK = "ap-loaded-check"
-
-
-JAVA_SAFEMODE_ALL = "all"  # magic value for *all* options from JavaSafemodeOptions
-JAVA_SAFEMODE_ALL_OPTIONS = [o.value for o in JavaSafemodeOptions]
-JAVA_SAFEMODE_DEFAULT_OPTIONS = [
-    JavaSafemodeOptions.PROFILED_OOM.value,
-    JavaSafemodeOptions.PROFILED_SIGNALED.value,
-    JavaSafemodeOptions.HSERR.value,
-]
-
-
-SUPPORTED_AP_MODES = ["cpu", "itimer", "alloc"]
-
-
-# see StackWalkFeatures
-# https://github.com/async-profiler/async-profiler/blob/a17529378b47e6700d84f89d74ca5e6284ffd1a6/src/arguments.h#L95-L112
-class AsyncProfilerFeatures(str, Enum):
-    # these will be controllable via "features" in a future AP release:
-    #
-    # unknown_java
-    # unwind_stub
-    # unwind_comp
-    # unwind_native
-    # java_anchor
-    # gc_traces
-
-    # these are controllable via "features" in AP 3.0
-    probe_sp = "probesp"
-    vtable_target = "vtable"
-    comp_task = "comptask"
-    # as of AP 3.0
-
-
-SUPPORTED_AP_FEATURES = [o.value for o in AsyncProfilerFeatures]
-DEFAULT_AP_FEATURES = [AsyncProfilerFeatures.probe_sp.value, AsyncProfilerFeatures.vtable_target.value]
-
-# see options still here and not in "features":
-# https://github.com/async-profiler/async-profiler/blob/a17529378b47e6700d84f89d74ca5e6284ffd1a6/src/arguments.cpp#L262
-# we don't want any of them disabled by default.
-JAVA_ASYNC_PROFILER_DEFAULT_SAFEMODE = 0
-
-PROBLEMATIC_FRAME_REGEX = re.compile(r"^# Problematic frame:\n# (.*?)\n#\n", re.MULTILINE | re.DOTALL)
-"""
-See VMError::report.
-Example:
-    # Problematic frame:
-    # C  [libasyncProfiler.so+0x218a0]  Profiler::getJavaTraceAsync(void*, ASGCT_CallFrame*, int)+0xe0
-"""
-
-
-class JavaFlagCollectionOptions(str, Enum):
-    ALL = "all"
-    DEFAULT = "default"
-    NONE = "none"
-
-
-class JattachExceptionBase(CalledProcessError):
-    def __init__(
-        self, returncode: int, cmd: Any, stdout: Any, stderr: Any, target_pid: int, ap_log: str, ap_loaded: str
-    ):
-        super().__init__(returncode, cmd, stdout, stderr)
-        self._target_pid = target_pid
-        self._ap_log = ap_log
-        self._ap_loaded = ap_loaded
-
-    def __str__(self) -> str:
-        ap_log = self._ap_log.strip()
-        if not ap_log:
-            ap_log = "(empty)"
-        loaded_msg = f"async-profiler DSO loaded: {self._ap_loaded}"
-        return super().__str__() + f"\nJava PID: {self._target_pid}\n{loaded_msg}\nasync-profiler log:\n{ap_log}"
-
-    def get_ap_log(self) -> str:
-        return self._ap_log
-
-    @property
-    def is_ap_loaded(self) -> bool:
-        return self._ap_loaded == "yes"
-
-
-class JattachException(JattachExceptionBase):
-    pass
-
-
-# doesn't extend JattachException itself, we're not just a jattach error, we're
-# specifically the timeout one.
-class JattachTimeout(JattachExceptionBase):
-    def __init__(
-        self,
-        returncode: int,
-        cmd: Any,
-        stdout: Any,
-        stderr: Any,
-        target_pid: int,
-        ap_log: str,
-        ap_loaded: str,
-        timeout: int,
-    ):
-        super().__init__(returncode, cmd, stdout, stderr, target_pid, ap_log, ap_loaded)
-        self._timeout = timeout
-
-    def __str__(self) -> str:
-        return super().__str__() + (
-            f"\njattach timed out (timeout was {self._timeout} seconds);"
-            " you can increase it with the --java-jattach-timeout parameter."
-        )
-
-
-class JattachSocketMissingException(JattachExceptionBase):
-    def __str__(self) -> str:
-        # the attach listener is initialized once, then it is marked as initialized:
-        # (https://github.com/openjdk/jdk/blob/3d07b3c7f01b60ff4dc38f62407c212b48883dbf/src/hotspot/share/services/attachListener.cpp#L388)
-        # and will not be initialized again:
-        # https://github.com/openjdk/jdk/blob/3d07b3c7f01b60ff4dc38f62407c212b48883dbf/src/hotspot/os/linux/attachListener_linux.cpp#L509
-        # since openjdk 2870c9d55efe, the attach socket will be recreated even when removed (and this exception
-        # won't happen).
-        return super().__str__() + (
-            "\nJVM attach socket is missing and jattach could not create it. It has most"
-            " likely been removed; the process has to be restarted for a new socket to be created."
-        )
-
-
-class JattachJcmdRunner:
-    def __init__(self, stop_event: Event, jattach_timeout: int):
-        self.stop_event = stop_event
-        self.jattach_timeout = jattach_timeout
-
-    def run(self, process: Process, cmd: str) -> str:
-        try:
-            return run_process(
-                [asprof_path(), "jcmd", str(process.pid), cmd],
-                stop_event=self.stop_event,
-                timeout=self.jattach_timeout,
-            ).stdout.decode()
-        except CalledProcessError as e:
-            if f"Process {process.pid} not found" in str(e):
-                raise NoSuchProcess(process.pid)
-            raise e
-
-
-def is_java_basename(process: Process) -> bool:
-    return is_process_basename_matching(process, r"^java$")
-
-
-_JAVA_VERSION_TIMEOUT = 5
-
-_JAVA_VERSION_CACHE_MAX = 1024
-
-
-def _get_process_ns_java_path(process: Process) -> Optional[str]:
-    """
-    Look up path to java executable installed together with this process' libjvm.
-    """
-    # This has the benefit of working even if the Java binary was replaced, e.g due to an upgrade.
-    # in that case, the libraries would have been replaced as well, and therefore we're actually checking
-    # the version of the now installed Java, and not the running one.
-    # but since this is used for the "JDK type" check, it's good enough - we don't expect that to change.
-    # this whole check, however, is growing to be too complex, and we should consider other approaches
-    # for it:
-    # 1. purely in async-profiler - before calling any APIs that might harm blacklisted JDKs, we can
-    #    check the JDK type in async-profiler itself.
-    # 2. assume JDK type by the path, e.g the "java" Docker image has
-    #    "/usr/lib/jvm/java-8-openjdk-amd64/jre/bin/java" which means "OpenJDK". needs to be checked for
-    #    other JDK types.
-    if is_java_basename(process):
-        nspid = get_process_nspid(process.pid)
-        return f"/proc/{nspid}/exe"  # it's a symlink and will be resolveable under process' mnt ns
-    libjvm_path: Optional[str] = None
-    for m in process.memory_maps():
-        if re.match(DETECTED_JAVA_PROCESSES_REGEX, m.path):
-            libjvm_path = m.path
-            break
-    if libjvm_path is not None:
-        libjvm_dir = os.path.dirname(libjvm_path)
-        # support two java layouts - it's either lib/server/../../bin/java or lib/{arch}/server/../../../bin/java:
-        java_candidate_paths = [
-            Path(libjvm_dir, "../../bin/java").resolve(),
-            Path(libjvm_dir, "../../../bin/java").resolve(),
-        ]
-        for java_path in java_candidate_paths:
-            # don't need resolve_proc_root_links here - paths in /proc/pid/maps are normalized.
-            proc_relative_path = Path(f"/proc/{process.pid}/root", java_path.relative_to("/"))
-            if proc_relative_path.exists():
-                if os.access(proc_relative_path, os.X_OK):
-                    return str(java_path)
-    return None
-
-
-# process is hashable and the same process instance compares equal
-@functools.lru_cache(maxsize=_JAVA_VERSION_CACHE_MAX)
-def get_java_version(process: Process, stop_event: Event) -> Optional[str]:
-    # make sure we're able to find "java" binary bundled with process libjvm
-    process_java_path = _get_process_ns_java_path(process)
-    if process_java_path is None:
-        return None
-
-    def _run_java_version() -> "CompletedProcess[bytes]":
-        return run_process(
-            [
-                cast(str, process_java_path),
-                "-version",
-            ],
-            stop_event=stop_event,
-            timeout=_JAVA_VERSION_TIMEOUT,
-        )
-
-    # doesn't work without changing PID NS as well (I'm getting ENOENT for libjli.so)
-    # Version is printed to stderr
-    return run_in_ns(["pid", "mnt"], _run_java_version, process.pid).stderr.decode().strip()
-
-
-def get_java_version_logged(process: Process, stop_event: Event) -> Optional[str]:
-    java_version = get_java_version(process, stop_event)
-    logger.debug("java -version output", java_version_output=java_version, pid=process.pid)
-    return java_version
-
-
 class JavaMetadata(ApplicationMetadata):
     def __init__(
         self,
@@ -375,7 +100,7 @@ def __init__(
         self.java_collect_jvm_flags = java_collect_jvm_flags
 
     def make_application_metadata(self, process: Process) -> Dict[str, Any]:
-        version = get_java_version(process, self._stop_event) or "/java not found"
+        version = get_java_version(process, self._stop_event, logger) or "/java not found"
         # libjvm elfid - we care only about libjvm, not about the java exe itself which is a just small program
         # that loads other libs.
         libjvm_elfid = get_mapped_dso_elf_id(process, "/libjvm")
@@ -470,372 +195,6 @@ def fdtransfer_path() -> str:
 def get_ap_version() -> str:
     return Path(resource_path("java/async-profiler-version")).read_text()
 
-
-T = TypeVar("T", bound="AsyncProfiledProcess")
-
-# Format is defined by async-profiler here: (Granulate's fork logs the output to logger, hence the `INFO` prefix)
-# https://github.com/jvm-profiling-tools/async-profiler/blob/7eaefdb18f331962dc4c78c82322aec257e95c6c/src/profiler.cpp#L1204
-
-_MEM_INFO_LOG_RE = re.compile(
-    r"\[INFO\] Call trace storage:\s*(\d+) "
-    r"KB\n\s*Dictionaries:\s*(\d+) KB\n\s*Code cache:\s*(\d+) KB\n-*\n\s*Total:\s*(\d+) "
-    r"KB\n\n"
-)
-
-
-class AsyncProfiledProcess:
-    """
-    Represents a process profiled with async-profiler.
-    """
-
-    FORMAT_PARAMS = "ann,sig"
-    OUTPUT_FORMAT = "collapsed"
-    OUTPUTS_MODE = 0o622  # readable by root, writable by all
-
-    # timeouts in seconds
-    _FDTRANSFER_TIMEOUT = 10
-    _DEFAULT_JATTACH_TIMEOUT = 30  # higher than jattach's timeout
-
-    _DEFAULT_MCACHE = 30  # arbitrarily chosen, not too high & not too low.
-
-    def __init__(
-        self,
-        process: Process,
-        profiler_state: ProfilerState,
-        mode: str,
-        ap_safemode: int,
-        ap_features: List[str],
-        ap_args: str,
-        jattach_timeout: int = _DEFAULT_JATTACH_TIMEOUT,
-        mcache: int = 0,
-        collect_meminfo: bool = True,
-        include_method_modifiers: bool = False,
-        java_line_numbers: str = "none",
-    ):
-        self.process = process
-        self._profiler_state = profiler_state
-        # access the process' root via its topmost parent/ancestor which uses the same mount namespace.
-        # this allows us to access the files after the process exits:
-        # * for processes that run in host mount NS - their ancestor is always available (it's going to be PID 1)
-        # * for processes that run in a container, and the container remains running after they exit - hence, the
-        #   ancestor is still alive.
-        # there is a hidden assumption here that neither the ancestor nor the process will change their mount
-        # namespace. I think it's okay to assume that.
-        self._process_root = get_proc_root_path(process)
-        self._cmdline = process.cmdline()
-        self._cwd = process.cwd()
-        self._nspid = get_process_nspid(self.process.pid)
-
-        # not using storage_dir for AP itself on purpose: this path should remain constant for the lifetime
-        # of the target process, so AP is loaded exactly once (if we have multiple paths, AP can be loaded
-        # multiple times into the process)
-        # without depending on storage_dir here, we maintain the same path even if gProfiler is re-run,
-        # because storage_dir changes between runs.
-        # we embed the async-profiler version in the path, so future gprofiler versions which use another version
-        # of AP case use it (will be loaded as a different DSO)
-        self._ap_dir_base = self._find_rw_exec_dir()
-        self._ap_dir_versioned = os.path.join(self._ap_dir_base, f"async-profiler-{get_ap_version()}")
-        self._ap_dir_host = os.path.join(
-            self._ap_dir_versioned,
-            "musl" if self._needs_musl_ap() else "glibc",
-        )
-
-        self._libap_path_host = os.path.join(self._ap_dir_host, "libasyncProfiler.so")
-        self._libap_path_process = remove_prefix(self._libap_path_host, self._process_root)
-
-        # for other purposes - we can use storage_dir.
-        self._storage_dir_host = resolve_proc_root_links(self._process_root, self._profiler_state.storage_dir)
-
-        self._output_path_host = os.path.join(self._storage_dir_host, f"async-profiler-{self.process.pid}.output")
-        self._output_path_process = remove_prefix(self._output_path_host, self._process_root)
-        self._log_path_host = os.path.join(self._storage_dir_host, f"async-profiler-{self.process.pid}.log")
-        self._log_path_process = remove_prefix(self._log_path_host, self._process_root)
-
-        assert mode in ("cpu", "itimer", "alloc"), f"unexpected mode: {mode}"
-        self._mode = mode
-        self._fdtransfer_path = f"@async-profiler-{process.pid}-{secrets.token_hex(10)}" if mode == "cpu" else None
-        self._ap_safemode = ap_safemode
-        self._ap_features = ap_features
-        self._ap_args = ap_args
-        self._jattach_timeout = jattach_timeout
-        self._mcache = mcache
-        self._collect_meminfo = collect_meminfo
-        self._include_method_modifiers = ",includemm" if include_method_modifiers else ""
-        self._include_line_numbers = ",includeln" if java_line_numbers == "line-of-function" else ""
-
-    def _find_rw_exec_dir(self) -> str:
-        """
-        Find a rw & executable directory (in the context of the process) where we can place libasyncProfiler.so
-        and the target process will be able to load it.
-        This function creates the gprofiler_tmp directory as a directory owned by root, if it doesn't exist under the
-        chosen rwx directory.
-        It does not create the parent directory itself, if it doesn't exist (e.g /run).
-        The chosen rwx directory needs to be owned by root.
-        """
-        for d in POSSIBLE_AP_DIRS:
-            full_dir = Path(resolve_proc_root_links(self._process_root, d))
-            if not full_dir.parent.exists():
-                continue  # we do not create the parent.
-
-            if not is_owned_by_root(full_dir.parent):
-                continue  # the parent needs to be owned by root
-
-            try:
-                mkdir_owned_root(full_dir)
-            except OSError as e:
-                # dir is not r/w, try next one
-                if e.errno == errno.EROFS:
-                    continue
-                raise
-
-            if is_rw_exec_dir(full_dir):
-                return str(full_dir)
-        else:
-            raise NoRwExecDirectoryFoundError(
-                f"Could not find a rw & exec directory out of {POSSIBLE_AP_DIRS} for {self._process_root}!"
-            )
-
-    def __enter__(self: T) -> T:
-        # create the directory structure for executable libap, make sure it's owned by root
-        # for sanity & simplicity, mkdir_owned_root() does not support creating parent directories, as this allows
-        # the caller to absentmindedly ignore the check of the parents ownership.
-        # hence we create the structure here part by part.
-        assert is_owned_by_root(
-            Path(self._ap_dir_base)
-        ), f"expected {self._ap_dir_base} to be owned by root at this point"
-        mkdir_owned_root(self._ap_dir_versioned)
-        mkdir_owned_root(self._ap_dir_host)
-        os.makedirs(self._storage_dir_host, 0o755, exist_ok=True)
-
-        self._check_disk_requirements()
-
-        # make out & log paths writable for all, so target process can write to them.
-        # see comment on TemporaryDirectoryWithMode in GProfiler.__init__.
-        touch_path(self._output_path_host, self.OUTPUTS_MODE)
-        self._recreate_log()
-        # copy libasyncProfiler.so if needed
-        self._copy_libap()
-
-        return self
-
-    def __exit__(
-        self,
-        exc_type: Optional[Type[BaseException]],
-        exc_val: Optional[BaseException],
-        exc_ctb: Optional[TracebackType],
-    ) -> None:
-        # ignore_errors because we are deleting paths via /proc/pid/root - and the pid
-        # we're using might have gone down already.
-        # remove them as best effort.
-        remove_path(self._output_path_host, missing_ok=True)
-        remove_path(self._log_path_host, missing_ok=True)
-
-    def _existing_realpath(self, path: str) -> Optional[str]:
-        """
-        Return path relative to process working directory if it exists. Otherwise return None.
-        """
-        if not path.startswith("/"):
-            # relative path
-            path = f"{self._cwd}/{path}"
-        path = resolve_proc_root_links(self._process_root, path)
-        return path if os.path.exists(path) else None
-
-    def locate_hotspot_error_file(self) -> Optional[str]:
-        for path in locate_hotspot_error_file(self._nspid, self._cmdline):
-            realpath = self._existing_realpath(path)
-            if realpath is not None:
-                return realpath
-        return None
-
-    def _needs_musl_ap(self) -> bool:
-        """
-        Should we use the musl build of AP for this process?
-        """
-        return needs_musl_ap_cached(self.process)
-
-    def _copy_libap(self) -> None:
-        # copy *is* racy with respect to other processes running in the same namespace, because they all use
-        # the same directory for libasyncProfiler.so.
-        # therefore, we need to synchronize copies from different threads that profile different processes.
-        if os.path.exists(self._libap_path_host):
-            # all good
-            return
-
-        with libap_copy_lock:
-            if not os.path.exists(self._libap_path_host):
-                # atomically copy it
-                libap_resource = resource_path(
-                    os.path.join("java", "musl" if self._needs_musl_ap() else "glibc", "libasyncProfiler.so")
-                )
-                os.chmod(
-                    libap_resource, 0o755
-                )  # make it accessible for all; needed with PyInstaller, which extracts files as 0700
-                safe_copy(libap_resource, self._libap_path_host)
-
-    def _recreate_log(self) -> None:
-        touch_path(self._log_path_host, self.OUTPUTS_MODE)
-
-    def _check_disk_requirements(self) -> None:
-        """
-        Avoid running if disk space is low, so we don't reach out-of-disk space situation because of profiling data.
-        """
-        free_disk = psutil.disk_usage(self._storage_dir_host).free
-        required = 250 * 1024
-        if free_disk < required:
-            raise Exception(
-                f"Not enough free disk space: {free_disk}kb left, {250 * 1024}kb"
-                f" required (on path: {self._output_path_host!r}"
-            )
-
-    def _get_base_cmd(self) -> List[str]:
-        return [
-            asprof_path(),
-            str(self.process.pid),
-            "load",
-            self._libap_path_process,
-            "true",  # 'true' means the given path ^^ is absolute.
-        ]
-
-    def _get_extra_ap_args(self) -> str:
-        return f",{self._ap_args}" if self._ap_args else ""
-
-    def _get_ap_output_args(self) -> str:
-        return (
-            f",file={self._output_path_process},{self.OUTPUT_FORMAT},"
-            + f"{self.FORMAT_PARAMS}{self._include_method_modifiers}{self._include_line_numbers}"
-        )
-
-    def _get_interval_arg(self, interval: int) -> str:
-        if self._mode == "alloc":
-            return f",alloc={interval}"
-        return f",interval={interval}"
-
-    def _get_start_cmd(self, interval: int, ap_timeout: int) -> List[str]:
-        return self._get_base_cmd() + [
-            f"start,event={self._mode}"
-            f"{self._get_ap_output_args()}{self._get_interval_arg(interval)},"
-            f"log={self._log_path_process}"
-            f"{f',fdtransfer={self._fdtransfer_path}' if self._mode == 'cpu' else ''}"
-            f",safemode={self._ap_safemode},"
-            f",features={'+'.join(self._ap_features)},"  # asprof uses '+' as a separator: https://github.com/async-profiler/async-profiler/blob/a17529378b47e6700d84f89d74ca5e6284ffd1a6/src/launcher/main.cpp#L441  # noqa
-            f"timeout={ap_timeout}"
-            f"{',lib' if self._profiler_state.insert_dso_name else ''}{self._get_extra_ap_args()}"
-        ]
-
-    def _get_stop_cmd(self, with_output: bool) -> List[str]:
-        return self._get_base_cmd() + [
-            f"stop,log={self._log_path_process},mcache={self._mcache}"
-            f"{self._get_ap_output_args() if with_output else ''}"
-            f"{',lib' if self._profiler_state.insert_dso_name else ''}{',meminfolog' if self._collect_meminfo else ''}"
-            f"{self._get_extra_ap_args()}"
-        ]
-
-    def _read_ap_log(self) -> str:
-        if not os.path.exists(self._log_path_host):
-            return "(log file doesn't exist)"
-
-        log = Path(self._log_path_host)
-        ap_log = log.read_text()
-        # clean immediately so we don't mix log messages from multiple invocations.
-        # this is also what AP's profiler.sh does.
-        log.unlink()
-        self._recreate_log()
-        return ap_log
-
-    def _run_async_profiler(self, cmd: List[str]) -> str:
-        try:
-            # kill jattach with SIGTERM if it hangs. it will go down
-            run_process(
-                cmd,
-                stop_event=self._profiler_state.stop_event,
-                timeout=self._jattach_timeout,
-                kill_signal=signal.SIGTERM,
-            )
-        except CalledProcessError as e:  # catches CalledProcessTimeoutError as well
-            assert isinstance(e.stderr, str), f"unexpected type {type(e.stderr)}"
-
-            ap_log = self._read_ap_log()
-            try:
-                ap_loaded = (
-                    "yes" if f" {self._libap_path_process}\n" in read_proc_file(self.process, "maps").decode() else "no"
-                )
-            except NoSuchProcess:
-                ap_loaded = "not sure, process exited"
-
-            args = e.returncode, e.cmd, e.stdout, e.stderr, self.process.pid, ap_log, ap_loaded
-            if isinstance(e, CalledProcessTimeoutError):
-                raise JattachTimeout(*args, timeout=self._jattach_timeout) from None
-            elif e.stderr == "Could not start attach mechanism: No such file or directory\n":
-                # this is true for jattach_hotspot
-                raise JattachSocketMissingException(*args) from None
-            else:
-                raise JattachException(*args) from None
-        else:
-            ap_log = self._read_ap_log()
-            ap_log_stripped = _MEM_INFO_LOG_RE.sub("", ap_log)  # strip out mem info log only when for gProfiler log
-            logger.debug("async-profiler log", jattach_cmd=cmd, ap_log=ap_log_stripped)
-            return ap_log
-
-    def _run_fdtransfer(self) -> None:
-        """
-        Start fdtransfer; it will fork & exit once ready, so we can continue with jattach.
-        """
-        assert self._fdtransfer_path is not None  # should be set if fdntransfer is invoked
-        run_process(
-            # run fdtransfer with accept timeout that's slightly greater than the jattach timeout - to make
-            # sure that fdtransfer is still around for the full duration of jattach, in case the application
-            # takes a while to accept & handle the connection.
-            [
-                asprof_path(),
-                "fdtransfer",
-                "--fd-path",
-                self._fdtransfer_path,
-                "--fdtransfer-timeout",
-                str(self._jattach_timeout + 5),
-                str(self.process.pid),
-            ],
-            stop_event=self._profiler_state.stop_event,
-            timeout=self._FDTRANSFER_TIMEOUT,
-        )
-
-    def start_async_profiler(self, interval: int, second_try: bool = False, ap_timeout: int = 0) -> bool:
-        """
-        Returns True if profiling was started; False if it was already started.
-        ap_timeout defaults to 0, which means "no timeout" for AP (see call to startTimer() in profiler.cpp)
-        """
-        if self._mode == "cpu" and not second_try:
-            self._run_fdtransfer()
-
-        start_cmd = self._get_start_cmd(interval, ap_timeout)
-        try:
-            self._run_async_profiler(start_cmd)
-            return True
-        except JattachException as e:
-            if e.is_ap_loaded:
-                if (
-                    e.returncode == 200  # 200 == AP's COMMAND_ERROR
-                    # this is the error we get when we try to start AP on a process that already has it loaded.
-                    # check with "in" and not "==" in case other warnings/infos are printed alongside it,
-                    # but generally, we expect it to be the only output in this case.
-                    and "[ERROR] Profiler already started\n" in e.get_ap_log()
-                ):
-                    # profiler was already running
-                    return False
-            raise
-
-    def stop_async_profiler(self, with_output: bool) -> str:
-        return self._run_async_profiler(self._get_stop_cmd(with_output))
-
-    def read_output(self) -> Optional[str]:
-        try:
-            return Path(self._output_path_host).read_text()
-        except FileNotFoundError:
-            # perhaps it has exited?
-            if not is_process_running(self.process):
-                return None
-            raise
-
-
 @register_profiler(
     "Java",
     possible_modes=["ap", "disabled"],
@@ -1031,7 +390,9 @@ def __init__(
         self._enabled_proc_events_java = False
         self._collect_jvm_flags = self._init_collect_jvm_flags(java_collect_jvm_flags)
         self._jattach_jcmd_runner = JattachJcmdRunner(
-            stop_event=self._profiler_state.stop_event, jattach_timeout=self._jattach_timeout
+            stop_event=self._profiler_state.stop_event,
+            jattach_timeout=self._jattach_timeout,
+            logger=logger,
         )
         self._ap_timeout = self._duration + self._AP_EXTRA_TIMEOUT_S
         application_identifiers.ApplicationIdentifiers.init_java(self._jattach_jcmd_runner)
@@ -1235,7 +596,7 @@ def _profile_process(self, process: Process, duration: int, spawned: bool) -> Pr
             self._want_to_profile_pids.add(process.pid)
             # there's no reliable way to get the underlying cache of get_java_version, otherwise
             # I'd just use it.
-            if len(self._pid_to_java_version) > _JAVA_VERSION_CACHE_MAX:
+            if len(self._pid_to_java_version) > JAVA_VERSION_CACHE_MAX:
                 self._pid_to_java_version.clear()
 
             # This Java version might be used in _proc_exit_callback
@@ -1269,11 +630,18 @@ def _profile_process(self, process: Process, duration: int, spawned: bool) -> Pr
 
         with AsyncProfiledProcess(
             process,
-            self._profiler_state,
+            self._profiler_state.stop_event,
+            self._profiler_state.storage_dir,
+            self._profiler_state.insert_dso_name,
+            asprof_path(),
+            get_ap_version(),
+            os.path.join("java", "glibc", "libasyncProfiler.so"),
+            os.path.join("java", "musl", "libasyncProfiler.so"),
             self._mode,
             self._ap_safemode,
             self._ap_features,
             self._ap_args,
+            logger,
             self._jattach_timeout,
             self._ap_mcache,
             self._report_meminfo,
@@ -1286,7 +654,7 @@ def _profile_process(self, process: Process, duration: int, spawned: bool) -> Pr
 
     @staticmethod
     def _log_mem_usage(ap_log: str, pid: int) -> None:
-        match = _MEM_INFO_LOG_RE.search(ap_log)
+        match = MEM_INFO_LOG_RE.search(ap_log)
         if match is None:
             logger.warning("Couldn't extract mem usage from ap log", log=ap_log, pid=pid)
             return
diff --git a/gprofiler/utils/__init__.py b/gprofiler/utils/__init__.py
index e93483c6b..e38142dea 100644
--- a/gprofiler/utils/__init__.py
+++ b/gprofiler/utils/__init__.py
@@ -13,64 +13,28 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
-import ctypes
-import datetime
-import glob
-import logging
 import os
-import random
 import re
-import shutil
-import signal
-import socket
-import string
-import subprocess
-import sys
-import time
-from contextlib import contextmanager
 from functools import lru_cache
-from pathlib import Path
-from subprocess import CompletedProcess, Popen, TimeoutExpired
-from tempfile import TemporaryDirectory
-from threading import Event
-from typing import Any, Callable, Dict, Iterator, List, Optional, Tuple, Union, cast
+from typing import List
 
 import importlib_resources
 import psutil
-from granulate_utils.exceptions import CouldNotAcquireMutex
-from granulate_utils.linux.mutex import try_acquire_mutex
-from granulate_utils.linux.ns import run_in_ns
 from granulate_utils.linux.process import is_kernel_thread, process_exe
 from psutil import Process
 
-from gprofiler.consts import CPU_PROFILING_MODE
-from gprofiler.platform import is_linux, is_windows
+from granulate_utils.gprofiler.platform import is_windows
+import granulate_utils.gprofiler.utils as _utils
+from granulate_utils.gprofiler.utils import *
 
 if is_windows():
     import pythoncom
     import wmi
 
-from gprofiler.exceptions import (
-    CalledProcessError,
-    CalledProcessTimeoutError,
-    ProcessStoppedException,
-    ProgramMissingException,
-    StopEventSetException,
-)
 from gprofiler.log import get_logger_adapter
 
 logger = get_logger_adapter(__name__)
 
-GPROFILER_DIRECTORY_NAME = "gprofiler_tmp"
-TEMPORARY_STORAGE_PATH = (
-    f"/tmp/{GPROFILER_DIRECTORY_NAME}"
-    if is_linux()
-    else os.getenv("USERPROFILE", default=os.getcwd()) + f"\\AppData\\Local\\Temp\\{GPROFILER_DIRECTORY_NAME}"
-)
-
-gprofiler_mutex: Optional[socket.socket] = None
-
-
 @lru_cache(maxsize=None)
 def resource_path(relative_path: str = "") -> str:
     *relative_directory, basename = relative_path.split("/")
@@ -81,242 +45,6 @@ def resource_path(relative_path: str = "") -> str:
     except ImportError as e:
         raise Exception(f"Resource {relative_path!r} not found!") from e
 
-
-@lru_cache(maxsize=None)
-def is_root() -> bool:
-    if is_windows():
-        return cast(int, ctypes.windll.shell32.IsUserAnAdmin()) == 1  # type: ignore
-    else:
-        return os.geteuid() == 0
-
-
-libc: Optional[ctypes.CDLL] = None
-
-
-def prctl(*argv: Any) -> int:
-    global libc
-    if libc is None:
-        libc = ctypes.CDLL("libc.so.6", use_errno=True)
-    return cast(int, libc.prctl(*argv))
-
-
-PR_SET_PDEATHSIG = 1
-
-
-def set_child_termination_on_parent_death() -> int:
-    ret = prctl(PR_SET_PDEATHSIG, signal.SIGTERM)
-    if ret != 0:
-        errno = ctypes.get_errno()
-        logger.warning(
-            f"Failed to set parent-death signal on child process. errno: {errno}, strerror: {os.strerror(errno)}"
-        )
-    return ret
-
-
-def wrap_callbacks(callbacks: List[Callable]) -> Callable:
-    # Expects array of callback.
-    # Returns one callback that call each one of them, and returns the retval of last callback
-    def wrapper() -> Any:
-        ret = None
-        for cb in callbacks:
-            ret = cb()
-
-        return ret
-
-    return wrapper
-
-
-def start_process(
-    cmd: Union[str, List[str]], via_staticx: bool = False, term_on_parent_death: bool = True, **kwargs: Any
-) -> Popen:
-    if isinstance(cmd, str):
-        cmd = [cmd]
-
-    logger.debug("Running command", command=cmd)
-
-    env = kwargs.pop("env", None)
-    staticx_dir = get_staticx_dir()
-    # are we running under staticx?
-    if staticx_dir is not None:
-        # if so, if "via_staticx" was requested, then run the binary with the staticx ld.so
-        # because it's supposed to be run with it.
-        if via_staticx:
-            # staticx_dir (from STATICX_BUNDLE_DIR) is where staticx has extracted all of the
-            # libraries it had collected earlier.
-            # see https://github.com/JonathonReinhart/staticx#run-time-information
-            cmd = [f"{staticx_dir}/.staticx.interp", "--library-path", staticx_dir] + cmd
-        else:
-            env = env if env is not None else os.environ.copy()
-            # ensure `TMPDIR` env is propagated to the child processes (used by staticx)
-            if "TMPDIR" not in env and "TMPDIR" in os.environ:
-                env["TMPDIR"] = os.environ["TMPDIR"]
-            # explicitly remove our directory from LD_LIBRARY_PATH
-            env["LD_LIBRARY_PATH"] = ""
-
-    if is_windows():
-        cur_preexec_fn = None  # preexec_fn is not supported on Windows platforms. subprocess.py reports this.
-    else:
-        cur_preexec_fn = kwargs.pop("preexec_fn", os.setpgrp)
-        if term_on_parent_death:
-            cur_preexec_fn = wrap_callbacks([set_child_termination_on_parent_death, cur_preexec_fn])
-
-    popen = Popen(
-        cmd,
-        stdout=kwargs.pop("stdout", subprocess.PIPE),
-        stderr=kwargs.pop("stderr", subprocess.PIPE),
-        stdin=subprocess.PIPE,
-        preexec_fn=cur_preexec_fn,
-        env=env,
-        **kwargs,
-    )
-    return popen
-
-
-def wait_event(timeout: float, stop_event: Event, condition: Callable[[], bool], interval: float = 0.1) -> None:
-    end_time = time.monotonic() + timeout
-    while True:
-        if condition():
-            break
-
-        if stop_event.wait(interval):
-            raise StopEventSetException()
-
-        if time.monotonic() > end_time:
-            raise TimeoutError()
-
-
-def poll_process(process: Popen, timeout: float, stop_event: Event) -> None:
-    try:
-        wait_event(timeout, stop_event, lambda: process.poll() is not None)
-    except StopEventSetException:
-        process.kill()
-        raise
-
-
-def remove_files_by_prefix(prefix: str) -> None:
-    for f in glob.glob(f"{prefix}*"):
-        os.unlink(f)
-
-
-def wait_for_file_by_prefix(prefix: str, timeout: float, stop_event: Event) -> Path:
-    glob_pattern = f"{prefix}*"
-    wait_event(timeout, stop_event, lambda: len(glob.glob(glob_pattern)) > 0)
-
-    output_files = glob.glob(glob_pattern)
-    # All the snapshot samples should be in one file
-    if len(output_files) != 1:
-        # this can happen if:
-        # * the profiler generating those files is erroneous
-        # * the profiler received many signals (and it generated files based on signals)
-        # * errors in gProfiler led to previous output fails remain not removed
-        # in any case, we remove all old files, and assume the last one (after sorting by timestamp)
-        # is the one we want.
-        logger.warning(
-            f"One output file expected, but found {len(output_files)}."
-            f" Removing all and using the last one. {output_files}"
-        )
-        # timestamp format guarantees alphabetical order == chronological order.
-        output_files.sort()
-        for f in output_files[:-1]:
-            os.unlink(f)
-        output_files = output_files[-1:]
-
-    return Path(output_files[0])
-
-
-def reap_process(process: Popen) -> Tuple[int, bytes, bytes]:
-    """
-    Safely reap a process. This function expects the process to be exited or exiting.
-    It uses communicate() instead of wait() to avoid the possible deadlock in wait()
-    (see https://docs.python.org/3/library/subprocess.html#subprocess.Popen.wait, and see
-    ticket https://github.com/Granulate/gprofiler/issues/744).
-    """
-    stdout, stderr = process.communicate()
-    returncode = process.poll()
-    assert returncode is not None  # only None if child has not terminated
-    return returncode, stdout, stderr
-
-
-def _kill_and_reap_process(process: Popen, kill_signal: signal.Signals) -> Tuple[int, bytes, bytes]:
-    process.send_signal(kill_signal)
-    logger.debug(
-        f"({process.args!r}) was killed by us with signal {kill_signal} due to timeout or stop request, reaping it"
-    )
-    return reap_process(process)
-
-
-def run_process(
-    cmd: Union[str, List[str]],
-    *,
-    stop_event: Event = None,
-    suppress_log: bool = False,
-    via_staticx: bool = False,
-    check: bool = True,
-    timeout: int = None,
-    kill_signal: signal.Signals = signal.SIGTERM if is_windows() else signal.SIGKILL,
-    stdin: bytes = None,
-    **kwargs: Any,
-) -> "CompletedProcess[bytes]":
-    stdout: bytes
-    stderr: bytes
-
-    reraise_exc: Optional[BaseException] = None
-    with start_process(cmd, via_staticx, **kwargs) as process:
-        assert isinstance(process.args, str) or (
-            isinstance(process.args, list) and all(isinstance(s, str) for s in process.args)
-        ), process.args  # mypy
-
-        try:
-            if stdin is not None:
-                assert process.stdin is not None
-                process.stdin.write(stdin)
-            if stop_event is None:
-                assert timeout is None, f"expected no timeout, got {timeout!r}"
-                # wait for stderr & stdout to be closed
-                stdout, stderr = process.communicate()
-            else:
-                end_time = (time.monotonic() + timeout) if timeout is not None else None
-                while True:
-                    try:
-                        stdout, stderr = process.communicate(timeout=1)
-                        break
-                    except TimeoutExpired:
-                        if stop_event.is_set():
-                            raise ProcessStoppedException from None
-                        if end_time is not None and time.monotonic() > end_time:
-                            assert timeout is not None
-                            raise
-        except TimeoutExpired:
-            returncode, stdout, stderr = _kill_and_reap_process(process, kill_signal)
-            assert timeout is not None
-            reraise_exc = CalledProcessTimeoutError(
-                timeout, returncode, cmd, stdout.decode("latin-1"), stderr.decode("latin-1")
-            )
-        except BaseException as e:  # noqa
-            returncode, stdout, stderr = _kill_and_reap_process(process, kill_signal)
-            reraise_exc = e
-        retcode = process.poll()
-        assert retcode is not None  # only None if child has not terminated
-
-    result: CompletedProcess[bytes] = CompletedProcess(process.args, retcode, stdout, stderr)
-
-    # decoding stdout/stderr as latin-1 which should never raise UnicodeDecodeError.
-    extra: Dict[str, Any] = {"exit_code": result.returncode}
-    if not suppress_log:
-        if result.stdout:
-            extra["stdout"] = result.stdout.decode("latin-1")
-        if result.stderr:
-            extra["stderr"] = result.stderr.decode("latin-1")
-    logger.debug("Command exited", command=process.args, **extra)
-    if reraise_exc is not None:
-        raise reraise_exc
-    elif check and retcode != 0:
-        raise CalledProcessError(
-            retcode, process.args, output=stdout.decode("latin-1"), stderr=stderr.decode("latin-1")
-        )
-    return result
-
-
 if is_windows():
 
     def pgrep_exe(match: str) -> List[Process]:
@@ -343,215 +71,52 @@ def pgrep_exe(match: str) -> List[Process]:
         return procs
 
 
-def pgrep_maps(match: str) -> List[Process]:
-    # this is much faster than iterating over processes' maps with psutil.
-    # We use flag -E in grep to support systems where grep is not PCRE
-    result = run_process(
-        f"grep -lE '{match}' /proc/*/maps",
-        stdout=subprocess.PIPE,
-        stderr=subprocess.PIPE,
-        shell=True,
-        suppress_log=True,
-        check=False,
-    )
-    # 0 - found
-    # 1 - not found
-    # 2 - error (which we might get for a missing /proc/pid/maps file of a process which just exited)
-    # so this ensures grep wasn't killed by a signal
-    assert result.returncode in (
-        0,
-        1,
-        2,
-    ), f"unexpected 'grep' exit code: {result.returncode}, stdout {result.stdout!r} stderr {result.stderr!r}"
-
-    error_lines = []
-    for line in result.stderr.splitlines():
-        if not (
-            line.startswith(b"grep: /proc/")
-            and (line.endswith(b"/maps: No such file or directory") or line.endswith(b"/maps: No such process"))
-        ):
-            error_lines.append(line)
-    if error_lines:
-        logger.error(f"Unexpected 'grep' error output (first 10 lines): {error_lines[:10]}")
-
-    processes: List[Process] = []
-    for line in result.stdout.splitlines():
-        assert line.startswith(b"/proc/") and line.endswith(b"/maps"), f"unexpected 'grep' line: {line!r}"
-        pid = int(line[len(b"/proc/") : -len(b"/maps")])
-        try:
-            processes.append(Process(pid))
-        except psutil.NoSuchProcess:
-            continue  # process might have died meanwhile
-
-    return processes
-
-
-def get_iso8601_format_time_from_epoch_time(time: float) -> str:
-    return get_iso8601_format_time(datetime.datetime.utcfromtimestamp(time))
-
-
-def get_iso8601_format_time(time: datetime.datetime) -> str:
-    return time.replace(microsecond=0).isoformat()
-
-
-def remove_prefix(s: str, prefix: str) -> str:
-    # like str.removeprefix of Python 3.9, but this also ensures the prefix exists.
-    assert s.startswith(prefix), f"{s} doesn't start with {prefix}"
-    return s[len(prefix) :]
-
-
-def touch_path(path: str, mode: int) -> None:
-    Path(path).touch()
-    # chmod() afterwards (can't use 'mode' in touch(), because it's affected by umask)
-    os.chmod(path, mode)
-
-
-def remove_path(path: Union[str, Path], missing_ok: bool = False) -> None:
-    # backporting missing_ok, available only from 3.8
-    try:
-        Path(path).unlink()
-    except FileNotFoundError:
-        if not missing_ok:
-            raise
-
-
-@contextmanager
-def removed_path(path: str) -> Iterator[None]:
-    try:
-        yield
-    finally:
-        remove_path(path, missing_ok=True)
-
-
-_INSTALLED_PROGRAMS_CACHE: List[str] = []
-
-
-def assert_program_installed(program: str) -> None:
-    if program in _INSTALLED_PROGRAMS_CACHE:
-        return
-
-    if shutil.which(program) is not None:
-        _INSTALLED_PROGRAMS_CACHE.append(program)
-    else:
-        raise ProgramMissingException(program)
-
-
-def grab_gprofiler_mutex() -> bool:
-    """
-    Implements a basic, system-wide mutex for gProfiler, to make sure we don't run 2 instances simultaneously.
-    The mutex is implemented by a Unix domain socket bound to an address in the abstract namespace of the init
-    network namespace. This provides automatic cleanup when the process goes down, and does not make any assumption
-    on filesystem structure (as happens with file-based locks).
-    In order to see who's holding the lock now, you can run "sudo netstat -xp | grep gprofiler".
-    """
-    GPROFILER_LOCK = "\x00gprofiler_lock"
-
-    try:
-        run_in_ns(["net"], lambda: try_acquire_mutex(GPROFILER_LOCK))
-    except CouldNotAcquireMutex:
-        print(
-            "Could not acquire gProfiler's lock. Is it already running?"
-            " Try 'sudo netstat -xp | grep gprofiler' to see which process holds the lock.",
-            file=sys.stderr,
-        )
-        return False
-    else:
-        # success
-        return True
-
-
-def atomically_symlink(target: str, link_node: str) -> None:
-    """
-    Create a symlink file at 'link_node' pointing to 'target'.
-    If a file already exists at 'link_node', it is replaced atomically.
-    Would be obsoloted by https://bugs.python.org/issue36656, which covers this as well.
-    """
-    tmp_path = link_node + ".tmp"
-    os.symlink(target, tmp_path)
-    os.rename(tmp_path, link_node)
-
-
-class TemporaryDirectoryWithMode(TemporaryDirectory):
-    def __init__(self, *args: Any, mode: int = None, **kwargs: Any):
-        super().__init__(*args, **kwargs)
-        if mode is not None:
-            os.chmod(self.name, mode)
-
-
-def reset_umask() -> None:
-    """
-    Resets our umask back to a sane value.
-    """
-    os.umask(0o022)
-
-
-def limit_frequency(
-    limit: Optional[int],
-    requested: int,
-    msg_header: str,
-    runtime_logger: logging.LoggerAdapter,
-    profiling_mode: str,
-) -> int:
-    if profiling_mode != CPU_PROFILING_MODE:
-        return requested
-
-    if limit is not None and requested > limit:
-        runtime_logger.warning(
-            f"{msg_header}: Requested frequency ({requested}) is higher than the limit {limit}, "
-            f"limiting the frequency to the limit ({limit})"
-        )
-        return limit
-
-    return requested
-
-
-def random_prefix() -> str:
-    return "".join(random.choice(string.ascii_letters) for _ in range(16))
-
-
-PERF_EVENT_MLOCK_KB = "/proc/sys/kernel/perf_event_mlock_kb"
-
-
-def read_perf_event_mlock_kb() -> int:
-    return int(Path(PERF_EVENT_MLOCK_KB).read_text())
-
-
-def write_perf_event_mlock_kb(value: int) -> None:
-    Path(PERF_EVENT_MLOCK_KB).write_text(str(value))
-
-
-def is_pyinstaller() -> bool:
-    """
-    Are we running in PyInstaller?
-    """
-    # https://pyinstaller.readthedocs.io/en/stable/runtime-information.html#run-time-information
-    return getattr(sys, "frozen", False) and hasattr(sys, "_MEIPASS")
+def set_child_termination_on_parent_death() -> int:
+    return _utils.set_child_termination_on_parent_death(logger)
 
 
-def get_staticx_dir() -> Optional[str]:
-    return os.getenv("STATICX_BUNDLE_DIR")
+def start_process(
+    cmd: Union[str, List[str]],
+    via_staticx: bool = False,
+    term_on_parent_death: bool = True,
+    **kwargs: Any,
+) -> Popen:
+    return _utils.start_process(cmd, via_staticx, term_on_parent_death, **kwargs)
 
 
-def add_permission_dir(path: str, permission_for_file: int, permission_for_dir: int) -> None:
-    os.chmod(path, os.stat(path).st_mode | permission_for_dir)
-    for subpath in os.listdir(path):
-        absolute_subpath = os.path.join(path, subpath)
-        if os.path.isdir(absolute_subpath):
-            add_permission_dir(absolute_subpath, permission_for_file, permission_for_dir)
-        else:
-            os.chmod(absolute_subpath, os.stat(absolute_subpath).st_mode | permission_for_file)
+def wait_for_file_by_prefix(
+    prefix: str,
+    timeout: float,
+    stop_event: Event,
+) -> Path:
+    return _utils.wait_for_file_by_prefix(prefix, timeout, stop_event, logger)
 
 
-def merge_dicts(source: Dict[str, Any], dest: Dict[str, Any]) -> Dict[str, Any]:
-    for key, value in source.items():
-        # in case value is a dict itself
-        if isinstance(value, dict):
-            node = dest.setdefault(key, {})
-            merge_dicts(value, node)
-        else:
-            dest[key] = value
-    return dest
+def run_process(
+    cmd: Union[str, List[str]],
+    *,
+    stop_event: Event = None,
+    suppress_log: bool = False,
+    via_staticx: bool = False,
+    check: bool = True,
+    timeout: int = None,
+    kill_signal: signal.Signals = signal.SIGTERM if is_windows() else signal.SIGKILL,
+    stdin: bytes = None,
+    **kwargs: Any,
+) -> "CompletedProcess[bytes]":
+    return _utils.run_process(
+        cmd,
+        logger,
+        stop_event=stop_event,
+        suppress_log=suppress_log,
+        via_staticx=via_staticx,
+        check=check,
+        timeout=timeout,
+        kill_signal=kill_signal,
+        stdin=stdin,
+        **kwargs,
+    )
 
 
-def is_profiler_disabled(profile_mode: str) -> bool:
-    return profile_mode in ("none", "disabled")
+def pgrep_maps(match: str) -> List[Process]:
+    return _utils.pgrep_maps(match, logger)