Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

feat(interactive): Implement a c++ wrapper for compiler's GraphPlanner #4310

Merged
merged 33 commits into from
Jan 14, 2025
Merged
Show file tree
Hide file tree
Changes from 4 commits
Commits
Show all changes
33 commits
Select commit Hold shift + click to select a range
87e948a
add impl
zhanglei1949 Nov 4, 2024
dbde861
merge
zhanglei1949 Nov 4, 2024
ba68cb5
call-compiler-via-jni
zhanglei1949 Nov 4, 2024
ef312c9
fixing ci
zhanglei1949 Nov 4, 2024
ee687ec
add guard to control jni or subprocess
zhanglei1949 Nov 8, 2024
65b049e
support jni or pip3
zhanglei1949 Nov 11, 2024
bc71bf6
introduce c++ wrapper for graph planner
shirly121 Dec 10, 2024
0198fe8
Merge remote-tracking branch 'origin/main' into call-compiler-via-jni
shirly121 Dec 10, 2024
93b43fa
fix compilation
zhanglei1949 Dec 11, 2024
837a07e
set cxx_standard 17 to use filesystem
zhanglei1949 Dec 11, 2024
ad49402
add graph-planner-jni in root pom
shirly121 Dec 11, 2024
f55eed6
remove the cargo build phase from mvn build
shirly121 Dec 11, 2024
ce0bbc4
fix compiling errors in mac os
shirly121 Dec 11, 2024
8e3cb54
minor fix
shirly121 Dec 11, 2024
7ffc2e4
fix bugs of jni building and add readme
shirly121 Dec 11, 2024
8617793
refine jni interface, accept graph schema and statistics in string
shirly121 Dec 11, 2024
e217d75
expose 'compilePlan' interface by restful api
shirly121 Dec 12, 2024
f23b478
impl GraphPlanner as single instance to avoid creation overhead in ea…
shirly121 Dec 12, 2024
0c6f3fd
add function uri in yaml configs
shirly121 Jan 8, 2025
85855b9
minor fix
shirly121 Jan 8, 2025
6b0c2d9
Merge remote-tracking branch 'origin/main' into call-compiler-via-jni
shirly121 Jan 9, 2025
e34049a
add docs for graph planner interface
shirly121 Jan 9, 2025
f8e2140
revert changes to parent pom
shirly121 Jan 9, 2025
eb4edc3
revert changes to compiler conf
shirly121 Jan 10, 2025
f251452
fix hiactor config used for graph planner jni examples
shirly121 Jan 10, 2025
3737edc
Merge remote-tracking branch 'origin/main' into call-compiler-via-jni
shirly121 Jan 10, 2025
f8b406a
revert space
zhanglei1949 Jan 10, 2025
8e7fcdc
fix ci bugs of gs interactive
shirly121 Jan 10, 2025
6834ac9
Merge branch 'call-compiler-via-jni' of https://github.com/zhanglei19…
shirly121 Jan 10, 2025
ecfacd4
add basic type proto in CMakeLists
shirly121 Jan 10, 2025
cc6dfc1
fix bugs of reading query in graph planner
shirly121 Jan 10, 2025
4347546
fixing workflow
zhanglei1949 Jan 13, 2025
8cb0b05
Merge remote-tracking branch 'upstream/main' into call-compiler-via-jni
liulx20 Jan 13, 2025
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
21 changes: 21 additions & 0 deletions .github/workflows/interactive.yml
Original file line number Diff line number Diff line change
Expand Up @@ -317,6 +317,27 @@ jobs:
cd ${GITHUB_WORKSPACE}/interactive_engine/
mvn clean install -Pexperimental -DskipTests -q

- name: Test physical plan generation
run: |
cd ${GITHUB_WORKSPACE}/flex/build
cat > /tmp/physical_plan_gen_config.yaml <<EOF
compiler:
planner:
is_on: true
opt: CBO
rules:
- FilterIntoJoinRule
- FilterMatchRule
- NotMatchToAntiJoinRule
physical.opt.config: proto
EOF
echo " meta.reader.schema.uri: ${GITHUB_WORKSPACE}/flex/interactive/examples/modern_graph/graph.yaml" >> /tmp/physical_plan_gen_config.yaml
echo " meta.reader.statistics.uri: ${GITHUB_WORKSPACE}/interactive_engine/compiler/src/test/resources/statistics/modern_statistics.json" >> /tmp/physical_plan_gen_config.yaml

./tests/planner/graph_planner_test ${GITHUB_WORKSPACE}/interactive_engine/compiler/target/compiler-0.0.1-SNAPSHOT.jar:${GITHUB_WORKSPACE}/interactive_engine/compiler/target/libs/ \
${GITHUB_WORKSPACE}/interactive_engine/executor/ir/target/release/ ${GITHUB_WORKSPACE}/flex/interactive/examples/modern_graph/graph.yaml \
/tmp/physical_plan_gen_config.yaml "MATCH(n) return count(n);"

- name: Run End-to-End cypher adhoc ldbc query test
env:
GS_TEST_DIR: ${{ github.workspace }}/gstest
Expand Down
10 changes: 10 additions & 0 deletions flex/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -93,6 +93,15 @@ find_package(libgrapelite REQUIRED)
include_directories(SYSTEM ${LIBGRAPELITE_INCLUDE_DIRS})
include_directories(SYSTEM ${LIBGRAPELITE_INCLUDE_DIRS}/grape/analytical_apps)

# find JNI-----------------------------------------------------------------------
find_package(JNI REQUIRED)
if (JNI_FOUND)
include_directories(SYSTEM ${JAVA_INCLUDE_PATH})
include_directories(SYSTEM ${JAVA_INCLUDE_PATH2})
else()
message(FATAL_ERROR "JNI not found")
endif()

# find Threads------------------------------------------------------------------
set(CMAKE_THREAD_PREFER_PTHREAD ON)
find_package(Threads REQUIRED)
Expand Down Expand Up @@ -233,6 +242,7 @@ endif()
if (BUILD_TEST)
add_subdirectory(tests)
endif()
add_subdirectory(planner)


configure_file(${CMAKE_CURRENT_SOURCE_DIR}/flex-config.in.cmake
Expand Down
5 changes: 5 additions & 0 deletions flex/planner/CMakeLists.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
file(GLOB_RECURSE PLANNER_SRC_FILES "${CMAKE_CURRENT_SOURCE_DIR}/*.cc")

add_library(graph_planner SHARED ${PLANNER_SRC_FILES})
target_link_libraries(graph_planner PUBLIC flex_plan_proto ${CMAKE_JNI_LINKER_FLAGS} ${JAVA_JVM_LIBRARY} ${JNI_LIBRARIES})
target_include_directories(graph_planner PUBLIC $<BUILD_INTERFACE:${CMAKE_CURRENT_BINARY_DIR}>)
3 changes: 3 additions & 0 deletions flex/planner/README.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
# GraphScope Interactive Query Planner

This directory contains the c++ wrapper of Interactive Query Planner, which is implemented in [java](https://github.com/alibaba/GraphScope/tree/main/interactive_engine/compiler).
235 changes: 235 additions & 0 deletions flex/planner/graph_planner.cc
Original file line number Diff line number Diff line change
@@ -0,0 +1,235 @@
/** Copyright 2020 Alibaba Group Holding Limited.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/

#include <flex/planner/graph_planner.h>

namespace gs {
namespace jni {

static JavaVM* _jvm = NULL;

JavaVM* CreateJavaVM(const std::string& jvm_options) {
const char *p, *q;
const char* jvm_opts;
if (jvm_options.empty()) {
jvm_opts = getenv("FLEX_JVM_OPTS");
} else {
jvm_opts = jvm_options.c_str();
}
if (jvm_opts == NULL) {
LOG(FATAL) << "Expect FLEX_JVM_OPTS set before initiate jvm";
return NULL;
}
VLOG(1) << "Jvm opts str: " << jvm_opts;

if (*jvm_opts == '\0')
return NULL;

int num_of_opts = 1;
for (const char* p = jvm_opts; *p; p++) {
if (*p == ' ')
num_of_opts++;
}

if (num_of_opts == 0)
return NULL;

JavaVM* jvm = NULL;
JNIEnv* env = NULL;
int i = 0;
int status = 1;
JavaVMInitArgs vm_args;

JavaVMOption* options = new JavaVMOption[num_of_opts];
memset(options, 0, sizeof(JavaVMOption) * num_of_opts);

for (p = q = jvm_opts;; p++) {
if (*p == ' ' || *p == '\0') {
if (q >= p) {
goto ret;
}
char* opt = new char[p - q + 1];
memcpy(opt, q, p - q);
opt[p - q] = '\0';
options[i++].optionString = opt;
q = p + 1; // assume opts are separated by single space
if (*p == '\0')
break;
}
}

memset(&vm_args, 0, sizeof(vm_args));
vm_args.version = JNI_VERSION_1_8;
vm_args.nOptions = num_of_opts;
vm_args.options = options;

status = JNI_CreateJavaVM(&jvm, reinterpret_cast<void**>(&env), &vm_args);
if (status == JNI_OK) {
LOG(INFO) << "Create java virtual machine successfully.";
} else if (status == JNI_EEXIST) {
VLOG(1) << "JNI evn already exists.";
} else {
LOG(ERROR) << "Error, create java virtual machine failed. return JNI_CODE ("
<< status << ")\n";
}

ret:
for (int i = 0; i < num_of_opts; i++) {
delete[] options[i].optionString;
}
delete[] options;
return jvm;
}

// One process can only create jvm for once.

Check notice on line 96 in flex/planner/graph_planner.cc

View check run for this annotation

codefactor.io / CodeFactor

flex/planner/graph_planner.cc#L23-L96

Complex Method
JavaVM* GetJavaVM(const std::string jvm_options = "") {
if (_jvm == NULL) {
// Try to find whether there exists one javaVM
jsize nVMs;
JNI_GetCreatedJavaVMs(NULL, 0,
&nVMs); // 1. just get the required array length
VLOG(1) << "Found " << nVMs << " VMs existing in this process.";
JavaVM** buffer = new JavaVM*[nVMs];
JNI_GetCreatedJavaVMs(buffer, nVMs, &nVMs); // 2. get the data
for (auto i = 0; i < nVMs; ++i) {
if (buffer[i] != NULL) {
_jvm = buffer[i];
VLOG(1) << "Found index " << i << " VM non null "
<< reinterpret_cast<jlong>(_jvm);
return _jvm;
}
}
_jvm = CreateJavaVM(jvm_options);
VLOG(1) << "Created JVM " << reinterpret_cast<jlong>(_jvm);
}
return _jvm;
}

JNIEnvMark::JNIEnvMark() : JNIEnvMark::JNIEnvMark("") {}

JNIEnvMark::JNIEnvMark(const std::string& jvm_options) : _env(NULL) {
if (!GetJavaVM(jvm_options)) {
return;
}
int status =
GetJavaVM(jvm_options)
->AttachCurrentThread(reinterpret_cast<void**>(&_env), nullptr);
if (status != JNI_OK) {
LOG(ERROR) << "Error attach current thread: " << status;
}
}

JNIEnvMark::~JNIEnvMark() {
if (_env) {
GetJavaVM()->DetachCurrentThread();
}
}

JNIEnv* JNIEnvMark::env() { return _env; }

physical::PhysicalPlan GraphPlannerWrapper::CompilePlan(
const std::string& compiler_config_path,
const std::string& cypher_query_string) {
physical::PhysicalPlan physical_plan;
if (!is_valid()) {
LOG(ERROR) << "Invalid GraphPlannerWrapper.";
return physical_plan;
}
jstring param1 =
jni_wrapper_.env()->NewStringUTF(compiler_config_path.c_str());
jstring param2 =
jni_wrapper_.env()->NewStringUTF(cypher_query_string.c_str());

jbyteArray res = (jbyteArray) jni_wrapper_.env()->CallStaticObjectMethod(
graph_planner_clz_, graph_planner_method_id_, param1, param2);
if (jni_wrapper_.env()->ExceptionCheck()) {
jni_wrapper_.env()->ExceptionDescribe();
jni_wrapper_.env()->ExceptionClear();
LOG(ERROR) << "Error in calling GraphPlanner.";
return physical_plan;
}
if (res == NULL) {
LOG(ERROR) << "Fail to generate plan.";
return physical_plan;
}
jbyte* str = jni_wrapper_.env()->GetByteArrayElements(res, NULL);
jsize len = jni_wrapper_.env()->GetArrayLength(res);
LOG(INFO) << "Physical plan size: " << len;

physical_plan.ParseFromArray(str, len);
jni_wrapper_.env()->ReleaseByteArrayElements(res, str, 0);
jni_wrapper_.env()->DeleteLocalRef(param1);
jni_wrapper_.env()->DeleteLocalRef(param2);
jni_wrapper_.env()->DeleteLocalRef(res);

return physical_plan;
}

std::string GraphPlannerWrapper::generate_jvm_options(
const std::string java_path, const std::string& jna_path,
const std::string& graph_schema_yaml,
const std::string& graph_statistic_json) {
auto expanded_java_path = expand_directory(java_path);
VLOG(10) << "Expanded java path: " << expanded_java_path;
std::string jvm_options = "-Djava.class.path=" + expanded_java_path;
jvm_options += " -Djna.library.path=" + jna_path;
jvm_options += " -Dgraph.schema=" + graph_schema_yaml;
if (!graph_statistic_json.empty()) {
jvm_options += " -Dgraph.statistic=" + graph_statistic_json;
}
return jvm_options;
}

std::string GraphPlannerWrapper::expand_directory(const std::string& path) {
std::vector<std::string> paths;
std::string::size_type start = 0;
std::string::size_type end = path.find(':');
while (end != std::string::npos) {
auto sub_path = path.substr(start, end - start);
if (!sub_path.empty()) {
if (std::filesystem::is_directory(sub_path)) {
auto files = list_files(sub_path);
paths.insert(paths.end(), files.begin(), files.end());
} else {
paths.push_back(sub_path);
}
}
start = end + 1;
end = path.find(':', start);
}
auto sub_path = path.substr(start);
if (!sub_path.empty()) {
auto files = list_files(sub_path);
paths.insert(paths.end(), files.begin(), files.end());
}
std::stringstream ss;
for (const auto& p : paths) {
ss << p << ":";
}
return ss.str();
}

std::vector<std::string> GraphPlannerWrapper::list_files(
const std::string& path) {
// list all files in the directory
std::vector<std::string> files;
for (const auto& entry : std::filesystem::directory_iterator(path)) {
files.push_back(entry.path().string());
}
return files;
}

} // namespace jni
} // namespace gs
Loading
Loading