Skip to content

Commit

Permalink
Merge branch 'main' into refactor
Browse files Browse the repository at this point in the history
  • Loading branch information
liulx20 authored Jan 16, 2025
2 parents 81c0fae + a60e912 commit 6843a29
Show file tree
Hide file tree
Showing 49 changed files with 3,596 additions and 121 deletions.
23 changes: 23 additions & 0 deletions .github/workflows/interactive.yml
Original file line number Diff line number Diff line change
Expand Up @@ -218,6 +218,7 @@ jobs:



- name: Sample Query test
env:
GS_TEST_DIR: ${{ github.workspace }}/gstest
Expand Down Expand Up @@ -309,6 +310,28 @@ jobs:
cd ${GITHUB_WORKSPACE}/interactive_engine/
mvn clean install -Pexperimental -DskipTests -q
- name: Test physical plan generation
run: |
cd ${GITHUB_WORKSPACE}/interactive_engine
cat > /tmp/physical_plan_gen_config.yaml <<EOF
compiler:
planner:
is_on: true
opt: CBO
rules:
- FilterIntoJoinRule
- FilterMatchRule
- NotMatchToAntiJoinRule
physical.opt.config: proto
EOF
echo " meta.reader.schema.uri: ${GITHUB_WORKSPACE}/flex/interactive/examples/modern_graph/graph.yaml" >> /tmp/physical_plan_gen_config.yaml
echo " meta.reader.statistics.uri: ${GITHUB_WORKSPACE}/interactive_engine/compiler/src/test/resources/statistics/modern_statistics.json" >> /tmp/physical_plan_gen_config.yaml
mvn clean install -DskipTests -Pgraph-planner-jni
INTERACTIVE_ENGINE_HOME=${GITHUB_WORKSPACE}/interactive_engine
./target/native/test_graph_planner ${INTERACTIVE_ENGINE_HOME}/compiler/target/compiler-0.0.1-SNAPSHOT.jar:${INTERACTIVE_ENGINE_HOME}/compiler/target/libs/ ${INTERACTIVE_ENGINE_HOME}/executor/ir/target/release/libir_core.so \
${GITHUB_WORKSPACE}/flex/interactive/examples/modern_graph/graph.yaml ${INTERACTIVE_ENGINE_HOME}/compiler/src/test/resources/statistics/modern_statistics.json \
"MATCH(n) return count(n);" /tmp/physical_plan_gen_config.yaml
- name: Run End-to-End cypher adhoc ldbc query test
env:
GS_TEST_DIR: ${{ github.workspace }}/gstest
Expand Down
4 changes: 2 additions & 2 deletions analytical_engine/apps/pregel/louvain/louvain_app_base.h
Original file line number Diff line number Diff line change
Expand Up @@ -223,11 +223,11 @@ class LouvainAppBase
auto actual_quality =
ctx.compute_context().template get_aggregated_value<double>(
actual_quality_aggregator);
assert(actual_quality <= 1.0);
// after one pass if already decided halt, that means the pass yield no
// changes, so we halt computation.
if (current_super_step <= 14 ||
std::fabs(actual_quality - ctx.prev_quality()) <
min_quality_improvement) {
(actual_quality - ctx.prev_quality()) <= min_quality_improvement) {
// turn to sync community result
ctx.compute_context().set_superstep(sync_result_step);
syncCommunity(frag, ctx, messages);
Expand Down
13 changes: 1 addition & 12 deletions analytical_engine/apps/pregel/louvain/louvain_vertex.h
Original file line number Diff line number Diff line change
Expand Up @@ -68,7 +68,7 @@ class LouvainVertex : public PregelVertex<FRAG_T, VD_T, MD_T> {

size_t edge_size() {
if (!this->use_fake_edges()) {
return this->incoming_edges().Size() + this->outgoing_edges().Size();
return this->outgoing_edges().Size();
} else {
return this->fake_edges().size();
}
Expand All @@ -88,11 +88,6 @@ class LouvainVertex : public PregelVertex<FRAG_T, VD_T, MD_T> {

edata_t get_edge_value(const vid_t& dst_id) {
if (!this->use_fake_edges()) {
for (auto& edge : this->incoming_edges()) {
if (this->fragment_->Vertex2Gid(edge.get_neighbor()) == dst_id) {
return static_cast<edata_t>(edge.get_data());
}
}
for (auto& edge : this->outgoing_edges()) {
if (this->fragment_->Vertex2Gid(edge.get_neighbor()) == dst_id) {
return static_cast<edata_t>(edge.get_data());
Expand All @@ -117,12 +112,6 @@ class LouvainVertex : public PregelVertex<FRAG_T, VD_T, MD_T> {
edata_t get_edge_values(const std::set<vid_t>& dst_ids) {
edata_t ret = 0;
if (!this->use_fake_edges()) {
for (auto& edge : this->incoming_edges()) {
auto gid = this->fragment_->Vertex2Gid(edge.get_neighbor());
if (dst_ids.find(gid) != dst_ids.end()) {
ret += static_cast<edata_t>(edge.get_data());
}
}
for (auto& edge : this->outgoing_edges()) {
auto gid = this->fragment_->Vertex2Gid(edge.get_neighbor());
if (dst_ids.find(gid) != dst_ids.end()) {
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -113,11 +113,11 @@ public void receiveMessages() {
///////////////////////////////////////////
bytesOfReceivedMsg += tmpVector.size();
}
tmpVector.delete();
logger.info(
"Frag [{}] totally Received [{}] bytes from others starting deserialization",
fragId,
bytesOfReceivedMsg);
tmpVector.delete();
}

/**
Expand Down Expand Up @@ -256,5 +256,9 @@ public void postSuperstep() {
}

@Override
public void postApplication() {}
public void postApplication() {
for (int i = 0; i < fragNum; ++i) {
cacheOut[i].close();
}
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -38,6 +38,11 @@ public FFIByteVectorOutputStream(FFIByteVector vector) {
offset = 0;
}

@Override
public void close() {
vector.delete();
}

public void resize(long size) {
vector.resize(size);
}
Expand Down Expand Up @@ -412,9 +417,4 @@ public void write(int b) throws IOException {
vector.setRawByte(offset, (byte) b);
offset += 1;
}

@Override
public void close() throws IOException {
vector.delete();
}
}
1 change: 1 addition & 0 deletions docs/index.rst
Original file line number Diff line number Diff line change
Expand Up @@ -74,6 +74,7 @@ and the vineyard store that offers efficient in-memory data transfers.
interactive_engine/tinkerpop_eco
interactive_engine/neo4j_eco
interactive_engine/gopt
interactive_engine/graph_planner
interactive_engine/benchmark_tool
.. interactive_engine/guide_and_examples
interactive_engine/design_of_gie
Expand Down
234 changes: 234 additions & 0 deletions docs/interactive_engine/graph_planner.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,234 @@
# Graph Planner Interface by JNI and RESTful API

`GraphPlanner` is the primary entry point for GOpt’s query optimization and physical plan generation. Originally, it was tightly integrated into the Frontend service, where it optimized Cypher queries received via the Bolt protocol and generated execution plans for various backend engines.

To enhance its flexibility and ease of integration, `GraphPlanner` is now available as a standalone module, free from any dependencies on other Frontend modules. It supports both JNI and RESTful API interfaces, enabling lightweight and straightforward integration into diverse systems. Whether you are working on a native application or web-based services, `GraphPlanner` can seamlessly integrate into your architecture, providing efficient query optimization and physical plan generation across a wide range of use cases.


## JNI API

### Interface Overview

We provide a c++ wrapper implementation `GraphPlannerWrapper` for the JNI interface. Here is a brief explanation of the logical interface provided by the `c++` class.

Constructor:

```cpp
/**
* @brief Constructs a new GraphPlannerWrapper object
* @param java_path Java class path
* @param jna_path JNA library path
* @param graph_schema_yaml Path to the graph schema file in YAML format (optional)
* @param graph_statistic_json Path to the graph statistics file in JSON format (optional)
*/
GraphPlannerWrapper(const std::string &java_path,
const std::string &jna_path,
const std::string &graph_schema_yaml = "",
const std::string &graph_statistic_json = "");
```
Method:
```cpp
/**
* @brief Compile a cypher query to a physical plan by JNI invocation.
* @param compiler_config_path The path of compiler config file.
* @param cypher_query_string The cypher query string.
* @param graph_schema_yaml Content of the graph schema in YAML format
* @param graph_statistic_json Content of the graph statistics in JSON format
* @return The physical plan in bytes and result schema in yaml.
*/
Plan GraphPlannerWrapper::CompilePlan(const std::string &compiler_config_path,
const std::string &cypher_query_string,
const std::string &graph_schema_yaml,
const std::string &graph_statistic_json)
```

### Getting Started
Follow the steps below to get started with the Graph Planner interface for c++ invocation.

#### Step 1: Build the Project

Navigate to the project directory and build the package using Maven:
```bash
cd interactive_engine
mvn clean package -DskipTests -Pgraph-planner-jni
```

#### Step 2: Locate and Extract the Package

After the build completes, a tarball named `graph-planner-jni.tar.gz` will be available in the `assembly/target` directory. Extract the contents of the tarball:

```bash
cd assembly/target
tar xvzf graph-planner-jni.tar.gz
cd graph-planner-jni
```

#### Step 3: Run the Example Binary

To demonstrate the usage of the JNI interface, an example binary `test_graph_planner` is provided. Use the following command to execute it:

```bash
# bin/test_graph_planner <java class path> <jna lib path> <graph schema path> <graph statistics path> <query> <config path>
bin/test_graph_planner libs native ./conf/graph.yaml ./conf/modern_statistics.json "MATCH (n) RETURN n, COUNT(n);" ./conf/gs_interactive_hiactor.yaml
```

The output consists of the physical plan (in byte format) and the result schema (in YAML format). The physical plan adheres to the specifications defined in the [protobuf]().

Below is an example of a result schema:

```yaml
schema:
name: default
description: default desc
mode: READ
extension: .so
library: libdefault.so
params: []
returns:
- name: n
type: {primitive_type: DT_UNKNOWN}
- name: $f1
type: {primitive_type: DT_SIGNED_INT64}
type: UNKNOWN
query: MATCH (n) RETURN n, COUNT(n);
```
The `returns` field defines the structure of the data returned by backend engines. Each nested entry in the returns field includes three components:
- the column name, which specifies the name of the result column;
- the entry’s ordinal position, which determines the column ID;
- the type, which enforces the data type constraint for the column.

## Restful API

We provide an alternative method to expose the interface as a RESTful API. Follow the steps below to access the interface via REST.

### Getting Started

#### Step 1: Build the Project

To build the project, run the following command:
```bash
cd interactive_engine
# Use '-Dskip.native=true' to skip compiling C++ native code
mvn clean package -DskipTests -Pgraph-planner-jni -Dskip.native=true
```

#### Step 2: Locate and Extract the Package

Once the build completes, a tarball named graph-planner-jni.tar.gz will be available in the assembly/target directory. Extract the contents as follows:

```bash
cd assembly/target
tar xvzf graph-planner-jni.tar.gz
cd graph-planner-jni
```

#### Step 3: Start the Graph Planner RESTful Service

To start the service, run the following command:

```bash
java -cp ".:./libs/*" com.alibaba.graphscope.sdk.restful.GraphPlannerService --spring.config.location=./conf/application.yaml
```

#### Step 4: Access the RESTful API by `Curl`

To send a request to the RESTful API, use the following `curl` command:

```bash
curl -X POST http://localhost:8080/api/compilePlan \
-H "Content-Type: application/json" \
-d "{
\"configPath\": \"$configPath\",
\"query\": \"$query\",
\"schemaYaml\": \"$schemaYaml\",
\"statsJson\": \"$statsJson\"
}"
```

Replace `$configPath`, `$query`, `$schemaYaml`, and `$statsJson` with the appropriate values.

The response will be in JSON format, similar to:

```json
{
"graphPlan": {
"physicalBytes": "",
"resultSchemaYaml": ""
}
}
```

The response contains two fields:
1. physicalBytes: A Base64-encoded string representing the physical plan bytes.
2. resultSchemaYaml: A string representing the YAML schema.

You can decode these values into the required structures.

#### Step 4: Access the RESTful API by `Java` Sdk

Alternatively, if you are a java-side user, we provide a java sdk example to guide you how to access the restful API and decode the response :

```java
public static void main(String[] args) throws Exception {
if (args.length < 4) {
System.out.println("Usage: <configPath> <query> <schemaPath> <statsPath>");
System.exit(1);
}
// set request body in json format
String jsonPayLoad = createParameters(args[0], args[1], args[2], args[3]).toString();
HttpClient client = HttpClient.newBuilder().build();
// create http request, set header and body content
HttpRequest request =
HttpRequest.newBuilder()
.uri(URI.create("http://localhost:8080/api/compilePlan"))
.setHeader("Content-Type", "application/json")
.POST(
HttpRequest.BodyPublishers.ofString(
jsonPayLoad, StandardCharsets.UTF_8))
.build();
// send request and get response
HttpResponse<String> response = client.send(request, HttpResponse.BodyHandlers.ofString());
String body = response.body();
// parse response body as json
JsonNode planNode = (new ObjectMapper()).readTree(body).get("graphPlan");
// print result
System.out.println(getPhysicalPlan(planNode));
System.out.println(getResultSchemaYaml(planNode));
}
private static JsonNode createParameters(
String configPath, String query, String schemaPath, String statsPath) throws Exception {
Map<String, String> params =
ImmutableMap.of(
"configPath",
configPath,
"query",
query,
"schemaYaml",
FileUtils.readFileToString(new File(schemaPath), StandardCharsets.UTF_8),
"statsJson",
FileUtils.readFileToString(new File(statsPath), StandardCharsets.UTF_8));
return (new ObjectMapper()).valueToTree(params);
}
// get base64 string from json, convert it to physical bytes , then parse it to PhysicalPlan
private static GraphAlgebraPhysical.PhysicalPlan getPhysicalPlan(JsonNode planNode)
throws Exception {
String base64Str = planNode.get("physicalBytes").asText();
byte[] bytes = java.util.Base64.getDecoder().decode(base64Str);
return GraphAlgebraPhysical.PhysicalPlan.parseFrom(bytes);
}
// get result schema yaml from json
private static String getResultSchemaYaml(JsonNode planNode) {
return planNode.get("resultSchemaYaml").asText();
}
```

Run the java sdk example with the following command:
```bash
java -cp ".:./libs/*" com.alibaba.graphscope.sdk.examples.TestGraphPlanner ./conf/gs_interactive_hiactor.yaml "Match (n) Return n;" ./conf/graph.yaml ./conf/modern_statistics.json
```
Loading

0 comments on commit 6843a29

Please sign in to comment.