From bc1aac650fe8498cb0186e67800ebb4760ecb578 Mon Sep 17 00:00:00 2001 From: Shylock Hg <33566796+Shylock-Hg@users.noreply.github.com> Date: Thu, 9 Dec 2021 15:44:44 +0800 Subject: [PATCH] Feature/view vertices edges (#3320) * Scan multiple parts. * Add multiple parts test case. * Add limit test. * Remove unused include. * Support multiple tags. * Fix license header. * Optimize the extra read operations. * Fix compile error. * Skip invalid tag in one loop. * Avoid extra logical. * Add scan executors. * Add scan entry of match. * Format. * Push filter down to ScanVertices. * Push filter over AppendVertices. * Remove unused code. * Support push limit down to scan vertices. * Fix vfilter push down. * Transforme traverse to get edges. * Push limit to scan edges. * Check limit for scan. * Revert test cases. * Resolve conflict. * Remove redundant line. Co-authored-by: cpw <13495049+CPWstatic@users.noreply.github.com> --- src/clients/storage/StorageClient.cpp | 10 +- src/clients/storage/StorageClient.h | 10 +- src/common/meta/SchemaManager.cpp | 12 ++ src/common/meta/SchemaManager.h | 2 + src/graph/context/ast/CypherAstContext.h | 2 + src/graph/executor/CMakeLists.txt | 2 + src/graph/executor/Executor.cpp | 8 + src/graph/executor/query/GetPropExecutor.h | 3 +- .../executor/query/ScanEdgesExecutor.cpp | 50 ++++++ src/graph/executor/query/ScanEdgesExecutor.h | 22 +++ .../executor/query/ScanVerticesExecutor.cpp | 50 ++++++ .../executor/query/ScanVerticesExecutor.h | 26 +++ src/graph/optimizer/CMakeLists.txt | 5 + .../optimizer/rule/GetEdgesTransformRule.cpp | 129 ++++++++++++++ .../optimizer/rule/GetEdgesTransformRule.h | 45 +++++ .../rule/PushFilterDownScanVerticesRule.cpp | 99 +++++++++++ .../rule/PushFilterDownScanVerticesRule.h | 30 ++++ .../PushLimitDownScanAppendVerticesRule.cpp | 104 ++++++++++++ .../PushLimitDownScanAppendVerticesRule.h | 30 ++++ ...shLimitDownScanEdgesAppendVerticesRule.cpp | 113 +++++++++++++ ...PushLimitDownScanEdgesAppendVerticesRule.h | 30 ++++ .../rule/PushVFilterDownScanVerticesRule.cpp | 126 ++++++++++++++ .../rule/PushVFilterDownScanVerticesRule.h | 31 ++++ src/graph/planner/CMakeLists.txt | 1 + src/graph/planner/PlannersRegister.cpp | 6 + src/graph/planner/match/ScanSeek.cpp | 103 ++++++++++++ src/graph/planner/match/ScanSeek.h | 33 ++++ src/graph/planner/plan/PlanNode.cpp | 4 + src/graph/planner/plan/PlanNode.h | 2 + src/graph/planner/plan/Query.cpp | 64 ++++++- src/graph/planner/plan/Query.h | 118 +++++++++++++ .../validator/test/MatchValidatorTest.cpp | 8 +- .../visitor/ExtractFilterExprVisitor.cpp | 86 +++++++++- src/graph/visitor/ExtractFilterExprVisitor.h | 25 +++ src/interface/storage.thrift | 25 +-- src/storage/GraphStorageServiceHandler.cpp | 4 +- src/storage/GraphStorageServiceHandler.h | 5 +- src/storage/query/ScanEdgeProcessor.cpp | 7 +- src/storage/query/ScanEdgeProcessor.h | 5 +- src/storage/query/ScanVertexProcessor.cpp | 7 +- src/storage/query/ScanVertexProcessor.h | 6 +- src/storage/test/ScanEdgeTest.cpp | 67 ++++---- src/storage/test/ScanVertexTest.cpp | 24 ++- tests/tck/features/match/Base.IntVid.feature | 14 +- tests/tck/features/match/Base.feature | 14 +- tests/tck/features/match/Scan.feature | 157 ++++++++++++++++++ tests/tck/features/match/SeekByEdge.feature | 8 +- tests/tck/features/match/SeekById.feature | 16 +- .../features/match/SeekById.intVid.feature | 16 +- .../PushLimitDownScanEdgesRule.feature | 47 ++++++ .../PushLimitDownScanVerticesRule.feature | 45 +++++ 51 files changed, 1724 insertions(+), 132 deletions(-) create mode 100644 src/graph/executor/query/ScanEdgesExecutor.cpp create mode 100644 src/graph/executor/query/ScanEdgesExecutor.h create mode 100644 src/graph/executor/query/ScanVerticesExecutor.cpp create mode 100644 src/graph/executor/query/ScanVerticesExecutor.h create mode 100644 src/graph/optimizer/rule/GetEdgesTransformRule.cpp create mode 100644 src/graph/optimizer/rule/GetEdgesTransformRule.h create mode 100644 src/graph/optimizer/rule/PushFilterDownScanVerticesRule.cpp create mode 100644 src/graph/optimizer/rule/PushFilterDownScanVerticesRule.h create mode 100644 src/graph/optimizer/rule/PushLimitDownScanAppendVerticesRule.cpp create mode 100644 src/graph/optimizer/rule/PushLimitDownScanAppendVerticesRule.h create mode 100644 src/graph/optimizer/rule/PushLimitDownScanEdgesAppendVerticesRule.cpp create mode 100644 src/graph/optimizer/rule/PushLimitDownScanEdgesAppendVerticesRule.h create mode 100644 src/graph/optimizer/rule/PushVFilterDownScanVerticesRule.cpp create mode 100644 src/graph/optimizer/rule/PushVFilterDownScanVerticesRule.h create mode 100644 src/graph/planner/match/ScanSeek.cpp create mode 100644 src/graph/planner/match/ScanSeek.h create mode 100644 tests/tck/features/match/Scan.feature create mode 100644 tests/tck/features/optimizer/PushLimitDownScanEdgesRule.feature create mode 100644 tests/tck/features/optimizer/PushLimitDownScanVerticesRule.feature diff --git a/src/clients/storage/StorageClient.cpp b/src/clients/storage/StorageClient.cpp index 462dcefc367..5cc70ecde01 100644 --- a/src/clients/storage/StorageClient.cpp +++ b/src/clients/storage/StorageClient.cpp @@ -558,15 +558,15 @@ StorageRpcRespFuture StorageClient::lookupAndTravers }); } -StorageRpcRespFuture StorageClient::scanEdge( +StorageRpcRespFuture StorageClient::scanEdge( const CommonRequestParam& param, - const cpp2::EdgeProp& edgeProp, + const std::vector& edgeProp, int64_t limit, const Expression* filter) { std::unordered_map requests; auto status = getHostPartsWithCursor(param.space); if (!status.ok()) { - return folly::makeFuture>( + return folly::makeFuture>( std::runtime_error(status.status().toString())); } auto& clusters = status.value(); @@ -589,7 +589,7 @@ StorageRpcRespFuture StorageClient::scanEdge( const cpp2::ScanEdgeRequest& r) { return client->future_scanEdge(r); }); } -StorageRpcRespFuture StorageClient::scanVertex( +StorageRpcRespFuture StorageClient::scanVertex( const CommonRequestParam& param, const std::vector& vertexProp, int64_t limit, @@ -597,7 +597,7 @@ StorageRpcRespFuture StorageClient::scanVertex( std::unordered_map requests; auto status = getHostPartsWithCursor(param.space); if (!status.ok()) { - return folly::makeFuture>( + return folly::makeFuture>( std::runtime_error(status.status().toString())); } auto& clusters = status.value(); diff --git a/src/clients/storage/StorageClient.h b/src/clients/storage/StorageClient.h index 2261f548b53..49c333fe715 100644 --- a/src/clients/storage/StorageClient.h +++ b/src/clients/storage/StorageClient.h @@ -129,12 +129,12 @@ class StorageClient : public StorageClientBase lookupAndTraverse( const CommonRequestParam& param, cpp2::IndexSpec indexSpec, cpp2::TraverseSpec traverseSpec); - StorageRpcRespFuture scanEdge(const CommonRequestParam& param, - const cpp2::EdgeProp& vertexProp, - int64_t limit, - const Expression* filter); + StorageRpcRespFuture scanEdge(const CommonRequestParam& param, + const std::vector& vertexProp, + int64_t limit, + const Expression* filter); - StorageRpcRespFuture scanVertex( + StorageRpcRespFuture scanVertex( const CommonRequestParam& param, const std::vector& vertexProp, int64_t limit, diff --git a/src/common/meta/SchemaManager.cpp b/src/common/meta/SchemaManager.cpp index f50642b60cc..1252e418d51 100644 --- a/src/common/meta/SchemaManager.cpp +++ b/src/common/meta/SchemaManager.cpp @@ -23,5 +23,17 @@ StatusOr> SchemaManager::getSchemaIDByName(GraphSpaceID return Status::Error("Schema not exist: %s", schemaName.str().c_str()); } +StatusOr> SchemaManager::getAllTags(GraphSpaceID space) { + std::unordered_map tags; + auto tagSchemas = getAllLatestVerTagSchema(space); + NG_RETURN_IF_ERROR(tagSchemas); + for (auto& tagSchema : tagSchemas.value()) { + auto tagName = toTagName(space, tagSchema.first); + NG_RETURN_IF_ERROR(tagName); + tags.emplace(tagSchema.first, tagName.value()); + } + return tags; +} + } // namespace meta } // namespace nebula diff --git a/src/common/meta/SchemaManager.h b/src/common/meta/SchemaManager.h index ab7fe7fea3e..23fa8c68dec 100644 --- a/src/common/meta/SchemaManager.h +++ b/src/common/meta/SchemaManager.h @@ -68,6 +68,8 @@ class SchemaManager { virtual StatusOr> getAllEdge(GraphSpaceID space) = 0; + StatusOr> getAllTags(GraphSpaceID space); + // get all version of all tag schema virtual StatusOr getAllVerTagSchema(GraphSpaceID space) = 0; diff --git a/src/graph/context/ast/CypherAstContext.h b/src/graph/context/ast/CypherAstContext.h index f6d4e775a57..31b2bde72b1 100644 --- a/src/graph/context/ast/CypherAstContext.h +++ b/src/graph/context/ast/CypherAstContext.h @@ -63,6 +63,8 @@ struct ScanInfo { std::vector indexIds; // use for seek by edge only MatchEdge::Direction direction{MatchEdge::Direction::OUT_EDGE}; + // use for scan seek + bool anyLabel{false}; }; struct CypherClauseContextBase : AstContext { diff --git a/src/graph/executor/CMakeLists.txt b/src/graph/executor/CMakeLists.txt index 5bb8064ce3c..4be67ba0c25 100644 --- a/src/graph/executor/CMakeLists.txt +++ b/src/graph/executor/CMakeLists.txt @@ -34,6 +34,8 @@ nebula_add_library( query/InnerJoinExecutor.cpp query/IndexScanExecutor.cpp query/AssignExecutor.cpp + query/ScanVerticesExecutor.cpp + query/ScanEdgesExecutor.cpp query/TraverseExecutor.cpp query/AppendVerticesExecutor.cpp algo/ConjunctPathExecutor.cpp diff --git a/src/graph/executor/Executor.cpp b/src/graph/executor/Executor.cpp index 447e25acb31..78cbaf24573 100644 --- a/src/graph/executor/Executor.cpp +++ b/src/graph/executor/Executor.cpp @@ -81,6 +81,8 @@ #include "graph/executor/query/MinusExecutor.h" #include "graph/executor/query/ProjectExecutor.h" #include "graph/executor/query/SampleExecutor.h" +#include "graph/executor/query/ScanEdgesExecutor.h" +#include "graph/executor/query/ScanVerticesExecutor.h" #include "graph/executor/query/SortExecutor.h" #include "graph/executor/query/TopNExecutor.h" #include "graph/executor/query/TraverseExecutor.h" @@ -170,6 +172,12 @@ Executor *Executor::makeExecutor(QueryContext *qctx, const PlanNode *node) { case PlanNode::Kind::kGetVertices: { return pool->add(new GetVerticesExecutor(node, qctx)); } + case PlanNode::Kind::kScanEdges: { + return pool->add(new ScanEdgesExecutor(node, qctx)); + } + case PlanNode::Kind::kScanVertices: { + return pool->add(new ScanVerticesExecutor(node, qctx)); + } case PlanNode::Kind::kGetNeighbors: { return pool->add(new GetNeighborsExecutor(node, qctx)); } diff --git a/src/graph/executor/query/GetPropExecutor.h b/src/graph/executor/query/GetPropExecutor.h index 9db3be0d20c..313e3f2bef2 100644 --- a/src/graph/executor/query/GetPropExecutor.h +++ b/src/graph/executor/query/GetPropExecutor.h @@ -18,7 +18,8 @@ class GetPropExecutor : public StorageAccessExecutor { GetPropExecutor(const std::string &name, const PlanNode *node, QueryContext *qctx) : StorageAccessExecutor(name, node, qctx) {} - Status handleResp(storage::StorageRpcResponse &&rpcResp, + template + Status handleResp(storage::StorageRpcResponse &&rpcResp, const std::vector &colNames) { auto result = handleCompleteness(rpcResp, FLAGS_accept_partial_success); NG_RETURN_IF_ERROR(result); diff --git a/src/graph/executor/query/ScanEdgesExecutor.cpp b/src/graph/executor/query/ScanEdgesExecutor.cpp new file mode 100644 index 00000000000..fd70ad6e86b --- /dev/null +++ b/src/graph/executor/query/ScanEdgesExecutor.cpp @@ -0,0 +1,50 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#include "graph/executor/query/ScanEdgesExecutor.h" + +#include "common/time/ScopedTimer.h" +#include "graph/context/QueryContext.h" +#include "graph/planner/plan/Query.h" +#include "graph/util/SchemaUtil.h" + +using nebula::storage::StorageClient; +using nebula::storage::StorageRpcResponse; +using nebula::storage::cpp2::ScanResponse; + +namespace nebula { +namespace graph { + +folly::Future ScanEdgesExecutor::execute() { return scanEdges(); } + +folly::Future ScanEdgesExecutor::scanEdges() { + SCOPED_TIMER(&execTime_); + StorageClient *client = qctx()->getStorageClient(); + auto *se = asNode(node()); + if (se->limit() < 0) { + return Status::Error("Scan edges must specify limit number."); + } + + time::Duration scanEdgesTime; + StorageClient::CommonRequestParam param(se->space(), + qctx()->rctx()->session()->id(), + qctx()->plan()->id(), + qctx()->plan()->isProfileEnabled()); + return DCHECK_NOTNULL(client) + ->scanEdge(param, *DCHECK_NOTNULL(se->props()), se->limit(), se->filter()) + .via(runner()) + .ensure([this, scanEdgesTime]() { + SCOPED_TIMER(&execTime_); + otherStats_.emplace("total_rpc", folly::sformat("{}(us)", scanEdgesTime.elapsedInUSec())); + }) + .thenValue([this, se](StorageRpcResponse &&rpcResp) { + SCOPED_TIMER(&execTime_); + addStats(rpcResp, otherStats_); + return handleResp(std::move(rpcResp), se->colNames()); + }); +} + +} // namespace graph +} // namespace nebula diff --git a/src/graph/executor/query/ScanEdgesExecutor.h b/src/graph/executor/query/ScanEdgesExecutor.h new file mode 100644 index 00000000000..c2385182e29 --- /dev/null +++ b/src/graph/executor/query/ScanEdgesExecutor.h @@ -0,0 +1,22 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#include "graph/executor/query/GetPropExecutor.h" + +namespace nebula { +namespace graph { +class ScanEdgesExecutor final : public GetPropExecutor { + public: + ScanEdgesExecutor(const PlanNode *node, QueryContext *qctx) + : GetPropExecutor("ScanEdgesExecutor", node, qctx) {} + + folly::Future execute() override; + + private: + folly::Future scanEdges(); +}; + +} // namespace graph +} // namespace nebula diff --git a/src/graph/executor/query/ScanVerticesExecutor.cpp b/src/graph/executor/query/ScanVerticesExecutor.cpp new file mode 100644 index 00000000000..2ff896002b2 --- /dev/null +++ b/src/graph/executor/query/ScanVerticesExecutor.cpp @@ -0,0 +1,50 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#include "graph/executor/query/ScanVerticesExecutor.h" + +#include "common/time/ScopedTimer.h" +#include "graph/context/QueryContext.h" +#include "graph/util/SchemaUtil.h" + +using nebula::storage::StorageClient; +using nebula::storage::StorageRpcResponse; +using nebula::storage::cpp2::ScanResponse; + +namespace nebula { +namespace graph { + +folly::Future ScanVerticesExecutor::execute() { return scanVertices(); } + +folly::Future ScanVerticesExecutor::scanVertices() { + SCOPED_TIMER(&execTime_); + + auto *sv = asNode(node()); + if (sv->limit() < 0) { + return Status::Error("Scan vertices must specify limit number."); + } + StorageClient *storageClient = qctx()->getStorageClient(); + + time::Duration scanVertexTime; + StorageClient::CommonRequestParam param(sv->space(), + qctx()->rctx()->session()->id(), + qctx()->plan()->id(), + qctx()->plan()->isProfileEnabled()); + return DCHECK_NOTNULL(storageClient) + ->scanVertex(param, *DCHECK_NOTNULL(sv->props()), sv->limit(), sv->filter()) + .via(runner()) + .ensure([this, scanVertexTime]() { + SCOPED_TIMER(&execTime_); + otherStats_.emplace("total_rpc", folly::sformat("{}(us)", scanVertexTime.elapsedInUSec())); + }) + .thenValue([this, sv](StorageRpcResponse &&rpcResp) { + SCOPED_TIMER(&execTime_); + addStats(rpcResp, otherStats_); + return handleResp(std::move(rpcResp), sv->colNames()); + }); +} + +} // namespace graph +} // namespace nebula diff --git a/src/graph/executor/query/ScanVerticesExecutor.h b/src/graph/executor/query/ScanVerticesExecutor.h new file mode 100644 index 00000000000..1b46cc84549 --- /dev/null +++ b/src/graph/executor/query/ScanVerticesExecutor.h @@ -0,0 +1,26 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#pragma once + +#include "graph/executor/query/GetPropExecutor.h" +#include "graph/planner/plan/Query.h" + +namespace nebula { +namespace graph { + +class ScanVerticesExecutor final : public GetPropExecutor { + public: + ScanVerticesExecutor(const PlanNode *node, QueryContext *qctx) + : GetPropExecutor("ScanVerticesExecutor", node, qctx) {} + + folly::Future execute() override; + + private: + folly::Future scanVertices(); +}; + +} // namespace graph +} // namespace nebula diff --git a/src/graph/optimizer/CMakeLists.txt b/src/graph/optimizer/CMakeLists.txt index 0329f9c60b7..d7326f5bb01 100644 --- a/src/graph/optimizer/CMakeLists.txt +++ b/src/graph/optimizer/CMakeLists.txt @@ -26,6 +26,8 @@ nebula_add_library( rule/PushFilterDownAggregateRule.cpp rule/PushFilterDownProjectRule.cpp rule/PushFilterDownLeftJoinRule.cpp + rule/PushFilterDownScanVerticesRule.cpp + rule/PushVFilterDownScanVerticesRule.cpp rule/OptimizeEdgeIndexScanByFilterRule.cpp rule/OptimizeTagIndexScanByFilterRule.cpp rule/UnionAllIndexScanBaseRule.cpp @@ -45,6 +47,9 @@ nebula_add_library( rule/PushLimitDownEdgeIndexPrefixScanRule.cpp rule/PushLimitDownEdgeIndexRangeScanRule.cpp rule/PushLimitDownProjectRule.cpp + rule/PushLimitDownScanAppendVerticesRule.cpp + rule/GetEdgesTransformRule.cpp + rule/PushLimitDownScanEdgesAppendVerticesRule.cpp ) nebula_add_subdirectory(test) diff --git a/src/graph/optimizer/rule/GetEdgesTransformRule.cpp b/src/graph/optimizer/rule/GetEdgesTransformRule.cpp new file mode 100644 index 00000000000..bfa8456c57a --- /dev/null +++ b/src/graph/optimizer/rule/GetEdgesTransformRule.cpp @@ -0,0 +1,129 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#include "graph/optimizer/rule/GetEdgesTransformRule.h" + +#include "common/expression/Expression.h" +#include "graph/optimizer/OptContext.h" +#include "graph/optimizer/OptGroup.h" +#include "graph/planner/plan/PlanNode.h" +#include "graph/planner/plan/Query.h" +#include "graph/visitor/ExtractFilterExprVisitor.h" + +using nebula::Expression; +using nebula::graph::AppendVertices; +using nebula::graph::PlanNode; +using nebula::graph::Project; +using nebula::graph::QueryContext; +using nebula::graph::ScanEdges; +using nebula::graph::ScanVertices; +using nebula::graph::Traverse; + +namespace nebula { +namespace opt { + +std::unique_ptr GetEdgesTransformRule::kInstance = + std::unique_ptr(new GetEdgesTransformRule()); + +GetEdgesTransformRule::GetEdgesTransformRule() { RuleSet::QueryRules().addRule(this); } + +const Pattern &GetEdgesTransformRule::pattern() const { + static Pattern pattern = + Pattern::create(PlanNode::Kind::kAppendVertices, + {Pattern::create(PlanNode::Kind::kTraverse, + {Pattern::create(PlanNode::Kind::kScanVertices)})}); + return pattern; +} + +bool GetEdgesTransformRule::match(OptContext *ctx, const MatchedResult &matched) const { + if (!OptRule::match(ctx, matched)) { + return false; + } + auto traverse = static_cast(matched.planNode({0, 0})); + const auto &colNames = traverse->colNames(); + auto colSize = colNames.size(); + DCHECK_GE(colSize, 2); + if (colNames[colSize - 2][0] != '_') { // src + return false; + } + if (traverse->stepRange() != nullptr) { + return false; + } + return true; +} + +StatusOr GetEdgesTransformRule::transform( + OptContext *ctx, const MatchedResult &matched) const { + auto appendVerticesGroupNode = matched.node; + auto appendVertices = static_cast(appendVerticesGroupNode->node()); + auto traverseGroupNode = matched.dependencies.front().node; + auto traverse = static_cast(traverseGroupNode->node()); + auto scanVerticesGroupNode = matched.dependencies.front().dependencies.front().node; + auto qctx = ctx->qctx(); + + auto newAppendVertices = appendVertices->clone(); + auto colSize = appendVertices->colNames().size(); + newAppendVertices->setColNames( + {appendVertices->colNames()[colSize - 2], appendVertices->colNames()[colSize - 1]}); + auto newAppendVerticesGroupNode = + OptGroupNode::create(ctx, newAppendVertices, appendVerticesGroupNode->group()); + + auto *newScanEdges = traverseToScanEdges(traverse); + auto newScanEdgesGroup = OptGroup::create(ctx); + auto newScanEdgesGroupNode = newScanEdgesGroup->makeGroupNode(newScanEdges); + + auto *newProj = projectEdges(qctx, newScanEdges, traverse->colNames().back()); + newProj->setInputVar(newScanEdges->outputVar()); + newProj->setOutputVar(traverse->outputVar()); + newProj->setColNames({traverse->colNames().back()}); + auto newProjGroup = OptGroup::create(ctx); + auto newProjGroupNode = newProjGroup->makeGroupNode(newProj); + + newAppendVerticesGroupNode->dependsOn(newProjGroup); + newProjGroupNode->dependsOn(newScanEdgesGroup); + for (auto dep : scanVerticesGroupNode->dependencies()) { + newScanEdgesGroupNode->dependsOn(dep); + } + + TransformResult result; + result.eraseCurr = true; + result.newGroupNodes.emplace_back(newAppendVerticesGroupNode); + return result; +} + +std::string GetEdgesTransformRule::toString() const { return "GetEdgesTransformRule"; } + +/*static*/ graph::ScanEdges *GetEdgesTransformRule::traverseToScanEdges( + const graph::Traverse *traverse) { + const auto *edgeProps = traverse->edgeProps(); + auto scanEdges = ScanEdges::make( + traverse->qctx(), + nullptr, + traverse->space(), + edgeProps == nullptr ? nullptr + : std::make_unique>(*edgeProps), + nullptr, + traverse->dedup(), + traverse->limit(), + {}, + traverse->filter() == nullptr ? nullptr : traverse->filter()->clone()); + return scanEdges; +} + +/*static*/ graph::Project *GetEdgesTransformRule::projectEdges(graph::QueryContext *qctx, + PlanNode *input, + const std::string &colName) { + auto *yieldColumns = qctx->objPool()->makeAndAdd(); + auto *edgeExpr = EdgeExpression::make(qctx->objPool()); + auto *listEdgeExpr = ListExpression::make(qctx->objPool()); + listEdgeExpr->setItems({edgeExpr}); + yieldColumns->addColumn(new YieldColumn(listEdgeExpr, colName)); + auto project = Project::make(qctx, input, yieldColumns); + project->setColNames({colName}); + return project; +} + +} // namespace opt +} // namespace nebula diff --git a/src/graph/optimizer/rule/GetEdgesTransformRule.h b/src/graph/optimizer/rule/GetEdgesTransformRule.h new file mode 100644 index 00000000000..86492a44fa7 --- /dev/null +++ b/src/graph/optimizer/rule/GetEdgesTransformRule.h @@ -0,0 +1,45 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#pragma once + +#include "graph/optimizer/OptRule.h" + +namespace nebula { + +namespace graph { +class ScanEdges; +class Project; +class Traverse; +class PlanNode; +} // namespace graph + +namespace opt { + +// e.g. match ()-[e]->(?) return e +// Optimize to get edges directly +class GetEdgesTransformRule final : public OptRule { + public: + const Pattern &pattern() const override; + + bool match(OptContext *ctx, const MatchedResult &matched) const override; + StatusOr transform(OptContext *ctx, const MatchedResult &matched) const override; + + std::string toString() const override; + + private: + GetEdgesTransformRule(); + + static graph::ScanEdges *traverseToScanEdges(const graph::Traverse *traverse); + + static graph::Project *projectEdges(graph::QueryContext *qctx, + graph::PlanNode *input, + const std::string &colName); + + static std::unique_ptr kInstance; +}; + +} // namespace opt +} // namespace nebula diff --git a/src/graph/optimizer/rule/PushFilterDownScanVerticesRule.cpp b/src/graph/optimizer/rule/PushFilterDownScanVerticesRule.cpp new file mode 100644 index 00000000000..00ed8a00711 --- /dev/null +++ b/src/graph/optimizer/rule/PushFilterDownScanVerticesRule.cpp @@ -0,0 +1,99 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#include "graph/optimizer/rule/PushFilterDownScanVerticesRule.h" + +#include "common/expression/Expression.h" +#include "common/expression/LogicalExpression.h" +#include "graph/optimizer/OptContext.h" +#include "graph/optimizer/OptGroup.h" +#include "graph/planner/plan/PlanNode.h" +#include "graph/planner/plan/Query.h" +#include "graph/visitor/ExtractFilterExprVisitor.h" + +using nebula::Expression; +using nebula::graph::Filter; +using nebula::graph::PlanNode; +using nebula::graph::QueryContext; +using nebula::graph::ScanVertices; + +namespace nebula { +namespace opt { + +std::unique_ptr PushFilterDownScanVerticesRule::kInstance = + std::unique_ptr(new PushFilterDownScanVerticesRule()); + +PushFilterDownScanVerticesRule::PushFilterDownScanVerticesRule() { + RuleSet::QueryRules().addRule(this); +} + +const Pattern &PushFilterDownScanVerticesRule::pattern() const { + static Pattern pattern = + Pattern::create(PlanNode::Kind::kFilter, {Pattern::create(PlanNode::Kind::kScanVertices)}); + return pattern; +} + +StatusOr PushFilterDownScanVerticesRule::transform( + OptContext *ctx, const MatchedResult &matched) const { + auto filterGroupNode = matched.node; + auto svGroupNode = matched.dependencies.front().node; + auto filter = static_cast(filterGroupNode->node()); + auto sv = static_cast(svGroupNode->node()); + auto qctx = ctx->qctx(); + auto pool = qctx->objPool(); + auto condition = filter->condition()->clone(); + + auto visitor = graph::ExtractFilterExprVisitor::makePushGetVertices(pool); + condition->accept(&visitor); + if (!visitor.ok()) { + return TransformResult::noTransform(); + } + + auto remainedExpr = std::move(visitor).remainedExpr(); + OptGroupNode *newFilterGroupNode = nullptr; + if (remainedExpr != nullptr) { + auto newFilter = Filter::make(qctx, nullptr, remainedExpr); + newFilter->setOutputVar(filter->outputVar()); + newFilter->setInputVar(filter->inputVar()); + newFilterGroupNode = OptGroupNode::create(ctx, newFilter, filterGroupNode->group()); + } + + auto newSVFilter = condition; + if (sv->filter() != nullptr) { + auto logicExpr = LogicalExpression::makeAnd(pool, condition, sv->filter()->clone()); + newSVFilter = logicExpr; + } + + auto newSV = static_cast(sv->clone()); + newSV->setFilter(newSVFilter); + + OptGroupNode *newSvGroupNode = nullptr; + if (newFilterGroupNode != nullptr) { + // Filter(A&&B)<-ScanVertices(C) => Filter(A)<-ScanVertices(B&&C) + auto newGroup = OptGroup::create(ctx); + newSvGroupNode = newGroup->makeGroupNode(newSV); + newFilterGroupNode->dependsOn(newGroup); + } else { + // Filter(A)<-ScanVertices(C) => ScanVertices(A&&C) + newSvGroupNode = OptGroupNode::create(ctx, newSV, filterGroupNode->group()); + newSV->setOutputVar(filter->outputVar()); + } + + for (auto dep : svGroupNode->dependencies()) { + newSvGroupNode->dependsOn(dep); + } + + TransformResult result; + result.eraseCurr = true; + result.newGroupNodes.emplace_back(newFilterGroupNode ? newFilterGroupNode : newSvGroupNode); + return result; +} + +std::string PushFilterDownScanVerticesRule::toString() const { + return "PushFilterDownScanVerticesRule"; +} + +} // namespace opt +} // namespace nebula diff --git a/src/graph/optimizer/rule/PushFilterDownScanVerticesRule.h b/src/graph/optimizer/rule/PushFilterDownScanVerticesRule.h new file mode 100644 index 00000000000..1f5cf14fc61 --- /dev/null +++ b/src/graph/optimizer/rule/PushFilterDownScanVerticesRule.h @@ -0,0 +1,30 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#pragma once + +#include + +#include "graph/optimizer/OptRule.h" + +namespace nebula { +namespace opt { + +class PushFilterDownScanVerticesRule final : public OptRule { + public: + const Pattern &pattern() const override; + + StatusOr transform(OptContext *ctx, const MatchedResult &matched) const override; + + std::string toString() const override; + + private: + PushFilterDownScanVerticesRule(); + + static std::unique_ptr kInstance; +}; + +} // namespace opt +} // namespace nebula diff --git a/src/graph/optimizer/rule/PushLimitDownScanAppendVerticesRule.cpp b/src/graph/optimizer/rule/PushLimitDownScanAppendVerticesRule.cpp new file mode 100644 index 00000000000..26c4d0d1440 --- /dev/null +++ b/src/graph/optimizer/rule/PushLimitDownScanAppendVerticesRule.cpp @@ -0,0 +1,104 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#include "graph/optimizer/rule/PushLimitDownScanAppendVerticesRule.h" + +#include "graph/optimizer/OptContext.h" +#include "graph/optimizer/OptGroup.h" +#include "graph/planner/plan/PlanNode.h" +#include "graph/planner/plan/Query.h" + +using nebula::graph::AppendVertices; +using nebula::graph::Limit; +using nebula::graph::PlanNode; +using nebula::graph::QueryContext; +using nebula::graph::ScanVertices; + +namespace nebula { +namespace opt { + +// Limit->AppendVertices->ScanVertices ==> Limit->AppendVertices->ScanVertices(Limit) + +std::unique_ptr PushLimitDownScanAppendVerticesRule::kInstance = + std::unique_ptr(new PushLimitDownScanAppendVerticesRule()); + +PushLimitDownScanAppendVerticesRule::PushLimitDownScanAppendVerticesRule() { + RuleSet::QueryRules().addRule(this); +} + +const Pattern &PushLimitDownScanAppendVerticesRule::pattern() const { + static Pattern pattern = + Pattern::create(graph::PlanNode::Kind::kLimit, + {Pattern::create(graph::PlanNode::Kind::kAppendVertices, + {Pattern::create(graph::PlanNode::Kind::kScanVertices)})}); + return pattern; +} + +bool PushLimitDownScanAppendVerticesRule::match(OptContext *ctx, + const MatchedResult &matched) const { + if (!OptRule::match(ctx, matched)) { + return false; + } + auto av = static_cast(matched.planNode({0, 0})); + auto *src = av->src(); + if (src->kind() != Expression::Kind::kInputProperty && + src->kind() != Expression::Kind::kVarProperty) { + return false; + } + auto *propExpr = static_cast(src); + if (propExpr->prop() != kVid) { + return false; + } + auto *filter = av->filter(); + auto *vFilter = av->vFilter(); + // Limit can't push over filter operation + return filter == nullptr && vFilter == nullptr; +} + +StatusOr PushLimitDownScanAppendVerticesRule::transform( + OptContext *octx, const MatchedResult &matched) const { + auto limitGroupNode = matched.node; + auto appendVerticesGroupNode = matched.dependencies.front().node; + auto scanVerticesGroupNode = matched.dependencies.front().dependencies.front().node; + + const auto limit = static_cast(limitGroupNode->node()); + const auto appendVertices = static_cast(appendVerticesGroupNode->node()); + const auto scanVertices = static_cast(scanVerticesGroupNode->node()); + + int64_t limitRows = limit->offset() + limit->count(); + if (scanVertices->limit() >= 0 && limitRows >= scanVertices->limit()) { + return TransformResult::noTransform(); + } + + auto newLimit = static_cast(limit->clone()); + auto newLimitGroupNode = OptGroupNode::create(octx, newLimit, limitGroupNode->group()); + + auto newAppendVertices = static_cast(appendVertices->clone()); + auto newAppendVerticesGroup = OptGroup::create(octx); + auto newAppendVerticesGroupNode = newAppendVerticesGroup->makeGroupNode(newAppendVertices); + + auto newScanVertices = static_cast(scanVertices->clone()); + newScanVertices->setLimit(limitRows); + auto newScanVerticesGroup = OptGroup::create(octx); + auto newScanVerticesGroupNode = newScanVerticesGroup->makeGroupNode(newScanVertices); + + newLimitGroupNode->dependsOn(newAppendVerticesGroup); + newAppendVerticesGroupNode->dependsOn(newScanVerticesGroup); + for (auto dep : scanVerticesGroupNode->dependencies()) { + newScanVerticesGroupNode->dependsOn(dep); + } + + TransformResult result; + result.eraseAll = true; + result.newGroupNodes.emplace_back(newLimitGroupNode); + return result; +} + +std::string PushLimitDownScanAppendVerticesRule::toString() const { + return "PushLimitDownScanAppendVerticesRule"; +} + +} // namespace opt +} // namespace nebula diff --git a/src/graph/optimizer/rule/PushLimitDownScanAppendVerticesRule.h b/src/graph/optimizer/rule/PushLimitDownScanAppendVerticesRule.h new file mode 100644 index 00000000000..6652da49d5e --- /dev/null +++ b/src/graph/optimizer/rule/PushLimitDownScanAppendVerticesRule.h @@ -0,0 +1,30 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#pragma once + +#include "graph/optimizer/OptRule.h" + +namespace nebula { +namespace opt { + +class PushLimitDownScanAppendVerticesRule final : public OptRule { + public: + const Pattern &pattern() const override; + + bool match(OptContext *ctx, const MatchedResult &matched) const override; + StatusOr transform(OptContext *ctx, + const MatchedResult &matched) const override; + + std::string toString() const override; + + private: + PushLimitDownScanAppendVerticesRule(); + + static std::unique_ptr kInstance; +}; + +} // namespace opt +} // namespace nebula diff --git a/src/graph/optimizer/rule/PushLimitDownScanEdgesAppendVerticesRule.cpp b/src/graph/optimizer/rule/PushLimitDownScanEdgesAppendVerticesRule.cpp new file mode 100644 index 00000000000..4f249ab001d --- /dev/null +++ b/src/graph/optimizer/rule/PushLimitDownScanEdgesAppendVerticesRule.cpp @@ -0,0 +1,113 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#include "graph/optimizer/rule/PushLimitDownScanEdgesAppendVerticesRule.h" + +#include "graph/optimizer/OptContext.h" +#include "graph/optimizer/OptGroup.h" +#include "graph/planner/plan/PlanNode.h" +#include "graph/planner/plan/Query.h" +#include "graph/util/ExpressionUtils.h" + +using nebula::graph::AppendVertices; +using nebula::graph::Limit; +using nebula::graph::PlanNode; +using nebula::graph::Project; +using nebula::graph::QueryContext; +using nebula::graph::ScanEdges; + +namespace nebula { +namespace opt { + +// Limit->AppendVertices->Project->ScanEdges ==> Limit->AppendVertices->Project->ScanEdges(Limit) + +std::unique_ptr PushLimitDownScanEdgesAppendVerticesRule::kInstance = + std::unique_ptr( + new PushLimitDownScanEdgesAppendVerticesRule()); + +PushLimitDownScanEdgesAppendVerticesRule::PushLimitDownScanEdgesAppendVerticesRule() { + RuleSet::QueryRules().addRule(this); +} + +const Pattern &PushLimitDownScanEdgesAppendVerticesRule::pattern() const { + static Pattern pattern = Pattern::create( + graph::PlanNode::Kind::kLimit, + {Pattern::create(graph::PlanNode::Kind::kAppendVertices, + {Pattern::create(graph::PlanNode::Kind::kProject, + {Pattern::create(graph::PlanNode::Kind::kScanEdges)})})}); + return pattern; +} + +bool PushLimitDownScanEdgesAppendVerticesRule::match(OptContext *ctx, + const MatchedResult &matched) const { + if (!OptRule::match(ctx, matched)) { + return false; + } + auto av = static_cast(matched.planNode({0, 0})); + auto *src = av->src(); + auto *inputExpr = graph::ExpressionUtils::findAny( + src, {Expression::Kind::kInputProperty, Expression::Kind::kVarProperty}); + if (inputExpr == nullptr) { + return false; + } + auto *filter = av->filter(); + auto *vFilter = av->vFilter(); + // Limit can't push over filter operation + return filter == nullptr && vFilter == nullptr; +} + +StatusOr PushLimitDownScanEdgesAppendVerticesRule::transform( + OptContext *octx, const MatchedResult &matched) const { + auto limitGroupNode = matched.node; + auto appendVerticesGroupNode = matched.dependencies.front().node; + auto projGroupNode = matched.dependencies.front().dependencies.front().node; + auto scanEdgesGroupNode = + matched.dependencies.front().dependencies.front().dependencies.front().node; + + const auto limit = static_cast(limitGroupNode->node()); + const auto appendVertices = static_cast(appendVerticesGroupNode->node()); + const auto proj = static_cast(projGroupNode->node()); + const auto scanEdges = static_cast(scanEdgesGroupNode->node()); + + int64_t limitRows = limit->offset() + limit->count(); + if (scanEdges->limit() >= 0 && limitRows >= scanEdges->limit()) { + return TransformResult::noTransform(); + } + + auto newLimit = static_cast(limit->clone()); + auto newLimitGroupNode = OptGroupNode::create(octx, newLimit, limitGroupNode->group()); + + auto newAppendVertices = static_cast(appendVertices->clone()); + auto newAppendVerticesGroup = OptGroup::create(octx); + auto newAppendVerticesGroupNode = newAppendVerticesGroup->makeGroupNode(newAppendVertices); + + auto newProj = static_cast(proj->clone()); + auto newProjGroup = OptGroup::create(octx); + auto newProjGroupNode = newProjGroup->makeGroupNode(newProj); + + auto newScanEdges = static_cast(scanEdges->clone()); + newScanEdges->setLimit(limitRows); + auto newScanEdgesGroup = OptGroup::create(octx); + auto newScanEdgesGroupNode = newScanEdgesGroup->makeGroupNode(newScanEdges); + + newLimitGroupNode->dependsOn(newAppendVerticesGroup); + newAppendVerticesGroupNode->dependsOn(newProjGroup); + newProjGroupNode->dependsOn(newScanEdgesGroup); + for (auto dep : scanEdgesGroupNode->dependencies()) { + newScanEdgesGroupNode->dependsOn(dep); + } + + TransformResult result; + result.eraseAll = true; + result.newGroupNodes.emplace_back(newLimitGroupNode); + return result; +} + +std::string PushLimitDownScanEdgesAppendVerticesRule::toString() const { + return "PushLimitDownScanEdgesAppendVerticesRule"; +} + +} // namespace opt +} // namespace nebula diff --git a/src/graph/optimizer/rule/PushLimitDownScanEdgesAppendVerticesRule.h b/src/graph/optimizer/rule/PushLimitDownScanEdgesAppendVerticesRule.h new file mode 100644 index 00000000000..38c079bc660 --- /dev/null +++ b/src/graph/optimizer/rule/PushLimitDownScanEdgesAppendVerticesRule.h @@ -0,0 +1,30 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#pragma once + +#include "graph/optimizer/OptRule.h" + +namespace nebula { +namespace opt { + +class PushLimitDownScanEdgesAppendVerticesRule final : public OptRule { + public: + const Pattern &pattern() const override; + + bool match(OptContext *ctx, const MatchedResult &matched) const override; + StatusOr transform(OptContext *ctx, + const MatchedResult &matched) const override; + + std::string toString() const override; + + private: + PushLimitDownScanEdgesAppendVerticesRule(); + + static std::unique_ptr kInstance; +}; + +} // namespace opt +} // namespace nebula diff --git a/src/graph/optimizer/rule/PushVFilterDownScanVerticesRule.cpp b/src/graph/optimizer/rule/PushVFilterDownScanVerticesRule.cpp new file mode 100644 index 00000000000..c335bc38238 --- /dev/null +++ b/src/graph/optimizer/rule/PushVFilterDownScanVerticesRule.cpp @@ -0,0 +1,126 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#include "graph/optimizer/rule/PushVFilterDownScanVerticesRule.h" + +#include "common/expression/Expression.h" +#include "common/expression/LogicalExpression.h" +#include "common/expression/PropertyExpression.h" +#include "common/expression/UnaryExpression.h" +#include "graph/optimizer/OptContext.h" +#include "graph/optimizer/OptGroup.h" +#include "graph/planner/plan/PlanNode.h" +#include "graph/planner/plan/Query.h" +#include "graph/util/ExpressionUtils.h" +#include "graph/visitor/ExtractFilterExprVisitor.h" + +using nebula::Expression; +using nebula::graph::AppendVertices; +using nebula::graph::PlanNode; +using nebula::graph::QueryContext; +using nebula::graph::ScanVertices; + +namespace nebula { +namespace opt { + +std::unique_ptr PushVFilterDownScanVerticesRule::kInstance = + std::unique_ptr(new PushVFilterDownScanVerticesRule()); + +PushVFilterDownScanVerticesRule::PushVFilterDownScanVerticesRule() { + RuleSet::QueryRules().addRule(this); +} + +const Pattern &PushVFilterDownScanVerticesRule::pattern() const { + static Pattern pattern = Pattern::create(PlanNode::Kind::kAppendVertices, + {Pattern::create(PlanNode::Kind::kScanVertices)}); + return pattern; +} + +// AppendVertices is the leaf node to fetch data from storage, so Filter can't push over it +// normally. +// But in this case, if AppendVertices get vId from ScanVertices, it can be pushed down. +bool PushVFilterDownScanVerticesRule::match(OptContext *ctx, const MatchedResult &matched) const { + if (!OptRule::match(ctx, matched)) { + return false; + } + auto appendVerticesGroupNode = matched.node; + auto appendVertices = static_cast(appendVerticesGroupNode->node()); + auto *src = appendVertices->src(); + if (src->kind() != Expression::Kind::kInputProperty && + src->kind() != Expression::Kind::kVarProperty) { + return false; + } + auto *propExpr = static_cast(src); + if (propExpr->prop() != kVid) { + return false; + } + if (appendVertices->vFilter() == nullptr) { + return false; + } + auto tagPropExprs = graph::ExpressionUtils::collectAll(appendVertices->vFilter(), + {Expression::Kind::kTagProperty}); + for (const auto &tagPropExpr : tagPropExprs) { + auto tagProp = static_cast(tagPropExpr); + if (tagProp->sym() == "*") { + return false; + } + } + return true; +} + +StatusOr PushVFilterDownScanVerticesRule::transform( + OptContext *ctx, const MatchedResult &matched) const { + auto appendVerticesGroupNode = matched.node; + auto svGroupNode = matched.dependencies.front().node; + auto appendVertices = static_cast(appendVerticesGroupNode->node()); + auto sv = static_cast(svGroupNode->node()); + auto qctx = ctx->qctx(); + auto pool = qctx->objPool(); + auto condition = appendVertices->vFilter()->clone(); + + auto visitor = graph::ExtractFilterExprVisitor::makePushGetVertices(pool); + condition->accept(&visitor); + if (!visitor.ok()) { + return TransformResult::noTransform(); + } + + auto remainedExpr = std::move(visitor).remainedExpr(); + OptGroupNode *newAppendVerticesGroupNode = nullptr; + auto newAppendVertices = appendVertices->clone(); + newAppendVertices->setVertexFilter(remainedExpr); + newAppendVertices->setOutputVar(appendVertices->outputVar()); + newAppendVertices->setInputVar(appendVertices->inputVar()); + newAppendVerticesGroupNode = + OptGroupNode::create(ctx, newAppendVertices, appendVerticesGroupNode->group()); + + auto newSVFilter = condition; + if (sv->filter() != nullptr) { + auto logicExpr = LogicalExpression::makeAnd(pool, condition, sv->filter()->clone()); + newSVFilter = logicExpr; + } + + auto newSV = static_cast(sv->clone()); + newSV->setFilter(newSVFilter); + + auto newGroup = OptGroup::create(ctx); + auto newSvGroupNode = newGroup->makeGroupNode(newSV); + newAppendVerticesGroupNode->dependsOn(newGroup); + + for (auto dep : svGroupNode->dependencies()) { + newSvGroupNode->dependsOn(dep); + } + + TransformResult result; + result.eraseCurr = true; + result.newGroupNodes.emplace_back(newAppendVerticesGroupNode); + return result; +} + +std::string PushVFilterDownScanVerticesRule::toString() const { + return "PushVFilterDownScanVerticesRule"; +} + +} // namespace opt +} // namespace nebula diff --git a/src/graph/optimizer/rule/PushVFilterDownScanVerticesRule.h b/src/graph/optimizer/rule/PushVFilterDownScanVerticesRule.h new file mode 100644 index 00000000000..098bf752636 --- /dev/null +++ b/src/graph/optimizer/rule/PushVFilterDownScanVerticesRule.h @@ -0,0 +1,31 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#pragma once + +#include + +#include "graph/optimizer/OptRule.h" + +namespace nebula { +namespace opt { + +class PushVFilterDownScanVerticesRule final : public OptRule { + public: + const Pattern &pattern() const override; + + bool match(OptContext *ctx, const MatchedResult &matched) const override; + StatusOr transform(OptContext *ctx, const MatchedResult &matched) const override; + + std::string toString() const override; + + private: + PushVFilterDownScanVerticesRule(); + + static std::unique_ptr kInstance; +}; + +} // namespace opt +} // namespace nebula diff --git a/src/graph/planner/CMakeLists.txt b/src/graph/planner/CMakeLists.txt index c3d487105ed..bbd2aeda4e0 100644 --- a/src/graph/planner/CMakeLists.txt +++ b/src/graph/planner/CMakeLists.txt @@ -26,6 +26,7 @@ nebula_add_library( match/PropIndexSeek.cpp match/VertexIdSeek.cpp match/LabelIndexSeek.cpp + match/ScanSeek.cpp ngql/PathPlanner.cpp ngql/GoPlanner.cpp ngql/SubgraphPlanner.cpp diff --git a/src/graph/planner/PlannersRegister.cpp b/src/graph/planner/PlannersRegister.cpp index e682ad243b8..f7067b5c7ac 100644 --- a/src/graph/planner/PlannersRegister.cpp +++ b/src/graph/planner/PlannersRegister.cpp @@ -10,6 +10,7 @@ #include "graph/planner/match/LabelIndexSeek.h" #include "graph/planner/match/MatchPlanner.h" #include "graph/planner/match/PropIndexSeek.h" +#include "graph/planner/match/ScanSeek.h" #include "graph/planner/match/StartVidFinder.h" #include "graph/planner/match/VertexIdSeek.h" #include "graph/planner/ngql/FetchEdgesPlanner.h" @@ -97,6 +98,11 @@ void PlannersRegister::registerMatch() { // MATCH(n: tag) RETURN n // MATCH(s)-[:edge]->(e) RETURN e startVidFinders.emplace_back(&LabelIndexSeek::make); + + // Scan the start vertex directly + // Now we hard code the order of match rules before CBO, + // put scan rule at the last for we assume it's most inefficient + startVidFinders.emplace_back(&ScanSeek::make); } } // namespace graph diff --git a/src/graph/planner/match/ScanSeek.cpp b/src/graph/planner/match/ScanSeek.cpp new file mode 100644 index 00000000000..b4874039c27 --- /dev/null +++ b/src/graph/planner/match/ScanSeek.cpp @@ -0,0 +1,103 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#include "graph/planner/match/ScanSeek.h" + +#include + +#include "graph/planner/match/MatchSolver.h" +#include "graph/planner/plan/Query.h" +#include "graph/util/ExpressionUtils.h" +#include "graph/util/SchemaUtil.h" + +namespace nebula { +namespace graph { + +bool ScanSeek::matchEdge(EdgeContext *edgeCtx) { + UNUSED(edgeCtx); + return false; +} + +StatusOr ScanSeek::transformEdge(EdgeContext *edgeCtx) { + UNUSED(edgeCtx); + return Status::Error("Unimplemented for edge pattern."); +} + +bool ScanSeek::matchNode(NodeContext *nodeCtx) { + auto &node = *nodeCtx->info; + // only require the tag + if (node.tids.size() == 0) { + // empty labels means all labels + const auto *qctx = nodeCtx->matchClauseCtx->qctx; + auto allLabels = qctx->schemaMng()->getAllTags(nodeCtx->matchClauseCtx->space.id); + if (!allLabels.ok()) { + return false; + } + for (const auto &label : allLabels.value()) { + nodeCtx->scanInfo.schemaIds.emplace_back(label.first); + nodeCtx->scanInfo.schemaNames.emplace_back(label.second); + } + nodeCtx->scanInfo.anyLabel = true; + } else { + for (std::size_t i = 0; i < node.tids.size(); i++) { + auto tagId = node.tids[i]; + auto tagName = node.labels[i]; + nodeCtx->scanInfo.schemaIds.emplace_back(tagId); + nodeCtx->scanInfo.schemaNames.emplace_back(tagName); + } + } + return true; +} + +StatusOr ScanSeek::transformNode(NodeContext *nodeCtx) { + SubPlan plan; + auto *matchClauseCtx = nodeCtx->matchClauseCtx; + auto *qctx = matchClauseCtx->qctx; + auto *pool = qctx->objPool(); + auto anyLabel = nodeCtx->scanInfo.anyLabel; + + auto vProps = std::make_unique>(); + std::vector colNames{kVid}; + for (std::size_t i = 0; i < nodeCtx->scanInfo.schemaIds.size(); ++i) { + storage::cpp2::VertexProp vProp; + std::vector props{kTag}; + vProp.set_tag(nodeCtx->scanInfo.schemaIds[i]); + vProp.set_props(std::move(props)); + vProps->emplace_back(std::move(vProp)); + colNames.emplace_back(nodeCtx->scanInfo.schemaNames[i] + "." + kTag); + } + + auto *scanVertices = + ScanVertices::make(qctx, nullptr, matchClauseCtx->space.id, std::move(vProps)); + scanVertices->setColNames(std::move(colNames)); + plan.root = scanVertices; + plan.tail = scanVertices; + + // Filter vertices lack labels + Expression *prev = nullptr; + for (const auto &tag : nodeCtx->scanInfo.schemaNames) { + auto *tagPropExpr = TagPropertyExpression::make(pool, tag, kTag); + auto *notEmpty = UnaryExpression::makeIsNotEmpty(pool, tagPropExpr); + if (prev != nullptr) { + if (anyLabel) { + auto *orExpr = LogicalExpression::makeOr(pool, prev, notEmpty); + prev = orExpr; + } else { + auto *andExpr = LogicalExpression::makeAnd(pool, prev, notEmpty); + prev = andExpr; + } + } else { + prev = notEmpty; + } + } + auto *filter = Filter::make(qctx, scanVertices, prev); + plan.root = filter; + + nodeCtx->initialExpr = InputPropertyExpression::make(pool, kVid); + return plan; +} + +} // namespace graph +} // namespace nebula diff --git a/src/graph/planner/match/ScanSeek.h b/src/graph/planner/match/ScanSeek.h new file mode 100644 index 00000000000..a323723e751 --- /dev/null +++ b/src/graph/planner/match/ScanSeek.h @@ -0,0 +1,33 @@ +/* Copyright (c) 2021 vesoft inc. All rights reserved. + * + * This source code is licensed under Apache 2.0 License. + */ + +#pragma once + +#include "graph/context/ast/CypherAstContext.h" +#include "graph/planner/match/StartVidFinder.h" + +namespace nebula { +namespace graph { +/* + * The ScanSeek was designed to find if could get the starting vids in + * filter. + */ +class ScanSeek final : public StartVidFinder { + public: + static std::unique_ptr make() { return std::unique_ptr(new ScanSeek()); } + + bool matchNode(NodeContext* nodeCtx) override; + + bool matchEdge(EdgeContext* edgeCtx) override; + + StatusOr transformNode(NodeContext* nodeCtx) override; + + StatusOr transformEdge(EdgeContext* edgeCtx) override; + + private: + ScanSeek() = default; +}; +} // namespace graph +} // namespace nebula diff --git a/src/graph/planner/plan/PlanNode.cpp b/src/graph/planner/plan/PlanNode.cpp index b1a43a2836c..a1629320279 100644 --- a/src/graph/planner/plan/PlanNode.cpp +++ b/src/graph/planner/plan/PlanNode.cpp @@ -55,6 +55,10 @@ const char* PlanNode::toString(PlanNode::Kind kind) { return "EdgeIndexRangeScan"; case Kind::kEdgeIndexPrefixScan: return "EdgeIndexPrefixScan"; + case Kind::kScanVertices: + return "ScanVertices"; + case Kind::kScanEdges: + return "ScanEdges"; case Kind::kFilter: return "Filter"; case Kind::kUnion: diff --git a/src/graph/planner/plan/PlanNode.h b/src/graph/planner/plan/PlanNode.h index 053272ce01b..bac87810a32 100644 --- a/src/graph/planner/plan/PlanNode.h +++ b/src/graph/planner/plan/PlanNode.h @@ -39,6 +39,8 @@ class PlanNode { kEdgeIndexFullScan, kEdgeIndexPrefixScan, kEdgeIndexRangeScan, + kScanVertices, + kScanEdges, // ------------------ kFilter, kUnion, diff --git a/src/graph/planner/plan/Query.cpp b/src/graph/planner/plan/Query.cpp index b45c4bb88a6..48b5c05a356 100644 --- a/src/graph/planner/plan/Query.cpp +++ b/src/graph/planner/plan/Query.cpp @@ -194,6 +194,64 @@ void IndexScan::cloneMembers(const IndexScan& g) { isEmptyResultSet_ = g.isEmptyResultSet(); } +std::unique_ptr ScanVertices::explain() const { + auto desc = Explore::explain(); + addDescription("props", props_ ? folly::toJson(util::toJson(*props_)) : "", desc.get()); + addDescription("exprs", exprs_ ? folly::toJson(util::toJson(*exprs_)) : "", desc.get()); + return desc; +} + +PlanNode* ScanVertices::clone() const { + auto* newGV = ScanVertices::make(qctx_, nullptr, space_); + newGV->cloneMembers(*this); + return newGV; +} + +void ScanVertices::cloneMembers(const ScanVertices& gv) { + Explore::cloneMembers(gv); + + if (gv.props_) { + auto vertexProps = *gv.props_; + auto vertexPropsPtr = std::make_unique(std::move(vertexProps)); + setVertexProps(std::move(vertexPropsPtr)); + } + + if (gv.exprs_) { + auto exprs = *gv.exprs_; + auto exprsPtr = std::make_unique(std::move(exprs)); + setExprs(std::move(exprsPtr)); + } +} + +std::unique_ptr ScanEdges::explain() const { + auto desc = Explore::explain(); + addDescription("props", props_ ? folly::toJson(util::toJson(*props_)) : "", desc.get()); + addDescription("exprs", exprs_ ? folly::toJson(util::toJson(*exprs_)) : "", desc.get()); + return desc; +} + +PlanNode* ScanEdges::clone() const { + auto* newGE = ScanEdges::make(qctx_, nullptr, space_); + newGE->cloneMembers(*this); + return newGE; +} + +void ScanEdges::cloneMembers(const ScanEdges& ge) { + Explore::cloneMembers(ge); + + if (ge.props_) { + auto edgeProps = *ge.props_; + auto edgePropsPtr = std::make_unique(std::move(edgeProps)); + setEdgeProps(std::move(edgePropsPtr)); + } + + if (ge.exprs_) { + auto exprs = *ge.exprs_; + auto exprsPtr = std::make_unique(std::move(exprs)); + setExprs(std::move(exprsPtr)); + } +} + Filter::Filter(QueryContext* qctx, PlanNode* input, Expression* condition, bool needStableFilter) : SingleInputNode(qctx, Kind::kFilter, input) { condition_ = condition; @@ -664,7 +722,11 @@ AppendVertices* AppendVertices::clone() const { void AppendVertices::cloneMembers(const AppendVertices& a) { GetVertices::cloneMembers(a); - setVertexFilter(a.vFilter_->clone()); + if (a.vFilter_ != nullptr) { + setVertexFilter(a.vFilter_->clone()); + } else { + setVertexFilter(nullptr); + } } std::unique_ptr AppendVertices::explain() const { diff --git a/src/graph/planner/plan/Query.h b/src/graph/planner/plan/Query.h index 076b7471b53..d4e20562216 100644 --- a/src/graph/planner/plan/Query.h +++ b/src/graph/planner/plan/Query.h @@ -464,6 +464,124 @@ class IndexScan : public Explore { bool isEmptyResultSet_{false}; }; +/** + * Scan vertices + */ +class ScanVertices final : public Explore { + public: + static ScanVertices* make(QueryContext* qctx, + PlanNode* input, + GraphSpaceID space, + std::unique_ptr>&& props = nullptr, + std::unique_ptr>&& exprs = nullptr, + bool dedup = false, + std::vector orderBy = {}, + int64_t limit = -1, + Expression* filter = nullptr) { + return qctx->objPool()->add(new ScanVertices(qctx, + input, + space, + std::move(props), + std::move(exprs), + dedup, + std::move(orderBy), + limit, + filter)); + } + + const std::vector* props() const { return props_.get(); } + + const std::vector* exprs() const { return exprs_.get(); } + + void setVertexProps(std::unique_ptr> props) { props_ = std::move(props); } + + void setExprs(std::unique_ptr> exprs) { exprs_ = std::move(exprs); } + + PlanNode* clone() const override; + std::unique_ptr explain() const override; + + private: + ScanVertices(QueryContext* qctx, + PlanNode* input, + GraphSpaceID space, + std::unique_ptr>&& props, + std::unique_ptr>&& exprs, + bool dedup, + std::vector orderBy, + int64_t limit, + Expression* filter) + : Explore(qctx, Kind::kScanVertices, input, space, dedup, limit, filter, std::move(orderBy)), + props_(std::move(props)), + exprs_(std::move(exprs)) {} + + void cloneMembers(const ScanVertices&); + + private: + // props of the vertex + std::unique_ptr> props_; + // expression to get + std::unique_ptr> exprs_; +}; + +/** + * Scan edges + */ +class ScanEdges final : public Explore { + public: + static ScanEdges* make(QueryContext* qctx, + PlanNode* input, + GraphSpaceID space, + std::unique_ptr>&& props = nullptr, + std::unique_ptr>&& exprs = nullptr, + bool dedup = false, + int64_t limit = -1, + std::vector orderBy = {}, + Expression* filter = nullptr) { + return qctx->objPool()->add(new ScanEdges(qctx, + input, + space, + std::move(props), + std::move(exprs), + dedup, + limit, + std::move(orderBy), + filter)); + } + + const std::vector* props() const { return props_.get(); } + + const std::vector* exprs() const { return exprs_.get(); } + + void setEdgeProps(std::unique_ptr> props) { props_ = std::move(props); } + + void setExprs(std::unique_ptr> exprs) { exprs_ = std::move(exprs); } + + PlanNode* clone() const override; + std::unique_ptr explain() const override; + + private: + ScanEdges(QueryContext* qctx, + PlanNode* input, + GraphSpaceID space, + std::unique_ptr>&& props, + std::unique_ptr>&& exprs, + bool dedup, + int64_t limit, + std::vector orderBy, + Expression* filter) + : Explore(qctx, Kind::kScanEdges, input, space, dedup, limit, filter, std::move(orderBy)), + props_(std::move(props)), + exprs_(std::move(exprs)) {} + + void cloneMembers(const ScanEdges&); + + private: + // props of edge to get + std::unique_ptr> props_; + // expression to show + std::unique_ptr> exprs_; +}; + /** * A Filter node helps filt some records with condition. */ diff --git a/src/graph/validator/test/MatchValidatorTest.cpp b/src/graph/validator/test/MatchValidatorTest.cpp index 481b09fc7fc..715f206f6d6 100644 --- a/src/graph/validator/test/MatchValidatorTest.cpp +++ b/src/graph/validator/test/MatchValidatorTest.cpp @@ -46,7 +46,13 @@ TEST_F(MatchValidatorTest, SeekByTagIndex) { // non index { std::string query = "MATCH (v:room) RETURN id(v) AS id;"; - EXPECT_FALSE(validate(query)); + std::vector expected = {PlanNode::Kind::kProject, + PlanNode::Kind::kProject, + PlanNode::Kind::kAppendVertices, + PlanNode::Kind::kFilter, + PlanNode::Kind::kScanVertices, + PlanNode::Kind::kStart}; + EXPECT_TRUE(checkResult(query, expected)); } } diff --git a/src/graph/visitor/ExtractFilterExprVisitor.cpp b/src/graph/visitor/ExtractFilterExprVisitor.cpp index f412b1a50bb..ce97ddd8cba 100644 --- a/src/graph/visitor/ExtractFilterExprVisitor.cpp +++ b/src/graph/visitor/ExtractFilterExprVisitor.cpp @@ -20,9 +20,31 @@ void ExtractFilterExprVisitor::visit(VariableExpression *expr) { void ExtractFilterExprVisitor::visit(VersionedVariableExpression *) { canBePushed_ = false; } -void ExtractFilterExprVisitor::visit(TagPropertyExpression *) { canBePushed_ = false; } +void ExtractFilterExprVisitor::visit(TagPropertyExpression *) { + switch (pushType_) { + case PushType::kGetNeighbors: + canBePushed_ = false; + break; + case PushType::kGetVertices: + canBePushed_ = true; + break; + case PushType::kGetEdges: + canBePushed_ = false; + break; + } +} -void ExtractFilterExprVisitor::visit(EdgePropertyExpression *) { canBePushed_ = true; } +void ExtractFilterExprVisitor::visit(EdgePropertyExpression *) { + switch (pushType_) { + case PushType::kGetNeighbors: + case PushType::kGetEdges: + canBePushed_ = true; + break; + case PushType::kGetVertices: + canBePushed_ = false; + break; + } +} void ExtractFilterExprVisitor::visit(InputPropertyExpression *) { canBePushed_ = false; } @@ -30,15 +52,65 @@ void ExtractFilterExprVisitor::visit(VariablePropertyExpression *) { canBePushed void ExtractFilterExprVisitor::visit(DestPropertyExpression *) { canBePushed_ = false; } -void ExtractFilterExprVisitor::visit(SourcePropertyExpression *) { canBePushed_ = true; } +void ExtractFilterExprVisitor::visit(SourcePropertyExpression *) { + switch (pushType_) { + case PushType::kGetNeighbors: + canBePushed_ = true; + break; + case PushType::kGetVertices: + case PushType::kGetEdges: + canBePushed_ = false; + break; + } +} -void ExtractFilterExprVisitor::visit(EdgeSrcIdExpression *) { canBePushed_ = true; } +void ExtractFilterExprVisitor::visit(EdgeSrcIdExpression *) { + switch (pushType_) { + case PushType::kGetNeighbors: + case PushType::kGetEdges: + canBePushed_ = true; + break; + case PushType::kGetVertices: + canBePushed_ = false; + break; + } +} -void ExtractFilterExprVisitor::visit(EdgeTypeExpression *) { canBePushed_ = true; } +void ExtractFilterExprVisitor::visit(EdgeTypeExpression *) { + switch (pushType_) { + case PushType::kGetNeighbors: + case PushType::kGetEdges: + canBePushed_ = true; + break; + case PushType::kGetVertices: + canBePushed_ = false; + break; + } +} -void ExtractFilterExprVisitor::visit(EdgeRankExpression *) { canBePushed_ = true; } +void ExtractFilterExprVisitor::visit(EdgeRankExpression *) { + switch (pushType_) { + case PushType::kGetNeighbors: + case PushType::kGetEdges: + canBePushed_ = true; + break; + case PushType::kGetVertices: + canBePushed_ = false; + break; + } +} -void ExtractFilterExprVisitor::visit(EdgeDstIdExpression *) { canBePushed_ = true; } +void ExtractFilterExprVisitor::visit(EdgeDstIdExpression *) { + switch (pushType_) { + case PushType::kGetNeighbors: + case PushType::kGetEdges: + canBePushed_ = true; + break; + case PushType::kGetVertices: + canBePushed_ = false; + break; + } +} void ExtractFilterExprVisitor::visit(VertexExpression *) { canBePushed_ = false; } diff --git a/src/graph/visitor/ExtractFilterExprVisitor.h b/src/graph/visitor/ExtractFilterExprVisitor.h index 33dfe8a7221..33db050234b 100644 --- a/src/graph/visitor/ExtractFilterExprVisitor.h +++ b/src/graph/visitor/ExtractFilterExprVisitor.h @@ -20,6 +20,24 @@ class ExtractFilterExprVisitor final : public ExprVisitorImpl { Expression *remainedExpr() { return remainedExpr_; } + static ExtractFilterExprVisitor makePushGetNeighbors(ObjectPool *pool) { + ExtractFilterExprVisitor visitor(pool); + visitor.pushType_ = PushType::kGetNeighbors; + return visitor; + } + + static ExtractFilterExprVisitor makePushGetVertices(ObjectPool *pool) { + ExtractFilterExprVisitor visitor(pool); + visitor.pushType_ = PushType::kGetVertices; + return visitor; + } + + static ExtractFilterExprVisitor makePushGetEdges(ObjectPool *pool) { + ExtractFilterExprVisitor visitor(pool); + visitor.pushType_ = PushType::kGetEdges; + return visitor; + } + private: using ExprVisitorImpl::visit; @@ -45,9 +63,16 @@ class ExtractFilterExprVisitor final : public ExprVisitorImpl { void visit(SubscriptRangeExpression *) override; private: + enum class PushType { + kGetNeighbors, + kGetVertices, // Get/Append/Scan Vertices + kGetEdges, // Get/Append/Scan Edges + }; + ObjectPool *pool_; bool canBePushed_{true}; Expression *remainedExpr_{nullptr}; + PushType pushType_{PushType::kGetNeighbors}; }; } // namespace graph diff --git a/src/interface/storage.thrift b/src/interface/storage.thrift index c2feb3ec8a0..07c56e2b2fa 100644 --- a/src/interface/storage.thrift +++ b/src/interface/storage.thrift @@ -585,21 +585,11 @@ struct ScanVertexRequest { 10: optional RequestCommon common, } -struct ScanVertexResponse { - 1: required ResponseCommon result, - // The data will return as a dataset. The format is as follows: - // Each column represents one property. the column name is in the form of "tag_name.prop_alias" - // in the same order which specified in VertexProp in request. - 2: common.DataSet vertex_data, - 3: map (cpp.template = "std::unordered_map") - cursors; -} - struct ScanEdgeRequest { 1: common.GraphSpaceID space_id, 2: map (cpp.template = "std::unordered_map") parts, - 3: EdgeProp return_columns, + 3: list return_columns, // max row count of edge in this response 4: i64 limit, // only return data in time range [start_time, end_time) @@ -614,12 +604,13 @@ struct ScanEdgeRequest { 10: optional RequestCommon common, } -struct ScanEdgeResponse { +struct ScanResponse { 1: required ResponseCommon result, // The data will return as a dataset. The format is as follows: - // Each column represents one property. the column name is in the form of "edge_name.prop_alias" - // in the same order which specified in EdgeProp in requests. - 2: common.DataSet edge_data, + // Each column represents one property. the column name is in the form of "edge/tag_name.prop_alias" + // in the same order which specified in VertexProp/EdgeProp in request + // Should keep same with result of GetProps + 2: optional common.DataSet props, 3: map (cpp.template = "std::unordered_map") cursors; } @@ -679,8 +670,8 @@ service GraphStorageService { UpdateResponse updateVertex(1: UpdateVertexRequest req); UpdateResponse updateEdge(1: UpdateEdgeRequest req); - ScanVertexResponse scanVertex(1: ScanVertexRequest req) - ScanEdgeResponse scanEdge(1: ScanEdgeRequest req) + ScanResponse scanVertex(1: ScanVertexRequest req) + ScanResponse scanEdge(1: ScanEdgeRequest req) GetUUIDResp getUUID(1: GetUUIDReq req); diff --git a/src/storage/GraphStorageServiceHandler.cpp b/src/storage/GraphStorageServiceHandler.cpp index 23f9abe18ec..7f7f027af5e 100644 --- a/src/storage/GraphStorageServiceHandler.cpp +++ b/src/storage/GraphStorageServiceHandler.cpp @@ -135,13 +135,13 @@ folly::Future GraphStorageServiceHandler::future_lookupIn RETURN_FUTURE(processor); } -folly::Future GraphStorageServiceHandler::future_scanVertex( +folly::Future GraphStorageServiceHandler::future_scanVertex( const cpp2::ScanVertexRequest& req) { auto* processor = ScanVertexProcessor::instance(env_, &kScanVertexCounters, readerPool_.get()); RETURN_FUTURE(processor); } -folly::Future GraphStorageServiceHandler::future_scanEdge( +folly::Future GraphStorageServiceHandler::future_scanEdge( const cpp2::ScanEdgeRequest& req) { auto* processor = ScanEdgeProcessor::instance(env_, &kScanEdgeCounters, readerPool_.get()); RETURN_FUTURE(processor); diff --git a/src/storage/GraphStorageServiceHandler.h b/src/storage/GraphStorageServiceHandler.h index a28b1509cb1..d4e806d9bc5 100644 --- a/src/storage/GraphStorageServiceHandler.h +++ b/src/storage/GraphStorageServiceHandler.h @@ -55,10 +55,9 @@ class GraphStorageServiceHandler final : public cpp2::GraphStorageServiceSvIf { folly::Future future_chainAddEdges(const cpp2::AddEdgesRequest& req) override; - folly::Future future_scanVertex( - const cpp2::ScanVertexRequest& req) override; + folly::Future future_scanVertex(const cpp2::ScanVertexRequest& req) override; - folly::Future future_scanEdge(const cpp2::ScanEdgeRequest& req) override; + folly::Future future_scanEdge(const cpp2::ScanEdgeRequest& req) override; folly::Future future_getUUID(const cpp2::GetUUIDReq& req) override; diff --git a/src/storage/query/ScanEdgeProcessor.cpp b/src/storage/query/ScanEdgeProcessor.cpp index 94a6a03a1b2..29b9d3cce33 100644 --- a/src/storage/query/ScanEdgeProcessor.cpp +++ b/src/storage/query/ScanEdgeProcessor.cpp @@ -25,7 +25,8 @@ void ScanEdgeProcessor::process(const cpp2::ScanEdgeRequest& req) { void ScanEdgeProcessor::doProcess(const cpp2::ScanEdgeRequest& req) { spaceId_ = req.get_space_id(); enableReadFollower_ = req.get_enable_read_from_follower(); - limit_ = req.get_limit(); + // Negative means no limit + limit_ = req.get_limit() < 0 ? std::numeric_limits::max() : req.get_limit(); auto retCode = getSpaceVidLen(spaceId_); if (retCode != nebula::cpp2::ErrorCode::SUCCEEDED) { @@ -61,7 +62,7 @@ nebula::cpp2::ErrorCode ScanEdgeProcessor::checkAndBuildContexts(const cpp2::Sca return ret; } - std::vector returnProps = {*req.return_columns_ref()}; + std::vector returnProps = *req.return_columns_ref(); ret = handleEdgeProps(returnProps); buildEdgeColName(returnProps); ret = buildFilter(req, [](const cpp2::ScanEdgeRequest& r) -> const std::string* { @@ -85,7 +86,7 @@ void ScanEdgeProcessor::buildEdgeColName(const std::vector& edge } void ScanEdgeProcessor::onProcessFinished() { - resp_.set_edge_data(std::move(resultDataSet_)); + resp_.set_props(std::move(resultDataSet_)); resp_.set_cursors(std::move(cursors_)); } diff --git a/src/storage/query/ScanEdgeProcessor.h b/src/storage/query/ScanEdgeProcessor.h index 40c5186975d..f3798cabc83 100644 --- a/src/storage/query/ScanEdgeProcessor.h +++ b/src/storage/query/ScanEdgeProcessor.h @@ -16,7 +16,7 @@ namespace storage { extern ProcessorCounters kScanEdgeCounters; -class ScanEdgeProcessor : public QueryBaseProcessor { +class ScanEdgeProcessor : public QueryBaseProcessor { public: static ScanEdgeProcessor* instance(StorageEnv* env, const ProcessorCounters* counters = &kScanEdgeCounters, @@ -30,8 +30,7 @@ class ScanEdgeProcessor : public QueryBaseProcessor(env, counters, executor) { - } + : QueryBaseProcessor(env, counters, executor) {} nebula::cpp2::ErrorCode checkAndBuildContexts(const cpp2::ScanEdgeRequest& req) override; diff --git a/src/storage/query/ScanVertexProcessor.cpp b/src/storage/query/ScanVertexProcessor.cpp index bb9b3a705ad..c8624a0d490 100644 --- a/src/storage/query/ScanVertexProcessor.cpp +++ b/src/storage/query/ScanVertexProcessor.cpp @@ -5,6 +5,8 @@ #include "storage/query/ScanVertexProcessor.h" +#include + #include "common/utils/NebulaKeyUtils.h" #include "storage/StorageFlags.h" #include "storage/exec/QueryUtils.h" @@ -24,7 +26,8 @@ void ScanVertexProcessor::process(const cpp2::ScanVertexRequest& req) { void ScanVertexProcessor::doProcess(const cpp2::ScanVertexRequest& req) { spaceId_ = req.get_space_id(); - limit_ = req.get_limit(); + // negative limit number means no limit + limit_ = req.get_limit() < 0 ? std::numeric_limits::max() : req.get_limit(); enableReadFollower_ = req.get_enable_read_from_follower(); auto retCode = getSpaceVidLen(spaceId_); @@ -87,7 +90,7 @@ void ScanVertexProcessor::buildTagColName(const std::vector& t } void ScanVertexProcessor::onProcessFinished() { - resp_.set_vertex_data(std::move(resultDataSet_)); + resp_.set_props(std::move(resultDataSet_)); resp_.set_cursors(std::move(cursors_)); } diff --git a/src/storage/query/ScanVertexProcessor.h b/src/storage/query/ScanVertexProcessor.h index 39b34aedae9..6512c1788a6 100644 --- a/src/storage/query/ScanVertexProcessor.h +++ b/src/storage/query/ScanVertexProcessor.h @@ -16,8 +16,7 @@ namespace storage { extern ProcessorCounters kScanVertexCounters; -class ScanVertexProcessor - : public QueryBaseProcessor { +class ScanVertexProcessor : public QueryBaseProcessor { public: static ScanVertexProcessor* instance(StorageEnv* env, const ProcessorCounters* counters = &kScanVertexCounters, @@ -31,8 +30,7 @@ class ScanVertexProcessor private: ScanVertexProcessor(StorageEnv* env, const ProcessorCounters* counters, folly::Executor* executor) - : QueryBaseProcessor( - env, counters, executor) {} + : QueryBaseProcessor(env, counters, executor) {} nebula::cpp2::ErrorCode checkAndBuildContexts(const cpp2::ScanVertexRequest& req) override; diff --git a/src/storage/test/ScanEdgeTest.cpp b/src/storage/test/ScanEdgeTest.cpp index 381b0df6c33..320361726e9 100644 --- a/src/storage/test/ScanEdgeTest.cpp +++ b/src/storage/test/ScanEdgeTest.cpp @@ -14,13 +14,14 @@ namespace nebula { namespace storage { -cpp2::ScanEdgeRequest buildRequest(std::vector partIds, - std::vector cursors, - const std::pair>& edge, - int64_t rowLimit = 100, - int64_t startTime = 0, - int64_t endTime = std::numeric_limits::max(), - bool onlyLatestVer = false) { +cpp2::ScanEdgeRequest buildRequest( + std::vector partIds, + std::vector cursors, + const std::vector>>& edges, + int64_t rowLimit = 100, + int64_t startTime = 0, + int64_t endTime = std::numeric_limits::max(), + bool onlyLatestVer = false) { cpp2::ScanEdgeRequest req; req.set_space_id(1); cpp2::ScanCursor c; @@ -32,13 +33,17 @@ cpp2::ScanEdgeRequest buildRequest(std::vector partIds, parts.emplace(partIds[i], c); } req.set_parts(std::move(parts)); - EdgeType edgeType = edge.first; - cpp2::EdgeProp edgeProp; - edgeProp.set_type(edgeType); - for (const auto& prop : edge.second) { - (*edgeProp.props_ref()).emplace_back(std::move(prop)); + std::vector edgeProps; + for (const auto& edge : edges) { + EdgeType edgeType = edge.first; + cpp2::EdgeProp edgeProp; + edgeProp.set_type(edgeType); + for (const auto& prop : edge.second) { + (*edgeProp.props_ref()).emplace_back(std::move(prop)); + } + edgeProps.emplace_back(std::move(edgeProp)); } - req.set_return_columns(std::move(edgeProp)); + req.set_return_columns(std::move(edgeProps)); req.set_limit(rowLimit); req.set_start_time(startTime); req.set_end_time(endTime); @@ -104,14 +109,14 @@ TEST(ScanEdgeTest, PropertyTest) { serve, std::vector{kSrc, kType, kRank, kDst, "teamName", "startYear", "endYear"}); for (PartitionID partId = 1; partId <= totalParts; partId++) { - auto req = buildRequest({partId}, {""}, edge); + auto req = buildRequest({partId}, {""}, {edge}); auto* processor = ScanEdgeProcessor::instance(env, nullptr); auto f = processor->getFuture(); processor->process(req); auto resp = std::move(f).get(); ASSERT_EQ(0, resp.result.failed_parts.size()); - checkResponse(*resp.edge_data_ref(), edge, edge.second.size(), totalRowCount); + checkResponse(*resp.props_ref(), edge, edge.second.size(), totalRowCount); } CHECK_EQ(mock::MockData::serves_.size(), totalRowCount); } @@ -120,7 +125,7 @@ TEST(ScanEdgeTest, PropertyTest) { size_t totalRowCount = 0; auto edge = std::make_pair(serve, std::vector{}); for (PartitionID partId = 1; partId <= totalParts; partId++) { - auto req = buildRequest({partId}, {""}, edge); + auto req = buildRequest({partId}, {""}, {edge}); auto* processor = ScanEdgeProcessor::instance(env, nullptr); auto f = processor->getFuture(); processor->process(req); @@ -128,7 +133,7 @@ TEST(ScanEdgeTest, PropertyTest) { ASSERT_EQ(0, resp.result.failed_parts.size()); // all 9 columns in value - checkResponse(*resp.edge_data_ref(), edge, 9, totalRowCount); + checkResponse(*resp.props_ref(), edge, 9, totalRowCount); } CHECK_EQ(mock::MockData::serves_.size(), totalRowCount); } @@ -155,14 +160,14 @@ TEST(ScanEdgeTest, CursorTest) { bool hasNext = true; std::string cursor = ""; while (hasNext) { - auto req = buildRequest({partId}, {cursor}, edge, 5); + auto req = buildRequest({partId}, {cursor}, {edge}, 5); auto* processor = ScanEdgeProcessor::instance(env, nullptr); auto f = processor->getFuture(); processor->process(req); auto resp = std::move(f).get(); ASSERT_EQ(0, resp.result.failed_parts.size()); - checkResponse(*resp.edge_data_ref(), edge, edge.second.size(), totalRowCount); + checkResponse(*resp.props_ref(), edge, edge.second.size(), totalRowCount); hasNext = resp.get_cursors().at(partId).get_has_next(); if (hasNext) { CHECK(resp.get_cursors().at(partId).next_cursor_ref().has_value()); @@ -182,14 +187,14 @@ TEST(ScanEdgeTest, CursorTest) { bool hasNext = true; std::string cursor = ""; while (hasNext) { - auto req = buildRequest({partId}, {cursor}, edge, 1); + auto req = buildRequest({partId}, {cursor}, {edge}, 1); auto* processor = ScanEdgeProcessor::instance(env, nullptr); auto f = processor->getFuture(); processor->process(req); auto resp = std::move(f).get(); ASSERT_EQ(0, resp.result.failed_parts.size()); - checkResponse(*resp.edge_data_ref(), edge, edge.second.size(), totalRowCount); + checkResponse(*resp.props_ref(), edge, edge.second.size(), totalRowCount); hasNext = resp.get_cursors().at(partId).get_has_next(); if (hasNext) { CHECK(resp.get_cursors().at(partId).next_cursor_ref().has_value()); @@ -218,20 +223,20 @@ TEST(ScanEdgeTest, MultiplePartsTest) { auto edge = std::make_pair( serve, std::vector{kSrc, kType, kRank, kDst, "teamName", "startYear", "endYear"}); - auto req = buildRequest({1, 3}, {"", ""}, edge); + auto req = buildRequest({1, 3}, {"", ""}, {edge}); auto* processor = ScanEdgeProcessor::instance(env, nullptr); auto f = processor->getFuture(); processor->process(req); auto resp = std::move(f).get(); ASSERT_EQ(0, resp.result.failed_parts.size()); - checkResponse(*resp.edge_data_ref(), edge, edge.second.size(), totalRowCount); + checkResponse(*resp.props_ref(), edge, edge.second.size(), totalRowCount); } { LOG(INFO) << "Scan one edge with all properties in one batch"; size_t totalRowCount = 0; auto edge = std::make_pair(serve, std::vector{}); - auto req = buildRequest({1, 3}, {"", ""}, edge); + auto req = buildRequest({1, 3}, {"", ""}, {edge}); auto* processor = ScanEdgeProcessor::instance(env, nullptr); auto f = processor->getFuture(); processor->process(req); @@ -239,7 +244,7 @@ TEST(ScanEdgeTest, MultiplePartsTest) { ASSERT_EQ(0, resp.result.failed_parts.size()); // all 9 columns in value - checkResponse(*resp.edge_data_ref(), edge, 9, totalRowCount); + checkResponse(*resp.props_ref(), edge, 9, totalRowCount); } } @@ -261,14 +266,14 @@ TEST(ScanEdgeTest, LimitTest) { auto edge = std::make_pair( serve, std::vector{kSrc, kType, kRank, kDst, "teamName", "startYear", "endYear"}); - auto req = buildRequest({1}, {""}, edge, limit); + auto req = buildRequest({1}, {""}, {edge}, limit); auto* processor = ScanEdgeProcessor::instance(env, nullptr); auto f = processor->getFuture(); processor->process(req); auto resp = std::move(f).get(); ASSERT_EQ(0, resp.result.failed_parts.size()); - checkResponse(*resp.edge_data_ref(), edge, edge.second.size(), totalRowCount); + checkResponse(*resp.props_ref(), edge, edge.second.size(), totalRowCount); EXPECT_EQ(totalRowCount, limit); } { @@ -276,7 +281,7 @@ TEST(ScanEdgeTest, LimitTest) { constexpr std::size_t limit = 3; size_t totalRowCount = 0; auto edge = std::make_pair(serve, std::vector{}); - auto req = buildRequest({1}, {""}, edge, limit); + auto req = buildRequest({1}, {""}, {edge}, limit); auto* processor = ScanEdgeProcessor::instance(env, nullptr); auto f = processor->getFuture(); processor->process(req); @@ -284,7 +289,7 @@ TEST(ScanEdgeTest, LimitTest) { ASSERT_EQ(0, resp.result.failed_parts.size()); // all 9 columns in value - checkResponse(*resp.edge_data_ref(), edge, 9, totalRowCount); + checkResponse(*resp.props_ref(), edge, 9, totalRowCount); EXPECT_EQ(totalRowCount, limit); } } @@ -307,7 +312,7 @@ TEST(ScanEdgeTest, FilterTest) { auto edge = std::make_pair( serve, std::vector{kSrc, kType, kRank, kDst, "teamName", "startYear", "endYear"}); - auto req = buildRequest({1}, {""}, edge, limit); + auto req = buildRequest({1}, {""}, {edge}, limit); Expression* filter = EdgePropertyExpression::make(&pool, "101", kSrc); filter = RelationalExpression::makeEQ( &pool, filter, ConstantExpression::make(&pool, "Damian Lillard")); @@ -328,7 +333,7 @@ TEST(ScanEdgeTest, FilterTest) { "101.endYear"}); expected.emplace_back( List({"Damian Lillard", 101, 2012, "Trail Blazers", "Trail Blazers", 2012, 2020})); - EXPECT_EQ(*resp.edge_data_ref(), expected); + EXPECT_EQ(*resp.props_ref(), expected); } } diff --git a/src/storage/test/ScanVertexTest.cpp b/src/storage/test/ScanVertexTest.cpp index ea972dd39e6..09653b7d1bf 100644 --- a/src/storage/test/ScanVertexTest.cpp +++ b/src/storage/test/ScanVertexTest.cpp @@ -120,7 +120,7 @@ TEST(ScanVertexTest, PropertyTest) { auto resp = std::move(f).get(); ASSERT_EQ(0, resp.result.failed_parts.size()); - checkResponse(*resp.vertex_data_ref(), tag, tag.second.size() + 1 /* kVid */, totalRowCount); + checkResponse(*resp.props_ref(), tag, tag.second.size() + 1 /* kVid */, totalRowCount); } CHECK_EQ(mock::MockData::players_.size(), totalRowCount); } @@ -149,7 +149,7 @@ TEST(ScanVertexTest, PropertyTest) { ASSERT_EQ(0, resp.result.failed_parts.size()); // all 11 columns in value - checkResponse(*resp.vertex_data_ref(), respTag, 11 + 1 /* kVid */, totalRowCount); + checkResponse(*resp.props_ref(), respTag, 11 + 1 /* kVid */, totalRowCount); } CHECK_EQ(mock::MockData::players_.size(), totalRowCount); } @@ -182,8 +182,7 @@ TEST(ScanVertexTest, CursorTest) { auto resp = std::move(f).get(); ASSERT_EQ(0, resp.result.failed_parts.size()); - checkResponse( - *resp.vertex_data_ref(), tag, tag.second.size() + 1 /* kVid */, totalRowCount); + checkResponse(*resp.props_ref(), tag, tag.second.size() + 1 /* kVid */, totalRowCount); hasNext = resp.get_cursors().at(partId).get_has_next(); if (hasNext) { CHECK(resp.get_cursors().at(partId).next_cursor_ref()); @@ -209,8 +208,7 @@ TEST(ScanVertexTest, CursorTest) { auto resp = std::move(f).get(); ASSERT_EQ(0, resp.result.failed_parts.size()); - checkResponse( - *resp.vertex_data_ref(), tag, tag.second.size() + 1 /* kVid */, totalRowCount); + checkResponse(*resp.props_ref(), tag, tag.second.size() + 1 /* kVid */, totalRowCount); hasNext = resp.get_cursors().at(partId).get_has_next(); if (hasNext) { CHECK(resp.get_cursors().at(partId).next_cursor_ref()); @@ -245,7 +243,7 @@ TEST(ScanVertexTest, MultiplePartsTest) { auto resp = std::move(f).get(); ASSERT_EQ(0, resp.result.failed_parts.size()); - checkResponse(*resp.vertex_data_ref(), tag, tag.second.size() + 1 /* kVid */, totalRowCount); + checkResponse(*resp.props_ref(), tag, tag.second.size() + 1 /* kVid */, totalRowCount); } { LOG(INFO) << "Scan one tag with all properties in one batch"; @@ -271,7 +269,7 @@ TEST(ScanVertexTest, MultiplePartsTest) { ASSERT_EQ(0, resp.result.failed_parts.size()); // all 11 columns in value - checkResponse(*resp.vertex_data_ref(), respTag, 11 + 1 /* kVid */, totalRowCount); + checkResponse(*resp.props_ref(), respTag, 11 + 1 /* kVid */, totalRowCount); } } @@ -299,7 +297,7 @@ TEST(ScanVertexTest, LimitTest) { auto resp = std::move(f).get(); ASSERT_EQ(0, resp.result.failed_parts.size()); - checkResponse(*resp.vertex_data_ref(), tag, tag.second.size() + 1 /* kVid */, totalRowCount); + checkResponse(*resp.props_ref(), tag, tag.second.size() + 1 /* kVid */, totalRowCount); EXPECT_EQ(totalRowCount, limit); } { @@ -327,7 +325,7 @@ TEST(ScanVertexTest, LimitTest) { ASSERT_EQ(0, resp.result.failed_parts.size()); // all 11 columns in value - checkResponse(*resp.vertex_data_ref(), respTag, 11 + 1 /* kVid */, totalRowCount); + checkResponse(*resp.props_ref(), respTag, 11 + 1 /* kVid */, totalRowCount); EXPECT_EQ(totalRowCount, limit); } } @@ -433,7 +431,7 @@ TEST(ScanVertexTest, MultipleTagsTest) { 16.7, Value::kEmpty, Value::kEmpty})); - EXPECT_EQ(expect, *resp.vertex_data_ref()); + EXPECT_EQ(expect, *resp.props_ref()); } } @@ -471,7 +469,7 @@ TEST(ScanVertexTest, FilterTest) { {"_vid", "1._vid", "1._tag", "1.name", "1.age", "1.avgScore", "2._tag", "2.name"}); expect.emplace_back(List( {"Kobe Bryant", "Kobe Bryant", 1, "Kobe Bryant", 41, 25, Value::kEmpty, Value::kEmpty})); - EXPECT_EQ(expect, *resp.vertex_data_ref()); + EXPECT_EQ(expect, *resp.props_ref()); } { LOG(INFO) << "Scan one tag with some properties in one batch"; @@ -498,7 +496,7 @@ TEST(ScanVertexTest, FilterTest) { {"_vid", "1._vid", "1._tag", "1.name", "1.age", "1.avgScore", "2._tag", "2.name"}); expect.emplace_back(List( {"Kobe Bryant", "Kobe Bryant", 1, "Kobe Bryant", 41, 25, Value::kEmpty, Value::kEmpty})); - EXPECT_EQ(expect, *resp.vertex_data_ref()); + EXPECT_EQ(expect, *resp.props_ref()); } } diff --git a/tests/tck/features/match/Base.IntVid.feature b/tests/tck/features/match/Base.IntVid.feature index d06379f3775..36d9c69d83e 100644 --- a/tests/tck/features/match/Base.IntVid.feature +++ b/tests/tck/features/match/Base.IntVid.feature @@ -487,36 +487,36 @@ Feature: Basic match """ MATCH (v) return v """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (v) RETURN v + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v{name: "Tim Duncan"}) return v """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (v{name:"Tim Duncan"}) RETURN v + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v:player:bachelor) RETURN v """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (v:player:bachelor) RETURN v + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v:player{age:23}:bachelor) RETURN v """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (v:player{age:23}:bachelor) RETURN v + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH () -[]-> (v) return * """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH ()-->(v) RETURN * + Then a ExecutionError should be raised at runtime: Scan edges must specify limit number. When executing query: """ MATCH () --> (v) --> () return * """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH ()-->(v)-->() RETURN * + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. # The 0 step means node scan in fact, but p and t has no label or properties for index seek # So it's not workable now When executing query: """ MATCH (p)-[:serve*0..3]->(t) RETURN p """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (p)-[:serve*0..3]->(t) RETURN p + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. diff --git a/tests/tck/features/match/Base.feature b/tests/tck/features/match/Base.feature index ddd9f76d970..2177de5273e 100644 --- a/tests/tck/features/match/Base.feature +++ b/tests/tck/features/match/Base.feature @@ -596,36 +596,36 @@ Feature: Basic match """ MATCH (v) return v """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (v) RETURN v + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v{name: "Tim Duncan"}) return v """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (v{name:"Tim Duncan"}) RETURN v + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v:player:bachelor) RETURN v """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (v:player:bachelor) RETURN v + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v:player{age:23}:bachelor) RETURN v """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (v:player{age:23}:bachelor) RETURN v + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH () -[]-> (v) return * """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH ()-->(v) RETURN * + Then a ExecutionError should be raised at runtime: Scan edges must specify limit number. When executing query: """ MATCH () --> (v) --> () return * """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH ()-->(v)-->() RETURN * + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. # The 0 step means node scan in fact, but p and t has no label or properties for index seek # So it's not workable now When executing query: """ MATCH (p)-[:serve*0..3]->(t) RETURN p """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (p)-[:serve*0..3]->(t) RETURN p + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. diff --git a/tests/tck/features/match/Scan.feature b/tests/tck/features/match/Scan.feature new file mode 100644 index 00000000000..faf8e5cded3 --- /dev/null +++ b/tests/tck/features/match/Scan.feature @@ -0,0 +1,157 @@ +# Copyright (c) 2021 vesoft inc. All rights reserved. +# +# This source code is licensed under Apache 2.0 License. +Feature: Match seek by scan + + Background: Prepare space + Given a graph with space named "student" + + Scenario: query vertices by scan + When executing query: + """ + MATCH (v) + RETURN v.name AS Name + LIMIT 3 + """ + Then the result should be, in any order: + | Name | + | /\w+/ | + | /\w+/ | + | /\w+/ | + When executing query: + """ + MATCH (v:teacher) + RETURN v.name AS Name + LIMIT 3 + """ + Then the result should be, in any order: + | Name | + | /\w+/ | + | /\w+/ | + | /\w+/ | + # TODO check index validation in match planner entry + # When executing query: + # """ + # MATCH (v:teacher) + # WHERE v.name = "Mary" + # RETURN v.name AS Name + # LIMIT 3 + # """ + # Then the result should be, in any order: + # | Name | + # | "Mary" | + # When executing query: + # """ + # MATCH (v:teacher {name: "Mary"}) + # RETURN v.name AS Name + # LIMIT 3 + # """ + # Then the result should be, in any order: + # | Name | + # | "Mary" | + When executing query: + """ + MATCH (v:teacher:student) + RETURN v.name AS Name + LIMIT 3 + """ + Then the result should be, in any order: + | Name | + When executing query: + """ + MATCH (v:person:teacher) + RETURN v.name AS Name + LIMIT 3 + """ + Then the result should be, in any order: + | Name | + | /\w+/ | + | /\w+/ | + | /\w+/ | + When executing query: + """ + MATCH (v:person{name: "Mary"}:teacher) + RETURN v.name AS Name + LIMIT 3 + """ + Then the result should be, in any order: + | Name | + | "Mary" | + + Scenario: query vertices by scan failed + When executing query: + """ + MATCH (v) + RETURN v.name AS Name + """ + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. + When executing query: + """ + MATCH (v{name: "Mary"}) + RETURN v.name AS Name + LIMIT 3 + """ + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. + + Scenario: query edge by scan + When executing query: + """ + MATCH ()-[e]->() + RETURN type(e) AS Type + LIMIT 3 + """ + Then the result should be, in any order: + | Type | + | /[\w_]+/ | + | /[\w_]+/ | + | /[\w_]+/ | + When executing query: + """ + MATCH ()-[e:is_teacher]->() + RETURN type(e) AS Type, e.start_year AS StartYear, e.end_year AS EndYear + LIMIT 3 + """ + Then the result should be, in any order: + | Type | StartYear | EndYear | + | /[\w_]+/ | /\d{4}/ | /\d{4}/ | + | /[\w_]+/ | /\d{4}/ | /\d{4}/ | + | /[\w_]+/ | /\d{4}/ | /\d{4}/ | + + # TODO check index validation in match planner entry + # When executing query: + # """ + # MATCH ()-[e:is_teacher]->() + # WHERE e.start_year == 2018 + # RETURN type(e) AS Type, e.start_year AS StartYear, e.end_year AS EndYear + # LIMIT 3 + # """ + # Then the result should be, in any order: + # | Type | StartYear | EndYear | + # | /[\w_]+/ | /\d{4}/ | /\d{4}/ | + # | /[\w_]+/ | /\d{4}/ | /\d{4}/ | + # | /[\w_]+/ | /\d{4}/ | /\d{4}/ | + # When executing query: + # """ + # MATCH ()-[e:is_teacher {start_year: 2018}]->() + # RETURN type(e) AS Type, e.start_year AS StartYear, e.end_year AS EndYear + # LIMIT 3 + # """ + # Then the result should be, in any order: + # | Type | StartYear | EndYear | + # | /[\w_]+/ | /\d{4}/ | /\d{4}/ | + # | /[\w_]+/ | /\d{4}/ | /\d{4}/ | + # | /[\w_]+/ | /\d{4}/ | /\d{4}/ | + Scenario: query edge by scan failed + When executing query: + """ + MATCH ()-[e]->() + RETURN type(e) AS Type + """ + Then a ExecutionError should be raised at runtime: Scan edges must specify limit number. + When executing query: + """ + MATCH (v)-[e]->() + RETURN v.name, type(e) AS Type + LIMIT 3 + """ + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. diff --git a/tests/tck/features/match/SeekByEdge.feature b/tests/tck/features/match/SeekByEdge.feature index ef1629c7652..51c1983eb0b 100644 --- a/tests/tck/features/match/SeekByEdge.feature +++ b/tests/tck/features/match/SeekByEdge.feature @@ -1469,7 +1469,7 @@ Feature: Match seek by edge MATCH (p1)-[:teammate]->(p2) RETURN p1.name, id(p2) """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (p1)-[:teammate]->(p2) RETURN p1.name,id(p2) + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. Scenario Outline: seek by edge in a single edge type space Given an empty graph @@ -1490,16 +1490,16 @@ Feature: Match seek by edge MATCH (p1)-[]->(p2) RETURN p1.name, id(p2) """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (p1)-->(p2) RETURN p1.name,id(p2) + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (p1)-[b]->(p2) RETURN p1.name, id(p2) """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (p1)-[b]->(p2) RETURN p1.name,id(p2) + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (p1)-[:edge_1]->(p2) RETURN p1.name, id(p2) """ - Then a SemanticError should be raised at runtime: Can't solve the start vids from the sentence: MATCH (p1)-[:edge_1]->(p2) RETURN p1.name,id(p2) + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. diff --git a/tests/tck/features/match/SeekById.feature b/tests/tck/features/match/SeekById.feature index e4793ecea7b..c3dd7f5ba72 100644 --- a/tests/tck/features/match/SeekById.feature +++ b/tests/tck/features/match/SeekById.feature @@ -222,37 +222,37 @@ Feature: Match seek by id WHERE NOT id(v) == 'Paul Gasol' RETURN v.name AS Name, v.age AS Age """ - Then a SemanticError should be raised at runtime: + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v) WHERE NOT id(v) IN ['James Harden', 'Jonathon Simmons', 'Klay Thompson', 'Dejounte Murray'] RETURN v.name AS Name """ - Then a SemanticError should be raised at runtime: + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v) WHERE id(v) IN ['James Harden', 'Jonathon Simmons', 'Klay Thompson', 'Dejounte Murray'] - OR v.age == 23 + OR v.age == 23 RETURN v.name AS Name """ - Then a SemanticError should be raised at runtime: + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v) WHERE id(v) == 'James Harden' - OR v.age == 23 + OR v.age == 23 RETURN v.name AS Name """ - Then a SemanticError should be raised at runtime: + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v) WHERE id(x) == 'James Harden' RETURN v.name AS Name """ - Then a SemanticError should be raised at runtime: + Then a SemanticError should be raised at runtime: Alias used but not defined: `x' When executing query: """ MATCH (v) @@ -266,7 +266,7 @@ Feature: Match seek by id WHERE id(v) IN ['James Harden', v.name] RETURN v.name AS Name """ - Then a SemanticError should be raised at runtime: + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. Scenario: Start from end When executing query: diff --git a/tests/tck/features/match/SeekById.intVid.feature b/tests/tck/features/match/SeekById.intVid.feature index 02a9f94c806..fb5fa4db1c2 100644 --- a/tests/tck/features/match/SeekById.intVid.feature +++ b/tests/tck/features/match/SeekById.intVid.feature @@ -222,44 +222,44 @@ Feature: Match seek by id WHERE NOT id(v) == hash('Paul Gasol') RETURN v.name AS Name, v.age AS Age """ - Then a SemanticError should be raised at runtime: + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v) WHERE NOT id(v) IN [hash('James Harden'), hash('Jonathon Simmons'), hash('Klay Thompson'), hash('Dejounte Murray')] RETURN v.name AS Name """ - Then a SemanticError should be raised at runtime: + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v) WHERE id(v) IN [hash('James Harden'), hash('Jonathon Simmons'), hash('Klay Thompson'), hash('Dejounte Murray')] - OR v.age == 23 + OR v.age == 23 RETURN v.name AS Name """ - Then a SemanticError should be raised at runtime: + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v) WHERE id(v) == hash('James Harden') - OR v.age == 23 + OR v.age == 23 RETURN v.name AS Name """ - Then a SemanticError should be raised at runtime: + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. When executing query: """ MATCH (v) WHERE id(x) == hash('James Harden') RETURN v.name AS Name """ - Then a SemanticError should be raised at runtime: + Then a SemanticError should be raised at runtime: Alias used but not defined: `x' When executing query: """ MATCH (v) WHERE id(v) IN [hash('James Harden'), v.name] RETURN v.name AS Name """ - Then a SemanticError should be raised at runtime: + Then a ExecutionError should be raised at runtime: Scan vertices must specify limit number. Scenario: with arithmetic When executing query: diff --git a/tests/tck/features/optimizer/PushLimitDownScanEdgesRule.feature b/tests/tck/features/optimizer/PushLimitDownScanEdgesRule.feature new file mode 100644 index 00000000000..a0aabec877f --- /dev/null +++ b/tests/tck/features/optimizer/PushLimitDownScanEdgesRule.feature @@ -0,0 +1,47 @@ +# Copyright (c) 2021 vesoft inc. All rights reserved. +# +# This source code is licensed under Apache 2.0 License. +Feature: Push Limit down scan edges rule + + Background: + Given a graph with space named "student" + + Scenario: push limit down to ScanEdges + When profiling query: + """ + MATCH ()-[e:is_teacher]->() + RETURN e.start_year LIMIT 3 + """ + Then the result should be, in any order: + | e.start_year | + | /\d+/ | + | /\d+/ | + | /\d+/ | + And the execution plan should be: + | id | name | dependencies | operator info | + | 9 | DataCollect | 19 | | + | 19 | Project | 16 | | + | 16 | Limit | 11 | | + | 11 | AppendVertices | 3 | | + | 3 | Project | 2 | | + | 2 | ScanEdges | 0 | {"limit": "3"} | + | 0 | Start | | | + When profiling query: + """ + MATCH ()-[e]->() + RETURN type(e) LIMIT 3 + """ + Then the result should be, in any order: + | type(e) | + | /\w+/ | + | /\w+/ | + | /\w+/ | + And the execution plan should be: + | id | name | dependencies | operator info | + | 9 | DataCollect | 19 | | + | 19 | Project | 16 | | + | 16 | Limit | 11 | | + | 11 | AppendVertices | 3 | | + | 3 | Project | 2 | | + | 2 | ScanEdges | 0 | {"limit": "3"} | + | 0 | Start | | | diff --git a/tests/tck/features/optimizer/PushLimitDownScanVerticesRule.feature b/tests/tck/features/optimizer/PushLimitDownScanVerticesRule.feature new file mode 100644 index 00000000000..dd503af4909 --- /dev/null +++ b/tests/tck/features/optimizer/PushLimitDownScanVerticesRule.feature @@ -0,0 +1,45 @@ +# Copyright (c) 2021 vesoft inc. All rights reserved. +# +# This source code is licensed under Apache 2.0 License. +Feature: Push Limit down scan vertices rule + + Background: + Given a graph with space named "student" + + Scenario: push limit down to ScanVertices + When profiling query: + """ + MATCH (v) + RETURN v.name LIMIT 3 + """ + Then the result should be, in any order: + | v.name | + | /\w+/ | + | /\w+/ | + | /\w+/ | + And the execution plan should be: + | id | name | dependencies | operator info | + | 9 | DataCollect | 19 | | + | 19 | Project | 16 | | + | 16 | Limit | 11 | | + | 11 | AppendVertices | 2 | | + | 2 | ScanVertices | 0 | {"limit": "3"} | + | 0 | Start | | | + When profiling query: + """ + MATCH (v:person) + RETURN v.name LIMIT 3 + """ + Then the result should be, in any order: + | v.name | + | /\w+/ | + | /\w+/ | + | /\w+/ | + And the execution plan should be: + | id | name | dependencies | operator info | + | 9 | DataCollect | 19 | | + | 19 | Project | 16 | | + | 16 | Limit | 11 | | + | 11 | AppendVertices | 2 | | + | 2 | ScanVertices | 0 | {"limit": "3"} | + | 0 | Start | | |