forked from oceanbase/oceanbase
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathob_topk_op.cpp
More file actions
140 lines (128 loc) · 4.45 KB
/
ob_topk_op.cpp
File metadata and controls
140 lines (128 loc) · 4.45 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
/**
* Copyright (c) 2021 OceanBase
* OceanBase CE is licensed under Mulan PubL v2.
* You can use this software according to the terms and conditions of the Mulan PubL v2.
* You may obtain a copy of Mulan PubL v2 at:
* http://license.coscl.org.cn/MulanPubL-2.0
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
* See the Mulan PubL v2 for more details.
*/
#define USING_LOG_PREFIX SQL_ENG
#include "sql/engine/basic/ob_topk_op.h"
#include "sql/engine/basic/ob_limit_op.h"
#include "sql/engine/sort/ob_sort_op.h"
#include "sql/engine/aggregate/ob_hash_groupby_op.h"
namespace oceanbase {
namespace sql {
using namespace oceanbase::common;
ObTopKSpec::ObTopKSpec(ObIAllocator& alloc, const ObPhyOperatorType type)
: ObOpSpec(alloc, type), minimum_row_count_(-1), topk_precision_(-1), org_limit_(NULL), org_offset_(NULL)
{}
bool ObTopKSpec::is_valid() const
{
return (get_output_count() > 0) && (NULL != org_limit_) && (NULL != child_) && (child_->get_output_count() > 0);
}
OB_SERIALIZE_MEMBER((ObTopKSpec, ObOpSpec), minimum_row_count_, topk_precision_, org_limit_, org_offset_);
ObTopKOp::ObTopKOp(ObExecContext& exec_ctx, const ObOpSpec& spec, ObOpInput* input)
: ObOperator(exec_ctx, spec, input), topk_final_count_(-1), output_count_(0)
{}
int ObTopKOp::inner_open()
{
int ret = OB_SUCCESS;
if (!MY_SPEC.is_valid()) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("topk operator is invalid", K(ret));
}
return ret;
}
int ObTopKOp::rescan()
{
output_count_ = 0;
return ObOperator::rescan();
}
int ObTopKOp::inner_get_next_row()
{
int ret = OB_SUCCESS;
if (0 == output_count_ || output_count_ < topk_final_count_) {
if (OB_FAIL(child_->get_next_row())) {
if (OB_ITER_END == ret) {
LOG_WARN("child get next row", K(ret), K(output_count_), K(topk_final_count_));
}
} else {
if (0 == output_count_) {
if (OB_FAIL(get_topk_final_count())) {
LOG_WARN("get topk count failed", K(ret));
} else if (OB_UNLIKELY(0 == topk_final_count_)) {
ret = OB_ITER_END;
}
}
if (OB_SUCC(ret)) {
clear_evaluated_flag();
++output_count_;
}
}
} else {
ret = OB_ITER_END;
}
return ret;
}
int ObTopKOp::get_topk_final_count()
{
int ret = OB_SUCCESS;
int64_t limit = -1;
int64_t offset = 0;
bool is_null_value = false;
ObPhysicalPlanCtx* plan_ctx = ctx_.get_physical_plan_ctx();
if (OB_ISNULL(child_) || OB_ISNULL(plan_ctx)) {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("child_ or plan_ctx is NULL", K(ret), KP(child_), KP(plan_ctx));
} else if (OB_FAIL(ObLimitOp::get_int_val(MY_SPEC.org_limit_, eval_ctx_, limit, is_null_value))) {
LOG_WARN("get limit values failed", K(ret));
} else if (!is_null_value && OB_FAIL(ObLimitOp::get_int_val(MY_SPEC.org_offset_, eval_ctx_, offset, is_null_value))) {
LOG_WARN("get offset values failed", K(ret));
} else {
// revise limit, offset because rownum < -1 is rewritten as limit -1
limit = (is_null_value || limit < 0) ? 0 : limit;
offset = (is_null_value || offset < 0) ? 0 : offset;
topk_final_count_ = std::max(MY_SPEC.minimum_row_count_, limit + offset);
int64_t row_count = 0;
ObPhyOperatorType op_type = child_->get_spec().get_type();
switch (op_type) {
case PHY_SORT: {
ObSortOp* sort_op = static_cast<ObSortOp*>(child_);
if (OB_FAIL(row_count = sort_op->get_sort_row_count())) {
LOG_WARN("get sort row count failed", K(ret));
}
break;
}
case PHY_MATERIAL: {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("material not implimented yet", K(ret));
break;
}
case PHY_HASH_GROUP_BY: {
ObHashGroupByOp* gby_op = static_cast<ObHashGroupByOp*>(child_);
row_count = gby_op->get_hash_groupby_row_count();
break;
}
default: {
ret = OB_ERR_UNEXPECTED;
LOG_WARN("invalid child_ for topk operator", K(ret), K(op_type));
break;
}
}
if (OB_SUCC(ret)) {
topk_final_count_ = std::max(topk_final_count_, static_cast<int64_t>(row_count * MY_SPEC.topk_precision_ / 100));
if (topk_final_count_ >= row_count) {
plan_ctx->set_is_result_accurate(true);
} else {
plan_ctx->set_is_result_accurate(false);
}
}
}
return ret;
}
} // namespace sql
} // namespace oceanbase