1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
|
#pragma once
#include "mkql_match_recognize_list.h"
#include <yql/essentials/minikql/computation/mkql_computation_node_impl.h>
#include <yql/essentials/minikql/computation/mkql_computation_node_holders.h>
namespace NKikimr::NMiniKQL::NMatchRecognize {
template<class R>
using TMatchedVar = std::vector<R, TMKQLAllocator<R>>;
template<class R>
void Extend(TMatchedVar<R>& var, const R& r) {
if (var.empty()) {
var.emplace_back(r);
} else {
MKQL_ENSURE(r.From() > var.back().To(), "Internal logic error");
if (var.back().To() + 1 == r.From() && var.back().NfaIndex() == r.NfaIndex()) {
var.back().Extend();
} else {
var.emplace_back(r);
}
}
}
template<class R>
using TMatchedVars = std::vector<TMatchedVar<R>, TMKQLAllocator<TMatchedVar<R>>>;
template<class R>
NUdf::TUnboxedValue ToValue(const THolderFactory& holderFactory, const R& range) {
std::array<NUdf::TUnboxedValue, 2> array = {NUdf::TUnboxedValuePod{range.From()}, NUdf::TUnboxedValuePod{range.To()}};
return holderFactory.RangeAsArray(cbegin(array), cend(array));
}
template<class R>
NUdf::TUnboxedValue ToValue(const THolderFactory& holderFactory, const TMatchedVar<R>& var) {
TUnboxedValueVector data;
data.reserve(var.size());
for (const auto& r: var) {
data.push_back(ToValue(holderFactory, r));
}
return holderFactory.VectorAsVectorHolder(std::move(data));
}
template<class R>
inline NUdf::TUnboxedValue ToValue(const THolderFactory& holderFactory, const TMatchedVars<R>& vars) {
NUdf::TUnboxedValue* ptr;
auto result = holderFactory.CreateDirectArrayHolder(vars.size(), ptr);
for (const auto& v: vars) {
*ptr++ = ToValue(holderFactory, v);
}
return result;
}
///Optimized reference based implementation to be used as an argument
///for lambdas which produce strict result(do not require lazy access to its arguments)
template<class R>
class TMatchedVarsValue : public TComputationValue<TMatchedVarsValue<R>> {
class TRangeList: public TComputationValue<TRangeList> {
class TIterator : public TComputationValue<TIterator> {
public:
TIterator(TMemoryUsageInfo* memInfo, const THolderFactory& holderFactory, const std::vector<R, TMKQLAllocator<R>>& ranges)
: TComputationValue<TIterator>(memInfo)
, HolderFactory(holderFactory)
, Ranges(ranges)
, Index(0)
{}
private:
bool Next(NUdf::TUnboxedValue& value) override {
if (Ranges.size() == Index){
return false;
}
value = ToValue(HolderFactory, Ranges[Index++]);
return true;
}
const THolderFactory& HolderFactory;
const std::vector<R, TMKQLAllocator<R>>& Ranges;
size_t Index;
};
public:
TRangeList(TMemoryUsageInfo* memInfo, const THolderFactory& holderFactory, const TMatchedVar<R>& v)
: TComputationValue<TRangeList>(memInfo)
, HolderFactory(holderFactory)
, Var(v)
{
}
bool HasFastListLength() const override {
return true;
}
ui64 GetListLength() const override {
return Var.size();
}
bool HasListItems() const override {
return !Var.empty();
}
NUdf::TUnboxedValue GetListIterator() const override {
return HolderFactory.Create<TIterator>(HolderFactory, Var);
}
private:
const THolderFactory& HolderFactory;
const TMatchedVar<R>& Var;
};
public:
TMatchedVarsValue(TMemoryUsageInfo* memInfo, const THolderFactory& holderFactory, const std::vector<TMatchedVar<R>, TMKQLAllocator<TMatchedVar<R>>>& vars)
: TComputationValue<TMatchedVarsValue>(memInfo)
, HolderFactory(holderFactory)
, Vars(vars)
{}
NUdf::TUnboxedValue GetElement(ui32 index) const override {
return HolderFactory.Create<TRangeList>(HolderFactory, Vars[index]);
}
private:
const THolderFactory& HolderFactory;
const std::vector<TMatchedVar<R>, TMKQLAllocator<TMatchedVar<R>>>& Vars;
};
}//namespace NKikimr::NMiniKQL::NMatchRecognize
|