blob: b4f64630f7754b988d1d919a12599b6806632eae (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
|
#include "grammar.h"
#include <yql/essentials/sql/v1/reflect/sql_reflect.h>
namespace NSQLComplete {
class TSqlGrammar: public ISqlGrammar {
public:
TSqlGrammar(const NSQLReflect::TLexerGrammar& grammar)
: Vocabulary(GetVocabularyP())
, AllTokens(ComputeAllTokens())
, KeywordTokens(ComputeKeywordTokens(grammar))
, PunctuationTokens(ComputePunctuationTokens(grammar))
{
}
const antlr4::dfa::Vocabulary& GetVocabulary() const override {
return *Vocabulary;
}
const std::unordered_set<TTokenId>& GetAllTokens() const override {
return AllTokens;
}
const std::unordered_set<TTokenId>& GetKeywordTokens() const override {
return KeywordTokens;
}
const std::unordered_set<TTokenId>& GetPunctuationTokens() const override {
return PunctuationTokens;
}
private:
static const antlr4::dfa::Vocabulary* GetVocabularyP() {
return &NALADefaultAntlr4::SQLv1Antlr4Parser(nullptr).getVocabulary();
}
std::unordered_set<TTokenId> ComputeAllTokens() {
const auto& vocabulary = GetVocabulary();
std::unordered_set<TTokenId> allTokens;
for (size_t type = 1; type <= vocabulary.getMaxTokenType(); ++type) {
allTokens.emplace(type);
}
return allTokens;
}
std::unordered_set<TTokenId> ComputeKeywordTokens(
const NSQLReflect::TLexerGrammar& grammar) {
const auto& vocabulary = GetVocabulary();
auto keywordTokens = GetAllTokens();
std::erase_if(keywordTokens, [&](TTokenId token) {
return !grammar.KeywordNames.contains(vocabulary.getSymbolicName(token));
});
keywordTokens.erase(TOKEN_EOF);
return keywordTokens;
}
std::unordered_set<TTokenId> ComputePunctuationTokens(
const NSQLReflect::TLexerGrammar& grammar) {
const auto& vocabulary = GetVocabulary();
auto punctuationTokens = GetAllTokens();
std::erase_if(punctuationTokens, [&](TTokenId token) {
return !grammar.PunctuationNames.contains(vocabulary.getSymbolicName(token));
});
return punctuationTokens;
}
const antlr4::dfa::Vocabulary* Vocabulary;
const std::unordered_set<TTokenId> AllTokens;
const std::unordered_set<TTokenId> KeywordTokens;
const std::unordered_set<TTokenId> PunctuationTokens;
};
const ISqlGrammar& GetSqlGrammar() {
const static TSqlGrammar DefaultSqlGrammar(NSQLReflect::LoadLexerGrammar());
return DefaultSqlGrammar;
}
} // namespace NSQLComplete
|