summaryrefslogtreecommitdiffstats
path: root/.github/scripts/analytics/data_mart_queries/perfomance_olap_mart.sql
blob: a56b3574cac38efcee8393f58498c07a247abb30 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
$start_timestamp = (CurrentUtcDate() - 30 * Interval("P1D"));

$all_suites = (
    SELECT 
        Suite, Test, Db
    FROM (
        SELECT
            Db,
            Suite,
            ListSort(AGG_LIST_DISTINCT(Test)) AS Tests
        FROM `perfomance/olap/tests_results`
        WHERE Timestamp >= $start_timestamp
        GROUP BY Suite, Db
    ) 
    FLATTEN LIST BY Tests AS Test
);

$launch_times = (
    SELECT 
        launch_times_raw.*,
        all_suites.Suite as Suite,
        all_suites.Test as Test,
        COALESCE(SubString(CAST(launch_times_raw.Version AS String), 0U, RFIND(CAST(launch_times_raw.Version AS String), '.')), 'unknown') As Branch,
        COALESCE(SubString(CAST(launch_times_raw.CiVersion AS String), 0U, RFIND(CAST(launch_times_raw.CiVersion AS String), '.')), 'unknown') As CiBranch,
        COALESCE(SubString(CAST(launch_times_raw.TestToolsVersion AS String), 0U, RFIND(CAST(launch_times_raw.TestToolsVersion AS String), '.')), 'unknown') As TestToolsBranch,
    FROM
    $all_suites AS all_suites 
    LEFT JOIN (
        SELECT
            Db,
            Version,
            LunchId,
            CAST(Min(RunId / 1000UL) AS Timestamp) AS Run_start_timestamp,
            ROW_NUMBER() OVER (PARTITION BY Db, Version ORDER BY Min(RunId) ASC) AS Run_number_in_version,
            JSON_VALUE(MAX_BY(Info, RunId), "$.ci_version") AS CiVersion,
            JSON_VALUE(MAX_BY(Info, RunId), "$.test_tools_version") AS TestToolsVersion,
        FROM `perfomance/olap/tests_results`
        WHERE Timestamp >= $start_timestamp
        GROUP BY
            Db,
            JSON_VALUE(Info, "$.cluster.version") AS Version,
            COALESCE(JSON_VALUE(Info, "$.ci_launch_id"), CAST(RunId AS String)) AS LunchId
    ) AS launch_times_raw ON all_suites.Db == launch_times_raw.Db
);

$all_tests_raw =
    SELECT 
        tests_results.*,
        JSON_VALUE(Info, "$.report_url") AS Report,
        JSON_VALUE(tests_results.Info, "$.cluster.version") AS Version_n,
        JSON_VALUE(Info, "$.ci_version") AS CiVersion_n,
        JSON_VALUE(Info, "$.test_tools_version") AS TestToolsVersion_n,
        COALESCE(JSON_VALUE(tests_results.Info, "$.ci_launch_id"), CAST(RunId AS String)) AS LunchId_n,
        CAST(JSON_VALUE(Stats, '$.DiffsCount') AS INT) AS diff_response,
        IF(Success > 0, CAST(CAST(JSON_VALUE(Stats, '$.CompilationAvg') AS Double) AS Uint64)) AS CompilationAvg,
        IF(Success > 0, CAST(CAST(JSON_VALUE(Stats, '$.CompilationCPUTime') AS Double) AS Uint64)) AS CompilationCPUTime,
        IF(Success > 0, CAST(CAST(JSON_VALUE(Stats, '$.ProcessCPUTime') AS Double) AS Uint64)) AS ProcessCPUTime,
        IF(Success > 0, MeanDuration / 1000) AS YdbSumMeans,
        IF(Success > 0, MaxDuration / 1000) AS YdbSumMax,
        IF(Success > 0, MinDuration / 1000) AS YdbSumMin,
        CAST(RunId / 1000UL AS Timestamp) AS RunTs,
        IF (JSON_VALUE(Stats, "$.errors.other") = "true",
            "red",
            IF (JSON_VALUE(Stats, "$.errors.timeout") = "true",
            "blue",
                IF (JSON_VALUE(Stats, "$.errors.warning") = "true",
                    "yellow",
                    "green"
                )
            )
        ) AS Color
    FROM `perfomance/olap/tests_results` AS tests_results
    WHERE Timestamp >= $start_timestamp;

SELECT 
    Db,
    Suite, 
    Test,
    Run_start_timestamp,
    Run_number_in_version,
    MaxDuration,
    MeanDuration,
    MedianDuration,
    MinDuration,
    YdbSumMax,
    YdbSumMeans,
    YdbSumMin,
    CompilationAvg,
    CompilationCPUTime,
    ProcessCPUTime,
    Version,
    CiVersion,
    TestToolsVersion,
    Branch,
    CiBranch,
    TestToolsBranch,
    diff_response,
    Timestamp,
    COALESCE(Success,0) AS Success,
    max(Kind) OVER (PARTITION  by Db, Run_start_timestamp, Suite) AS Kind,
    max(Report) OVER (PARTITION  by Db, Run_start_timestamp, Suite) AS Report,
    max(RunId) OVER (PARTITION  by Db, Run_start_timestamp, Suite) AS RunId,
    max(RunTs) OVER (PARTITION  by Db, Run_start_timestamp, Suite) AS RunTs,
    YdbSumMeans IS NULL AS errors,
    max(Report) OVER (PARTITION  by Db, Run_start_timestamp, Suite) IS NULL AS Suite_not_runned,
    Color,
    CASE
        WHEN Db LIKE '%sas%' THEN 'sas'
        WHEN Db LIKE '%vla%' THEN 'vla'
        WHEN Db LIKE '%klg%' THEN 'klg'
        WHEN Db LIKE '%etn0vb1kg3p016q1tp3t%' THEN 'cloud'
        ELSE 'other'
    END AS DbDc,

    CASE
        WHEN Db LIKE '%load%' THEN 'column'
        WHEN Db LIKE '%/s3%' THEN 's3'
        WHEN Db LIKE '%/row%' THEN 'row'
        ELSE 'other'
    END AS DbType,

    CASE
        WHEN Db LIKE '%sas-daily%' THEN 'sas_small_'
        WHEN Db LIKE '%sas-perf%' THEN 'sas_big_'
        WHEN Db LIKE '%vla-acceptance%' THEN 'vla_small_'
        WHEN Db LIKE '%vla-perf%' THEN 'vla_big_'
        WHEN Db LIKE '%vla4-8154%' OR Db LIKE '%vla4-8158%' THEN 'vla_2_node_'
        WHEN Db LIKE '%vla4-8157%' THEN 'vla_1_node_'
        WHEN Db LIKE '%vla4-8163%' OR Db LIKE '%vla4-8171%' OR Db LIKE '%vla4-8174%' THEN 'vla_3_node_'
        WHEN Db LIKE '%etn0vb1kg3p016q1tp3t%b1ggceeul2pkher8vhb6/etn0vb1kg3p016q1tp3t%' THEN 'cloud_slonnn_128_'
        WHEN Db LIKE '%etntj9d0t8v7ud2hrqho%b1ggceeul2pkher8vhb6/etntj9d0t8v7ud2hrqho%' THEN 'cloud_slonnn_64_'
        WHEN Db LIKE '%static-node-1.ydb-cluster.com/Root/db%' THEN 'ansible_'
        WHEN Db LIKE '%ydb-vla-dev04-002%' THEN 'oltp-vla-perf1_'
        WHEN Db LIKE '%ydb-vla-dev04-005%' THEN 'oltp-vla-perf2_'
        WHEN Db LIKE '%ydb-qa-01-klg-010%' THEN 'oltp-klg-perf3_'
        WHEN Db LIKE '%ydb-qa-01-klg-014%' THEN 'oltp-klg-perf4_'
        WHEN Db LIKE '%ydb-qa-01-klg-018%' THEN 'oltp-klg-perf5_'
        WHEN Db LIKE '%ydb-qa-01-sas-000%' THEN 'oltp-3dc-perf6_'
        WHEN Db LIKE '%ydb-qa-01-klg-021%' THEN 'oltp-klg-perf7_'
        WHEN Db LIKE '%ydb-qa-01-klg-030%' THEN 'oltp-klg-perf9_'
        WHEN Db LIKE '%sas%' THEN 'sas_'
        WHEN Db LIKE '%vla%' THEN 'vla_'
        WHEN Db LIKE '%klg%' THEN 'klg_'
        ELSE 'new_db_'
    END || CASE
        WHEN Db LIKE '%load%' THEN 'column'
        WHEN Db LIKE '%/s3%' THEN 's3'
        WHEN Db LIKE '%/row%' THEN 'row'
        ELSE 'other'
    END AS DbAlias,
FROM (
    SELECT
        null_template.Db AS Db,  --only from null_template
        COALESCE(real_data.Kind, null_template.Kind) AS Kind,
        COALESCE(real_data.MaxDuration, null_template.MaxDuration) AS MaxDuration,
        COALESCE(real_data.MeanDuration, null_template.MeanDuration) AS MeanDuration,
        COALESCE(real_data.MedianDuration, null_template.MedianDuration) AS MedianDuration,
        COALESCE(real_data.MinDuration, null_template.MinDuration) AS MinDuration,
        COALESCE(real_data.Report, null_template.Report) AS Report,
        COALESCE(real_data.Branch, null_template.Branch) AS Branch,
        COALESCE(real_data.CiBranch, null_template.CiBranch) AS CiBranch,
        COALESCE(real_data.TestToolsBranch, null_template.TestToolsBranch) AS TestToolsBranch,
        COALESCE(real_data.RunId, null_template.RunId) AS RunId,
        COALESCE(real_data.RunTs, null_template.RunTs) AS RunTs,
        null_template.Run_number_in_version AS Run_number_in_version,  --only from null_template
        null_template.Run_start_timestamp AS Run_start_timestamp,  --only from null_template
        COALESCE(real_data.Success, null_template.Success) AS Success,
        null_template.Suite AS Suite,  --only from null_template
        null_template.Test AS Test,  --only from null_template
        COALESCE(real_data.Timestamp, null_template.Timestamp) AS Timestamp,
        COALESCE(real_data.Version, null_template.Version) AS Version,
        COALESCE(real_data.CiVersion, null_template.CiVersion) AS CiVersion,
        COALESCE(real_data.TestToolsVersion, null_template.TestToolsVersion) AS TestToolsVersion,
        COALESCE(real_data.YdbSumMax, null_template.YdbSumMax) AS YdbSumMax,
        COALESCE(real_data.YdbSumMeans, null_template.YdbSumMeans) AS YdbSumMeans,
        COALESCE(real_data.CompilationAvg, null_template.CompilationAvg) AS CompilationAvg,
        COALESCE(real_data.CompilationCPUTime, null_template.CompilationCPUTime) AS CompilationCPUTime,
        COALESCE(real_data.ProcessCPUTime, null_template.ProcessCPUTime) AS ProcessCPUTime,
        COALESCE(real_data.YdbSumMin, null_template.YdbSumMin) AS YdbSumMin,
        COALESCE(real_data.diff_response, null_template.diff_response) AS diff_response,
        COALESCE(real_data.Color, null_template.Color) AS Color,
    FROM (
        SELECT 
            all_tests.*,
            launch_times.*
        FROM $launch_times AS launch_times
        LEFT JOIN (
            SELECT
                *
            FROM $all_tests_raw AS all_tests_raw
            WHERE JSON_VALUE(all_tests_raw.Info, "$.cluster.version") is NULL
        ) AS all_tests
        ON all_tests.Db = launch_times.Db
        AND all_tests.Suite = launch_times.Suite
        AND all_tests.Test = launch_times.Test
    -- WHERE (  all_tests.Version_n is NULL)
    ) AS null_template
    FULL OUTER JOIN (
        SELECT
            real_data.Db AS Db,
            real_data.Kind AS Kind,
            real_data.MaxDuration AS MaxDuration,
            real_data.MeanDuration AS MeanDuration,
            real_data.MedianDuration AS MedianDuration,
            real_data.MinDuration AS MinDuration,
            real_data.Report AS Report,
            real_data.Branch AS Branch,
            real_data.CiBranch AS CiBranch,
            real_data.TestToolsBranch AS TestToolsBranch,
            real_data.RunId AS RunId,
            real_data.RunTs AS RunTs,
            real_data.Run_number_in_version AS Run_number_in_version,
            real_data.Run_start_timestamp AS Run_start_timestamp,
            --real_data.Stats AS Stats,
            real_data.Success AS Success,
            real_data.Suite AS Suite,
            real_data.Test AS Test,
            real_data.Timestamp AS Timestamp,
            real_data.Version AS Version,
            real_data.CiVersion AS CiVersion,
            real_data.TestToolsVersion AS TestToolsVersion,
            real_data.YdbSumMax AS YdbSumMax,
            real_data.YdbSumMeans AS YdbSumMeans,
            real_data.CompilationAvg AS CompilationAvg,
            real_data.CompilationCPUTime AS CompilationCPUTime,
            real_data.ProcessCPUTime AS ProcessCPUTime,
            real_data.YdbSumMin AS YdbSumMin,
            real_data.diff_response AS diff_response,
            real_data.Color AS Color,
        FROM (
            SELECT 
                all_tests.*,
                launch_times.*,
            FROM $launch_times AS launch_times
            LEFT JOIN $all_tests_raw AS all_tests
            ON all_tests.Db = launch_times.Db
            AND all_tests.Suite = launch_times.Suite
            AND all_tests.Test = launch_times.Test
            AND all_tests.Version_n = launch_times.Version
            WHERE (
                all_tests.LunchId_n == launch_times.LunchId
                OR all_tests.RunId IS NULL 
            )
        ) AS real_data
    ) AS real_data
    ON null_template.Db = real_data.Db
    AND null_template.Run_start_timestamp = real_data.Run_start_timestamp
    AND null_template.Suite = real_data.Suite
    AND null_template.Test = real_data.Test
)