aboutsummaryrefslogtreecommitdiffstats
path: root/contrib/clickhouse/src/Functions/URL/path.h
blob: a0dd5eea2d3d636ef5de1589ed5842e87ad5d813 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#pragma once

#include <base/find_symbols.h>
#include <Functions/StringHelpers.h>


namespace DB
{

template <bool with_query_string>
struct ExtractPath
{
    static size_t getReserveLengthForElement() { return 25; }

    static void execute(Pos data, size_t size, Pos & res_data, size_t & res_size)
    {
        res_data = data;
        res_size = 0;

        Pos pos = data;
        Pos end = pos + size;

        /// We support URLs with and without schema:
        /// 1. http://host/path
        /// 2. host/path
        /// We search for first slash and if there is subsequent slash, then skip and repeat search for the next slash.

        pos = find_first_symbols<'/'>(pos, end);
        if (end == pos)
            return;

        /// Note that strings are zero-terminated.
        bool has_subsequent_slash = pos[1] == '/';
        if (has_subsequent_slash)
        {
            /// Search for next slash.
            pos = find_first_symbols<'/'>(pos + 2, end);
            if (end == pos)
                return;
        }

        res_data = pos;

        if constexpr (with_query_string)
        {
            res_size = end - res_data;
        }
        else
        {
            Pos query_string_or_fragment = find_first_symbols<'?', '#'>(pos, end);
            res_size = query_string_or_fragment - res_data;
        }
    }
};

}