aboutsummaryrefslogtreecommitdiffstats
path: root/library/cpp/clickhouse/client/base/compressed.cpp
blob: b883d534ee0bac6868ad8527b6594d65a944f4f9 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
#include "compressed.h"
#include "wire_format.h"

#include <util/generic/yexception.h>

#include <contrib/libs/lz4/lz4.h>
#include <contrib/restricted/cityhash-1.0.2/city.h>

#define DBMS_MAX_COMPRESSED_SIZE 0x40000000ULL // 1GB

namespace NClickHouse {
    TCompressedInput::TCompressedInput(TCodedInputStream* input)
        : Input_(input)
    {
    }

    TCompressedInput::~TCompressedInput() {
        if (!Mem_.Exhausted()) {
            Y_ABORT("some data was not read");
        }
    }

    size_t TCompressedInput::DoNext(const void** ptr, size_t len) {
        if (Mem_.Exhausted()) {
            if (!Decompress()) {
                return 0;
            }
        }

        return Mem_.Next(ptr, len);
    }

    bool TCompressedInput::Decompress() {
        CityHash_v1_0_2::uint128 hash;
        ui32 compressed = 0;
        ui32 original = 0;
        ui8 method = 0;

        if (!TWireFormat::ReadFixed(Input_, &hash)) {
            return false;
        }
        if (!TWireFormat::ReadFixed(Input_, &method)) {
            return false;
        }

        if (method != 0x82) {
            ythrow yexception() << "unsupported compression method "
                                << int(method);
        } else {
            if (!TWireFormat::ReadFixed(Input_, &compressed)) {
                return false;
            }
            if (!TWireFormat::ReadFixed(Input_, &original)) {
                return false;
            }

            if (compressed > DBMS_MAX_COMPRESSED_SIZE) {
                ythrow yexception() << "compressed data too big";
            }

            TTempBuf tmp(compressed);

            // Заполнить заголовок сжатых данных.
            tmp.Append(&method, sizeof(method));
            tmp.Append(&compressed, sizeof(compressed));
            tmp.Append(&original, sizeof(original));

            if (!TWireFormat::ReadBytes(Input_, tmp.Data() + 9, compressed - 9)) {
                return false;
            } else {
                if (hash != CityHash_v1_0_2::CityHash128(tmp.Data(), compressed)) {
                    ythrow yexception() << "data was corrupted";
                }
            }

            Data_ = TTempBuf(original);

            if (LZ4_decompress_fast(tmp.Data() + 9, Data_.Data(), original) < 0) {
                ythrow yexception() << "can't decompress data";
            } else {
                Mem_.Reset(Data_.Data(), original);
            }
        }

        return true;
    }

}