aboutsummaryrefslogtreecommitdiffstats
path: root/library/cpp/string_utils/tskv_format/escape.cpp
blob: 3dc78bec8c0d2dbfcbf6f76cf397635909ca1004 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
#include <util/generic/yexception.h>
#include "escape.h"

namespace NTskvFormat {
    namespace {
        const TStringBuf ESCAPE_CHARS("\t\n\r\\\0=\"", 7);

        TString& EscapeImpl(const char* src, size_t len, TString& dst) {
            TStringBuf srcStr(src, len);
            size_t noEscapeStart = 0;

            while (noEscapeStart < len) {
                size_t noEscapeEnd = srcStr.find_first_of(ESCAPE_CHARS, noEscapeStart);

                if (noEscapeEnd == TStringBuf::npos) {
                    dst.append(src + noEscapeStart, len - noEscapeStart);
                    break;
                }

                dst.append(src + noEscapeStart, noEscapeEnd - noEscapeStart);

                switch (src[noEscapeEnd]) {
                    case '\t':
                        dst.append(TStringBuf("\\t"));
                        break;
                    case '\n':
                        dst.append(TStringBuf("\\n"));
                        break;
                    case '\r':
                        dst.append(TStringBuf("\\r"));
                        break;
                    case '\0':
                        dst.append(TStringBuf("\\0"));
                        break;
                    case '\\':
                        dst.append(TStringBuf("\\\\"));
                        break;
                    case '=':
                        dst.append(TStringBuf("\\="));
                        break;
                    case '"':
                        dst.append(TStringBuf("\\\""));
                        break;
                }

                noEscapeStart = noEscapeEnd + 1;
            }

            return dst;
        }

        TString& UnescapeImpl(const char* src, const size_t len, TString& dst) {
            TStringBuf srcStr(src, len);
            size_t noEscapeStart = 0;

            while (noEscapeStart < len) {
                size_t noEscapeEnd = srcStr.find('\\', noEscapeStart);

                if (noEscapeEnd == TStringBuf::npos) {
                    dst.append(src + noEscapeStart, len - noEscapeStart);
                    break;
                }

                dst.append(src + noEscapeStart, noEscapeEnd - noEscapeStart);

                if (noEscapeEnd + 1 >= len) {
                    throw yexception() << "expected (t|n|r|0|\\|=|\"|) after \\. Got end of line.";
                }

                switch (src[noEscapeEnd + 1]) {
                    case 't':
                        dst.append('\t');
                        break;
                    case 'n':
                        dst.append('\n');
                        break;
                    case 'r':
                        dst.append('\r');
                        break;
                    case '0':
                        dst.append('\0');
                        break;
                    case '\\':
                        dst.append('\\');
                        break;
                    case '=':
                        dst.append('=');
                        break;
                    case '"':
                        dst.append('"');
                        break;
                    default:
                        throw yexception() << "unexpected symbol '" << src[noEscapeEnd + 1] << "' after \\";
                }

                noEscapeStart = noEscapeEnd + 2;
            }

            return dst;
        }

    }

    TString& Escape(const TStringBuf& src, TString& dst) {
        return EscapeImpl(src.data(), src.size(), dst);
    }

    TString& Unescape(const TStringBuf& src, TString& dst) {
        return UnescapeImpl(src.data(), src.size(), dst);
    }

}