1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
|
#include "StackTrace.h"
#include <base/FnTraits.h>
#include <base/constexpr_helpers.h>
#include <base/demangle.h>
#include <Common/Dwarf.h>
#include <Common/Elf.h>
#include <Common/MemorySanitizer.h>
#include <Common/SymbolIndex.h>
#include <IO/WriteBufferFromString.h>
#include <IO/WriteHelpers.h>
#include <IO/Operators.h>
#include <atomic>
#include <filesystem>
#include <map>
#include <mutex>
#include <sstream>
#include <unordered_map>
#include <fmt/format.h>
#include <libunwind.h>
#include "clickhouse_config.h"
/// Convenient helper (added for jemalloc)
int unw_backtrace(void **buffer, int size) {
unw_context_t context;
unw_cursor_t cursor;
if (unw_getcontext(&context) || unw_init_local(&cursor, &context)) {
return 0;
}
unw_word_t ip;
int current = 0;
while (unw_step(&cursor) > 0) {
if (current >= size || unw_get_reg(&cursor, UNW_REG_IP, &ip)) {
break;
}
buffer[current++] = reinterpret_cast<void *>(static_cast<uintptr_t>(ip));
}
return current;
}
namespace
{
/// Currently this variable is set up once on server startup.
/// But we use atomic just in case, so it is possible to be modified at runtime.
std::atomic<bool> show_addresses = true;
bool shouldShowAddress(const void * addr)
{
/// If the address is less than 4096, most likely it is a nullptr dereference with offset,
/// and showing this offset is secure nevertheless.
/// NOTE: 4096 is the page size on x86 and it can be different on other systems,
/// but for the purpose of this branch, it does not matter.
if (reinterpret_cast<uintptr_t>(addr) < 4096)
return true;
return show_addresses.load(std::memory_order_relaxed);
}
}
void StackTrace::setShowAddresses(bool show)
{
show_addresses.store(show, std::memory_order_relaxed);
}
std::string SigsegvErrorString(const siginfo_t & info, [[maybe_unused]] const ucontext_t & context)
{
using namespace std::string_literals;
std::string address
= info.si_addr == nullptr ? "NULL pointer"s : (shouldShowAddress(info.si_addr) ? fmt::format("{}", info.si_addr) : ""s);
const std::string_view access =
#if defined(__x86_64__) && !defined(OS_FREEBSD) && !defined(OS_DARWIN) && !defined(__arm__) && !defined(__powerpc__)
(context.uc_mcontext.gregs[REG_ERR] & 0x02) ? "write" : "read";
#else
"";
#endif
std::string_view message;
switch (info.si_code)
{
case SEGV_ACCERR:
message = "Attempted access has violated the permissions assigned to the memory area";
break;
case SEGV_MAPERR:
message = "Address not mapped to object";
break;
default:
message = "Unknown si_code";
break;
}
return fmt::format("Address: {}. Access: {}. {}.", std::move(address), access, message);
}
constexpr std::string_view SigbusErrorString(int si_code)
{
switch (si_code)
{
case BUS_ADRALN:
return "Invalid address alignment.";
case BUS_ADRERR:
return "Non-existent physical address.";
case BUS_OBJERR:
return "Object specific hardware error.";
// Linux specific
#if defined(BUS_MCEERR_AR)
case BUS_MCEERR_AR:
return "Hardware memory error: action required.";
#endif
#if defined(BUS_MCEERR_AO)
case BUS_MCEERR_AO:
return "Hardware memory error: action optional.";
#endif
default:
return "Unknown si_code.";
}
}
constexpr std::string_view SigfpeErrorString(int si_code)
{
switch (si_code)
{
case FPE_INTDIV:
return "Integer divide by zero.";
case FPE_INTOVF:
return "Integer overflow.";
case FPE_FLTDIV:
return "Floating point divide by zero.";
case FPE_FLTOVF:
return "Floating point overflow.";
case FPE_FLTUND:
return "Floating point underflow.";
case FPE_FLTRES:
return "Floating point inexact result.";
case FPE_FLTINV:
return "Floating point invalid operation.";
case FPE_FLTSUB:
return "Subscript out of range.";
default:
return "Unknown si_code.";
}
}
constexpr std::string_view SigillErrorString(int si_code)
{
switch (si_code)
{
case ILL_ILLOPC:
return "Illegal opcode.";
case ILL_ILLOPN:
return "Illegal operand.";
case ILL_ILLADR:
return "Illegal addressing mode.";
case ILL_ILLTRP:
return "Illegal trap.";
case ILL_PRVOPC:
return "Privileged opcode.";
case ILL_PRVREG:
return "Privileged register.";
case ILL_COPROC:
return "Coprocessor error.";
case ILL_BADSTK:
return "Internal stack error.";
default:
return "Unknown si_code.";
}
}
std::string signalToErrorMessage(int sig, const siginfo_t & info, [[maybe_unused]] const ucontext_t & context)
{
switch (sig)
{
case SIGSEGV:
return SigsegvErrorString(info, context);
case SIGBUS:
return std::string{SigbusErrorString(info.si_code)};
case SIGILL:
return std::string{SigillErrorString(info.si_code)};
case SIGFPE:
return std::string{SigfpeErrorString(info.si_code)};
case SIGTSTP:
return "This is a signal used for debugging purposes by the user.";
default:
return "";
}
}
static void * getCallerAddress(const ucontext_t & context)
{
#if defined(__x86_64__)
/// Get the address at the time the signal was raised from the RIP (x86-64)
# if defined(OS_FREEBSD)
return reinterpret_cast<void *>(context.uc_mcontext.mc_rip);
# elif defined(OS_DARWIN)
return reinterpret_cast<void *>(context.uc_mcontext->__ss.__rip);
# else
return reinterpret_cast<void *>(context.uc_mcontext.gregs[REG_RIP]);
# endif
#elif defined(OS_DARWIN) && defined(__aarch64__)
return reinterpret_cast<void *>(context.uc_mcontext->__ss.__pc);
#elif defined(OS_FREEBSD) && defined(__aarch64__)
return reinterpret_cast<void *>(context.uc_mcontext.mc_gpregs.gp_elr);
#elif defined(__aarch64__)
return reinterpret_cast<void *>(context.uc_mcontext.pc);
#elif defined(__powerpc64__) && defined(__linux__)
return reinterpret_cast<void *>(context.uc_mcontext.gp_regs[PT_NIP]);
#elif defined(__powerpc64__) && defined(__FreeBSD__)
return reinterpret_cast<void *>(context.uc_mcontext.mc_srr0);
#elif defined(__riscv)
return reinterpret_cast<void *>(context.uc_mcontext.__gregs[REG_PC]);
#elif defined(__s390x__)
return reinterpret_cast<void *>(context.uc_mcontext.psw.addr);
#else
return nullptr;
#endif
}
// FIXME: looks like this is used only for Sentry but duplicates the whole algo, maybe replace?
void StackTrace::symbolize(
const StackTrace::FramePointers & frame_pointers, [[maybe_unused]] size_t offset, size_t size, StackTrace::Frames & frames)
{
#if defined(__ELF__) && !defined(OS_FREEBSD)
const DB::SymbolIndex & symbol_index = DB::SymbolIndex::instance();
std::unordered_map<std::string, DB::Dwarf> dwarfs;
for (size_t i = 0; i < offset; ++i)
frames[i].virtual_addr = frame_pointers[i];
for (size_t i = offset; i < size; ++i)
{
StackTrace::Frame & current_frame = frames[i];
current_frame.virtual_addr = frame_pointers[i];
const auto * object = symbol_index.findObject(current_frame.virtual_addr);
uintptr_t virtual_offset = object ? uintptr_t(object->address_begin) : 0;
current_frame.physical_addr = reinterpret_cast<void *>(uintptr_t(current_frame.virtual_addr) - virtual_offset);
if (object)
{
current_frame.object = object->name;
if (std::error_code ec; std::filesystem::exists(current_frame.object.value(), ec) && !ec)
{
auto dwarf_it = dwarfs.try_emplace(object->name, object->elf).first;
DB::Dwarf::LocationInfo location;
std::vector<DB::Dwarf::SymbolizedFrame> inline_frames;
if (dwarf_it->second.findAddress(
uintptr_t(current_frame.physical_addr), location, DB::Dwarf::LocationInfoMode::FAST, inline_frames))
{
current_frame.file = location.file.toString();
current_frame.line = location.line;
}
}
}
else
current_frame.object = "?";
if (const auto * symbol = symbol_index.findSymbol(current_frame.virtual_addr))
current_frame.symbol = demangle(symbol->name);
else
current_frame.symbol = "?";
}
#else
for (size_t i = 0; i < size; ++i)
frames[i].virtual_addr = frame_pointers[i];
#endif
}
StackTrace::StackTrace(const ucontext_t & signal_context)
{
tryCapture();
/// This variable from signal handler is not instrumented by Memory Sanitizer.
__msan_unpoison(&signal_context, sizeof(signal_context));
void * caller_address = getCallerAddress(signal_context);
if (size == 0 && caller_address)
{
frame_pointers[0] = caller_address;
size = 1;
}
else
{
/// Skip excessive stack frames that we have created while finding stack trace.
for (size_t i = 0; i < size; ++i)
{
if (frame_pointers[i] == caller_address)
{
offset = i;
break;
}
}
}
}
void StackTrace::tryCapture()
{
size = unw_backtrace(frame_pointers.data(), capacity);
__msan_unpoison(frame_pointers.data(), size * sizeof(frame_pointers[0]));
}
/// ClickHouse uses bundled libc++ so type names will be the same on every system thus it's safe to hardcode them
constexpr std::pair<std::string_view, std::string_view> replacements[]
= {{"::__1", ""}, {"std::basic_string<char, std::char_traits<char>, std::allocator<char>>", "String"}};
String collapseNames(String && haystack)
{
// TODO: surely there is a written version already for better in place search&replace
for (auto [needle, to] : replacements)
{
size_t pos = 0;
while ((pos = haystack.find(needle, pos)) != std::string::npos)
{
haystack.replace(pos, needle.length(), to);
pos += to.length();
}
}
return haystack;
}
struct StackTraceRefTriple
{
const StackTrace::FramePointers & pointers;
size_t offset;
size_t size;
};
struct StackTraceTriple
{
StackTrace::FramePointers pointers;
size_t offset;
size_t size;
};
template <class T>
concept MaybeRef = std::is_same_v<T, StackTraceTriple> || std::is_same_v<T, StackTraceRefTriple>;
constexpr bool operator<(const MaybeRef auto & left, const MaybeRef auto & right)
{
return std::tuple{left.pointers, left.size, left.offset} < std::tuple{right.pointers, right.size, right.offset};
}
static void
toStringEveryLineImpl([[maybe_unused]] bool fatal, const StackTraceRefTriple & stack_trace, Fn<void(std::string_view)> auto && callback)
{
if (stack_trace.size == 0)
return callback("<Empty trace>");
#if defined(__ELF__) && !defined(OS_FREEBSD)
using enum DB::Dwarf::LocationInfoMode;
const auto mode = fatal ? FULL_WITH_INLINE : FAST;
const DB::SymbolIndex & symbol_index = DB::SymbolIndex::instance();
std::unordered_map<String, DB::Dwarf> dwarfs;
for (size_t i = stack_trace.offset; i < stack_trace.size; ++i)
{
std::vector<DB::Dwarf::SymbolizedFrame> inline_frames;
const void * virtual_addr = stack_trace.pointers[i];
const auto * object = symbol_index.findObject(virtual_addr);
uintptr_t virtual_offset = object ? uintptr_t(object->address_begin) : 0;
const void * physical_addr = reinterpret_cast<const void *>(uintptr_t(virtual_addr) - virtual_offset);
DB::WriteBufferFromOwnString out;
out << i << ". ";
if (std::error_code ec; object && std::filesystem::exists(object->name, ec) && !ec)
{
auto dwarf_it = dwarfs.try_emplace(object->name, object->elf).first;
DB::Dwarf::LocationInfo location;
if (dwarf_it->second.findAddress(uintptr_t(physical_addr), location, mode, inline_frames))
out << location.file.toString() << ":" << location.line << ": ";
}
if (const auto * const symbol = symbol_index.findSymbol(virtual_addr))
out << collapseNames(demangle(symbol->name));
else
out << "?";
if (shouldShowAddress(physical_addr))
{
out << " @ ";
DB::writePointerHex(physical_addr, out);
}
out << " in " << (object ? object->name : "?");
for (size_t j = 0; j < inline_frames.size(); ++j)
{
const auto & frame = inline_frames[j];
callback(fmt::format(
"{}.{}. inlined from {}:{}: {}",
i,
j + 1,
frame.location.file.toString(),
frame.location.line,
collapseNames(demangle(frame.name))));
}
callback(out.str());
}
#else
for (size_t i = stack_trace.offset; i < stack_trace.size; ++i)
if (const void * const addr = stack_trace.pointers[i]; shouldShowAddress(addr))
callback(fmt::format("{}. {}", i, addr));
#endif
}
void StackTrace::toStringEveryLine(std::function<void(std::string_view)> callback) const
{
toStringEveryLineImpl(true, {frame_pointers, offset, size}, std::move(callback));
}
void StackTrace::toStringEveryLine(const FramePointers & frame_pointers, std::function<void(std::string_view)> callback)
{
toStringEveryLineImpl(true, {frame_pointers, 0, static_cast<size_t>(std::find(frame_pointers.begin(), frame_pointers.end(), nullptr) - frame_pointers.begin())}, std::move(callback));
}
void StackTrace::toStringEveryLine(void ** frame_pointers_raw, size_t offset, size_t size, std::function<void(std::string_view)> callback)
{
__msan_unpoison(frame_pointers_raw, size * sizeof(*frame_pointers_raw));
StackTrace::FramePointers frame_pointers{};
std::copy_n(frame_pointers_raw, size, frame_pointers.begin());
toStringEveryLineImpl(true, {frame_pointers, offset, size}, std::move(callback));
}
using StackTraceCache = std::map<StackTraceTriple, String, std::less<>>;
static StackTraceCache & cacheInstance()
{
static StackTraceCache cache;
return cache;
}
static std::mutex stacktrace_cache_mutex;
String toStringCached(const StackTrace::FramePointers & pointers, size_t offset, size_t size)
{
/// Calculation of stack trace text is extremely slow.
/// We use simple cache because otherwise the server could be overloaded by trash queries.
/// Note that this cache can grow unconditionally, but practically it should be small.
std::lock_guard lock{stacktrace_cache_mutex};
StackTraceCache & cache = cacheInstance();
const StackTraceRefTriple key{pointers, offset, size};
if (auto it = cache.find(key); it != cache.end())
return it->second;
else
{
DB::WriteBufferFromOwnString out;
toStringEveryLineImpl(false, key, [&](std::string_view str) { out << str << '\n'; });
return cache.emplace(StackTraceTriple{pointers, offset, size}, out.str()).first->second;
}
}
std::string StackTrace::toString() const
{
return toStringCached(frame_pointers, offset, size);
}
std::string StackTrace::toString(void ** frame_pointers_raw, size_t offset, size_t size)
{
__msan_unpoison(frame_pointers_raw, size * sizeof(*frame_pointers_raw));
StackTrace::FramePointers frame_pointers{};
std::copy_n(frame_pointers_raw, size, frame_pointers.begin());
return toStringCached(frame_pointers, offset, size);
}
void StackTrace::dropCache()
{
std::lock_guard lock{stacktrace_cache_mutex};
cacheInstance().clear();
}
|