2012-11-12 16:53:47 +01:00
|
|
|
//===-- sanitizer_symbolizer.h ----------------------------------*- C++ -*-===//
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
2013-12-05 10:18:38 +01:00
|
|
|
// Symbolizer is used by sanitizers to map instruction address to a location in
|
|
|
|
// source code at run-time. Symbolizer either uses __sanitizer_symbolize_*
|
|
|
|
// defined in the program, or (if they are missing) tries to find and
|
|
|
|
// launch "llvm-symbolizer" commandline tool in a separate process and
|
|
|
|
// communicate with it.
|
2012-11-12 16:53:47 +01:00
|
|
|
//
|
2013-12-05 10:18:38 +01:00
|
|
|
// Generally we should try to avoid calling system library functions during
|
|
|
|
// symbolization (and use their replacements from sanitizer_libc.h instead).
|
2012-11-12 16:53:47 +01:00
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef SANITIZER_SYMBOLIZER_H
|
|
|
|
#define SANITIZER_SYMBOLIZER_H
|
|
|
|
|
2015-10-21 09:32:45 +02:00
|
|
|
#include "sanitizer_common.h"
|
|
|
|
#include "sanitizer_mutex.h"
|
2012-11-12 16:53:47 +01:00
|
|
|
|
|
|
|
namespace __sanitizer {
|
|
|
|
|
|
|
|
struct AddressInfo {
|
2015-10-21 09:32:45 +02:00
|
|
|
// Owns all the string members. Storage for them is
|
|
|
|
// (de)allocated using sanitizer internal allocator.
|
2012-11-12 16:53:47 +01:00
|
|
|
uptr address;
|
2014-05-22 09:09:21 +02:00
|
|
|
|
2012-11-12 16:53:47 +01:00
|
|
|
char *module;
|
|
|
|
uptr module_offset;
|
2014-05-22 09:09:21 +02:00
|
|
|
|
|
|
|
static const uptr kUnknown = ~(uptr)0;
|
2012-11-12 16:53:47 +01:00
|
|
|
char *function;
|
2014-05-22 09:09:21 +02:00
|
|
|
uptr function_offset;
|
|
|
|
|
2012-11-12 16:53:47 +01:00
|
|
|
char *file;
|
|
|
|
int line;
|
|
|
|
int column;
|
|
|
|
|
2015-10-21 09:32:45 +02:00
|
|
|
AddressInfo();
|
2014-05-22 09:09:21 +02:00
|
|
|
// Deletes all strings and resets all fields.
|
2015-10-21 09:32:45 +02:00
|
|
|
void Clear();
|
|
|
|
void FillModuleInfo(const char *mod_name, uptr mod_offset);
|
|
|
|
};
|
2012-11-12 16:53:47 +01:00
|
|
|
|
2015-10-21 09:32:45 +02:00
|
|
|
// Linked list of symbolized frames (each frame is described by AddressInfo).
|
|
|
|
struct SymbolizedStack {
|
|
|
|
SymbolizedStack *next;
|
|
|
|
AddressInfo info;
|
|
|
|
static SymbolizedStack *New(uptr addr);
|
|
|
|
// Deletes current, and all subsequent frames in the linked list.
|
|
|
|
// The object cannot be accessed after the call to this function.
|
|
|
|
void ClearAll();
|
|
|
|
|
|
|
|
private:
|
|
|
|
SymbolizedStack();
|
2012-11-12 16:53:47 +01:00
|
|
|
};
|
|
|
|
|
2014-11-13 21:41:38 +01:00
|
|
|
// For now, DataInfo is used to describe global variable.
|
2013-01-23 12:41:33 +01:00
|
|
|
struct DataInfo {
|
2015-10-21 09:32:45 +02:00
|
|
|
// Owns all the string members. Storage for them is
|
|
|
|
// (de)allocated using sanitizer internal allocator.
|
2013-01-23 12:41:33 +01:00
|
|
|
char *module;
|
|
|
|
uptr module_offset;
|
|
|
|
char *name;
|
|
|
|
uptr start;
|
|
|
|
uptr size;
|
2014-11-13 21:41:38 +01:00
|
|
|
|
2015-10-21 09:32:45 +02:00
|
|
|
DataInfo();
|
|
|
|
void Clear();
|
2013-01-23 12:41:33 +01:00
|
|
|
};
|
|
|
|
|
2015-10-21 09:32:45 +02:00
|
|
|
class SymbolizerTool;
|
|
|
|
|
|
|
|
class Symbolizer final {
|
2012-11-12 16:53:47 +01:00
|
|
|
public:
|
2014-09-23 19:59:53 +02:00
|
|
|
/// Initialize and return platform-specific implementation of symbolizer
|
|
|
|
/// (if it wasn't already initialized).
|
2013-12-05 10:18:38 +01:00
|
|
|
static Symbolizer *GetOrInit();
|
2015-10-21 09:32:45 +02:00
|
|
|
// Returns a list of symbolized frames for a given address (containing
|
|
|
|
// all inlined functions, if necessary).
|
|
|
|
SymbolizedStack *SymbolizePC(uptr address);
|
|
|
|
bool SymbolizeData(uptr address, DataInfo *info);
|
|
|
|
|
|
|
|
// The module names Symbolizer returns are stable and unique for every given
|
|
|
|
// module. It is safe to store and compare them as pointers.
|
|
|
|
bool GetModuleNameAndOffsetForPC(uptr pc, const char **module_name,
|
|
|
|
uptr *module_address);
|
|
|
|
const char *GetModuleNameForPc(uptr pc) {
|
|
|
|
const char *module_name = nullptr;
|
|
|
|
uptr unused;
|
|
|
|
if (GetModuleNameAndOffsetForPC(pc, &module_name, &unused))
|
|
|
|
return module_name;
|
|
|
|
return nullptr;
|
2013-12-05 10:18:38 +01:00
|
|
|
}
|
2015-10-21 09:32:45 +02:00
|
|
|
|
2013-11-04 22:33:31 +01:00
|
|
|
// Release internal caches (if any).
|
2015-10-21 09:32:45 +02:00
|
|
|
void Flush();
|
2013-11-04 22:33:31 +01:00
|
|
|
// Attempts to demangle the provided C++ mangled name.
|
2015-10-21 09:32:45 +02:00
|
|
|
const char *Demangle(const char *name);
|
|
|
|
void PrepareForSandboxing();
|
2012-11-12 16:53:47 +01:00
|
|
|
|
2013-12-05 10:18:38 +01:00
|
|
|
// Allow user to install hooks that would be called before/after Symbolizer
|
|
|
|
// does the actual file/line info fetching. Specific sanitizers may need this
|
|
|
|
// to distinguish system library calls made in user code from calls made
|
|
|
|
// during in-process symbolization.
|
|
|
|
typedef void (*StartSymbolizationHook)();
|
|
|
|
typedef void (*EndSymbolizationHook)();
|
|
|
|
// May be called at most once.
|
|
|
|
void AddHooks(StartSymbolizationHook start_hook,
|
|
|
|
EndSymbolizationHook end_hook);
|
|
|
|
|
|
|
|
private:
|
2015-10-21 09:32:45 +02:00
|
|
|
// GetModuleNameAndOffsetForPC has to return a string to the caller.
|
|
|
|
// Since the corresponding module might get unloaded later, we should create
|
|
|
|
// our owned copies of the strings that we can safely return.
|
|
|
|
// ModuleNameOwner does not provide any synchronization, thus calls to
|
|
|
|
// its method should be protected by |mu_|.
|
|
|
|
class ModuleNameOwner {
|
|
|
|
public:
|
|
|
|
explicit ModuleNameOwner(BlockingMutex *synchronized_by)
|
|
|
|
: storage_(kInitialCapacity), last_match_(nullptr),
|
|
|
|
mu_(synchronized_by) {}
|
|
|
|
const char *GetOwnedCopy(const char *str);
|
|
|
|
|
|
|
|
private:
|
|
|
|
static const uptr kInitialCapacity = 1000;
|
|
|
|
InternalMmapVector<const char*> storage_;
|
|
|
|
const char *last_match_;
|
|
|
|
|
|
|
|
BlockingMutex *mu_;
|
|
|
|
} module_names_;
|
|
|
|
|
2013-12-05 10:18:38 +01:00
|
|
|
/// Platform-specific function for creating a Symbolizer object.
|
2014-09-23 19:59:53 +02:00
|
|
|
static Symbolizer *PlatformInit();
|
2015-10-21 09:32:45 +02:00
|
|
|
|
|
|
|
bool FindModuleNameAndOffsetForAddress(uptr address, const char **module_name,
|
|
|
|
uptr *module_offset);
|
|
|
|
LoadedModule *FindModuleForAddress(uptr address);
|
|
|
|
LoadedModule modules_[kMaxNumberOfModules];
|
|
|
|
uptr n_modules_;
|
|
|
|
// If stale, need to reload the modules before looking up addresses.
|
|
|
|
bool modules_fresh_;
|
|
|
|
|
|
|
|
// Platform-specific default demangler, must not return nullptr.
|
|
|
|
const char *PlatformDemangle(const char *name);
|
|
|
|
void PlatformPrepareForSandboxing();
|
2013-12-05 10:18:38 +01:00
|
|
|
|
|
|
|
static Symbolizer *symbolizer_;
|
|
|
|
static StaticSpinMutex init_mu_;
|
|
|
|
|
2015-10-21 09:32:45 +02:00
|
|
|
// Mutex locked from public methods of |Symbolizer|, so that the internals
|
|
|
|
// (including individual symbolizer tools and platform-specific methods) are
|
|
|
|
// always synchronized.
|
|
|
|
BlockingMutex mu_;
|
|
|
|
|
|
|
|
typedef IntrusiveList<SymbolizerTool>::Iterator Iterator;
|
|
|
|
IntrusiveList<SymbolizerTool> tools_;
|
|
|
|
|
|
|
|
explicit Symbolizer(IntrusiveList<SymbolizerTool> tools);
|
2013-12-05 10:18:38 +01:00
|
|
|
|
|
|
|
static LowLevelAllocator symbolizer_allocator_;
|
|
|
|
|
|
|
|
StartSymbolizationHook start_hook_;
|
|
|
|
EndSymbolizationHook end_hook_;
|
|
|
|
class SymbolizerScope {
|
|
|
|
public:
|
|
|
|
explicit SymbolizerScope(const Symbolizer *sym);
|
|
|
|
~SymbolizerScope();
|
|
|
|
private:
|
|
|
|
const Symbolizer *sym_;
|
|
|
|
};
|
|
|
|
};
|
2012-11-12 16:53:47 +01:00
|
|
|
|
|
|
|
} // namespace __sanitizer
|
|
|
|
|
|
|
|
#endif // SANITIZER_SYMBOLIZER_H
|