1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387
|
/*--------------------------------------------------------------------*/
/*--- Demangling of decorated names. demangle.c ---*/
/*--------------------------------------------------------------------*/
/*
This file is part of Valgrind, a dynamic binary instrumentation
framework.
Copyright (C) 2000-2017 Julian Seward
jseward@acm.org
Rust demangler components are
Copyright (C) 2016-2016 David Tolnay
dtolnay@gmail.com
This program is free software; you can redistribute it and/or
modify it under the terms of the GNU General Public License as
published by the Free Software Foundation; either version 2 of the
License, or (at your option) any later version.
This program is distributed in the hope that it will be useful, but
WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, see <http://www.gnu.org/licenses/>.
The GNU General Public License is contained in the file COPYING.
*/
#include "pub_core_basics.h"
#include "pub_core_demangle.h"
#include "pub_core_libcassert.h"
#include "pub_core_libcbase.h"
#include "pub_core_libcprint.h"
#include "pub_core_mallocfree.h"
#include "pub_core_options.h"
#include "vg_libciface.h"
#include "demangle.h"
Bool VG_(lang_is_ada) = False;
/*------------------------------------------------------------*/
/*--- ---*/
/*------------------------------------------------------------*/
/* The demangler's job is to take a raw symbol name and turn it into
something a Human Bean can understand. There are two levels of
mangling.
1. First, C++ names are mangled by the compiler. So we'll have to
undo that.
2. Optionally, in relatively rare cases, the resulting name is then
itself encoded using Z-escaping (see pub_core_redir.h) so as to
become part of a redirect-specification.
Therefore, VG_(demangle) first tries to undo (2). If successful,
the soname part is discarded (humans don't want to see that).
Then, it tries to undo (1) (using demangling code from GNU/FSF).
Finally, it changes the name of all symbols which are known to be
functions below main() to "(below main)". This helps reduce
variability of stack traces, something which has been a problem for
the testsuite for a long time.
--------
If do_cxx_demangle == True, it does all the above stages:
- undo (2) [Z-encoding]
- undo (1) [C++ mangling]
- do the below-main hack
If do_cxx_demangle == False, the C++ and Rust stags are skipped:
- undo (2) [Z-encoding]
- do the below-main hack
*/
/* Note that the C++ demangler is from GNU libiberty and is almost
completely unmodified. We use vg_libciface.h as a way to
impedance-match the libiberty code into our own framework.
The libiberty code included here was taken from the GCC repository
and is released under the LGPL 2.1 license, which AFAICT is compatible
with "GPL 2 or later" and so is OK for inclusion in Valgrind.
To update to a newer libiberty, use the "update-demangler" script
which is included in the valgrind repository. */
/* This is the main, standard demangler entry point. */
/* Upon return, *RESULT will point to the demangled name.
The memory buffer that holds the demangled name is allocated on the
heap and will be deallocated in the next invocation. Conceptually,
that buffer is owned by VG_(demangle). That means two things:
(1) Users of VG_(demangle) must not free that buffer.
(2) If the demangled name needs to be stashed away for later use,
the contents of the buffer need to be copied. It is not sufficient
to just store the pointer as it will point to deallocated memory
after the next VG_(demangle) invocation. */
void VG_(demangle) ( Bool do_cxx_demangling, Bool do_z_demangling,
/* IN */ const HChar *orig,
/* OUT */ const HChar **result )
{
/* Possibly undo (2) */
/* Z-Demangling was requested.
The fastest way to see if it's a Z-mangled name is just to attempt
to Z-demangle it (with NULL for the soname buffer, since we're not
interested in that). */
if (do_z_demangling) {
const HChar *z_demangled;
if (VG_(maybe_Z_demangle)( orig, NULL, /*soname*/
&z_demangled, NULL, NULL, NULL )) {
orig = z_demangled;
}
}
/* Possibly undo (1) */
// - C++ mangled symbols start with "_Z" (possibly with exceptions?)
// - Rust "legacy" mangled symbols start with "_Z".
// - Rust "v0" mangled symbols start with "_R".
// - D programming language mangled symbols start with "_D".
// XXX: the Java/Rust/Ada demangling here probably doesn't work. See
// https://bugs.kde.org/show_bug.cgi?id=445235 for details.
if (do_cxx_demangling && VG_(clo_demangle)
&& orig != NULL && (VG_(lang_is_ada) ||
(orig[0] == '_' && (orig[1] == 'Z' || orig[1] == 'R' || orig[1] == 'D')))) {
/* !!! vvv STATIC vvv !!! */
static HChar* demangled = NULL;
/* !!! ^^^ STATIC ^^^ !!! */
/* Free up previously demangled name */
if (demangled) {
VG_(arena_free) (VG_AR_DEMANGLE, demangled);
demangled = NULL;
}
if (orig[1] == 'D') {
demangled = dlang_demangle ( orig, DMGL_ANSI | DMGL_PARAMS );
} else if (VG_(lang_is_ada)) {
demangled = ada_demangle(orig, 0);
} else {
demangled = ML_(cplus_demangle) ( orig, DMGL_ANSI | DMGL_PARAMS );
}
*result = (demangled == NULL) ? orig : demangled;
} else {
*result = orig;
}
// 13 Mar 2005: We used to check here that the demangler wasn't leaking
// by calling the (now-removed) function VG_(is_empty_arena)(). But,
// very rarely (ie. I've heard of it twice in 3 years), the demangler
// does leak. But, we can't do much about it, and it's not a disaster,
// so we just let it slide without aborting or telling the user.
}
/*------------------------------------------------------------*/
/*--- DEMANGLE Z-ENCODED NAMES ---*/
/*------------------------------------------------------------*/
/* Demangle a Z-encoded name as described in pub_tool_redir.h.
Z-encoded names are used by Valgrind for doing function
interception/wrapping.
Demangle 'sym' into its soname and fnname parts, putting them in
the specified buffers. Returns a Bool indicating whether the
demangled failed or not. A failure can occur because the prefix
isn't recognised, the internal Z-escaping is wrong, or because one
or the other (or both) of the output buffers becomes full. Passing
'so' as NULL is acceptable if the caller is only interested in the
function name part. */
Bool VG_(maybe_Z_demangle) ( const HChar* sym,
/*OUT*/const HChar** so,
/*OUT*/const HChar** fn,
/*OUT*/Bool* isWrap,
/*OUT*/Int* eclassTag,
/*OUT*/Int* eclassPrio )
{
static HChar *sobuf;
static HChar *fnbuf;
static SizeT buf_len = 0;
/* The length of the name after undoing Z-encoding is always smaller
than the mangled name. Making the soname and fnname buffers as large
as the demangled name is therefore always safe and overflow can never
occur. */
SizeT len = VG_(strlen)(sym) + 1;
if (buf_len < len) {
sobuf = VG_(arena_realloc)(VG_AR_DEMANGLE, "Z-demangle", sobuf, len);
fnbuf = VG_(arena_realloc)(VG_AR_DEMANGLE, "Z-demangle", fnbuf, len);
buf_len = len;
}
sobuf[0] = fnbuf[0] = '\0';
if (so)
*so = sobuf;
*fn = fnbuf;
# define EMITSO(ch) \
do { \
if (so) { \
sobuf[soi++] = ch; sobuf[soi] = 0; \
} \
} while (0)
# define EMITFN(ch) \
do { \
fnbuf[fni++] = ch; fnbuf[fni] = 0; \
} while (0)
Bool error, valid, fn_is_encoded, is_VG_Z_prefixed;
Int soi, fni, i;
error = False;
soi = 0;
fni = 0;
valid = sym[0] == '_'
&& sym[1] == 'v'
&& sym[2] == 'g'
&& (sym[3] == 'r' || sym[3] == 'w')
&& VG_(isdigit)(sym[4])
&& VG_(isdigit)(sym[5])
&& VG_(isdigit)(sym[6])
&& VG_(isdigit)(sym[7])
&& VG_(isdigit)(sym[8])
&& sym[9] == 'Z'
&& (sym[10] == 'Z' || sym[10] == 'U')
&& sym[11] == '_';
if (valid
&& sym[4] == '0' && sym[5] == '0' && sym[6] == '0' && sym[7] == '0'
&& sym[8] != '0') {
/* If the eclass tag is 0000 (meaning "no eclass"), the priority
must be 0 too. */
valid = False;
}
if (!valid)
return False;
fn_is_encoded = sym[10] == 'Z';
if (isWrap)
*isWrap = sym[3] == 'w';
if (eclassTag) {
*eclassTag = 1000 * ((Int)sym[4] - '0')
+ 100 * ((Int)sym[5] - '0')
+ 10 * ((Int)sym[6] - '0')
+ 1 * ((Int)sym[7] - '0');
vg_assert(*eclassTag >= 0 && *eclassTag <= 9999);
}
if (eclassPrio) {
*eclassPrio = ((Int)sym[8]) - '0';
vg_assert(*eclassPrio >= 0 && *eclassPrio <= 9);
}
/* Now check the soname prefix isn't "VG_Z_", as described in
pub_tool_redir.h. */
is_VG_Z_prefixed =
sym[12] == 'V' &&
sym[13] == 'G' &&
sym[14] == '_' &&
sym[15] == 'Z' &&
sym[16] == '_';
if (is_VG_Z_prefixed) {
vg_assert2(0, "symbol with a 'VG_Z_' prefix: %s.\n"
"see pub_tool_redir.h for an explanation.", sym);
}
/* Now scan the Z-encoded soname. */
i = 12;
while (True) {
if (sym[i] == '_')
/* Found the delimiter. Move on to the fnname loop. */
break;
if (sym[i] == 0) {
error = True;
goto out;
}
if (sym[i] != 'Z') {
EMITSO(sym[i]);
i++;
continue;
}
/* We've got a Z-escape. */
i++;
switch (sym[i]) {
case 'a': EMITSO('*'); break;
case 'c': EMITSO(':'); break;
case 'd': EMITSO('.'); break;
case 'h': EMITSO('-'); break;
case 'p': EMITSO('+'); break;
case 's': EMITSO(' '); break;
case 'u': EMITSO('_'); break;
case 'A': EMITSO('@'); break;
case 'D': EMITSO('$'); break;
case 'L': EMITSO('('); break;
case 'P': EMITSO('%'); break;
case 'R': EMITSO(')'); break;
case 'S': EMITSO('/'); break;
case 'Z': EMITSO('Z'); break;
default: error = True; goto out;
}
i++;
}
vg_assert(sym[i] == '_');
i++;
/* Now deal with the function name part. */
if (!fn_is_encoded) {
/* simple; just copy. */
while (True) {
if (sym[i] == 0)
break;
EMITFN(sym[i]);
i++;
}
goto out;
}
/* else use a Z-decoding loop like with soname */
while (True) {
if (sym[i] == 0)
break;
if (sym[i] != 'Z') {
EMITFN(sym[i]);
i++;
continue;
}
/* We've got a Z-escape. */
i++;
switch (sym[i]) {
case 'a': EMITFN('*'); break;
case 'c': EMITFN(':'); break;
case 'd': EMITFN('.'); break;
case 'h': EMITFN('-'); break;
case 'p': EMITFN('+'); break;
case 's': EMITFN(' '); break;
case 'u': EMITFN('_'); break;
case 'A': EMITFN('@'); break;
case 'D': EMITFN('$'); break;
case 'L': EMITFN('('); break;
case 'P': EMITFN('%'); break;
case 'R': EMITFN(')'); break;
case 'S': EMITFN('/'); break;
case 'Z': EMITFN('Z'); break;
default: error = True; goto out;
}
i++;
}
out:
EMITSO(0);
EMITFN(0);
if (error) {
/* Something's wrong. Give up. */
VG_(message)(Vg_UserMsg,
"m_demangle: error Z-demangling: %s\n", sym);
return False;
}
return True;
}
/*--------------------------------------------------------------------*/
/*--- end ---*/
/*--------------------------------------------------------------------*/
|