|
|
4f2909 |
commit f4abcc05fdba3f25890a9b30b71d511ccc906d46
|
|
|
4f2909 |
Author: Mark Wielaard <mark@klomp.org>
|
|
|
4f2909 |
Date: Mon Jul 27 22:43:28 2020 +0200
|
|
|
4f2909 |
|
|
|
4f2909 |
Incorrect call-graph tracking due to new _dl_runtime_resolve_xsave*
|
|
|
4f2909 |
|
|
|
4f2909 |
Newer glibc have alternate ld.so _ld_runtime_resolve functions.
|
|
|
4f2909 |
Namely _dl_runtime_resolve_xsave and _dl_runtime_resolve_xsave'2
|
|
|
4f2909 |
|
|
|
4f2909 |
This patch recognizes the xsave, xsvec and fxsave variants and
|
|
|
4f2909 |
changes callgrind so that any variant counts as _dl_runtime_resolve.
|
|
|
4f2909 |
|
|
|
4f2909 |
Original patch by paulo.cesar.pereira.de.andrade@gmail.com
|
|
|
4f2909 |
https://bugs.kde.org/show_bug.cgi?id=415293
|
|
|
4f2909 |
|
|
|
4f2909 |
diff --git a/callgrind/fn.c b/callgrind/fn.c
|
|
|
4f2909 |
index e9d8dd214..7cce1a0c7 100644
|
|
|
4f2909 |
--- a/callgrind/fn.c
|
|
|
4f2909 |
+++ b/callgrind/fn.c
|
|
|
4f2909 |
@@ -30,8 +30,11 @@
|
|
|
4f2909 |
|
|
|
4f2909 |
static fn_array current_fn_active;
|
|
|
4f2909 |
|
|
|
4f2909 |
-static Addr runtime_resolve_addr = 0;
|
|
|
4f2909 |
-static int runtime_resolve_length = 0;
|
|
|
4f2909 |
+/* x86_64 defines 4 variants. */
|
|
|
4f2909 |
+#define MAX_RESOLVE_ADDRS 4
|
|
|
4f2909 |
+static int runtime_resolve_addrs = 0;
|
|
|
4f2909 |
+static Addr runtime_resolve_addr[MAX_RESOLVE_ADDRS];
|
|
|
4f2909 |
+static int runtime_resolve_length[MAX_RESOLVE_ADDRS];
|
|
|
4f2909 |
|
|
|
4f2909 |
// a code pattern is a list of tuples (start offset, length)
|
|
|
4f2909 |
struct chunk_t { int start, len; };
|
|
|
4f2909 |
@@ -56,6 +59,9 @@ static Bool check_code(obj_node* obj,
|
|
|
4f2909 |
/* first chunk of pattern should always start at offset 0 and
|
|
|
4f2909 |
* have at least 3 bytes */
|
|
|
4f2909 |
CLG_ASSERT((pat->chunk[0].start == 0) && (pat->chunk[0].len >2));
|
|
|
4f2909 |
+
|
|
|
4f2909 |
+ /* and we cannot be called more than MAX_RESOLVE_ADDRS times */
|
|
|
4f2909 |
+ CLG_ASSERT(runtime_resolve_addrs < MAX_RESOLVE_ADDRS);
|
|
|
4f2909 |
|
|
|
4f2909 |
CLG_DEBUG(1, "check_code: %s, pattern %s, check %d bytes of [%x %x %x...]\n",
|
|
|
4f2909 |
obj->name, pat->name, pat->chunk[0].len, code[0], code[1], code[2]);
|
|
|
4f2909 |
@@ -93,8 +99,9 @@ static Bool check_code(obj_node* obj,
|
|
|
4f2909 |
pat->name, obj->name + obj->last_slash_pos,
|
|
|
4f2909 |
addr - obj->start, addr, pat->len);
|
|
|
4f2909 |
|
|
|
4f2909 |
- runtime_resolve_addr = addr;
|
|
|
4f2909 |
- runtime_resolve_length = pat->len;
|
|
|
4f2909 |
+ runtime_resolve_addr[runtime_resolve_addrs] = addr;
|
|
|
4f2909 |
+ runtime_resolve_length[runtime_resolve_addrs] = pat->len;
|
|
|
4f2909 |
+ runtime_resolve_addrs++;
|
|
|
4f2909 |
return True;
|
|
|
4f2909 |
}
|
|
|
4f2909 |
}
|
|
|
4f2909 |
@@ -138,8 +145,9 @@ static Bool search_runtime_resolve(obj_node* obj)
|
|
|
4f2909 |
"x86-glibc2.8", 30, {{ 0,12 }, { 16,14 }, { 30,0}} };
|
|
|
4f2909 |
|
|
|
4f2909 |
if (VG_(strncmp)(obj->name, "/lib/ld", 7) != 0) return False;
|
|
|
4f2909 |
- if (check_code(obj, code, &pat)) return True;
|
|
|
4f2909 |
- if (check_code(obj, code_28, &pat_28)) return True;
|
|
|
4f2909 |
+ Bool pat_p = check_code(obj, code, &pat;;
|
|
|
4f2909 |
+ Bool pat_28_p = check_code(obj, code_28, &pat_28);
|
|
|
4f2909 |
+ if (pat_p || pat_28_p) return True;
|
|
|
4f2909 |
return False;
|
|
|
4f2909 |
#endif
|
|
|
4f2909 |
|
|
|
4f2909 |
@@ -186,9 +194,98 @@ static Bool search_runtime_resolve(obj_node* obj)
|
|
|
4f2909 |
static struct pattern pat = {
|
|
|
4f2909 |
"amd64-def", 110, {{ 0,62 }, { 66,44 }, { 110,0 }} };
|
|
|
4f2909 |
|
|
|
4f2909 |
+ static UChar code_xsavec[] = {
|
|
|
4f2909 |
+ /* 0*/ 0x53, 0x48, 0x89, 0xe3, 0x48, 0x83, 0xe4, 0xc0,
|
|
|
4f2909 |
+ /* 8*/ 0x48, 0x2b, 0x25, 0x00, 0x00, 0x00, 0x00, /* sub <i32>(%rip),%rsp */
|
|
|
4f2909 |
+ /*15*/ 0x48,
|
|
|
4f2909 |
+ /*16*/ 0x89, 0x04, 0x24, 0x48, 0x89, 0x4c, 0x24, 0x08,
|
|
|
4f2909 |
+ /*24*/ 0x48, 0x89, 0x54, 0x24, 0x10, 0x48, 0x89, 0x74,
|
|
|
4f2909 |
+ /*32*/ 0x24, 0x18, 0x48, 0x89, 0x7c, 0x24, 0x20, 0x4c,
|
|
|
4f2909 |
+ /*40*/ 0x89, 0x44, 0x24, 0x28, 0x4c, 0x89, 0x4c, 0x24,
|
|
|
4f2909 |
+ /*48*/ 0x30, 0xb8, 0xee, 0x00, 0x00, 0x00, 0x31, 0xd2,
|
|
|
4f2909 |
+ /*56*/ 0x48, 0x89, 0x94, 0x24, 0x50, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*64*/ 0x48, 0x89, 0x94, 0x24, 0x58, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*72*/ 0x48, 0x89, 0x94, 0x24, 0x60, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*80*/ 0x48, 0x89, 0x94, 0x24, 0x68, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*88*/ 0x48, 0x89, 0x94, 0x24, 0x70, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*96*/ 0x48, 0x89, 0x94, 0x24, 0x78, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*04*/ 0x0f, 0xc7, 0x64, 0x24, 0x40, 0x48, 0x8b, 0x73,
|
|
|
4f2909 |
+ /*112*/0x10, 0x48, 0x8b, 0x7b, 0x08,
|
|
|
4f2909 |
+ /*117*/0xe8, 0x00, 0x00, 0x00, 0x00, /* callq <_dl_fixup> */
|
|
|
4f2909 |
+ /*122*/0x49, 0x89, 0xc3, 0xb8, 0xee, 0x00,
|
|
|
4f2909 |
+ /*128*/0x00, 0x00, 0x31, 0xd2, 0x0f, 0xae, 0x6c, 0x24,
|
|
|
4f2909 |
+ /*136*/0x40, 0x4c, 0x8b, 0x4c, 0x24, 0x30, 0x4c, 0x8b,
|
|
|
4f2909 |
+ /*144*/0x44, 0x24, 0x28, 0x48, 0x8b, 0x7c, 0x24, 0x20,
|
|
|
4f2909 |
+ /*152*/0x48, 0x8b, 0x74, 0x24, 0x18, 0x48, 0x8b, 0x54,
|
|
|
4f2909 |
+ /*160*/0x24, 0x10, 0x48, 0x8b, 0x4c, 0x24, 0x08, 0x48,
|
|
|
4f2909 |
+ /*168*/0x8b, 0x04, 0x24, 0x48, 0x89, 0xdc, 0x48, 0x8b,
|
|
|
4f2909 |
+ /*176*/0x1c, 0x24, 0x48, 0x83, 0xc4, 0x18, 0xf2, 0x41,
|
|
|
4f2909 |
+ /*184*/0xff, 0xe3 };
|
|
|
4f2909 |
+ static struct pattern pat_xsavec = {
|
|
|
4f2909 |
+ "amd64-xsavec", 186, {{ 0,11 }, { 15,103 }, {122,64}, { 186,0 }} };
|
|
|
4f2909 |
+
|
|
|
4f2909 |
+ static UChar code_xsave[] = {
|
|
|
4f2909 |
+ /* 0*/ 0x53, 0x48, 0x89, 0xe3, 0x48, 0x83, 0xe4, 0xc0,
|
|
|
4f2909 |
+ /* 8*/ 0x48, 0x2b, 0x25, 0x00, 0x00, 0x00, 0x00, /* sub <i32>(%rip),%rsp */
|
|
|
4f2909 |
+ /*15*/ 0x48,
|
|
|
4f2909 |
+ /*16*/ 0x89, 0x04, 0x24, 0x48, 0x89, 0x4c, 0x24, 0x08,
|
|
|
4f2909 |
+ /*24*/ 0x48, 0x89, 0x54, 0x24, 0x10, 0x48, 0x89, 0x74,
|
|
|
4f2909 |
+ /*32*/ 0x24, 0x18, 0x48, 0x89, 0x7c, 0x24, 0x20, 0x4c,
|
|
|
4f2909 |
+ /*40*/ 0x89, 0x44, 0x24, 0x28, 0x4c, 0x89, 0x4c, 0x24,
|
|
|
4f2909 |
+ /*48*/ 0x30, 0xb8, 0xee, 0x00, 0x00, 0x00, 0x31, 0xd2,
|
|
|
4f2909 |
+ /*56*/ 0x48, 0x89, 0x94, 0x24, 0x40, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*64*/ 0x48, 0x89, 0x94, 0x24, 0x48, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*72*/ 0x48, 0x89, 0x94, 0x24, 0x50, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*80*/ 0x48, 0x89, 0x94, 0x24, 0x58, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*88*/ 0x48, 0x89, 0x94, 0x24, 0x60, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*96*/ 0x48, 0x89, 0x94, 0x24, 0x68, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*104*/0x48, 0x89, 0x94, 0x24, 0x70, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*112*/0x48, 0x89, 0x94, 0x24, 0x78, 0x02, 0x00, 0x00,
|
|
|
4f2909 |
+ /*120*/0x0f, 0xae, 0x64, 0x24, 0x40, 0x48, 0x8b, 0x73,
|
|
|
4f2909 |
+ /*128*/0x10, 0x48, 0x8b, 0x7b, 0x08,
|
|
|
4f2909 |
+ /*133*/0xe8, 0x00, 0x00, 0x00, 0x00, /* callq <_dl_fixup> */
|
|
|
4f2909 |
+ /*138*/0x49, 0x89, 0xc3, 0xb8, 0xee, 0x00,
|
|
|
4f2909 |
+ /*144*/0x00, 0x00, 0x31, 0xd2, 0x0f, 0xae, 0x6c, 0x24,
|
|
|
4f2909 |
+ /*152*/0x40, 0x4c, 0x8b, 0x4c, 0x24, 0x30, 0x4c, 0x8b,
|
|
|
4f2909 |
+ /*160*/0x44, 0x24, 0x28, 0x48, 0x8b, 0x7c, 0x24, 0x20,
|
|
|
4f2909 |
+ /*168*/0x48, 0x8b, 0x74, 0x24, 0x18, 0x48, 0x8b, 0x54,
|
|
|
4f2909 |
+ /*176*/0x24, 0x10, 0x48, 0x8b, 0x4c, 0x24, 0x08, 0x48,
|
|
|
4f2909 |
+ /*184*/0x8b, 0x04, 0x24, 0x48, 0x89, 0xdc, 0x48, 0x8b,
|
|
|
4f2909 |
+ /*192*/0x1c, 0x24, 0x48, 0x83, 0xc4, 0x18, 0xf2, 0x41,
|
|
|
4f2909 |
+ /*200*/0xff, 0xe3 };
|
|
|
4f2909 |
+ static struct pattern pat_xsave = {
|
|
|
4f2909 |
+ "amd64-xsave", 202, {{ 0,11 }, { 15,119 }, {138,64}, { 202,0 }} };
|
|
|
4f2909 |
+
|
|
|
4f2909 |
+ static UChar code_fxsave[] = {
|
|
|
4f2909 |
+ /* 0*/ 0x53, 0x48, 0x89, 0xe3, 0x48, 0x83, 0xe4, 0xf0,
|
|
|
4f2909 |
+ /* 8*/ 0x48, 0x81, 0xec, 0x40, 0x02, 0x00, 0x00, 0x48,
|
|
|
4f2909 |
+ /*16*/ 0x89, 0x04, 0x24, 0x48, 0x89, 0x4c, 0x24, 0x08,
|
|
|
4f2909 |
+ /*24*/ 0x48, 0x89, 0x54, 0x24, 0x10, 0x48, 0x89, 0x74,
|
|
|
4f2909 |
+ /*32*/ 0x24, 0x18, 0x48, 0x89, 0x7c, 0x24, 0x20, 0x4c,
|
|
|
4f2909 |
+ /*40*/ 0x89, 0x44, 0x24, 0x28, 0x4c, 0x89, 0x4c, 0x24,
|
|
|
4f2909 |
+ /*48*/ 0x30, 0x0f, 0xae, 0x44, 0x24, 0x40, 0x48, 0x8b,
|
|
|
4f2909 |
+ /*56*/ 0x73, 0x10, 0x48, 0x8b, 0x7b, 0x08,
|
|
|
4f2909 |
+ /*62*/ 0xe8, 0x00, 0x00, 0x00, 0x00, /* callq <_dl_fixup> */
|
|
|
4f2909 |
+ /*67*/ 0x49, 0x89, 0xc3, 0x0f, 0xae,
|
|
|
4f2909 |
+ /*72*/ 0x4c, 0x24, 0x40, 0x4c, 0x8b, 0x4c, 0x24, 0x30,
|
|
|
4f2909 |
+ /*80*/ 0x4c, 0x8b, 0x44, 0x24, 0x28, 0x48, 0x8b, 0x7c,
|
|
|
4f2909 |
+ /*88*/ 0x24, 0x20, 0x48, 0x8b, 0x74, 0x24, 0x18, 0x48,
|
|
|
4f2909 |
+ /*96*/ 0x8b, 0x54, 0x24, 0x10, 0x48, 0x8b, 0x4c, 0x24,
|
|
|
4f2909 |
+ /*104*/0x08, 0x48, 0x8b, 0x04, 0x24, 0x48, 0x89, 0xdc,
|
|
|
4f2909 |
+ /*112*/0x48, 0x8b, 0x1c, 0x24, 0x48, 0x83, 0xc4, 0x18,
|
|
|
4f2909 |
+ /*120*/0xf2, 0x41, 0xff, 0xe3 };
|
|
|
4f2909 |
+ static struct pattern pat_fxsave = {
|
|
|
4f2909 |
+ "amd64-fxsave", 124, {{ 0,63 }, { 67,57 }, { 124,0 }} };
|
|
|
4f2909 |
+
|
|
|
4f2909 |
if ((VG_(strncmp)(obj->name, "/lib/ld", 7) != 0) &&
|
|
|
4f2909 |
- (VG_(strncmp)(obj->name, "/lib64/ld", 9) != 0)) return False;
|
|
|
4f2909 |
- return check_code(obj, code, &pat;;
|
|
|
4f2909 |
+ (VG_(strncmp)(obj->name, "/lib64/ld", 9) != 0) &&
|
|
|
4f2909 |
+ (VG_(strncmp)(obj->name, "/usr/lib/ld", 11) != 0) &&
|
|
|
4f2909 |
+ (VG_(strncmp)(obj->name, "/usr/lib64/ld", 13) != 0)) return False;
|
|
|
4f2909 |
+ Bool pat_p = check_code(obj, code, &pat;;
|
|
|
4f2909 |
+ Bool pat_xsavec_p = check_code(obj, code_xsavec, &pat_xsavec);
|
|
|
4f2909 |
+ Bool pat_xsave_p = check_code(obj, code_xsave, &pat_xsave);
|
|
|
4f2909 |
+ Bool pat_fxsave_p = check_code(obj, code_fxsave, &pat_fxsave);
|
|
|
4f2909 |
+ if (pat_p || pat_xsavec_p || pat_xsave_p || pat_fxsave_p) return True;
|
|
|
4f2909 |
#endif
|
|
|
4f2909 |
|
|
|
4f2909 |
/* For other platforms, no patterns known */
|
|
|
4f2909 |
@@ -254,7 +351,7 @@ obj_node* new_obj_node(DebugInfo* di, obj_node* next)
|
|
|
4f2909 |
i++;
|
|
|
4f2909 |
}
|
|
|
4f2909 |
|
|
|
4f2909 |
- if (runtime_resolve_addr == 0) search_runtime_resolve(obj);
|
|
|
4f2909 |
+ if (runtime_resolve_addrs == 0) search_runtime_resolve(obj);
|
|
|
4f2909 |
|
|
|
4f2909 |
return obj;
|
|
|
4f2909 |
}
|
|
|
4f2909 |
@@ -490,6 +587,7 @@ fn_node* CLG_(get_fn_node)(BB* bb)
|
|
|
4f2909 |
DebugInfo* di;
|
|
|
4f2909 |
UInt line_num;
|
|
|
4f2909 |
fn_node* fn;
|
|
|
4f2909 |
+ Int i;
|
|
|
4f2909 |
|
|
|
4f2909 |
/* fn from debug info is idempotent for a BB */
|
|
|
4f2909 |
if (bb->fn) return bb->fn;
|
|
|
4f2909 |
@@ -538,12 +636,14 @@ fn_node* CLG_(get_fn_node)(BB* bb)
|
|
|
4f2909 |
}
|
|
|
4f2909 |
if (0 == VG_(strcmp)(fnname, "_exit") && !exit_bb)
|
|
|
4f2909 |
exit_bb = bb;
|
|
|
4f2909 |
-
|
|
|
4f2909 |
- if (runtime_resolve_addr &&
|
|
|
4f2909 |
- (bb_addr(bb) >= runtime_resolve_addr) &&
|
|
|
4f2909 |
- (bb_addr(bb) < runtime_resolve_addr + runtime_resolve_length)) {
|
|
|
4f2909 |
- /* BB in runtime_resolve found by code check; use this name */
|
|
|
4f2909 |
- fnname = "_dl_runtime_resolve";
|
|
|
4f2909 |
+
|
|
|
4f2909 |
+ for (i = 0; i < runtime_resolve_addrs; i++) {
|
|
|
4f2909 |
+ if ((bb_addr(bb) >= runtime_resolve_addr[i]) &&
|
|
|
4f2909 |
+ (bb_addr(bb) < runtime_resolve_addr[i] + runtime_resolve_length[i])) {
|
|
|
4f2909 |
+ /* BB in runtime_resolve found by code check; use this name */
|
|
|
4f2909 |
+ fnname = "_dl_runtime_resolve";
|
|
|
4f2909 |
+ break;
|
|
|
4f2909 |
+ }
|
|
|
4f2909 |
}
|
|
|
4f2909 |
|
|
|
4f2909 |
/* get fn_node struct for this function */
|