DynamoRIO
average_bb_size.p5

In this variation we use inlined atomic instructions to adjust the counters. On a single core box this form should be quite fast, but on a multi-core box the cache line locking for atomic operations will slow things dramatically. We'll look at forms more suitable for multi-core further on.

#include "dr_api.h"
#ifdef WINDOWS
# define DISPLAY_STRING(msg) dr_messagebox(msg)
#else
# define DISPLAY_STRING(msg) dr_printf("%s\n", msg)
#endif
typedef struct bb_counts {
uint64 blocks;
uint64 total_size;
} bb_counts;
static bb_counts counts_as_built;
void *as_built_lock;
static bb_counts counts_dynamic;
static void
event_exit(void);
event_basic_block(void *drcontext, void *tag, instrlist_t *bb,
bool for_trace, bool translating);
DR_EXPORT void
dr_client_main(client_id_t id, int argc, const char *argv[])
{
/* register events */
dr_register_bb_event(event_basic_block);
/* initialize lock */
as_built_lock = dr_mutex_create();
}
static void
event_exit(void)
{
/* Display results - we must first snpritnf the string as on windows
* dr_printf(), dr_messagebox() and dr_fprintf() can't print floats. */
char msg[512];
int len;
len = snprintf(msg, sizeof(msg)/sizeof(msg[0]),
"Number of blocks built : %"UINT64_FORMAT_CODE"\n"
" Average size : %5.2lf instructions\n"
"Number of blocks executed : %"UINT64_FORMAT_CODE"\n"
" Average weighted size : %5.2lf instructions\n",
counts_as_built.blocks,
counts_as_built.total_size / (double)counts_as_built.blocks,
counts_dynamic.blocks,
counts_dynamic.total_size / (double)counts_dynamic.blocks);
DR_ASSERT(len > 0);
msg[sizeof(msg)/sizeof(msg[0])-1] = '\0';
DISPLAY_STRING(msg);
/* free mutex */
dr_mutex_destroy(as_built_lock);
}
event_basic_block(void *drcontext, void *tag, instrlist_t *bb,
bool for_trace, bool translating)
{
uint num_instructions = 0;
instr_t *instr, *where = NULL;
/* count the number of instructions in this block */
for (instr = instrlist_first(bb); instr != NULL; instr = instr_get_next(instr)) {
num_instructions++;
}
/* update the as-built counts */
dr_mutex_lock(as_built_lock);
counts_as_built.blocks++;
counts_as_built.total_size += num_instructions;
dr_mutex_unlock(as_built_lock);
+ /* increment counters */
+ where = instrlist_first(bb);
+ dr_save_arith_flags(drcontext, bb, where, SPILL_SLOT_1);
+ #ifdef X86_32
+ /* Since the counters are 64-bit we must use an add + an addc to increment.
+ * The operations is still effectively atomic since we're only increasing
+ * the count. */
+ LOCK(INSTR_CREATE_add(drcontext,
+ OPND_CREATE_ABSMEM((byte *)&counts_dynamic.blocks, OPSZ_4),
+ LOCK(INSTR_CREATE_adc(drcontext,
+ OPND_CREATE_ABSMEM((byte *)&counts_dynamic.blocks + 4, OPSZ_4),
+
+ LOCK(INSTR_CREATE_add(drcontext,
+ OPND_CREATE_ABSMEM((byte *)&counts_dynamic.total_size, OPSZ_4),
+ OPND_CREATE_INT_32OR8(num_instructions))));
+ LOCK(INSTR_CREATE_adc(drcontext,
+ OPND_CREATE_ABSMEM((byte *)&counts_dynamic.total_size + 4, OPSZ_4),
+ #else /* X86_64 */
+ LOCK(INSTR_CREATE_inc(drcontext,
+ OPND_CREATE_ABSMEM((byte *)&counts_dynamic.blocks, OPSZ_8))));
+ LOCK(INSTR_CREATE_add(drcontext,
+ OPND_CREATE_ABSMEM((byte *)&counts_dynamic.total_size, OPSZ_8),
+ OPND_CREATE_INT_32OR8(num_instructions))));
+ #endif
+ dr_restore_arith_flags(drcontext, bb, where, SPILL_SLOT_1);
+
}

[ prev | next ]

DR_API void dr_restore_arith_flags(void *drcontext, instrlist_t *ilist, instr_t *where, dr_spill_slot_t slot)
#define DR_ASSERT(x)
Definition: dr_tools.h:114
DR_API void dr_mutex_lock(void *mutex)
DR_API instr_t * instrlist_first(instrlist_t *ilist)
Top-level include file for DynamoRIO API.
#define INSTR_CREATE_inc(dc, d)
Definition: dr_ir_macros_x86.h:1589
DR_EXPORT void dr_client_main(client_id_t id, int argc, const char *argv[])
#define OPND_CREATE_ABSMEM(addr, size)
Definition: dr_ir_macros_aarch64.h:102
#define LOCK(instr_ptr)
Definition: dr_ir_macros_x86.h:60
#define OPND_CREATE_INT8(val)
Definition: dr_ir_macros.h:136
DR_API void * dr_mutex_create(void)
#define INSTR_CREATE_adc(dc, Rd, Rn, Rm_or_imm)
Definition: dr_ir_macros_arm.h:1191
DR_API INSTR_INLINE instr_t * instr_get_next(instr_t *instr)
DR_API void dr_save_arith_flags(void *drcontext, instrlist_t *ilist, instr_t *where, dr_spill_slot_t slot)
dr_emit_flags_t
Definition: dr_events.h:138
DR_API void instrlist_meta_preinsert(instrlist_t *ilist, instr_t *where, instr_t *instr)
#define OPND_CREATE_INT_32OR8(val)
Definition: dr_ir_macros.h:143
struct _instrlist_t instrlist_t
Definition: dr_defines.h:885
DR_API void dr_mutex_unlock(void *mutex)
DR_API void dr_register_bb_event(dr_emit_flags_t(*func)(void *drcontext, void *tag, instrlist_t *bb, bool for_trace, bool translating))
@ OPSZ_8
Definition: dr_ir_opnd.h:87
DR_API void dr_register_exit_event(void(*func)(void))
#define INSTR_CREATE_add(dc, Rd, Rn, Rm_or_imm)
Definition: dr_ir_macros_arm.h:1201
DR_API void dr_mutex_destroy(void *mutex)
@ DR_EMIT_DEFAULT
Definition: dr_events.h:140
Definition: dr_defines.h:378
@ OPSZ_4
Definition: dr_ir_opnd.h:85
uint client_id_t
Definition: dr_defines.h:357