Source code
Revision control
Copy as Markdown
Other Tools
/* -*- Mode: C++; c-basic-offset: 2; indent-tabs-mode: t; tab-width: 4 -*- */
/* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
//
// Here are a few examples of using the value-profiling utility:
//
// _vprof (e);
// at the end of program execution, you'll get a dump of the source location
// of this probe, its min, max, average, the total sum of all instances of e,
// and the total number of times this probe was called.
//
// _vprof (x > 0);
// shows how many times and what percentage of the cases x was > 0,
// that is the probablitiy that x > 0.
//
// _vprof (n % 2 == 0);
// shows how many times n was an even number
// as well as th probablitiy of n being an even number.
//
// _hprof (n, 4, 1000, 5000, 5001, 10000);
// gives you the histogram of n over the given 4 bucket boundaries:
// # cases < 1000
// # cases >= 1000 and < 5000
// # cases >= 5000 and < 5001
// # cases >= 5001 and < 10000
// # cases >= 10000
//
// _nvprof ("event name", value);
// all instances with the same name are merged
// so, you can call _vprof with the same event name at difference places
//
// _vprof (e, myProbe);
// value profile e and call myProbe (void* vprofID) at the profiling point.
// inside the probe, the client has the predefined variables:
// _VAL, _COUNT, _SUM, _MIN, _MAX, and the general purpose registers
// _IVAR1, ..., IVAR4 general integer registrs
// _I64VAR1, ..., I64VAR4 general integer64 registrs
// _DVAR1, ..., _DVAR4 general double registers
// _GENPTR a generic pointer that can be used by the client
// the number of registers can be changed in vprof.h
//
#ifndef devtools_vprof_vprof_h
#define devtools_vprof_vprof_h
//
// If the application for which you want to use vprof is threaded, THREADED must
// be defined as 1, otherwise define it as 0
//
// If your application is not threaded, define THREAD_SAFE 0,
// otherwise, you have the option of setting THREAD_SAFE to 1 which results in
// exact counts or to 0 which results in a much more efficient but non-exact
// counts
//
#define THREADED 0
#define THREAD_SAFE 0
#include "VMPI.h"
// Note, this is not supported in configurations with more than one AvmCore
// running in the same process.
// portable align macro
#if defined(_MSC_VER)
# define vprof_align8(t) __declspec(align(8)) t
#elif defined(__GNUC__)
# define vprof_align8(t) t __attribute__((aligned(8)))
#elif defined(__SUNPRO_C) || defined(__SUNPRO_CC)
# define vprof_align8(t) t __attribute__((aligned(8)))
#elif defined(VMCFG_SYMBIAN)
# define vprof_align8(t) t __attribute__((aligned(8)))
#endif
#ifdef __cplusplus
extern "C" {
#endif
int initValueProfile(void** id, char* file, int line, ...);
int profileValue(void* id, int64_t value);
int initHistProfile(void** id, char* file, int line, int nbins, ...);
int histValue(void* id, int64_t value);
uint64_t readTimestampCounter();
#ifdef __cplusplus
}
#endif
// #define DOPROF
#ifndef DOPROF
# define _nvprof(e, v)
# ifndef VMCFG_SYMBIAN
# define _vprof(v, ...)
# define _hprof(v, n, ...)
# define _nhprof(e, v, n, ...)
# define _ntprof_begin(e)
# define _ntprof_end(e)
# define _jvprof_init(id, ...)
# define _jnvprof_init(id, e, ...)
# define _jhprof_init(id, n, ...)
# define _jnhprof_init(id, e, n, ...)
# define _jvprof(id, v)
# define _jhprof(id, v)
# endif // ! VMCFG_SYMBIAN
#else
// Historical/compatibility note:
// The macros below were originally written using conditional expressions, not
// if/else. The original author said that this was done to allow _vprof and
// _nvprof to be used in an expression context, but the old code had already
// wrapped the macro bodies in { }, so it is not clear how this could have
// worked. At present, the profiling macros must appear in a statement context
// only.
# define _vprof(v, ...) \
do { \
static void* id = 0; \
if (id == 0) \
initValueProfile(&id, __FILE__, __LINE__, ##__VA_ARGS__, NULL); \
profileValue(id, (int64_t)(v)); \
} while (0)
# define _nvprof(e, v) \
do { \
static void* id = 0; \
if (id == 0) initValueProfile(&id, (char*)(e), -1, NULL); \
profileValue(id, (int64_t)(v)); \
} while (0)
# define _hprof(v, n, ...) \
do { \
static void* id = 0; \
if (id == 0) \
initHistProfile(&id, __FILE__, __LINE__, (int)(n), ##__VA_ARGS__); \
histValue(id, (int64_t)(v)); \
} while (0)
# define _nhprof(e, v, n, ...) \
do { \
static void* id = 0; \
if (id == 0) \
initHistProfile(&id, (char*)(e), -1, (int)(n), ##__VA_ARGS__); \
histValue(id, (int64_t)(v)); \
} while (0)
// Profile execution time between _ntprof_begin(e) and _ntprof_end(e).
// The tag 'e' must match at the beginning and end of the region to
// be timed. Regions may be nested or overlap arbitrarily, as it is
// the tag alone that defines the begin/end correspondence.
# define _ntprof_begin(e) \
do { \
static void* id = 0; \
if (id == 0) initValueProfile(&id, (char*)(e), -1, NULL); \
((entry_t)id)->i64var[0] = readTimestampCounter(); \
} while (0)
// Assume 2.6 Ghz CPU
# define TICKS_PER_USEC 2600
# define _ntprof_end(e) \
do { \
static void* id = 0; \
uint64_t stop = readTimestampCounter(); \
if (id == 0) initValueProfile(&id, (char*)(e), -1, NULL); \
uint64_t start = ((entry_t)id)->i64var[0]; \
uint64_t usecs = (stop - start) / TICKS_PER_USEC; \
profileValue(id, usecs); \
} while (0)
// These macros separate the creation of a profile record from its later usage.
// They are intended for profiling JIT-generated code. Once created, the JIT
// can bind a pointer to the profile record into the generated code, which can
// then record profile events during execution.
# define _jvprof_init(id, ...) \
if (*(id) == 0) \
initValueProfile((id), __FILE__, __LINE__, ##__VA_ARGS__, NULL)
# define _jnvprof_init(id, e, ...) \
if (*(id) == 0) initValueProfile((id), (char*)(e), -1, ##__VA_ARGS__, NULL)
# define _jhprof_init(id, n, ...) \
if (*(id) == 0) \
initHistProfile((id), __FILE__, __LINE__, (int)(n), ##__VA_ARGS__)
# define _jnhprof_init(id, e, n, ...) \
if (*(id) == 0) \
initHistProfile((id), (char*)(e), -1, (int)(n), ##__VA_ARGS__)
// Calls to the _jvprof and _jhprof macros must be wrapped in a non-inline
// function in order to be invoked from JIT-compiled code.
# define _jvprof(id, v) profileValue((id), (int64_t)(v))
# define _jhprof(id, v) histValue((id), (int64_t)(v))
#endif
#define NUM_EVARS 4
enum { LOCK_IS_FREE = 0, LOCK_IS_TAKEN = 1 };
extern
#ifdef __cplusplus
"C"
#endif
long
_InterlockedCompareExchange(long volatile* Destination, long Exchange,
long Comperand);
typedef struct hist hist;
typedef struct hist {
int nbins;
int64_t* lb;
int64_t* count;
}* hist_t;
typedef struct entry entry;
typedef struct entry {
long lock;
char* file;
int line;
int64_t value;
int64_t count;
int64_t sum;
int64_t min;
int64_t max;
void (*func)(void*);
hist* h;
entry* next;
// exposed to the clients
void* genptr;
int ivar[NUM_EVARS];
vprof_align8(int64_t) i64var[NUM_EVARS];
vprof_align8(double) dvar[NUM_EVARS];
//
char pad[128]; // avoid false sharing
}* entry_t;
#define _VAL ((entry_t)vprofID)->value
#define _COUNT ((entry_t)vprofID)->count
#define _SUM ((entry_t)vprofID)->sum
#define _MIN ((entry_t)vprofID)->min
#define _MAX ((entry_t)vprofID)->max
#define _GENPTR ((entry_t)vprofID)->genptr
#define _IVAR0 ((entry_t)vprofID)->ivar[0]
#define _IVAR1 ((entry_t)vprofID)->ivar[1]
#define _IVAR2 ((entry_t)vprofID)->ivar[2]
#define _IVAR3 ((entry_t)vprofID)->ivar[3]
#define _I64VAR0 ((entry_t)vprofID)->i64var[0]
#define _I64VAR1 ((entry_t)vprofID)->i64var[1]
#define _I64VAR2 ((entry_t)vprofID)->i64var[2]
#define _I64VAR3 ((entry_t)vprofID)->i64var[3]
#define _DVAR0 ((entry_t)vprofID)->dvar[0]
#define _DVAR1 ((entry_t)vprofID)->dvar[1]
#define _DVAR2 ((entry_t)vprofID)->dvar[2]
#define _DVAR3 ((entry_t)vprofID)->dvar[3]
#endif /* devtools_vprof_vprof_h */