Avoids a lot of cache line bouncing for threads.
Signed-off-by: Jens Axboe <axboe@kernel.dk>
#ifdef ARCH_HAVE_CPU_CLOCK
static unsigned long cycles_per_usec;
#ifdef ARCH_HAVE_CPU_CLOCK
static unsigned long cycles_per_usec;
-static unsigned long last_cycles;
int tsc_reliable = 0;
#endif
struct tv_valid {
struct timeval last_tv;
int last_tv_valid;
int tsc_reliable = 0;
#endif
struct tv_valid {
struct timeval last_tv;
int last_tv_valid;
+ unsigned long last_cycles;
};
static pthread_key_t tv_tls_key;
};
static pthread_key_t tv_tls_key;
void fio_gettime(struct timeval *tp, void fio_unused *caller)
#endif
{
void fio_gettime(struct timeval *tp, void fio_unused *caller)
#endif
{
#ifdef FIO_DEBUG_TIME
if (!caller)
#ifdef FIO_DEBUG_TIME
if (!caller)
+ tv = pthread_getspecific(tv_tls_key);
+
switch (fio_clock_source) {
case CS_GTOD:
gettimeofday(tp, NULL);
switch (fio_clock_source) {
case CS_GTOD:
gettimeofday(tp, NULL);
unsigned long long usecs, t;
t = get_cpu_clock();
unsigned long long usecs, t;
t = get_cpu_clock();
+ if (tv && t < tv->last_cycles) {
dprint(FD_TIME, "CPU clock going back in time\n");
dprint(FD_TIME, "CPU clock going back in time\n");
+ t = tv->last_cycles;
+ } else if (tv)
+ tv->last_cycles = t;
usecs = t / cycles_per_usec;
tp->tv_sec = usecs / 1000000;
tp->tv_usec = usecs % 1000000;
usecs = t / cycles_per_usec;
tp->tv_sec = usecs / 1000000;
tp->tv_usec = usecs % 1000000;
* If Linux is using the tsc clock on non-synced processors,
* sometimes time can appear to drift backwards. Fix that up.
*/
* If Linux is using the tsc clock on non-synced processors,
* sometimes time can appear to drift backwards. Fix that up.
*/
- t = pthread_getspecific(tv_tls_key);
- if (t) {
- if (t->last_tv_valid) {
- if (tp->tv_sec < t->last_tv.tv_sec)
- tp->tv_sec = t->last_tv.tv_sec;
- else if (t->last_tv.tv_sec == tp->tv_sec &&
- tp->tv_usec < t->last_tv.tv_usec)
- tp->tv_usec = t->last_tv.tv_usec;
+ if (tv) {
+ if (tv->last_tv_valid) {
+ if (tp->tv_sec < tv->last_tv.tv_sec)
+ tp->tv_sec = tv->last_tv.tv_sec;
+ else if (tv->last_tv.tv_sec == tp->tv_sec &&
+ tp->tv_usec < tv->last_tv.tv_usec)
+ tp->tv_usec = tv->last_tv.tv_usec;
- t->last_tv_valid = 1;
- memcpy(&t->last_tv, tp, sizeof(*tp));
+ tv->last_tv_valid = 1;
+ memcpy(&tv->last_tv, tp, sizeof(*tp));