X-Git-Url: https://git.kernel.dk/?a=blobdiff_plain;f=iolog.h;h=981081f9a1b087cfbc6b82d25e2ffbdba5ec7b9e;hb=HEAD;hp=0da70670c796ef1e8685394d88bb455a843d917b;hpb=423671679fef3932894b58748d532f06cf0533b2;p=fio.git diff --git a/iolog.h b/iolog.h index 0da70670..e864d169 100644 --- a/iolog.h +++ b/iolog.h @@ -1,10 +1,12 @@ #ifndef FIO_IOLOG_H #define FIO_IOLOG_H +#include + #include "lib/rbtree.h" #include "lib/ieee754.h" #include "flist.h" -#include "ioengine.h" +#include "ioengines.h" /* * Use for maintaining statistics @@ -18,19 +20,49 @@ struct io_stat { fio_fp64_t S; }; +struct io_hist { + uint64_t samples; + unsigned long hist_last; + struct flist_head list; +}; + +enum { + IO_LOG_SAMPLE_AVG = 0, + IO_LOG_SAMPLE_MAX, + IO_LOG_SAMPLE_BOTH, +}; + +struct io_sample_value { + uint64_t val0; + uint64_t val1; +}; + +union io_sample_data { + struct io_sample_value val; + struct io_u_plat_entry *plat_entry; +}; + +#define sample_val(value) ((union io_sample_data) { .val.val0 = value }) +#define sample_plat(plat) ((union io_sample_data) { .plat_entry = plat }) + /* * A single data sample */ struct io_sample { uint64_t time; - uint64_t val; + union io_sample_data data; uint32_t __ddir; - uint32_t bs; + uint16_t priority; + uint64_t bs; + uint64_t aux[]; }; -struct io_sample_offset { - struct io_sample s; - uint64_t offset; +/* + * Enumerate indexes of auxiliary log data in struct io_sample aux[] array + */ +enum { + IOS_AUX_OFFSET_INDEX, + IOS_AUX_ISSUE_TIME_INDEX, }; enum { @@ -39,6 +71,7 @@ enum { IO_LOG_TYPE_SLAT, IO_LOG_TYPE_BW, IO_LOG_TYPE_IOPS, + IO_LOG_TYPE_HIST, }; #define DEF_LOG_ENTRIES 1024 @@ -85,6 +118,16 @@ struct io_log { */ unsigned int log_offset; + /* + * Log I/O priorities + */ + unsigned int log_prio; + + /* + * Log I/O issuing time + */ + unsigned int log_issue_time; + /* * Max size of log entries before a chunk is compressed */ @@ -101,18 +144,48 @@ struct io_log { */ struct io_stat avg_window[DDIR_RWDIR_CNT]; unsigned long avg_msec; - unsigned long avg_last; + unsigned long avg_last[DDIR_RWDIR_CNT]; + + /* + * Windowed latency histograms, for keeping track of when we need to + * save a copy of the histogram every approximately hist_msec + * milliseconds. + */ + struct io_hist hist_window[DDIR_RWDIR_CNT]; + unsigned long hist_msec; + unsigned int hist_coarseness; pthread_mutex_t chunk_lock; unsigned int chunk_seq; struct flist_head chunk_list; + + pthread_mutex_t deferred_free_lock; +#define IOLOG_MAX_DEFER 8 + void *deferred_items[IOLOG_MAX_DEFER]; + unsigned int deferred; }; /* * If the upper bit is set, then we have the offset as well */ #define LOG_OFFSET_SAMPLE_BIT 0x80000000U -#define io_sample_ddir(io) ((io)->__ddir & ~LOG_OFFSET_SAMPLE_BIT) +/* + * If the bit following the upper bit is set, then we have the priority + */ +#define LOG_PRIO_SAMPLE_BIT 0x40000000U +/* + * If the bit following prioity sample vit is set, we report both avg and max + */ +#define LOG_AVG_MAX_SAMPLE_BIT 0x20000000U +/* + * If the bit following AVG_MAX_SAMPLE_BIT is set, we report the issue time also + */ +#define LOG_ISSUE_TIME_SAMPLE_BIT 0x10000000U + +#define LOG_SAMPLE_BITS (LOG_OFFSET_SAMPLE_BIT | LOG_PRIO_SAMPLE_BIT |\ + LOG_AVG_MAX_SAMPLE_BIT |\ + LOG_ISSUE_TIME_SAMPLE_BIT) +#define io_sample_ddir(io) ((io)->__ddir & ~LOG_SAMPLE_BITS) static inline void io_sample_set_ddir(struct io_log *log, struct io_sample *io, @@ -121,35 +194,49 @@ static inline void io_sample_set_ddir(struct io_log *log, io->__ddir = ddir | log->log_ddir_mask; } -static inline size_t __log_entry_sz(int log_offset) +static inline size_t __log_entry_sz(bool log_offset, bool log_issue_time) { + size_t ret = sizeof(struct io_sample); + if (log_offset) - return sizeof(struct io_sample_offset); - else - return sizeof(struct io_sample); + ret += sizeof(uint64_t); + + if (log_issue_time) + ret += sizeof(uint64_t); + + return ret; } static inline size_t log_entry_sz(struct io_log *log) { - return __log_entry_sz(log->log_offset); + return __log_entry_sz(log->log_offset, log->log_issue_time); } -static inline struct io_sample *__get_sample(void *samples, int log_offset, +static inline size_t log_sample_sz(struct io_log *log, struct io_logs *cur_log) +{ + return cur_log->nr_samples * log_entry_sz(log); +} + +static inline struct io_sample *__get_sample(void *samples, bool log_offset, + bool log_issue_time, uint64_t sample) { - uint64_t sample_offset = sample * __log_entry_sz(log_offset); + uint64_t sample_offset = sample * + __log_entry_sz(log_offset, log_issue_time); return (struct io_sample *) ((char *) samples + sample_offset); } struct io_logs *iolog_cur_log(struct io_log *); uint64_t iolog_nr_samples(struct io_log *); void regrow_logs(struct thread_data *); +void regrow_agg_logs(void); static inline struct io_sample *get_sample(struct io_log *iolog, struct io_logs *cur_log, uint64_t sample) { - return __get_sample(cur_log->log, iolog->log_offset, sample); + return __get_sample(cur_log->log, + iolog->log_offset, iolog->log_issue_time, sample); } enum { @@ -164,7 +251,7 @@ enum { */ struct io_piece { union { - struct rb_node rb_node; + struct fio_rb_node rb_node; struct flist_head list; }; struct flist_head trim_list; @@ -177,10 +264,8 @@ struct io_piece { unsigned long len; unsigned int flags; enum fio_ddir ddir; - union { - unsigned long delay; - unsigned int file_action; - }; + unsigned long delay; + unsigned int file_action; }; /* @@ -197,16 +282,20 @@ struct io_u; extern int __must_check read_iolog_get(struct thread_data *, struct io_u *); extern void log_io_u(const struct thread_data *, const struct io_u *); extern void log_file(struct thread_data *, struct fio_file *, enum file_log_act); -extern int __must_check init_iolog(struct thread_data *td); +extern bool __must_check init_iolog(struct thread_data *td); extern void log_io_piece(struct thread_data *, struct io_u *); extern void unlog_io_piece(struct thread_data *, struct io_u *); -extern void trim_io_piece(struct thread_data *, const struct io_u *); +extern void trim_io_piece(const struct io_u *); extern void queue_io_piece(struct thread_data *, struct io_piece *); extern void prune_io_piece_log(struct thread_data *); extern void write_iolog_close(struct thread_data *); +int64_t iolog_items_to_fetch(struct thread_data *td); extern int iolog_compress_init(struct thread_data *, struct sk_out *); extern void iolog_compress_exit(struct thread_data *); extern size_t log_chunk_sizes(struct io_log *); +extern int init_io_u_buffers(struct thread_data *); +extern unsigned long long delay_since_ttime(const struct thread_data *, + unsigned long long); #ifdef CONFIG_ZLIB extern int iolog_file_inflate(const char *); @@ -218,8 +307,12 @@ extern int iolog_file_inflate(const char *); struct log_params { struct thread_data *td; unsigned long avg_msec; + unsigned long hist_msec; + int hist_coarseness; int log_type; int log_offset; + int log_prio; + int log_issue_time; int log_gz; int log_gz_store; int log_compress; @@ -227,13 +320,29 @@ struct log_params { static inline bool per_unit_log(struct io_log *log) { - return log && !log->avg_msec; + return log && (!log->avg_msec || log->log_gz || log->log_gz_store); +} + +static inline bool inline_log(struct io_log *log) +{ + return log->log_type == IO_LOG_TYPE_LAT || + log->log_type == IO_LOG_TYPE_CLAT || + log->log_type == IO_LOG_TYPE_SLAT; +} + +static inline void ipo_bytes_align(unsigned int replay_align, struct io_piece *ipo) +{ + if (!replay_align) + return; + + ipo->offset &= ~(replay_align - (uint64_t)1); } extern void finalize_logs(struct thread_data *td, bool); extern void setup_log(struct io_log **, struct log_params *, const char *); -extern void flush_log(struct io_log *, int); +extern void flush_log(struct io_log *, bool); extern void flush_samples(FILE *, void *, uint64_t); +extern uint64_t hist_sum(int, int, uint64_t *, uint64_t *); extern void free_log(struct io_log *); extern void fio_writeout_logs(bool); extern void td_writeout_logs(struct thread_data *, bool); @@ -241,7 +350,7 @@ extern int iolog_cur_flush(struct io_log *, struct io_logs *); static inline void init_ipo(struct io_piece *ipo) { - memset(ipo, 0, sizeof(*ipo)); + INIT_FLIST_HEAD(&ipo->list); INIT_FLIST_HEAD(&ipo->trim_list); }