Merge branch 'fix-randtrimwrite' of https://github.com/minwooim/fio
[fio.git] / iolog.h
... / ...
CommitLineData
1#ifndef FIO_IOLOG_H
2#define FIO_IOLOG_H
3
4#include <stdio.h>
5
6#include "lib/rbtree.h"
7#include "lib/ieee754.h"
8#include "flist.h"
9#include "ioengines.h"
10
11/*
12 * Use for maintaining statistics
13 */
14struct io_stat {
15 uint64_t max_val;
16 uint64_t min_val;
17 uint64_t samples;
18
19 fio_fp64_t mean;
20 fio_fp64_t S;
21};
22
23struct io_hist {
24 uint64_t samples;
25 unsigned long hist_last;
26 struct flist_head list;
27};
28
29enum {
30 IO_LOG_SAMPLE_AVG = 0,
31 IO_LOG_SAMPLE_MAX,
32 IO_LOG_SAMPLE_BOTH,
33};
34
35struct io_sample_value {
36 uint64_t val0;
37 uint64_t val1;
38};
39
40union io_sample_data {
41 struct io_sample_value val;
42 struct io_u_plat_entry *plat_entry;
43};
44
45#define sample_val(value) ((union io_sample_data) { .val.val0 = value })
46#define sample_plat(plat) ((union io_sample_data) { .plat_entry = plat })
47
48/*
49 * A single data sample
50 */
51struct io_sample {
52 uint64_t time;
53 union io_sample_data data;
54 uint32_t __ddir;
55 uint16_t priority;
56 uint64_t bs;
57 uint64_t aux[];
58};
59
60/*
61 * Enumerate indexes of auxiliary log data in struct io_sample aux[] array
62 */
63enum {
64 IOS_AUX_OFFSET_INDEX,
65 IOS_AUX_ISSUE_TIME_INDEX,
66};
67
68enum {
69 IO_LOG_TYPE_LAT = 1,
70 IO_LOG_TYPE_CLAT,
71 IO_LOG_TYPE_SLAT,
72 IO_LOG_TYPE_BW,
73 IO_LOG_TYPE_IOPS,
74 IO_LOG_TYPE_HIST,
75};
76
77#define DEF_LOG_ENTRIES 1024
78#define MAX_LOG_ENTRIES (1024 * DEF_LOG_ENTRIES)
79
80struct io_logs {
81 struct flist_head list;
82 uint64_t nr_samples;
83 uint64_t max_samples;
84 void *log;
85};
86
87/*
88 * Dynamically growing data sample log
89 */
90struct io_log {
91 /*
92 * Entries already logged
93 */
94 struct flist_head io_logs;
95 uint32_t cur_log_max;
96
97 /*
98 * When the current log runs out of space, store events here until
99 * we have a chance to regrow
100 */
101 struct io_logs *pending;
102
103 unsigned int log_ddir_mask;
104
105 char *filename;
106
107 struct thread_data *td;
108
109 unsigned int log_type;
110
111 /*
112 * If we fail extending the log, stop collecting more entries.
113 */
114 bool disabled;
115
116 /*
117 * Log offsets
118 */
119 unsigned int log_offset;
120
121 /*
122 * Log I/O priorities
123 */
124 unsigned int log_prio;
125
126 /*
127 * Log I/O issuing time
128 */
129 unsigned int log_issue_time;
130
131 /*
132 * Max size of log entries before a chunk is compressed
133 */
134 unsigned int log_gz;
135
136 /*
137 * Don't deflate for storing, just store the compressed bits
138 */
139 unsigned int log_gz_store;
140
141 /*
142 * Windowed average, for logging single entries average over some
143 * period of time.
144 */
145 struct io_stat avg_window[DDIR_RWDIR_CNT];
146 unsigned long avg_msec;
147 unsigned long avg_last[DDIR_RWDIR_CNT];
148
149 /*
150 * Windowed latency histograms, for keeping track of when we need to
151 * save a copy of the histogram every approximately hist_msec
152 * milliseconds.
153 */
154 struct io_hist hist_window[DDIR_RWDIR_CNT];
155 unsigned long hist_msec;
156 unsigned int hist_coarseness;
157
158 pthread_mutex_t chunk_lock;
159 unsigned int chunk_seq;
160 struct flist_head chunk_list;
161
162 pthread_mutex_t deferred_free_lock;
163#define IOLOG_MAX_DEFER 8
164 void *deferred_items[IOLOG_MAX_DEFER];
165 unsigned int deferred;
166};
167
168/*
169 * If the upper bit is set, then we have the offset as well
170 */
171#define LOG_OFFSET_SAMPLE_BIT 0x80000000U
172/*
173 * If the bit following the upper bit is set, then we have the priority
174 */
175#define LOG_PRIO_SAMPLE_BIT 0x40000000U
176/*
177 * If the bit following prioity sample vit is set, we report both avg and max
178 */
179#define LOG_AVG_MAX_SAMPLE_BIT 0x20000000U
180/*
181 * If the bit following AVG_MAX_SAMPLE_BIT is set, we report the issue time also
182 */
183#define LOG_ISSUE_TIME_SAMPLE_BIT 0x10000000U
184
185#define LOG_SAMPLE_BITS (LOG_OFFSET_SAMPLE_BIT | LOG_PRIO_SAMPLE_BIT |\
186 LOG_AVG_MAX_SAMPLE_BIT |\
187 LOG_ISSUE_TIME_SAMPLE_BIT)
188#define io_sample_ddir(io) ((io)->__ddir & ~LOG_SAMPLE_BITS)
189
190static inline void io_sample_set_ddir(struct io_log *log,
191 struct io_sample *io,
192 enum fio_ddir ddir)
193{
194 io->__ddir = ddir | log->log_ddir_mask;
195}
196
197static inline size_t __log_entry_sz(bool log_offset, bool log_issue_time)
198{
199 size_t ret = sizeof(struct io_sample);
200
201 if (log_offset)
202 ret += sizeof(uint64_t);
203
204 if (log_issue_time)
205 ret += sizeof(uint64_t);
206
207 return ret;
208}
209
210static inline size_t log_entry_sz(struct io_log *log)
211{
212 return __log_entry_sz(log->log_offset, log->log_issue_time);
213}
214
215static inline size_t log_sample_sz(struct io_log *log, struct io_logs *cur_log)
216{
217 return cur_log->nr_samples * log_entry_sz(log);
218}
219
220static inline struct io_sample *__get_sample(void *samples, bool log_offset,
221 bool log_issue_time,
222 uint64_t sample)
223{
224 uint64_t sample_offset = sample *
225 __log_entry_sz(log_offset, log_issue_time);
226 return (struct io_sample *) ((char *) samples + sample_offset);
227}
228
229struct io_logs *iolog_cur_log(struct io_log *);
230uint64_t iolog_nr_samples(struct io_log *);
231void regrow_logs(struct thread_data *);
232void regrow_agg_logs(void);
233
234static inline struct io_sample *get_sample(struct io_log *iolog,
235 struct io_logs *cur_log,
236 uint64_t sample)
237{
238 return __get_sample(cur_log->log,
239 iolog->log_offset, iolog->log_issue_time, sample);
240}
241
242enum {
243 IP_F_ONRB = 1,
244 IP_F_ONLIST = 2,
245 IP_F_TRIMMED = 4,
246 IP_F_IN_FLIGHT = 8,
247};
248
249/*
250 * When logging io actions, this matches a single sent io_u
251 */
252struct io_piece {
253 union {
254 struct fio_rb_node rb_node;
255 struct flist_head list;
256 };
257 struct flist_head trim_list;
258 union {
259 int fileno;
260 struct fio_file *file;
261 };
262 unsigned long long offset;
263 unsigned short numberio;
264 unsigned long len;
265 unsigned int flags;
266 enum fio_ddir ddir;
267 unsigned long delay;
268 unsigned int file_action;
269};
270
271/*
272 * Log exports
273 */
274enum file_log_act {
275 FIO_LOG_ADD_FILE,
276 FIO_LOG_OPEN_FILE,
277 FIO_LOG_CLOSE_FILE,
278 FIO_LOG_UNLINK_FILE,
279};
280
281struct io_u;
282extern int __must_check read_iolog_get(struct thread_data *, struct io_u *);
283extern void log_io_u(const struct thread_data *, const struct io_u *);
284extern void log_file(struct thread_data *, struct fio_file *, enum file_log_act);
285extern bool __must_check init_iolog(struct thread_data *td);
286extern void log_io_piece(struct thread_data *, struct io_u *);
287extern void unlog_io_piece(struct thread_data *, struct io_u *);
288extern void trim_io_piece(const struct io_u *);
289extern void queue_io_piece(struct thread_data *, struct io_piece *);
290extern void prune_io_piece_log(struct thread_data *);
291extern void write_iolog_close(struct thread_data *);
292int64_t iolog_items_to_fetch(struct thread_data *td);
293extern int iolog_compress_init(struct thread_data *, struct sk_out *);
294extern void iolog_compress_exit(struct thread_data *);
295extern size_t log_chunk_sizes(struct io_log *);
296extern int init_io_u_buffers(struct thread_data *);
297extern unsigned long long delay_since_ttime(const struct thread_data *,
298 unsigned long long);
299
300#ifdef CONFIG_ZLIB
301extern int iolog_file_inflate(const char *);
302#endif
303
304/*
305 * Logging
306 */
307struct log_params {
308 struct thread_data *td;
309 unsigned long avg_msec;
310 unsigned long hist_msec;
311 int hist_coarseness;
312 int log_type;
313 int log_offset;
314 int log_prio;
315 int log_issue_time;
316 int log_gz;
317 int log_gz_store;
318 int log_compress;
319};
320
321static inline bool per_unit_log(struct io_log *log)
322{
323 return log && (!log->avg_msec || log->log_gz || log->log_gz_store);
324}
325
326static inline bool inline_log(struct io_log *log)
327{
328 return log->log_type == IO_LOG_TYPE_LAT ||
329 log->log_type == IO_LOG_TYPE_CLAT ||
330 log->log_type == IO_LOG_TYPE_SLAT;
331}
332
333static inline void ipo_bytes_align(unsigned int replay_align, struct io_piece *ipo)
334{
335 if (!replay_align)
336 return;
337
338 ipo->offset &= ~(replay_align - (uint64_t)1);
339}
340
341extern void finalize_logs(struct thread_data *td, bool);
342extern void setup_log(struct io_log **, struct log_params *, const char *);
343extern void flush_log(struct io_log *, bool);
344extern void flush_samples(FILE *, void *, uint64_t);
345extern uint64_t hist_sum(int, int, uint64_t *, uint64_t *);
346extern void free_log(struct io_log *);
347extern void fio_writeout_logs(bool);
348extern void td_writeout_logs(struct thread_data *, bool);
349extern int iolog_cur_flush(struct io_log *, struct io_logs *);
350
351static inline void init_ipo(struct io_piece *ipo)
352{
353 INIT_FLIST_HEAD(&ipo->list);
354 INIT_FLIST_HEAD(&ipo->trim_list);
355}
356
357struct iolog_compress {
358 struct flist_head list;
359 void *buf;
360 size_t len;
361 unsigned int seq;
362};
363
364#endif