Commit | Line | Data |
---|---|---|
c31092b8 | 1 | #include <signal.h> |
df9bd7d4 | 2 | #include <unistd.h> |
696378af BVA |
3 | #ifdef CONFIG_HAVE_TIMERFD_CREATE |
4 | #include <sys/timerfd.h> | |
5 | #endif | |
4f37732a BVA |
6 | #ifdef CONFIG_VALGRIND_DEV |
7 | #include <valgrind/drd.h> | |
8 | #else | |
9 | #define DRD_IGNORE_VAR(x) do { } while (0) | |
10 | #endif | |
11 | ||
3d0d549a BP |
12 | #ifdef WIN32 |
13 | #include "os/os-windows.h" | |
14 | #endif | |
15 | ||
a39fb9ea JA |
16 | #include "fio.h" |
17 | #include "smalloc.h" | |
18 | #include "helper_thread.h" | |
16e56d25 | 19 | #include "steadystate.h" |
ae626d4e | 20 | #include "pshared.h" |
a39fb9ea | 21 | |
df9bd7d4 | 22 | static int sleep_accuracy_ms; |
696378af | 23 | static int timerfd = -1; |
df9bd7d4 | 24 | |
52a552e2 BVA |
25 | enum action { |
26 | A_EXIT = 1, | |
27 | A_RESET = 2, | |
28 | A_DO_STAT = 3, | |
29 | }; | |
30 | ||
a39fb9ea JA |
31 | static struct helper_data { |
32 | volatile int exit; | |
52a552e2 | 33 | int pipe[2]; /* 0: read end; 1: write end. */ |
a39fb9ea JA |
34 | struct sk_out *sk_out; |
35 | pthread_t thread; | |
971caeb1 | 36 | struct fio_sem *startup_sem; |
a39fb9ea JA |
37 | } *helper_data; |
38 | ||
df9bd7d4 BVA |
39 | struct interval_timer { |
40 | const char *name; | |
41 | struct timespec expires; | |
42 | uint32_t interval_ms; | |
43 | int (*func)(void); | |
44 | }; | |
45 | ||
a39fb9ea JA |
46 | void helper_thread_destroy(void) |
47 | { | |
998e9ebb BVA |
48 | if (!helper_data) |
49 | return; | |
50 | ||
52a552e2 BVA |
51 | close(helper_data->pipe[0]); |
52 | close(helper_data->pipe[1]); | |
a39fb9ea JA |
53 | sfree(helper_data); |
54 | } | |
55 | ||
52a552e2 BVA |
56 | #ifdef _WIN32 |
57 | static void sock_init(void) | |
a39fb9ea | 58 | { |
52a552e2 BVA |
59 | WSADATA wsaData; |
60 | int res; | |
a39fb9ea | 61 | |
52a552e2 BVA |
62 | /* It is allowed to call WSAStartup() more than once. */ |
63 | res = WSAStartup(MAKEWORD(2, 2), &wsaData); | |
64 | assert(res == 0); | |
65 | } | |
a39fb9ea | 66 | |
52a552e2 BVA |
67 | static int make_nonblocking(int fd) |
68 | { | |
69 | unsigned long arg = 1; | |
dda11987 | 70 | |
52a552e2 | 71 | return ioctlsocket(fd, FIONBIO, &arg); |
a39fb9ea JA |
72 | } |
73 | ||
52a552e2 BVA |
74 | static int write_to_pipe(int fd, const void *buf, size_t len) |
75 | { | |
76 | return send(fd, buf, len, 0); | |
77 | } | |
78 | ||
79 | static int read_from_pipe(int fd, void *buf, size_t len) | |
80 | { | |
81 | return recv(fd, buf, len, 0); | |
82 | } | |
83 | #else | |
84 | static void sock_init(void) | |
85 | { | |
86 | } | |
87 | ||
88 | static int make_nonblocking(int fd) | |
89 | { | |
90 | return fcntl(fd, F_SETFL, O_NONBLOCK); | |
91 | } | |
92 | ||
93 | static int write_to_pipe(int fd, const void *buf, size_t len) | |
94 | { | |
95 | return write(fd, buf, len); | |
96 | } | |
97 | ||
98 | static int read_from_pipe(int fd, void *buf, size_t len) | |
99 | { | |
100 | return read(fd, buf, len); | |
101 | } | |
102 | #endif | |
103 | ||
2575407f BVA |
104 | static void block_signals(void) |
105 | { | |
106 | #ifdef HAVE_PTHREAD_SIGMASK | |
107 | sigset_t sigmask; | |
108 | ||
109 | ret = pthread_sigmask(SIG_UNBLOCK, NULL, &sigmask); | |
110 | assert(ret == 0); | |
111 | ret = pthread_sigmask(SIG_BLOCK, &sigmask, NULL); | |
112 | assert(ret == 0); | |
113 | #endif | |
114 | } | |
115 | ||
52a552e2 | 116 | static void submit_action(enum action a) |
a39fb9ea | 117 | { |
52a552e2 BVA |
118 | const char data = a; |
119 | int ret; | |
120 | ||
dda11987 JA |
121 | if (!helper_data) |
122 | return; | |
123 | ||
52a552e2 BVA |
124 | ret = write_to_pipe(helper_data->pipe[1], &data, sizeof(data)); |
125 | assert(ret == 1); | |
126 | } | |
127 | ||
128 | void helper_reset(void) | |
129 | { | |
130 | submit_action(A_RESET); | |
131 | } | |
132 | ||
133 | /* | |
134 | * May be invoked in signal handler context and hence must only call functions | |
135 | * that are async-signal-safe. See also | |
136 | * https://pubs.opengroup.org/onlinepubs/9699919799/functions/V2_chap02.html#tag_15_04_03. | |
137 | */ | |
138 | void helper_do_stat(void) | |
139 | { | |
140 | submit_action(A_DO_STAT); | |
a39fb9ea JA |
141 | } |
142 | ||
143 | bool helper_should_exit(void) | |
144 | { | |
145 | if (!helper_data) | |
146 | return true; | |
147 | ||
148 | return helper_data->exit; | |
149 | } | |
150 | ||
151 | void helper_thread_exit(void) | |
152 | { | |
998e9ebb BVA |
153 | if (!helper_data) |
154 | return; | |
155 | ||
a39fb9ea | 156 | helper_data->exit = 1; |
52a552e2 BVA |
157 | submit_action(A_EXIT); |
158 | pthread_join(helper_data->thread, NULL); | |
a39fb9ea JA |
159 | } |
160 | ||
df9bd7d4 BVA |
161 | /* Resets timers and returns the time in milliseconds until the next event. */ |
162 | static int reset_timers(struct interval_timer timer[], int num_timers, | |
163 | struct timespec *now) | |
164 | { | |
165 | uint32_t msec_to_next_event = INT_MAX; | |
166 | int i; | |
167 | ||
168 | for (i = 0; i < num_timers; ++i) { | |
169 | timer[i].expires = *now; | |
170 | timespec_add_msec(&timer[i].expires, timer[i].interval_ms); | |
171 | msec_to_next_event = min_not_zero(msec_to_next_event, | |
172 | timer[i].interval_ms); | |
173 | } | |
174 | ||
175 | return msec_to_next_event; | |
176 | } | |
177 | ||
335210df BVA |
178 | /* |
179 | * Waits for an action from fd during at least timeout_ms. `fd` must be in | |
180 | * non-blocking mode. | |
181 | */ | |
182 | static uint8_t wait_for_action(int fd, unsigned int timeout_ms) | |
183 | { | |
184 | struct timeval timeout = { | |
185 | .tv_sec = timeout_ms / 1000, | |
186 | .tv_usec = (timeout_ms % 1000) * 1000, | |
187 | }; | |
188 | fd_set rfds, efds; | |
189 | uint8_t action = 0; | |
696378af | 190 | uint64_t exp; |
335210df BVA |
191 | int res; |
192 | ||
193 | res = read_from_pipe(fd, &action, sizeof(action)); | |
194 | if (res > 0 || timeout_ms == 0) | |
195 | return action; | |
196 | FD_ZERO(&rfds); | |
197 | FD_SET(fd, &rfds); | |
198 | FD_ZERO(&efds); | |
199 | FD_SET(fd, &efds); | |
696378af BVA |
200 | #ifdef CONFIG_HAVE_TIMERFD_CREATE |
201 | { | |
202 | /* | |
203 | * If the timer frequency is 100 Hz, select() will round up | |
204 | * `timeout` to the next multiple of 1 / 100 Hz = 10 ms. Hence | |
205 | * use a high-resolution timer if possible to increase | |
206 | * select() timeout accuracy. | |
207 | */ | |
208 | struct itimerspec delta = {}; | |
209 | ||
210 | delta.it_value.tv_sec = timeout.tv_sec; | |
211 | delta.it_value.tv_nsec = timeout.tv_usec * 1000; | |
212 | res = timerfd_settime(timerfd, 0, &delta, NULL); | |
213 | assert(res == 0); | |
214 | FD_SET(timerfd, &rfds); | |
215 | } | |
216 | #endif | |
217 | res = select(max(fd, timerfd) + 1, &rfds, NULL, &efds, | |
218 | timerfd >= 0 ? NULL : &timeout); | |
335210df BVA |
219 | if (res < 0) { |
220 | log_err("fio: select() call in helper thread failed: %s", | |
221 | strerror(errno)); | |
222 | return A_EXIT; | |
223 | } | |
224 | if (FD_ISSET(fd, &rfds)) | |
225 | read_from_pipe(fd, &action, sizeof(action)); | |
696378af BVA |
226 | if (timerfd >= 0 && FD_ISSET(timerfd, &rfds)) { |
227 | res = read(timerfd, &exp, sizeof(exp)); | |
228 | assert(res == sizeof(exp)); | |
229 | } | |
335210df BVA |
230 | return action; |
231 | } | |
232 | ||
df9bd7d4 BVA |
233 | /* |
234 | * Verify whether or not timer @it has expired. If timer @it has expired, call | |
235 | * @it->func(). @now is the current time. @msec_to_next_event is an | |
236 | * input/output parameter that represents the time until the next event. | |
237 | */ | |
238 | static int eval_timer(struct interval_timer *it, const struct timespec *now, | |
239 | unsigned int *msec_to_next_event) | |
3da71e37 | 240 | { |
df9bd7d4 BVA |
241 | int64_t delta_ms; |
242 | bool expired; | |
243 | ||
244 | /* interval == 0 means that the timer is disabled. */ | |
245 | if (it->interval_ms == 0) | |
246 | return 0; | |
247 | ||
248 | delta_ms = rel_time_since(now, &it->expires); | |
249 | expired = delta_ms <= sleep_accuracy_ms; | |
250 | if (expired) { | |
251 | timespec_add_msec(&it->expires, it->interval_ms); | |
252 | delta_ms = rel_time_since(now, &it->expires); | |
253 | if (delta_ms < it->interval_ms - sleep_accuracy_ms || | |
254 | delta_ms > it->interval_ms + sleep_accuracy_ms) { | |
255 | dprint(FD_HELPERTHREAD, | |
256 | "%s: delta = %" PRIi64 " <> %u. Clock jump?\n", | |
257 | it->name, delta_ms, it->interval_ms); | |
258 | delta_ms = it->interval_ms; | |
259 | it->expires = *now; | |
260 | timespec_add_msec(&it->expires, it->interval_ms); | |
261 | } | |
262 | } | |
263 | *msec_to_next_event = min((unsigned int)delta_ms, *msec_to_next_event); | |
264 | return expired ? it->func() : 0; | |
3da71e37 VF |
265 | } |
266 | ||
a39fb9ea JA |
267 | static void *helper_thread_main(void *data) |
268 | { | |
269 | struct helper_data *hd = data; | |
df9bd7d4 BVA |
270 | unsigned int msec_to_next_event, next_log; |
271 | struct interval_timer timer[] = { | |
272 | { | |
273 | .name = "disk_util", | |
274 | .interval_ms = DISK_UTIL_MSEC, | |
275 | .func = update_io_ticks, | |
276 | }, | |
277 | { | |
278 | .name = "status_interval", | |
279 | .interval_ms = status_interval, | |
280 | .func = __show_running_run_stats, | |
281 | }, | |
282 | { | |
283 | .name = "steadystate", | |
90e678ba | 284 | .interval_ms = steadystate_enabled ? ss_check_interval : |
df9bd7d4 BVA |
285 | 0, |
286 | .func = steadystate_check, | |
287 | } | |
288 | }; | |
289 | struct timespec ts; | |
3d0d549a BP |
290 | long clk_tck; |
291 | int ret = 0; | |
df9bd7d4 | 292 | |
3d0d549a BP |
293 | os_clk_tck(&clk_tck); |
294 | ||
295 | dprint(FD_HELPERTHREAD, "clk_tck = %ld\n", clk_tck); | |
df9bd7d4 BVA |
296 | assert(clk_tck > 0); |
297 | sleep_accuracy_ms = (1000 + clk_tck - 1) / clk_tck; | |
a39fb9ea | 298 | |
696378af BVA |
299 | #ifdef CONFIG_HAVE_TIMERFD_CREATE |
300 | timerfd = timerfd_create(CLOCK_MONOTONIC, TFD_NONBLOCK); | |
301 | assert(timerfd >= 0); | |
302 | sleep_accuracy_ms = 1; | |
303 | #endif | |
304 | ||
a39fb9ea JA |
305 | sk_out_assign(hd->sk_out); |
306 | ||
c31092b8 | 307 | /* Let another thread handle signals. */ |
2575407f | 308 | block_signals(); |
c31092b8 | 309 | |
69212fc4 | 310 | fio_get_mono_time(&ts); |
59f94d26 | 311 | msec_to_next_event = reset_timers(timer, FIO_ARRAY_SIZE(timer), &ts); |
a39fb9ea | 312 | |
971caeb1 | 313 | fio_sem_up(hd->startup_sem); |
a39fb9ea | 314 | |
a39fb9ea | 315 | while (!ret && !hd->exit) { |
335210df | 316 | uint8_t action; |
df9bd7d4 | 317 | int i; |
335210df BVA |
318 | |
319 | action = wait_for_action(hd->pipe[0], msec_to_next_event); | |
320 | if (action == A_EXIT) | |
321 | break; | |
a39fb9ea | 322 | |
69212fc4 | 323 | fio_get_mono_time(&ts); |
a39fb9ea | 324 | |
df9bd7d4 BVA |
325 | msec_to_next_event = INT_MAX; |
326 | ||
327 | if (action == A_RESET) | |
328 | msec_to_next_event = reset_timers(timer, | |
59f94d26 | 329 | FIO_ARRAY_SIZE(timer), &ts); |
a39fb9ea | 330 | |
59f94d26 | 331 | for (i = 0; i < FIO_ARRAY_SIZE(timer); ++i) |
df9bd7d4 | 332 | ret = eval_timer(&timer[i], &ts, &msec_to_next_event); |
a39fb9ea | 333 | |
52a552e2 | 334 | if (action == A_DO_STAT) |
a39fb9ea | 335 | __show_running_run_stats(); |
a39fb9ea JA |
336 | |
337 | next_log = calc_log_samples(); | |
338 | if (!next_log) | |
339 | next_log = DISK_UTIL_MSEC; | |
340 | ||
3da71e37 | 341 | msec_to_next_event = min(next_log, msec_to_next_event); |
df9bd7d4 BVA |
342 | dprint(FD_HELPERTHREAD, |
343 | "next_log: %u, msec_to_next_event: %u\n", | |
344 | next_log, msec_to_next_event); | |
a39fb9ea JA |
345 | |
346 | if (!is_backend) | |
347 | print_thread_status(); | |
348 | } | |
349 | ||
696378af BVA |
350 | if (timerfd >= 0) { |
351 | close(timerfd); | |
352 | timerfd = -1; | |
353 | } | |
354 | ||
a39fb9ea JA |
355 | fio_writeout_logs(false); |
356 | ||
357 | sk_out_drop(); | |
358 | return NULL; | |
359 | } | |
360 | ||
52a552e2 BVA |
361 | /* |
362 | * Connect two sockets to each other to emulate the pipe() system call on Windows. | |
363 | */ | |
364 | int pipe_over_loopback(int fd[2]) | |
365 | { | |
366 | struct sockaddr_in addr = { .sin_family = AF_INET }; | |
367 | socklen_t len = sizeof(addr); | |
368 | int res; | |
369 | ||
370 | addr.sin_addr.s_addr = htonl(INADDR_LOOPBACK); | |
371 | ||
372 | sock_init(); | |
373 | ||
374 | fd[0] = socket(AF_INET, SOCK_STREAM, 0); | |
375 | if (fd[0] < 0) | |
376 | goto err; | |
377 | fd[1] = socket(AF_INET, SOCK_STREAM, 0); | |
378 | if (fd[1] < 0) | |
379 | goto close_fd_0; | |
380 | res = bind(fd[0], (struct sockaddr *)&addr, len); | |
381 | if (res < 0) | |
382 | goto close_fd_1; | |
383 | res = getsockname(fd[0], (struct sockaddr *)&addr, &len); | |
384 | if (res < 0) | |
385 | goto close_fd_1; | |
386 | res = listen(fd[0], 1); | |
387 | if (res < 0) | |
388 | goto close_fd_1; | |
389 | res = connect(fd[1], (struct sockaddr *)&addr, len); | |
390 | if (res < 0) | |
391 | goto close_fd_1; | |
392 | res = accept(fd[0], NULL, NULL); | |
393 | if (res < 0) | |
394 | goto close_fd_1; | |
395 | close(fd[0]); | |
396 | fd[0] = res; | |
397 | return 0; | |
398 | ||
399 | close_fd_1: | |
400 | close(fd[1]); | |
401 | ||
402 | close_fd_0: | |
403 | close(fd[0]); | |
404 | ||
405 | err: | |
406 | return -1; | |
407 | } | |
408 | ||
971caeb1 | 409 | int helper_thread_create(struct fio_sem *startup_sem, struct sk_out *sk_out) |
a39fb9ea JA |
410 | { |
411 | struct helper_data *hd; | |
412 | int ret; | |
413 | ||
b3090ff4 | 414 | hd = scalloc(1, sizeof(*hd)); |
a39fb9ea JA |
415 | |
416 | setup_disk_util(); | |
16e56d25 | 417 | steadystate_setup(); |
a39fb9ea JA |
418 | |
419 | hd->sk_out = sk_out; | |
34febb23 | 420 | |
52a552e2 BVA |
421 | #if defined(CONFIG_PIPE2) |
422 | ret = pipe2(hd->pipe, O_CLOEXEC); | |
423 | #elif defined(CONFIG_PIPE) | |
424 | ret = pipe(hd->pipe); | |
425 | #else | |
426 | ret = pipe_over_loopback(hd->pipe); | |
427 | #endif | |
34febb23 | 428 | if (ret) |
f9e5b5ee | 429 | return 1; |
34febb23 | 430 | |
52a552e2 BVA |
431 | ret = make_nonblocking(hd->pipe[0]); |
432 | assert(ret >= 0); | |
433 | ||
971caeb1 | 434 | hd->startup_sem = startup_sem; |
a39fb9ea | 435 | |
4f37732a BVA |
436 | DRD_IGNORE_VAR(helper_data); |
437 | ||
a39fb9ea JA |
438 | ret = pthread_create(&hd->thread, NULL, helper_thread_main, hd); |
439 | if (ret) { | |
440 | log_err("Can't create helper thread: %s\n", strerror(ret)); | |
441 | return 1; | |
442 | } | |
443 | ||
444 | helper_data = hd; | |
445 | ||
971caeb1 BVA |
446 | dprint(FD_MUTEX, "wait on startup_sem\n"); |
447 | fio_sem_down(startup_sem); | |
448 | dprint(FD_MUTEX, "done waiting on startup_sem\n"); | |
a39fb9ea JA |
449 | return 0; |
450 | } |