client: pass back server side error to client exit value
[fio.git] / client.c
CommitLineData
132159a5
JA
1#include <stdio.h>
2#include <stdlib.h>
3#include <unistd.h>
4#include <limits.h>
5#include <errno.h>
6#include <fcntl.h>
7#include <sys/poll.h>
8#include <sys/types.h>
9#include <sys/stat.h>
10#include <sys/wait.h>
d05c4a03 11#include <sys/socket.h>
87aa8f19 12#include <sys/un.h>
132159a5
JA
13#include <netinet/in.h>
14#include <arpa/inet.h>
15#include <netdb.h>
9e22ecb0 16#include <signal.h>
132159a5
JA
17
18#include "fio.h"
19#include "server.h"
b66570dc 20#include "flist.h"
3c5f57e3 21#include "hash.h"
132159a5 22
82c1ed38
JA
23struct client_eta {
24 struct jobs_eta eta;
25 unsigned int pending;
26};
27
b66570dc
JA
28struct fio_client {
29 struct flist_head list;
bebe6398 30 struct flist_head hash_list;
3f3a4542 31 struct flist_head arg_list;
b66570dc 32 struct sockaddr_in addr;
87aa8f19 33 struct sockaddr_un addr_un;
b66570dc 34 char *hostname;
bebe6398 35 int port;
b66570dc 36 int fd;
81179eec 37
b5296ddb
JA
38 char *name;
39
81179eec 40 int state;
af9c9fb3 41
17dd1764 42 int skip_newline;
87aa8f19 43 int is_sock;
d09a64a0 44 int disk_stats_shown;
11e950bd
JA
45 unsigned int jobs;
46 int error;
82c1ed38
JA
47
48 struct flist_head eta_list;
49 struct client_eta *eta_in_flight;
81179eec 50
89c1707c
JA
51 struct flist_head cmd_list;
52
81179eec
JA
53 uint16_t argc;
54 char **argv;
55};
56
af9c9fb3 57static struct timeval eta_tv;
48fbb46e 58
81179eec 59enum {
5c2857f9 60 Client_created = 0,
81179eec
JA
61 Client_connected = 1,
62 Client_started = 2,
01be038e
JA
63 Client_running = 3,
64 Client_stopped = 4,
65 Client_exited = 5,
b66570dc
JA
66};
67
68static FLIST_HEAD(client_list);
82c1ed38 69static FLIST_HEAD(eta_list);
b66570dc 70
3f3a4542
JA
71static FLIST_HEAD(arg_list);
72
37f0c1ae
JA
73static struct thread_stat client_ts;
74static struct group_run_stats client_gs;
75static int sum_stat_clients;
76static int sum_stat_nr;
77
3c5f57e3
JA
78#define FIO_CLIENT_HASH_BITS 7
79#define FIO_CLIENT_HASH_SZ (1 << FIO_CLIENT_HASH_BITS)
80#define FIO_CLIENT_HASH_MASK (FIO_CLIENT_HASH_SZ - 1)
bebe6398 81static struct flist_head client_hash[FIO_CLIENT_HASH_SZ];
3c5f57e3 82
e951bdc4 83static int handle_client(struct fio_client *client);
82c1ed38 84static void dec_jobs_eta(struct client_eta *eta);
0b8f30a5 85
bebe6398 86static void fio_client_add_hash(struct fio_client *client)
3c5f57e3
JA
87{
88 int bucket = hash_long(client->fd, FIO_CLIENT_HASH_BITS);
89
90 bucket &= FIO_CLIENT_HASH_MASK;
bebe6398 91 flist_add(&client->hash_list, &client_hash[bucket]);
3c5f57e3
JA
92}
93
bebe6398 94static void fio_client_remove_hash(struct fio_client *client)
3c5f57e3 95{
bebe6398
JA
96 if (!flist_empty(&client->hash_list))
97 flist_del_init(&client->hash_list);
3c5f57e3
JA
98}
99
100static void fio_init fio_client_hash_init(void)
101{
102 int i;
103
bebe6398
JA
104 for (i = 0; i < FIO_CLIENT_HASH_SZ; i++)
105 INIT_FLIST_HEAD(&client_hash[i]);
3c5f57e3
JA
106}
107
b66570dc
JA
108static struct fio_client *find_client_by_fd(int fd)
109{
3c5f57e3 110 int bucket = hash_long(fd, FIO_CLIENT_HASH_BITS) & FIO_CLIENT_HASH_MASK;
b66570dc
JA
111 struct fio_client *client;
112 struct flist_head *entry;
113
bebe6398
JA
114 flist_for_each(entry, &client_hash[bucket]) {
115 client = flist_entry(entry, struct fio_client, hash_list);
b66570dc
JA
116
117 if (client->fd == fd)
118 return client;
119 }
120
121 return NULL;
122}
123
b66570dc
JA
124static void remove_client(struct fio_client *client)
125{
39e8e016 126 dprint(FD_NET, "client: removed <%s>\n", client->hostname);
b66570dc 127 flist_del(&client->list);
3c5f57e3 128
bebe6398 129 fio_client_remove_hash(client);
81179eec 130
82c1ed38
JA
131 if (!flist_empty(&client->eta_list)) {
132 flist_del_init(&client->eta_list);
133 dec_jobs_eta(client->eta_in_flight);
134 }
af9c9fb3 135
b66570dc 136 free(client->hostname);
81179eec
JA
137 if (client->argv)
138 free(client->argv);
b5296ddb
JA
139 if (client->name)
140 free(client->name);
81179eec 141
b66570dc 142 free(client);
3c5f57e3 143 nr_clients--;
5fd0acbd 144 sum_stat_clients--;
b66570dc 145}
132159a5 146
fa2ea806
JA
147static void __fio_client_add_cmd_option(struct fio_client *client,
148 const char *opt)
81179eec 149{
39e8e016
JA
150 int index;
151
152 index = client->argc++;
81179eec 153 client->argv = realloc(client->argv, sizeof(char *) * client->argc);
39e8e016
JA
154 client->argv[index] = strdup(opt);
155 dprint(FD_NET, "client: add cmd %d: %s\n", index, opt);
81179eec
JA
156}
157
fa2ea806 158void fio_client_add_cmd_option(void *cookie, const char *opt)
81179eec 159{
bebe6398 160 struct fio_client *client = cookie;
3f3a4542 161 struct flist_head *entry;
81179eec 162
bebe6398 163 if (!client || !opt)
fa2ea806 164 return;
81179eec 165
fa2ea806 166 __fio_client_add_cmd_option(client, opt);
3f3a4542
JA
167
168 /*
169 * Duplicate arguments to shared client group
170 */
171 flist_for_each(entry, &arg_list) {
172 client = flist_entry(entry, struct fio_client, arg_list);
173
174 __fio_client_add_cmd_option(client, opt);
175 }
81179eec
JA
176}
177
bebe6398 178int fio_client_add(const char *hostname, void **cookie)
132159a5 179{
3f3a4542 180 struct fio_client *existing = *cookie;
b66570dc 181 struct fio_client *client;
132159a5 182
3f3a4542
JA
183 if (existing) {
184 /*
185 * We always add our "exec" name as the option, hence 1
186 * means empty.
187 */
188 if (existing->argc == 1)
189 flist_add_tail(&existing->arg_list, &arg_list);
190 else {
191 while (!flist_empty(&arg_list))
192 flist_del_init(arg_list.next);
193 }
194 }
195
b66570dc 196 client = malloc(sizeof(*client));
a37f69b7 197 memset(client, 0, sizeof(*client));
81179eec 198
3c5f57e3 199 INIT_FLIST_HEAD(&client->list);
bebe6398 200 INIT_FLIST_HEAD(&client->hash_list);
3f3a4542 201 INIT_FLIST_HEAD(&client->arg_list);
82c1ed38 202 INIT_FLIST_HEAD(&client->eta_list);
89c1707c 203 INIT_FLIST_HEAD(&client->cmd_list);
3c5f57e3 204
bebe6398
JA
205 if (fio_server_parse_string(hostname, &client->hostname,
206 &client->is_sock, &client->port,
207 &client->addr.sin_addr))
208 return -1;
87aa8f19 209
bebe6398 210 client->fd = -1;
3c5f57e3 211
81179eec
JA
212 __fio_client_add_cmd_option(client, "fio");
213
a37f69b7
JA
214 flist_add(&client->list, &client_list);
215 nr_clients++;
bebe6398
JA
216 dprint(FD_NET, "client: added <%s>\n", client->hostname);
217 *cookie = client;
218 return 0;
a37f69b7
JA
219}
220
87aa8f19 221static int fio_client_connect_ip(struct fio_client *client)
a37f69b7
JA
222{
223 int fd;
132159a5 224
b66570dc 225 client->addr.sin_family = AF_INET;
bebe6398 226 client->addr.sin_port = htons(client->port);
132159a5
JA
227
228 fd = socket(AF_INET, SOCK_STREAM, 0);
229 if (fd < 0) {
230 log_err("fio: socket: %s\n", strerror(errno));
87aa8f19 231 return -1;
132159a5
JA
232 }
233
b66570dc 234 if (connect(fd, (struct sockaddr *) &client->addr, sizeof(client->addr)) < 0) {
132159a5 235 log_err("fio: connect: %s\n", strerror(errno));
a7de0a11
JA
236 log_err("fio: failed to connect to %s:%u\n", client->hostname,
237 client->port);
b94cba47 238 close(fd);
87aa8f19
JA
239 return -1;
240 }
241
242 return fd;
243}
244
245static int fio_client_connect_sock(struct fio_client *client)
246{
247 struct sockaddr_un *addr = &client->addr_un;
248 fio_socklen_t len;
249 int fd;
250
251 memset(addr, 0, sizeof(*addr));
252 addr->sun_family = AF_UNIX;
253 strcpy(addr->sun_path, client->hostname);
254
255 fd = socket(AF_UNIX, SOCK_STREAM, 0);
256 if (fd < 0) {
257 log_err("fio: socket: %s\n", strerror(errno));
258 return -1;
259 }
260
261 len = sizeof(addr->sun_family) + strlen(addr->sun_path) + 1;
262 if (connect(fd, (struct sockaddr *) addr, len) < 0) {
263 log_err("fio: connect; %s\n", strerror(errno));
b94cba47 264 close(fd);
87aa8f19 265 return -1;
132159a5
JA
266 }
267
87aa8f19
JA
268 return fd;
269}
270
271static int fio_client_connect(struct fio_client *client)
272{
273 int fd;
274
275 dprint(FD_NET, "client: connect to host %s\n", client->hostname);
276
87aa8f19
JA
277 if (client->is_sock)
278 fd = fio_client_connect_sock(client);
279 else
280 fd = fio_client_connect_ip(client);
281
89c1707c
JA
282 dprint(FD_NET, "client: %s connected %d\n", client->hostname, fd);
283
87aa8f19
JA
284 if (fd < 0)
285 return 1;
286
b66570dc 287 client->fd = fd;
bebe6398 288 fio_client_add_hash(client);
81179eec 289 client->state = Client_connected;
132159a5
JA
290 return 0;
291}
292
cc0df00a
JA
293void fio_clients_terminate(void)
294{
295 struct flist_head *entry;
296 struct fio_client *client;
297
60efd14e
JA
298 dprint(FD_NET, "client: terminate clients\n");
299
cc0df00a
JA
300 flist_for_each(entry, &client_list) {
301 client = flist_entry(entry, struct fio_client, list);
302
89c1707c 303 fio_net_send_simple_cmd(client->fd, FIO_NET_CMD_QUIT, 0, NULL);
cc0df00a
JA
304 }
305}
306
307static void sig_int(int sig)
308{
bebe6398 309 dprint(FD_NET, "client: got signal %d\n", sig);
cc0df00a
JA
310 fio_clients_terminate();
311}
312
313static void client_signal_handler(void)
314{
315 struct sigaction act;
316
317 memset(&act, 0, sizeof(act));
318 act.sa_handler = sig_int;
319 act.sa_flags = SA_RESTART;
320 sigaction(SIGINT, &act, NULL);
321
322 memset(&act, 0, sizeof(act));
323 act.sa_handler = sig_int;
324 act.sa_flags = SA_RESTART;
325 sigaction(SIGTERM, &act, NULL);
326}
327
0b8f30a5
JA
328static void probe_client(struct fio_client *client)
329{
60efd14e
JA
330 dprint(FD_NET, "client: send probe\n");
331
89c1707c 332 fio_net_send_simple_cmd(client->fd, FIO_NET_CMD_PROBE, 0, &client->cmd_list);
0b8f30a5
JA
333}
334
81179eec
JA
335static int send_client_cmd_line(struct fio_client *client)
336{
fa2ea806
JA
337 struct cmd_single_line_pdu *cslp;
338 struct cmd_line_pdu *clp;
339 unsigned long offset;
7f868316 340 unsigned int *lens;
fa2ea806
JA
341 void *pdu;
342 size_t mem;
81179eec
JA
343 int i, ret;
344
39e8e016 345 dprint(FD_NET, "client: send cmdline %d\n", client->argc);
60efd14e 346
7f868316
JA
347 lens = malloc(client->argc * sizeof(unsigned int));
348
fa2ea806
JA
349 /*
350 * Find out how much mem we need
351 */
7f868316
JA
352 for (i = 0, mem = 0; i < client->argc; i++) {
353 lens[i] = strlen(client->argv[i]) + 1;
354 mem += lens[i];
355 }
fa2ea806
JA
356
357 /*
358 * We need one cmd_line_pdu, and argc number of cmd_single_line_pdu
359 */
360 mem += sizeof(*clp) + (client->argc * sizeof(*cslp));
361
362 pdu = malloc(mem);
363 clp = pdu;
364 offset = sizeof(*clp);
365
366 for (i = 0; i < client->argc; i++) {
7f868316 367 uint16_t arg_len = lens[i];
fa2ea806
JA
368
369 cslp = pdu + offset;
370 strcpy((char *) cslp->text, client->argv[i]);
371 cslp->len = cpu_to_le16(arg_len);
372 offset += sizeof(*cslp) + arg_len;
373 }
81179eec 374
7f868316 375 free(lens);
fa2ea806 376 clp->lines = cpu_to_le16(client->argc);
af9c9fb3 377 ret = fio_net_send_cmd(client->fd, FIO_NET_CMD_JOBLINE, pdu, mem, 0);
81179eec
JA
378 free(pdu);
379 return ret;
380}
381
a37f69b7
JA
382int fio_clients_connect(void)
383{
384 struct fio_client *client;
385 struct flist_head *entry, *tmp;
386 int ret;
387
60efd14e
JA
388 dprint(FD_NET, "client: connect all\n");
389
cc0df00a
JA
390 client_signal_handler();
391
a37f69b7
JA
392 flist_for_each_safe(entry, tmp, &client_list) {
393 client = flist_entry(entry, struct fio_client, list);
394
395 ret = fio_client_connect(client);
0b8f30a5 396 if (ret) {
a37f69b7 397 remove_client(client);
0b8f30a5
JA
398 continue;
399 }
400
401 probe_client(client);
81179eec
JA
402
403 if (client->argc > 1)
404 send_client_cmd_line(client);
a37f69b7
JA
405 }
406
407 return !nr_clients;
408}
409
132159a5
JA
410/*
411 * Send file contents to server backend. We could use sendfile(), but to remain
412 * more portable lets just read/write the darn thing.
413 */
a37f69b7 414static int fio_client_send_ini(struct fio_client *client, const char *filename)
132159a5
JA
415{
416 struct stat sb;
417 char *p, *buf;
418 off_t len;
419 int fd, ret;
420
46c48f1f
JA
421 dprint(FD_NET, "send ini %s to %s\n", filename, client->hostname);
422
132159a5
JA
423 fd = open(filename, O_RDONLY);
424 if (fd < 0) {
e951bdc4 425 log_err("fio: job file <%s> open: %s\n", filename, strerror(errno));
132159a5
JA
426 return 1;
427 }
428
429 if (fstat(fd, &sb) < 0) {
430 log_err("fio: job file stat: %s\n", strerror(errno));
b94cba47 431 close(fd);
132159a5
JA
432 return 1;
433 }
434
435 buf = malloc(sb.st_size);
436
437 len = sb.st_size;
438 p = buf;
439 do {
440 ret = read(fd, p, len);
441 if (ret > 0) {
442 len -= ret;
443 if (!len)
444 break;
445 p += ret;
446 continue;
447 } else if (!ret)
448 break;
449 else if (errno == EAGAIN || errno == EINTR)
450 continue;
451 } while (1);
452
0b8f30a5
JA
453 if (len) {
454 log_err("fio: failed reading job file %s\n", filename);
b94cba47 455 close(fd);
c524ef72 456 free(buf);
0b8f30a5
JA
457 return 1;
458 }
459
af9c9fb3 460 ret = fio_net_send_cmd(client->fd, FIO_NET_CMD_JOB, buf, sb.st_size, 0);
132159a5 461 free(buf);
b94cba47 462 close(fd);
132159a5
JA
463 return ret;
464}
37db14fe 465
a37f69b7
JA
466int fio_clients_send_ini(const char *filename)
467{
468 struct fio_client *client;
469 struct flist_head *entry, *tmp;
470
471 flist_for_each_safe(entry, tmp, &client_list) {
472 client = flist_entry(entry, struct fio_client, list);
473
474 if (fio_client_send_ini(client, filename))
475 remove_client(client);
476 }
477
478 return !nr_clients;
479}
480
a64e88da
JA
481static void convert_io_stat(struct io_stat *dst, struct io_stat *src)
482{
483 dst->max_val = le64_to_cpu(src->max_val);
484 dst->min_val = le64_to_cpu(src->min_val);
485 dst->samples = le64_to_cpu(src->samples);
802ad4a8
JA
486
487 /*
488 * Floats arrive as IEEE 754 encoded uint64_t, convert back to double
489 */
490 dst->mean.u.f = fio_uint64_to_double(le64_to_cpu(dst->mean.u.i));
491 dst->S.u.f = fio_uint64_to_double(le64_to_cpu(dst->S.u.i));
a64e88da
JA
492}
493
494static void convert_ts(struct thread_stat *dst, struct thread_stat *src)
495{
496 int i, j;
497
498 dst->error = le32_to_cpu(src->error);
499 dst->groupid = le32_to_cpu(src->groupid);
500 dst->pid = le32_to_cpu(src->pid);
501 dst->members = le32_to_cpu(src->members);
502
503 for (i = 0; i < 2; i++) {
504 convert_io_stat(&dst->clat_stat[i], &src->clat_stat[i]);
505 convert_io_stat(&dst->slat_stat[i], &src->slat_stat[i]);
506 convert_io_stat(&dst->lat_stat[i], &src->lat_stat[i]);
507 convert_io_stat(&dst->bw_stat[i], &src->bw_stat[i]);
508 }
509
510 dst->usr_time = le64_to_cpu(src->usr_time);
511 dst->sys_time = le64_to_cpu(src->sys_time);
512 dst->ctx = le64_to_cpu(src->ctx);
513 dst->minf = le64_to_cpu(src->minf);
514 dst->majf = le64_to_cpu(src->majf);
515 dst->clat_percentiles = le64_to_cpu(src->clat_percentiles);
802ad4a8
JA
516
517 for (i = 0; i < FIO_IO_U_LIST_MAX_LEN; i++) {
518 fio_fp64_t *fps = &src->percentile_list[i];
519 fio_fp64_t *fpd = &dst->percentile_list[i];
520
521 fpd->u.f = fio_uint64_to_double(le64_to_cpu(fps->u.i));
522 }
a64e88da
JA
523
524 for (i = 0; i < FIO_IO_U_MAP_NR; i++) {
525 dst->io_u_map[i] = le32_to_cpu(src->io_u_map[i]);
526 dst->io_u_submit[i] = le32_to_cpu(src->io_u_submit[i]);
527 dst->io_u_complete[i] = le32_to_cpu(src->io_u_complete[i]);
528 }
529
530 for (i = 0; i < FIO_IO_U_LAT_U_NR; i++) {
531 dst->io_u_lat_u[i] = le32_to_cpu(src->io_u_lat_u[i]);
532 dst->io_u_lat_m[i] = le32_to_cpu(src->io_u_lat_m[i]);
533 }
534
535 for (i = 0; i < 2; i++)
536 for (j = 0; j < FIO_IO_U_PLAT_NR; j++)
537 dst->io_u_plat[i][j] = le32_to_cpu(src->io_u_plat[i][j]);
538
539 for (i = 0; i < 3; i++) {
540 dst->total_io_u[i] = le64_to_cpu(src->total_io_u[i]);
93eee04a 541 dst->short_io_u[i] = le64_to_cpu(src->short_io_u[i]);
a64e88da
JA
542 }
543
544 dst->total_submit = le64_to_cpu(src->total_submit);
545 dst->total_complete = le64_to_cpu(src->total_complete);
546
547 for (i = 0; i < 2; i++) {
548 dst->io_bytes[i] = le64_to_cpu(src->io_bytes[i]);
549 dst->runtime[i] = le64_to_cpu(src->runtime[i]);
550 }
551
552 dst->total_run_time = le64_to_cpu(src->total_run_time);
553 dst->continue_on_error = le16_to_cpu(src->continue_on_error);
554 dst->total_err_count = le64_to_cpu(src->total_err_count);
ddcc0b69
JA
555 dst->first_error = le32_to_cpu(src->first_error);
556 dst->kb_base = le32_to_cpu(src->kb_base);
a64e88da
JA
557}
558
559static void convert_gs(struct group_run_stats *dst, struct group_run_stats *src)
560{
561 int i;
562
563 for (i = 0; i < 2; i++) {
564 dst->max_run[i] = le64_to_cpu(src->max_run[i]);
565 dst->min_run[i] = le64_to_cpu(src->min_run[i]);
566 dst->max_bw[i] = le64_to_cpu(src->max_bw[i]);
567 dst->min_bw[i] = le64_to_cpu(src->min_bw[i]);
568 dst->io_kb[i] = le64_to_cpu(src->io_kb[i]);
569 dst->agg[i] = le64_to_cpu(src->agg[i]);
570 }
571
572 dst->kb_base = le32_to_cpu(src->kb_base);
573 dst->groupid = le32_to_cpu(src->groupid);
574}
575
576static void handle_ts(struct fio_net_cmd *cmd)
577{
578 struct cmd_ts_pdu *p = (struct cmd_ts_pdu *) cmd->payload;
579
580 convert_ts(&p->ts, &p->ts);
581 convert_gs(&p->rs, &p->rs);
582
583 show_thread_status(&p->ts, &p->rs);
37f0c1ae
JA
584
585 if (sum_stat_clients == 1)
586 return;
587
588 sum_thread_stats(&client_ts, &p->ts, sum_stat_nr);
589 sum_group_stats(&client_gs, &p->rs);
590
591 client_ts.members++;
592 client_ts.groupid = p->ts.groupid;
593
594 if (++sum_stat_nr == sum_stat_clients) {
595 strcpy(client_ts.name, "All clients");
596 show_thread_status(&client_ts, &client_gs);
597 }
a64e88da
JA
598}
599
600static void handle_gs(struct fio_net_cmd *cmd)
601{
602 struct group_run_stats *gs = (struct group_run_stats *) cmd->payload;
603
604 convert_gs(gs, gs);
605 show_group_stats(gs);
606}
607
d09a64a0
JA
608static void convert_agg(struct disk_util_agg *agg)
609{
610 int i;
611
612 for (i = 0; i < 2; i++) {
613 agg->ios[i] = le32_to_cpu(agg->ios[i]);
614 agg->merges[i] = le32_to_cpu(agg->merges[i]);
615 agg->sectors[i] = le64_to_cpu(agg->sectors[i]);
616 agg->ticks[i] = le32_to_cpu(agg->ticks[i]);
617 }
618
619 agg->io_ticks = le32_to_cpu(agg->io_ticks);
620 agg->time_in_queue = le32_to_cpu(agg->time_in_queue);
621 agg->slavecount = le32_to_cpu(agg->slavecount);
622 agg->max_util.u.f = __le64_to_cpu(fio_uint64_to_double(agg->max_util.u.i));
623}
624
625static void convert_dus(struct disk_util_stat *dus)
626{
627 int i;
628
629 for (i = 0; i < 2; i++) {
630 dus->ios[i] = le32_to_cpu(dus->ios[i]);
631 dus->merges[i] = le32_to_cpu(dus->merges[i]);
632 dus->sectors[i] = le64_to_cpu(dus->sectors[i]);
633 dus->ticks[i] = le32_to_cpu(dus->ticks[i]);
634 }
635
636 dus->io_ticks = le32_to_cpu(dus->io_ticks);
637 dus->time_in_queue = le32_to_cpu(dus->time_in_queue);
638 dus->msec = le64_to_cpu(dus->msec);
639}
640
641static void handle_du(struct fio_client *client, struct fio_net_cmd *cmd)
642{
643 struct cmd_du_pdu *du = (struct cmd_du_pdu *) cmd->payload;
644
645 convert_dus(&du->dus);
646 convert_agg(&du->agg);
647
648 if (!client->disk_stats_shown) {
649 client->disk_stats_shown = 1;
650 log_info("\nDisk stats (read/write):\n");
651 }
652
f2f788dd 653 print_disk_util(&du->dus, &du->agg, terse_output);
d09a64a0
JA
654}
655
48fbb46e 656static void convert_jobs_eta(struct jobs_eta *je)
cf451d1e 657{
cf451d1e
JA
658 int i;
659
660 je->nr_running = le32_to_cpu(je->nr_running);
661 je->nr_ramp = le32_to_cpu(je->nr_ramp);
662 je->nr_pending = le32_to_cpu(je->nr_pending);
663 je->files_open = le32_to_cpu(je->files_open);
664 je->m_rate = le32_to_cpu(je->m_rate);
665 je->t_rate = le32_to_cpu(je->t_rate);
666 je->m_iops = le32_to_cpu(je->m_iops);
667 je->t_iops = le32_to_cpu(je->t_iops);
668
669 for (i = 0; i < 2; i++) {
670 je->rate[i] = le32_to_cpu(je->rate[i]);
671 je->iops[i] = le32_to_cpu(je->iops[i]);
672 }
673
b51eedb7 674 je->elapsed_sec = le64_to_cpu(je->elapsed_sec);
cf451d1e 675 je->eta_sec = le64_to_cpu(je->eta_sec);
48fbb46e
JA
676}
677
af9c9fb3 678static void sum_jobs_eta(struct jobs_eta *dst, struct jobs_eta *je)
48fbb46e 679{
48fbb46e
JA
680 int i;
681
682 dst->nr_running += je->nr_running;
683 dst->nr_ramp += je->nr_ramp;
684 dst->nr_pending += je->nr_pending;
685 dst->files_open += je->files_open;
686 dst->m_rate += je->m_rate;
687 dst->t_rate += je->t_rate;
688 dst->m_iops += je->m_iops;
689 dst->t_iops += je->t_iops;
690
691 for (i = 0; i < 2; i++) {
692 dst->rate[i] += je->rate[i];
693 dst->iops[i] += je->iops[i];
694 }
695
696 dst->elapsed_sec += je->elapsed_sec;
697
698 if (je->eta_sec > dst->eta_sec)
699 dst->eta_sec = je->eta_sec;
700}
701
82c1ed38
JA
702static void dec_jobs_eta(struct client_eta *eta)
703{
704 if (!--eta->pending) {
705 display_thread_status(&eta->eta);
706 free(eta);
707 }
708}
709
89c1707c
JA
710static void remove_reply_cmd(struct fio_client *client, struct fio_net_cmd *cmd)
711{
712 struct fio_net_int_cmd *icmd = NULL;
713 struct flist_head *entry;
714
715 flist_for_each(entry, &client->cmd_list) {
716 icmd = flist_entry(entry, struct fio_net_int_cmd, list);
717
df380934 718 if (cmd->tag == (uintptr_t) icmd)
89c1707c
JA
719 break;
720
721 icmd = NULL;
722 }
723
724 if (!icmd) {
725 log_err("fio: client: unable to find matching tag\n");
726 return;
727 }
728
729 flist_del(&icmd->list);
730 cmd->tag = icmd->saved_tag;
731 free(icmd);
732}
733
82c1ed38 734static void handle_eta(struct fio_client *client, struct fio_net_cmd *cmd)
48fbb46e
JA
735{
736 struct jobs_eta *je = (struct jobs_eta *) cmd->payload;
df380934 737 struct client_eta *eta = (struct client_eta *) (uintptr_t) cmd->tag;
af9c9fb3
JA
738
739 dprint(FD_NET, "client: got eta tag %p, %d\n", eta, eta->pending);
cf451d1e 740
f77d2676
JA
741 assert(client->eta_in_flight == eta);
742
743 client->eta_in_flight = NULL;
82c1ed38
JA
744 flist_del_init(&client->eta_list);
745
48fbb46e 746 convert_jobs_eta(je);
af9c9fb3 747 sum_jobs_eta(&eta->eta, je);
82c1ed38 748 dec_jobs_eta(eta);
cf451d1e
JA
749}
750
b5296ddb 751static void handle_probe(struct fio_client *client, struct fio_net_cmd *cmd)
2e03b4b2
JA
752{
753 struct cmd_probe_pdu *probe = (struct cmd_probe_pdu *) cmd->payload;
d2333358
JA
754 const char *os, *arch;
755 char bit[16];
2e03b4b2 756
cca84643
JA
757 os = fio_get_os_string(probe->os);
758 if (!os)
759 os = "unknown";
760
761 arch = fio_get_arch_string(probe->arch);
762 if (!arch)
763 os = "unknown";
764
d2333358 765 sprintf(bit, "%d-bit", probe->bpp * 8);
38fdef22
JA
766
767 log_info("hostname=%s, be=%u, %s, os=%s, arch=%s, fio=%u.%u.%u\n",
768 probe->hostname, probe->bigendian, bit, os, arch,
769 probe->fio_major, probe->fio_minor, probe->fio_patch);
b5296ddb
JA
770
771 if (!client->name)
772 client->name = strdup((char *) probe->hostname);
2e03b4b2
JA
773}
774
11e950bd
JA
775static void handle_start(struct fio_client *client, struct fio_net_cmd *cmd)
776{
777 struct cmd_start_pdu *pdu = (struct cmd_start_pdu *) cmd->payload;
778
779 client->state = Client_started;
780 client->jobs = le32_to_cpu(pdu->jobs);
781}
782
783static void handle_stop(struct fio_client *client, struct fio_net_cmd *cmd)
784{
785 struct cmd_end_pdu *pdu = (struct cmd_end_pdu *) cmd->payload;
786
787 client->state = Client_stopped;
788 client->error = le32_to_cpu(pdu->error);
498c92c2
JA
789
790 if (client->error)
791 log_info("client <%s>: exited with error %d\n", client->hostname, client->error);
11e950bd
JA
792}
793
e951bdc4 794static int handle_client(struct fio_client *client)
37db14fe
JA
795{
796 struct fio_net_cmd *cmd;
797
60efd14e
JA
798 dprint(FD_NET, "client: handle %s\n", client->hostname);
799
e951bdc4
JA
800 cmd = fio_net_recv_cmd(client->fd);
801 if (!cmd)
802 return 0;
c2c94585 803
89c1707c
JA
804 dprint(FD_NET, "client: got cmd op %s from %s\n",
805 fio_server_op(cmd->opcode), client->hostname);
46c48f1f 806
e951bdc4
JA
807 switch (cmd->opcode) {
808 case FIO_NET_CMD_QUIT:
809 remove_client(client);
810 free(cmd);
811 break;
812 case FIO_NET_CMD_TEXT: {
813 const char *buf = (const char *) cmd->payload;
b5296ddb 814 const char *name;
e951bdc4
JA
815 int fio_unused ret;
816
b5296ddb
JA
817 name = client->name ? client->name : client->hostname;
818
e951bdc4 819 if (!client->skip_newline)
b5296ddb 820 fprintf(f_out, "<%s> ", name);
e951bdc4
JA
821 ret = fwrite(buf, cmd->pdu_len, 1, f_out);
822 fflush(f_out);
823 client->skip_newline = strchr(buf, '\n') == NULL;
824 free(cmd);
825 break;
37db14fe 826 }
d09a64a0
JA
827 case FIO_NET_CMD_DU:
828 handle_du(client, cmd);
829 free(cmd);
830 break;
e951bdc4
JA
831 case FIO_NET_CMD_TS:
832 handle_ts(cmd);
833 free(cmd);
834 break;
835 case FIO_NET_CMD_GS:
836 handle_gs(cmd);
837 free(cmd);
838 break;
839 case FIO_NET_CMD_ETA:
89c1707c 840 remove_reply_cmd(client, cmd);
82c1ed38 841 handle_eta(client, cmd);
e951bdc4
JA
842 free(cmd);
843 break;
844 case FIO_NET_CMD_PROBE:
89c1707c 845 remove_reply_cmd(client, cmd);
b5296ddb 846 handle_probe(client, cmd);
e951bdc4
JA
847 free(cmd);
848 break;
01be038e
JA
849 case FIO_NET_CMD_RUN:
850 client->state = Client_running;
851 free(cmd);
852 break;
e951bdc4 853 case FIO_NET_CMD_START:
11e950bd 854 handle_start(client, cmd);
e951bdc4
JA
855 free(cmd);
856 break;
857 case FIO_NET_CMD_STOP:
11e950bd 858 handle_stop(client, cmd);
e951bdc4
JA
859 free(cmd);
860 break;
861 default:
89c1707c 862 log_err("fio: unknown client op: %s\n", fio_server_op(cmd->opcode));
e951bdc4
JA
863 free(cmd);
864 break;
37db14fe
JA
865 }
866
e951bdc4 867 return 1;
37db14fe 868}
b66570dc 869
af9c9fb3
JA
870static void request_client_etas(void)
871{
872 struct fio_client *client;
873 struct flist_head *entry;
874 struct client_eta *eta;
82c1ed38 875 int skipped = 0;
af9c9fb3
JA
876
877 dprint(FD_NET, "client: request eta (%d)\n", nr_clients);
878
af9c9fb3
JA
879 eta = malloc(sizeof(*eta));
880 memset(&eta->eta, 0, sizeof(eta->eta));
881 eta->pending = nr_clients;
882
883 flist_for_each(entry, &client_list) {
884 client = flist_entry(entry, struct fio_client, list);
885
82c1ed38
JA
886 if (!flist_empty(&client->eta_list)) {
887 skipped++;
888 continue;
889 }
01be038e
JA
890 if (client->state != Client_running)
891 continue;
82c1ed38 892
f77d2676 893 assert(!client->eta_in_flight);
82c1ed38 894 flist_add_tail(&client->eta_list, &eta_list);
f77d2676 895 client->eta_in_flight = eta;
af9c9fb3 896 fio_net_send_simple_cmd(client->fd, FIO_NET_CMD_SEND_ETA,
df380934 897 (uintptr_t) eta, &client->cmd_list);
af9c9fb3
JA
898 }
899
82c1ed38
JA
900 while (skipped--)
901 dec_jobs_eta(eta);
902
af9c9fb3
JA
903 dprint(FD_NET, "client: requested eta tag %p\n", eta);
904}
905
89c1707c
JA
906static int client_check_cmd_timeout(struct fio_client *client,
907 struct timeval *now)
908{
909 struct fio_net_int_cmd *cmd;
910 struct flist_head *entry, *tmp;
911 int ret = 0;
912
913 flist_for_each_safe(entry, tmp, &client->cmd_list) {
914 cmd = flist_entry(entry, struct fio_net_int_cmd, list);
915
916 if (mtime_since(&cmd->tv, now) < FIO_NET_CLIENT_TIMEOUT)
917 continue;
918
919 log_err("fio: client %s, timeout on cmd %s\n", client->hostname,
920 fio_server_op(cmd->cmd.opcode));
921 flist_del(&cmd->list);
922 free(cmd);
923 ret = 1;
924 }
925
926 return flist_empty(&client->cmd_list) && ret;
927}
928
929static int fio_client_timed_out(void)
930{
931 struct fio_client *client;
932 struct flist_head *entry, *tmp;
933 struct timeval tv;
934 int ret = 0;
935
936 gettimeofday(&tv, NULL);
937
938 flist_for_each_safe(entry, tmp, &client_list) {
939 client = flist_entry(entry, struct fio_client, list);
940
941 if (flist_empty(&client->cmd_list))
942 continue;
943
944 if (!client_check_cmd_timeout(client, &tv))
945 continue;
946
947 log_err("fio: client %s timed out\n", client->hostname);
948 remove_client(client);
949 ret = 1;
950 }
951
952 return ret;
953}
954
b66570dc
JA
955int fio_handle_clients(void)
956{
957 struct fio_client *client;
958 struct flist_head *entry;
959 struct pollfd *pfds;
498c92c2 960 int i, ret = 0, retval = 0;
b66570dc 961
af9c9fb3
JA
962 gettimeofday(&eta_tv, NULL);
963
b66570dc
JA
964 pfds = malloc(nr_clients * sizeof(struct pollfd));
965
37f0c1ae
JA
966 sum_stat_clients = nr_clients;
967 init_thread_stat(&client_ts);
968 init_group_run_stat(&client_gs);
969
82a4be1b
JA
970 while (!exit_backend && nr_clients) {
971 i = 0;
972 flist_for_each(entry, &client_list) {
973 client = flist_entry(entry, struct fio_client, list);
b66570dc 974
82a4be1b
JA
975 pfds[i].fd = client->fd;
976 pfds[i].events = POLLIN;
977 i++;
978 }
979
980 assert(i == nr_clients);
b66570dc 981
5c2857f9 982 do {
af9c9fb3
JA
983 struct timeval tv;
984
985 gettimeofday(&tv, NULL);
986 if (mtime_since(&eta_tv, &tv) >= 900) {
987 request_client_etas();
988 memcpy(&eta_tv, &tv, sizeof(tv));
89c1707c
JA
989
990 if (fio_client_timed_out())
991 break;
af9c9fb3
JA
992 }
993
5c2857f9
JA
994 ret = poll(pfds, nr_clients, 100);
995 if (ret < 0) {
996 if (errno == EINTR)
997 continue;
998 log_err("fio: poll clients: %s\n", strerror(errno));
999 break;
1000 } else if (!ret)
b66570dc 1001 continue;
5c2857f9 1002 } while (ret <= 0);
b66570dc
JA
1003
1004 for (i = 0; i < nr_clients; i++) {
1005 if (!(pfds[i].revents & POLLIN))
1006 continue;
1007
1008 client = find_client_by_fd(pfds[i].fd);
1009 if (!client) {
3c5f57e3 1010 log_err("fio: unknown client fd %d\n", pfds[i].fd);
b66570dc
JA
1011 continue;
1012 }
e951bdc4 1013 if (!handle_client(client)) {
28d3ab07
JA
1014 log_info("client: host=%s disconnected\n",
1015 client->hostname);
1016 remove_client(client);
498c92c2 1017 retval = 1;
28d3ab07 1018 }
498c92c2
JA
1019 if (client->error)
1020 retval = 1;
b66570dc
JA
1021 }
1022 }
1023
1024 free(pfds);
498c92c2 1025 return retval;
b66570dc 1026}