server: more debug dumping
[fio.git] / client.c
CommitLineData
132159a5
JA
1#include <stdio.h>
2#include <stdlib.h>
3#include <unistd.h>
4#include <limits.h>
5#include <errno.h>
6#include <fcntl.h>
7#include <sys/poll.h>
8#include <sys/types.h>
9#include <sys/stat.h>
10#include <sys/wait.h>
11#include <sys/mman.h>
12#include <netinet/in.h>
13#include <arpa/inet.h>
14#include <netdb.h>
15
16#include "fio.h"
17#include "server.h"
18#include "crc/crc32.h"
b66570dc 19#include "flist.h"
132159a5 20
b66570dc
JA
21struct fio_client {
22 struct flist_head list;
23 struct sockaddr_in addr;
24 char *hostname;
25 int fd;
81179eec
JA
26
27 int state;
17dd1764 28 int skip_newline;
81179eec
JA
29
30 uint16_t argc;
31 char **argv;
32};
33
34enum {
5c2857f9 35 Client_created = 0,
81179eec
JA
36 Client_connected = 1,
37 Client_started = 2,
38 Client_stopped = 3,
5c2857f9 39 Client_exited = 4,
b66570dc
JA
40};
41
42static FLIST_HEAD(client_list);
b66570dc 43
0b8f30a5
JA
44static int handle_client(struct fio_client *client, int one);
45
b66570dc
JA
46static struct fio_client *find_client_by_fd(int fd)
47{
48 struct fio_client *client;
49 struct flist_head *entry;
50
51 flist_for_each(entry, &client_list) {
52 client = flist_entry(entry, struct fio_client, list);
53
54 if (client->fd == fd)
55 return client;
56 }
57
58 return NULL;
59}
60
61static struct fio_client *find_client_by_name(const char *name)
62{
63 struct fio_client *client;
64 struct flist_head *entry;
65
66 flist_for_each(entry, &client_list) {
67 client = flist_entry(entry, struct fio_client, list);
68
69 if (!strcmp(name, client->hostname))
70 return client;
71 }
72
73 return NULL;
74}
75
76static void remove_client(struct fio_client *client)
77{
39e8e016 78 dprint(FD_NET, "client: removed <%s>\n", client->hostname);
b66570dc
JA
79 flist_del(&client->list);
80 nr_clients--;
81179eec 81
b66570dc 82 free(client->hostname);
81179eec
JA
83 if (client->argv)
84 free(client->argv);
85
b66570dc
JA
86 free(client);
87}
132159a5 88
81179eec
JA
89static void __fio_client_add_cmd_option(struct fio_client *client,
90 const char *opt)
91{
39e8e016
JA
92 int index;
93
94 index = client->argc++;
81179eec 95 client->argv = realloc(client->argv, sizeof(char *) * client->argc);
39e8e016
JA
96 client->argv[index] = strdup(opt);
97 dprint(FD_NET, "client: add cmd %d: %s\n", index, opt);
81179eec
JA
98}
99
100void fio_client_add_cmd_option(const char *hostname, const char *opt)
101{
102 struct fio_client *client;
103
104 if (!hostname || !opt)
105 return;
106
107 client = find_client_by_name(hostname);
108 if (!client) {
109 log_err("fio: unknown client %s\n", hostname);
110 return;
111 }
112
113 __fio_client_add_cmd_option(client, opt);
114}
115
a37f69b7 116void fio_client_add(const char *hostname)
132159a5 117{
b66570dc 118 struct fio_client *client;
132159a5 119
39e8e016 120 dprint(FD_NET, "client: added <%s>\n", hostname);
b66570dc 121 client = malloc(sizeof(*client));
a37f69b7 122 memset(client, 0, sizeof(*client));
81179eec 123
a37f69b7
JA
124 client->hostname = strdup(hostname);
125 client->fd = -1;
81179eec
JA
126
127 __fio_client_add_cmd_option(client, "fio");
128
a37f69b7
JA
129 flist_add(&client->list, &client_list);
130 nr_clients++;
131}
132
133static int fio_client_connect(struct fio_client *client)
134{
135 int fd;
132159a5 136
39e8e016 137 dprint(FD_NET, "client: connect to host %s\n", client->hostname);
46c48f1f 138
b66570dc
JA
139 memset(&client->addr, 0, sizeof(client->addr));
140 client->addr.sin_family = AF_INET;
141 client->addr.sin_port = htons(fio_net_port);
142
a37f69b7 143 if (inet_aton(client->hostname, &client->addr.sin_addr) != 1) {
132159a5
JA
144 struct hostent *hent;
145
a37f69b7 146 hent = gethostbyname(client->hostname);
132159a5
JA
147 if (!hent) {
148 log_err("fio: gethostbyname: %s\n", strerror(errno));
149 return 1;
150 }
151
b66570dc 152 memcpy(&client->addr.sin_addr, hent->h_addr, 4);
132159a5
JA
153 }
154
155 fd = socket(AF_INET, SOCK_STREAM, 0);
156 if (fd < 0) {
157 log_err("fio: socket: %s\n", strerror(errno));
158 return 1;
159 }
160
b66570dc 161 if (connect(fd, (struct sockaddr *) &client->addr, sizeof(client->addr)) < 0) {
132159a5 162 log_err("fio: connect: %s\n", strerror(errno));
cdf54d85 163 log_err("fio: failed to connect to %s\n", client->hostname);
132159a5
JA
164 return 1;
165 }
166
b66570dc 167 client->fd = fd;
81179eec 168 client->state = Client_connected;
132159a5
JA
169 return 0;
170}
171
cc0df00a
JA
172void fio_clients_terminate(void)
173{
174 struct flist_head *entry;
175 struct fio_client *client;
176
60efd14e
JA
177 dprint(FD_NET, "client: terminate clients\n");
178
cc0df00a
JA
179 flist_for_each(entry, &client_list) {
180 client = flist_entry(entry, struct fio_client, list);
181
182 fio_net_send_simple_cmd(client->fd, FIO_NET_CMD_QUIT, 0);
183 }
184}
185
186static void sig_int(int sig)
187{
60efd14e 188 dprint(FD_NET, "client: got sign %d\n", sig);
cc0df00a
JA
189 fio_clients_terminate();
190}
191
192static void client_signal_handler(void)
193{
194 struct sigaction act;
195
196 memset(&act, 0, sizeof(act));
197 act.sa_handler = sig_int;
198 act.sa_flags = SA_RESTART;
199 sigaction(SIGINT, &act, NULL);
200
201 memset(&act, 0, sizeof(act));
202 act.sa_handler = sig_int;
203 act.sa_flags = SA_RESTART;
204 sigaction(SIGTERM, &act, NULL);
205}
206
0b8f30a5
JA
207static void probe_client(struct fio_client *client)
208{
60efd14e
JA
209 dprint(FD_NET, "client: send probe\n");
210
0b8f30a5
JA
211 fio_net_send_simple_cmd(client->fd, FIO_NET_CMD_PROBE, 0);
212 handle_client(client, 1);
213}
214
81179eec
JA
215static int send_client_cmd_line(struct fio_client *client)
216{
217 struct cmd_line_pdu *pdu;
218 int i, ret;
219
39e8e016 220 dprint(FD_NET, "client: send cmdline %d\n", client->argc);
60efd14e 221
81179eec
JA
222 pdu = malloc(sizeof(*pdu));
223 for (i = 0; i < client->argc; i++)
224 strcpy((char *) pdu->argv[i], client->argv[i]);
225
226 pdu->argc = cpu_to_le16(client->argc);
227 ret = fio_net_send_cmd(client->fd, FIO_NET_CMD_JOBLINE, pdu, sizeof(*pdu));
228 free(pdu);
229 return ret;
230}
231
a37f69b7
JA
232int fio_clients_connect(void)
233{
234 struct fio_client *client;
235 struct flist_head *entry, *tmp;
236 int ret;
237
60efd14e
JA
238 dprint(FD_NET, "client: connect all\n");
239
cc0df00a
JA
240 client_signal_handler();
241
a37f69b7
JA
242 flist_for_each_safe(entry, tmp, &client_list) {
243 client = flist_entry(entry, struct fio_client, list);
244
245 ret = fio_client_connect(client);
0b8f30a5 246 if (ret) {
a37f69b7 247 remove_client(client);
0b8f30a5
JA
248 continue;
249 }
250
251 probe_client(client);
81179eec
JA
252
253 if (client->argc > 1)
254 send_client_cmd_line(client);
a37f69b7
JA
255 }
256
257 return !nr_clients;
258}
259
132159a5
JA
260/*
261 * Send file contents to server backend. We could use sendfile(), but to remain
262 * more portable lets just read/write the darn thing.
263 */
a37f69b7 264static int fio_client_send_ini(struct fio_client *client, const char *filename)
132159a5
JA
265{
266 struct stat sb;
267 char *p, *buf;
268 off_t len;
269 int fd, ret;
270
46c48f1f
JA
271 dprint(FD_NET, "send ini %s to %s\n", filename, client->hostname);
272
132159a5
JA
273 fd = open(filename, O_RDONLY);
274 if (fd < 0) {
275 log_err("fio: job file open: %s\n", strerror(errno));
276 return 1;
277 }
278
279 if (fstat(fd, &sb) < 0) {
280 log_err("fio: job file stat: %s\n", strerror(errno));
281 return 1;
282 }
283
284 buf = malloc(sb.st_size);
285
286 len = sb.st_size;
287 p = buf;
288 do {
289 ret = read(fd, p, len);
290 if (ret > 0) {
291 len -= ret;
292 if (!len)
293 break;
294 p += ret;
295 continue;
296 } else if (!ret)
297 break;
298 else if (errno == EAGAIN || errno == EINTR)
299 continue;
300 } while (1);
301
0b8f30a5
JA
302 if (len) {
303 log_err("fio: failed reading job file %s\n", filename);
304 return 1;
305 }
306
81179eec 307 ret = fio_net_send_cmd(client->fd, FIO_NET_CMD_JOB, buf, sb.st_size);
132159a5
JA
308 free(buf);
309 return ret;
310}
37db14fe 311
a37f69b7
JA
312int fio_clients_send_ini(const char *filename)
313{
314 struct fio_client *client;
315 struct flist_head *entry, *tmp;
316
317 flist_for_each_safe(entry, tmp, &client_list) {
318 client = flist_entry(entry, struct fio_client, list);
319
320 if (fio_client_send_ini(client, filename))
321 remove_client(client);
322 }
323
324 return !nr_clients;
325}
326
a64e88da
JA
327static void convert_io_stat(struct io_stat *dst, struct io_stat *src)
328{
329 dst->max_val = le64_to_cpu(src->max_val);
330 dst->min_val = le64_to_cpu(src->min_val);
331 dst->samples = le64_to_cpu(src->samples);
332 /* FIXME */
ddcc0b69
JA
333 dst->mean = __le64_to_cpu(src->mean);
334 dst->S = __le64_to_cpu(src->S);
a64e88da
JA
335}
336
337static void convert_ts(struct thread_stat *dst, struct thread_stat *src)
338{
339 int i, j;
340
341 dst->error = le32_to_cpu(src->error);
342 dst->groupid = le32_to_cpu(src->groupid);
343 dst->pid = le32_to_cpu(src->pid);
344 dst->members = le32_to_cpu(src->members);
345
346 for (i = 0; i < 2; i++) {
347 convert_io_stat(&dst->clat_stat[i], &src->clat_stat[i]);
348 convert_io_stat(&dst->slat_stat[i], &src->slat_stat[i]);
349 convert_io_stat(&dst->lat_stat[i], &src->lat_stat[i]);
350 convert_io_stat(&dst->bw_stat[i], &src->bw_stat[i]);
351 }
352
353 dst->usr_time = le64_to_cpu(src->usr_time);
354 dst->sys_time = le64_to_cpu(src->sys_time);
355 dst->ctx = le64_to_cpu(src->ctx);
356 dst->minf = le64_to_cpu(src->minf);
357 dst->majf = le64_to_cpu(src->majf);
358 dst->clat_percentiles = le64_to_cpu(src->clat_percentiles);
359 dst->percentile_list = NULL;
360
361 for (i = 0; i < FIO_IO_U_MAP_NR; i++) {
362 dst->io_u_map[i] = le32_to_cpu(src->io_u_map[i]);
363 dst->io_u_submit[i] = le32_to_cpu(src->io_u_submit[i]);
364 dst->io_u_complete[i] = le32_to_cpu(src->io_u_complete[i]);
365 }
366
367 for (i = 0; i < FIO_IO_U_LAT_U_NR; i++) {
368 dst->io_u_lat_u[i] = le32_to_cpu(src->io_u_lat_u[i]);
369 dst->io_u_lat_m[i] = le32_to_cpu(src->io_u_lat_m[i]);
370 }
371
372 for (i = 0; i < 2; i++)
373 for (j = 0; j < FIO_IO_U_PLAT_NR; j++)
374 dst->io_u_plat[i][j] = le32_to_cpu(src->io_u_plat[i][j]);
375
376 for (i = 0; i < 3; i++) {
377 dst->total_io_u[i] = le64_to_cpu(src->total_io_u[i]);
93eee04a 378 dst->short_io_u[i] = le64_to_cpu(src->short_io_u[i]);
a64e88da
JA
379 }
380
381 dst->total_submit = le64_to_cpu(src->total_submit);
382 dst->total_complete = le64_to_cpu(src->total_complete);
383
384 for (i = 0; i < 2; i++) {
385 dst->io_bytes[i] = le64_to_cpu(src->io_bytes[i]);
386 dst->runtime[i] = le64_to_cpu(src->runtime[i]);
387 }
388
389 dst->total_run_time = le64_to_cpu(src->total_run_time);
390 dst->continue_on_error = le16_to_cpu(src->continue_on_error);
391 dst->total_err_count = le64_to_cpu(src->total_err_count);
ddcc0b69
JA
392 dst->first_error = le32_to_cpu(src->first_error);
393 dst->kb_base = le32_to_cpu(src->kb_base);
a64e88da
JA
394}
395
396static void convert_gs(struct group_run_stats *dst, struct group_run_stats *src)
397{
398 int i;
399
400 for (i = 0; i < 2; i++) {
401 dst->max_run[i] = le64_to_cpu(src->max_run[i]);
402 dst->min_run[i] = le64_to_cpu(src->min_run[i]);
403 dst->max_bw[i] = le64_to_cpu(src->max_bw[i]);
404 dst->min_bw[i] = le64_to_cpu(src->min_bw[i]);
405 dst->io_kb[i] = le64_to_cpu(src->io_kb[i]);
406 dst->agg[i] = le64_to_cpu(src->agg[i]);
407 }
408
409 dst->kb_base = le32_to_cpu(src->kb_base);
410 dst->groupid = le32_to_cpu(src->groupid);
411}
412
413static void handle_ts(struct fio_net_cmd *cmd)
414{
415 struct cmd_ts_pdu *p = (struct cmd_ts_pdu *) cmd->payload;
416
417 convert_ts(&p->ts, &p->ts);
418 convert_gs(&p->rs, &p->rs);
419
420 show_thread_status(&p->ts, &p->rs);
421}
422
423static void handle_gs(struct fio_net_cmd *cmd)
424{
425 struct group_run_stats *gs = (struct group_run_stats *) cmd->payload;
426
427 convert_gs(gs, gs);
428 show_group_stats(gs);
429}
430
cf451d1e
JA
431static void handle_eta(struct fio_net_cmd *cmd)
432{
433 struct jobs_eta *je = (struct jobs_eta *) cmd->payload;
434 int i;
435
436 je->nr_running = le32_to_cpu(je->nr_running);
437 je->nr_ramp = le32_to_cpu(je->nr_ramp);
438 je->nr_pending = le32_to_cpu(je->nr_pending);
439 je->files_open = le32_to_cpu(je->files_open);
440 je->m_rate = le32_to_cpu(je->m_rate);
441 je->t_rate = le32_to_cpu(je->t_rate);
442 je->m_iops = le32_to_cpu(je->m_iops);
443 je->t_iops = le32_to_cpu(je->t_iops);
444
445 for (i = 0; i < 2; i++) {
446 je->rate[i] = le32_to_cpu(je->rate[i]);
447 je->iops[i] = le32_to_cpu(je->iops[i]);
448 }
449
450 je->elapsed_sec = le32_to_cpu(je->nr_running);
451 je->eta_sec = le64_to_cpu(je->eta_sec);
452
453 display_thread_status(je);
454}
455
2e03b4b2
JA
456static void handle_probe(struct fio_net_cmd *cmd)
457{
458 struct cmd_probe_pdu *probe = (struct cmd_probe_pdu *) cmd->payload;
459
0b8f30a5
JA
460 log_info("Probe: hostname=%s, fio ver %u.%u.%u\n", probe->hostname,
461 probe->fio_major, probe->fio_minor, probe->fio_patch);
2e03b4b2
JA
462}
463
0b8f30a5 464static int handle_client(struct fio_client *client, int one)
37db14fe
JA
465{
466 struct fio_net_cmd *cmd;
a450e492 467 int done = 0;
37db14fe 468
60efd14e
JA
469 dprint(FD_NET, "client: handle %s\n", client->hostname);
470
70e0c316 471 while ((cmd = fio_net_recv_cmd(client->fd, 1)) != NULL) {
46c48f1f
JA
472 dprint(FD_NET, "%s: got cmd op %d\n", client->hostname,
473 cmd->opcode);
474
a64e88da 475 switch (cmd->opcode) {
a64e88da 476 case FIO_NET_CMD_QUIT:
b66570dc 477 remove_client(client);
437377e1 478 free(cmd);
a450e492 479 done = 1;
437377e1 480 break;
17dd1764
JA
481 case FIO_NET_CMD_TEXT: {
482 const char *buf = (const char *) cmd->payload;
483
484 if (!client->skip_newline)
485 fprintf(f_out, "Client <%s>: ", client->hostname);
486 fwrite(buf, cmd->pdu_len, 1, f_out);
0b8f30a5 487 fflush(f_out);
17dd1764 488 client->skip_newline = strchr(buf, '\n') == NULL;
37db14fe 489 free(cmd);
a64e88da 490 break;
17dd1764 491 }
a64e88da
JA
492 case FIO_NET_CMD_TS:
493 handle_ts(cmd);
494 free(cmd);
495 break;
496 case FIO_NET_CMD_GS:
497 handle_gs(cmd);
498 free(cmd);
499 break;
cf451d1e
JA
500 case FIO_NET_CMD_ETA:
501 handle_eta(cmd);
502 free(cmd);
503 break;
2e03b4b2
JA
504 case FIO_NET_CMD_PROBE:
505 handle_probe(cmd);
506 free(cmd);
507 break;
81179eec
JA
508 case FIO_NET_CMD_START:
509 client->state = Client_started;
510 free(cmd);
511 break;
512 case FIO_NET_CMD_STOP:
513 client->state = Client_stopped;
514 free(cmd);
515 break;
a64e88da
JA
516 default:
517 log_err("fio: unknown client op: %d\n", cmd->opcode);
518 free(cmd);
519 break;
37db14fe 520 }
a450e492 521
0b8f30a5 522 if (done || one)
a450e492 523 break;
37db14fe
JA
524 }
525
526 return 0;
527}
b66570dc
JA
528
529int fio_handle_clients(void)
530{
531 struct fio_client *client;
532 struct flist_head *entry;
533 struct pollfd *pfds;
82a4be1b 534 int i, ret = 0;
b66570dc
JA
535
536 pfds = malloc(nr_clients * sizeof(struct pollfd));
537
82a4be1b
JA
538 while (!exit_backend && nr_clients) {
539 i = 0;
540 flist_for_each(entry, &client_list) {
541 client = flist_entry(entry, struct fio_client, list);
b66570dc 542
82a4be1b
JA
543 pfds[i].fd = client->fd;
544 pfds[i].events = POLLIN;
545 i++;
546 }
547
548 assert(i == nr_clients);
b66570dc 549
5c2857f9
JA
550 do {
551 ret = poll(pfds, nr_clients, 100);
552 if (ret < 0) {
553 if (errno == EINTR)
554 continue;
555 log_err("fio: poll clients: %s\n", strerror(errno));
556 break;
557 } else if (!ret)
b66570dc 558 continue;
5c2857f9 559 } while (ret <= 0);
b66570dc
JA
560
561 for (i = 0; i < nr_clients; i++) {
562 if (!(pfds[i].revents & POLLIN))
563 continue;
564
565 client = find_client_by_fd(pfds[i].fd);
566 if (!client) {
567 log_err("fio: unknown client\n");
568 continue;
569 }
0b8f30a5 570 handle_client(client, 0);
b66570dc
JA
571 }
572 }
573
574 free(pfds);
b66570dc
JA
575 return 0;
576}