server: more debug dumping
[fio.git] / server.c
... / ...
CommitLineData
1#include <stdio.h>
2#include <stdlib.h>
3#include <stdarg.h>
4#include <unistd.h>
5#include <limits.h>
6#include <errno.h>
7#include <fcntl.h>
8#include <sys/poll.h>
9#include <sys/types.h>
10#include <sys/wait.h>
11#include <sys/mman.h>
12#include <netinet/in.h>
13#include <arpa/inet.h>
14#include <netdb.h>
15#include <syslog.h>
16
17#include "fio.h"
18#include "server.h"
19#include "crc/crc16.h"
20
21int fio_net_port = 8765;
22
23int exit_backend = 0;
24
25static int server_fd = -1;
26
27int fio_send_data(int sk, const void *p, unsigned int len)
28{
29 assert(len <= sizeof(struct fio_net_cmd) + FIO_SERVER_MAX_PDU);
30
31 do {
32 int ret = send(sk, p, len, 0);
33
34 if (ret > 0) {
35 len -= ret;
36 if (!len)
37 break;
38 p += ret;
39 continue;
40 } else if (!ret)
41 break;
42 else if (errno == EAGAIN || errno == EINTR)
43 continue;
44 } while (!exit_backend);
45
46 if (!len)
47 return 0;
48
49 return 1;
50}
51
52int fio_recv_data(int sk, void *p, unsigned int len)
53{
54 do {
55 int ret = recv(sk, p, len, MSG_WAITALL);
56
57 if (ret > 0) {
58 len -= ret;
59 if (!len)
60 break;
61 p += ret;
62 continue;
63 } else if (!ret)
64 break;
65 else if (errno == EAGAIN || errno == EINTR)
66 continue;
67 } while (!exit_backend);
68
69 if (!len)
70 return 0;
71
72 return -1;
73}
74
75static int verify_convert_cmd(struct fio_net_cmd *cmd)
76{
77 uint16_t crc;
78
79 cmd->cmd_crc16 = le16_to_cpu(cmd->cmd_crc16);
80 cmd->pdu_crc16 = le16_to_cpu(cmd->pdu_crc16);
81
82 crc = crc16(cmd, FIO_NET_CMD_CRC_SZ);
83 if (crc != cmd->cmd_crc16) {
84 log_err("fio: server bad crc on command (got %x, wanted %x)\n",
85 cmd->cmd_crc16, crc);
86 return 1;
87 }
88
89 cmd->version = le16_to_cpu(cmd->version);
90 cmd->opcode = le16_to_cpu(cmd->opcode);
91 cmd->flags = le32_to_cpu(cmd->flags);
92 cmd->serial = le64_to_cpu(cmd->serial);
93 cmd->pdu_len = le32_to_cpu(cmd->pdu_len);
94
95 switch (cmd->version) {
96 case FIO_SERVER_VER1:
97 break;
98 default:
99 log_err("fio: bad server cmd version %d\n", cmd->version);
100 return 1;
101 }
102
103 if (cmd->pdu_len > FIO_SERVER_MAX_PDU) {
104 log_err("fio: command payload too large: %u\n", cmd->pdu_len);
105 return 1;
106 }
107
108 return 0;
109}
110
111/*
112 * Read (and defragment, if necessary) incoming commands
113 */
114struct fio_net_cmd *fio_net_recv_cmd(int sk, int block)
115{
116 struct fio_net_cmd cmd, *cmdret = NULL;
117 size_t cmd_size = 0, pdu_offset = 0;
118 uint16_t crc;
119 int ret, first = 1;
120 void *pdu = NULL;
121
122 do {
123 struct pollfd pfd;
124
125 pfd.fd = sk;
126 pfd.events = POLLIN;
127 ret = 0;
128 do {
129 int timeo = block ? 100 : 10;
130
131 ret = poll(&pfd, 1, timeo);
132 if (ret < 0) {
133 if (errno == EINTR)
134 break;
135 log_err("fio: poll: %s\n", strerror(errno));
136 break;
137 } else if (!ret) {
138 if (!block)
139 return NULL;
140 continue;
141 }
142
143 if (pfd.revents & POLLIN)
144 break;
145 if (pfd.revents & (POLLERR|POLLHUP)) {
146 ret = 1;
147 break;
148 }
149 } while (ret >= 0 && block);
150
151 if (ret < 0)
152 break;
153
154 ret = fio_recv_data(sk, &cmd, sizeof(cmd));
155 if (ret)
156 break;
157
158 /* We have a command, verify it and swap if need be */
159 ret = verify_convert_cmd(&cmd);
160 if (ret)
161 break;
162
163 if (first) {
164 /* if this is text, add room for \0 at the end */
165 cmd_size = sizeof(cmd) + cmd.pdu_len + 1;
166 assert(!cmdret);
167 } else
168 cmd_size += cmd.pdu_len;
169
170 cmdret = realloc(cmdret, cmd_size);
171
172 if (first)
173 memcpy(cmdret, &cmd, sizeof(cmd));
174 else
175 assert(cmdret->opcode == cmd.opcode);
176
177 if (!cmd.pdu_len)
178 break;
179
180 /* There's payload, get it */
181 pdu = (void *) cmdret->payload + pdu_offset;
182 ret = fio_recv_data(sk, pdu, cmd.pdu_len);
183 if (ret)
184 break;
185
186 /* Verify payload crc */
187 crc = crc16(pdu, cmd.pdu_len);
188 if (crc != cmd.pdu_crc16) {
189 log_err("fio: server bad crc on payload ");
190 log_err("(got %x, wanted %x)\n", cmd.pdu_crc16, crc);
191 ret = 1;
192 break;
193 }
194
195 pdu_offset += cmd.pdu_len;
196 if (!first)
197 cmdret->pdu_len += cmd.pdu_len;
198 first = 0;
199 } while (cmd.flags & FIO_NET_CMD_F_MORE);
200
201 if (ret) {
202 free(cmdret);
203 cmdret = NULL;
204 } else if (cmdret) {
205 /* zero-terminate text input */
206 if (cmdret->pdu_len && (cmdret->opcode == FIO_NET_CMD_TEXT ||
207 cmdret->opcode == FIO_NET_CMD_JOB)) {
208 char *buf = (char *) cmdret->payload;
209
210 buf[cmdret->pdu_len ] = '\0';
211 }
212 /* frag flag is internal */
213 cmdret->flags &= ~FIO_NET_CMD_F_MORE;
214 }
215
216 return cmdret;
217}
218
219void fio_net_cmd_crc(struct fio_net_cmd *cmd)
220{
221 uint32_t pdu_len;
222
223 cmd->cmd_crc16 = __cpu_to_le16(crc16(cmd, FIO_NET_CMD_CRC_SZ));
224
225 pdu_len = le32_to_cpu(cmd->pdu_len);
226 if (pdu_len)
227 cmd->pdu_crc16 = __cpu_to_le16(crc16(cmd->payload, pdu_len));
228}
229
230int fio_net_send_cmd(int fd, uint16_t opcode, const void *buf, off_t size)
231{
232 struct fio_net_cmd *cmd;
233 size_t this_len;
234 int ret;
235
236 do {
237 this_len = size;
238 if (this_len > FIO_SERVER_MAX_PDU)
239 this_len = FIO_SERVER_MAX_PDU;
240
241 cmd = malloc(sizeof(*cmd) + this_len);
242
243 fio_init_net_cmd(cmd, opcode, buf, this_len);
244
245 if (this_len < size)
246 cmd->flags = __cpu_to_le32(FIO_NET_CMD_F_MORE);
247
248 fio_net_cmd_crc(cmd);
249
250 ret = fio_send_data(fd, cmd, sizeof(*cmd) + this_len);
251 free(cmd);
252 size -= this_len;
253 buf += this_len;
254 } while (!ret && size);
255
256 return ret;
257}
258
259int fio_net_send_simple_cmd(int sk, uint16_t opcode, uint64_t serial)
260{
261 struct fio_net_cmd cmd = {
262 .version = __cpu_to_le16(FIO_SERVER_VER1),
263 .opcode = cpu_to_le16(opcode),
264 .serial = cpu_to_le64(serial),
265 };
266
267 fio_net_cmd_crc(&cmd);
268
269 return fio_send_data(sk, &cmd, sizeof(cmd));
270}
271
272static int fio_server_send_quit_cmd(void)
273{
274 dprint(FD_NET, "server: sending quit\n");
275 return fio_net_send_simple_cmd(server_fd, FIO_NET_CMD_QUIT, 0);
276}
277
278static int handle_job_cmd(struct fio_net_cmd *cmd)
279{
280 char *buf = (char *) cmd->payload;
281 int ret;
282
283 if (parse_jobs_ini(buf, 1, 0))
284 return -1;
285
286 fio_net_send_simple_cmd(server_fd, FIO_NET_CMD_START, 0);
287
288 ret = exec_run();
289 fio_server_send_quit_cmd();
290 reset_fio_state();
291 return ret;
292}
293
294static int handle_jobline_cmd(struct fio_net_cmd *cmd)
295{
296 struct cmd_line_pdu *pdu = (struct cmd_line_pdu *) cmd->payload;
297 char *argv[FIO_NET_CMD_JOBLINE_ARGV];
298 int ret, i;
299
300 pdu->argc = le16_to_cpu(pdu->argc);
301
302 dprint(FD_NET, "server: %d command line args\n", pdu->argc);
303
304 for (i = 0; i < pdu->argc; i++) {
305 argv[i] = (char *) pdu->argv[i];
306 dprint(FD_NET, "server: %d: %s\n", i, argv[i]);
307 }
308
309 if (parse_cmd_line(pdu->argc, argv))
310 return -1;
311
312 fio_net_send_simple_cmd(server_fd, FIO_NET_CMD_START, 0);
313
314 ret = exec_run();
315 fio_server_send_quit_cmd();
316 reset_fio_state();
317 return ret;
318}
319
320static int handle_probe_cmd(struct fio_net_cmd *cmd)
321{
322 struct cmd_probe_pdu probe;
323
324 memset(&probe, 0, sizeof(probe));
325 gethostname((char *) probe.hostname, sizeof(probe.hostname));
326 probe.fio_major = FIO_MAJOR;
327 probe.fio_minor = FIO_MINOR;
328 probe.fio_patch = FIO_PATCH;
329
330 return fio_net_send_cmd(server_fd, FIO_NET_CMD_PROBE, &probe, sizeof(probe));
331}
332
333static int handle_command(struct fio_net_cmd *cmd)
334{
335 int ret;
336
337 dprint(FD_NET, "server: got opcode %d\n", cmd->opcode);
338
339 switch (cmd->opcode) {
340 case FIO_NET_CMD_QUIT:
341 fio_terminate_threads(TERMINATE_ALL);
342 return -1;
343 case FIO_NET_CMD_EXIT:
344 exit_backend = 1;
345 return -1;
346 case FIO_NET_CMD_JOB:
347 ret = handle_job_cmd(cmd);
348 break;
349 case FIO_NET_CMD_JOBLINE:
350 ret = handle_jobline_cmd(cmd);
351 break;
352 case FIO_NET_CMD_PROBE:
353 ret = handle_probe_cmd(cmd);
354 break;
355 default:
356 log_err("fio: unknown opcode: %d\n", cmd->opcode);
357 ret = 1;
358 }
359
360 return ret;
361}
362
363static int handle_connection(int sk, int block)
364{
365 struct fio_net_cmd *cmd = NULL;
366 int ret = 0;
367
368 /* read forever */
369 while (!exit_backend) {
370 cmd = fio_net_recv_cmd(sk, block);
371 if (!cmd) {
372 ret = -1;
373 break;
374 }
375
376 ret = handle_command(cmd);
377 if (ret)
378 break;
379
380 free(cmd);
381 cmd = NULL;
382 }
383
384 if (cmd)
385 free(cmd);
386
387 return ret;
388}
389
390void fio_server_idle_loop(void)
391{
392 if (server_fd != -1)
393 handle_connection(server_fd, 0);
394}
395
396static int accept_loop(int listen_sk)
397{
398 struct sockaddr addr;
399 unsigned int len = sizeof(addr);
400 struct pollfd pfd;
401 int ret, sk, flags, exitval = 0;
402
403 dprint(FD_NET, "server enter accept loop\n");
404
405 flags = fcntl(listen_sk, F_GETFL);
406 flags |= O_NONBLOCK;
407 fcntl(listen_sk, F_SETFL, flags);
408again:
409 pfd.fd = listen_sk;
410 pfd.events = POLLIN;
411 do {
412 ret = poll(&pfd, 1, 100);
413 if (ret < 0) {
414 if (errno == EINTR)
415 break;
416 log_err("fio: poll: %s\n", strerror(errno));
417 goto out;
418 } else if (!ret)
419 continue;
420
421 if (pfd.revents & POLLIN)
422 break;
423 } while (!exit_backend);
424
425 if (exit_backend)
426 goto out;
427
428 sk = accept(listen_sk, &addr, &len);
429 if (sk < 0) {
430 log_err("fio: accept: %s\n", strerror(errno));
431 return -1;
432 }
433
434 dprint(FD_NET, "server got a connection\n");
435
436 server_fd = sk;
437
438 exitval = handle_connection(sk, 1);
439
440 server_fd = -1;
441 close(sk);
442
443 if (!exit_backend)
444 goto again;
445
446out:
447 return exitval;
448}
449
450int fio_server_text_output(const char *buf, unsigned int len)
451{
452 if (server_fd != -1)
453 return fio_net_send_cmd(server_fd, FIO_NET_CMD_TEXT, buf, len);
454
455 return 0;
456}
457
458static void convert_io_stat(struct io_stat *dst, struct io_stat *src)
459{
460 dst->max_val = cpu_to_le64(src->max_val);
461 dst->min_val = cpu_to_le64(src->min_val);
462 dst->samples = cpu_to_le64(src->samples);
463 /* FIXME */
464 dst->mean = __cpu_to_le64(src->mean);
465 dst->S = __cpu_to_le64(src->S);
466}
467
468static void convert_gs(struct group_run_stats *dst, struct group_run_stats *src)
469{
470 int i;
471
472 for (i = 0; i < 2; i++) {
473 dst->max_run[i] = cpu_to_le64(src->max_run[i]);
474 dst->min_run[i] = cpu_to_le64(src->min_run[i]);
475 dst->max_bw[i] = cpu_to_le64(src->max_bw[i]);
476 dst->min_bw[i] = cpu_to_le64(src->min_bw[i]);
477 dst->io_kb[i] = cpu_to_le64(src->io_kb[i]);
478 dst->agg[i] = cpu_to_le64(src->agg[i]);
479 }
480
481 dst->kb_base = cpu_to_le32(src->kb_base);
482 dst->groupid = cpu_to_le32(src->groupid);
483}
484
485/*
486 * Send a CMD_TS, which packs struct thread_stat and group_run_stats
487 * into a single payload.
488 */
489void fio_server_send_ts(struct thread_stat *ts, struct group_run_stats *rs)
490{
491 struct cmd_ts_pdu p;
492 int i, j;
493
494 dprint(FD_NET, "server sending end stats\n");
495
496 memset(&p, 0, sizeof(p));
497
498 strcpy(p.ts.name, ts->name);
499 strcpy(p.ts.verror, ts->verror);
500 strcpy(p.ts.description, ts->description);
501
502 p.ts.error = cpu_to_le32(ts->error);
503 p.ts.groupid = cpu_to_le32(ts->groupid);
504 p.ts.pid = cpu_to_le32(ts->pid);
505 p.ts.members = cpu_to_le32(ts->members);
506
507 for (i = 0; i < 2; i++) {
508 convert_io_stat(&p.ts.clat_stat[i], &ts->clat_stat[i]);
509 convert_io_stat(&p.ts.slat_stat[i], &ts->slat_stat[i]);
510 convert_io_stat(&p.ts.lat_stat[i], &ts->lat_stat[i]);
511 convert_io_stat(&p.ts.bw_stat[i], &ts->bw_stat[i]);
512 }
513
514 p.ts.usr_time = cpu_to_le64(ts->usr_time);
515 p.ts.sys_time = cpu_to_le64(ts->sys_time);
516 p.ts.ctx = cpu_to_le64(ts->ctx);
517 p.ts.minf = cpu_to_le64(ts->minf);
518 p.ts.majf = cpu_to_le64(ts->majf);
519 p.ts.clat_percentiles = cpu_to_le64(ts->clat_percentiles);
520 p.ts.percentile_list = NULL;
521
522 for (i = 0; i < FIO_IO_U_MAP_NR; i++) {
523 p.ts.io_u_map[i] = cpu_to_le32(ts->io_u_map[i]);
524 p.ts.io_u_submit[i] = cpu_to_le32(ts->io_u_submit[i]);
525 p.ts.io_u_complete[i] = cpu_to_le32(ts->io_u_complete[i]);
526 }
527
528 for (i = 0; i < FIO_IO_U_LAT_U_NR; i++) {
529 p.ts.io_u_lat_u[i] = cpu_to_le32(ts->io_u_lat_u[i]);
530 p.ts.io_u_lat_m[i] = cpu_to_le32(ts->io_u_lat_m[i]);
531 }
532
533 for (i = 0; i < 2; i++)
534 for (j = 0; j < FIO_IO_U_PLAT_NR; j++)
535 p.ts.io_u_plat[i][j] = cpu_to_le32(ts->io_u_plat[i][j]);
536
537 for (i = 0; i < 3; i++) {
538 p.ts.total_io_u[i] = cpu_to_le64(ts->total_io_u[i]);
539 p.ts.short_io_u[i] = cpu_to_le64(ts->short_io_u[i]);
540 }
541
542 p.ts.total_submit = cpu_to_le64(ts->total_submit);
543 p.ts.total_complete = cpu_to_le64(ts->total_complete);
544
545 for (i = 0; i < 2; i++) {
546 p.ts.io_bytes[i] = cpu_to_le64(ts->io_bytes[i]);
547 p.ts.runtime[i] = cpu_to_le64(ts->runtime[i]);
548 }
549
550 p.ts.total_run_time = cpu_to_le64(ts->total_run_time);
551 p.ts.continue_on_error = cpu_to_le16(ts->continue_on_error);
552 p.ts.total_err_count = cpu_to_le64(ts->total_err_count);
553 p.ts.first_error = cpu_to_le32(ts->first_error);
554 p.ts.kb_base = cpu_to_le32(ts->kb_base);
555
556 convert_gs(&p.rs, rs);
557
558 fio_net_send_cmd(server_fd, FIO_NET_CMD_TS, &p, sizeof(p));
559}
560
561void fio_server_send_gs(struct group_run_stats *rs)
562{
563 struct group_run_stats gs;
564
565 dprint(FD_NET, "server sending group run stats\n");
566
567 convert_gs(&gs, rs);
568 fio_net_send_cmd(server_fd, FIO_NET_CMD_GS, &gs, sizeof(gs));
569}
570
571void fio_server_send_status(void)
572{
573 struct jobs_eta *je;
574 size_t size;
575 void *buf;
576 int i;
577
578 size = sizeof(*je) + thread_number * sizeof(char);
579 buf = malloc(size);
580 memset(buf, 0, size);
581 je = buf;
582
583 if (!calc_thread_status(je)) {
584 free(je);
585 return;
586 }
587
588 dprint(FD_NET, "server sending status\n");
589
590 je->nr_running = cpu_to_le32(je->nr_running);
591 je->nr_ramp = cpu_to_le32(je->nr_ramp);
592 je->nr_pending = cpu_to_le32(je->nr_pending);
593 je->files_open = cpu_to_le32(je->files_open);
594 je->m_rate = cpu_to_le32(je->m_rate);
595 je->t_rate = cpu_to_le32(je->t_rate);
596 je->m_iops = cpu_to_le32(je->m_iops);
597 je->t_iops = cpu_to_le32(je->t_iops);
598
599 for (i = 0; i < 2; i++) {
600 je->rate[i] = cpu_to_le32(je->rate[i]);
601 je->iops[i] = cpu_to_le32(je->iops[i]);
602 }
603
604 je->elapsed_sec = cpu_to_le32(je->nr_running);
605 je->eta_sec = cpu_to_le64(je->eta_sec);
606
607 fio_net_send_cmd(server_fd, FIO_NET_CMD_ETA, buf, size);
608 free(je);
609}
610
611int fio_server_log(const char *format, ...)
612{
613 char buffer[1024];
614 va_list args;
615 size_t len;
616
617 dprint(FD_NET, "server log\n");
618
619 va_start(args, format);
620 len = vsnprintf(buffer, sizeof(buffer), format, args);
621 va_end(args);
622
623 return fio_server_text_output(buffer, len);
624}
625
626static int fio_server(void)
627{
628 struct sockaddr_in saddr_in;
629 struct sockaddr addr;
630 unsigned int len;
631 int sk, opt, ret;
632
633 dprint(FD_NET, "starting server\n");
634
635 sk = socket(AF_INET, SOCK_STREAM, 0);
636 if (sk < 0) {
637 log_err("fio: socket: %s\n", strerror(errno));
638 return -1;
639 }
640
641 opt = 1;
642 if (setsockopt(sk, SOL_SOCKET, SO_REUSEADDR, &opt, sizeof(opt)) < 0) {
643 log_err("fio: setsockopt: %s\n", strerror(errno));
644 return -1;
645 }
646#ifdef SO_REUSEPORT
647 if (setsockopt(fd, SOL_SOCKET, SO_REUSEPORT, &opt, sizeof(opt)) < 0) {
648 log_err("fio: setsockopt: %s\n", strerror(errno));
649 return -1;
650 }
651#endif
652
653 saddr_in.sin_family = AF_INET;
654 saddr_in.sin_addr.s_addr = htonl(INADDR_ANY);
655 saddr_in.sin_port = htons(fio_net_port);
656
657 if (bind(sk, (struct sockaddr *) &saddr_in, sizeof(saddr_in)) < 0) {
658 log_err("fio: bind: %s\n", strerror(errno));
659 return -1;
660 }
661
662 if (listen(sk, 1) < 0) {
663 log_err("fio: listen: %s\n", strerror(errno));
664 return -1;
665 }
666
667 len = sizeof(addr);
668 if (getsockname(sk, &addr, &len) < 0) {
669 log_err("fio: getsockname: %s\n", strerror(errno));
670 return -1;
671 }
672
673 ret = accept_loop(sk);
674 close(sk);
675 return ret;
676}
677
678static void sig_int(int sig)
679{
680 fio_terminate_threads(TERMINATE_ALL);
681 exit_backend = 1;
682}
683
684static void server_signal_handler(void)
685{
686 struct sigaction act;
687
688 memset(&act, 0, sizeof(act));
689 act.sa_handler = sig_int;
690 act.sa_flags = SA_RESTART;
691 sigaction(SIGINT, &act, NULL);
692
693 memset(&act, 0, sizeof(act));
694 act.sa_handler = sig_int;
695 act.sa_flags = SA_RESTART;
696 sigaction(SIGTERM, &act, NULL);
697}
698
699int fio_start_server(int daemonize)
700{
701 pid_t pid;
702
703 server_signal_handler();
704
705 if (!daemonize)
706 return fio_server();
707
708 openlog("fio", LOG_NDELAY|LOG_NOWAIT|LOG_PID, LOG_USER);
709 pid = fork();
710 if (pid < 0) {
711 syslog(LOG_ERR, "failed server fork");
712 return -1;
713 } else if (pid)
714 exit(0);
715
716 setsid();
717 close(STDIN_FILENO);
718 close(STDOUT_FILENO);
719 close(STDERR_FILENO);
720 f_out = NULL;
721 f_err = NULL;
722 log_syslog = 1;
723 return fio_server();
724}