server: quit on !block and backend exit
[fio.git] / server.c
... / ...
CommitLineData
1#include <stdio.h>
2#include <stdlib.h>
3#include <stdarg.h>
4#include <unistd.h>
5#include <limits.h>
6#include <errno.h>
7#include <fcntl.h>
8#include <sys/poll.h>
9#include <sys/types.h>
10#include <sys/wait.h>
11#include <sys/socket.h>
12#include <netinet/in.h>
13#include <arpa/inet.h>
14#include <netdb.h>
15#include <syslog.h>
16#include <signal.h>
17
18#include "fio.h"
19#include "server.h"
20#include "crc/crc16.h"
21#include "ieee754.h"
22
23int fio_net_port = 8765;
24
25int exit_backend = 0;
26
27static int server_fd = -1;
28
29int fio_send_data(int sk, const void *p, unsigned int len)
30{
31 assert(len <= sizeof(struct fio_net_cmd) + FIO_SERVER_MAX_PDU);
32
33 do {
34 int ret = send(sk, p, len, 0);
35
36 if (ret > 0) {
37 len -= ret;
38 if (!len)
39 break;
40 p += ret;
41 continue;
42 } else if (!ret)
43 break;
44 else if (errno == EAGAIN || errno == EINTR)
45 continue;
46 } while (!exit_backend);
47
48 if (!len)
49 return 0;
50
51 return 1;
52}
53
54int fio_recv_data(int sk, void *p, unsigned int len)
55{
56 do {
57 int ret = recv(sk, p, len, MSG_WAITALL);
58
59 if (ret > 0) {
60 len -= ret;
61 if (!len)
62 break;
63 p += ret;
64 continue;
65 } else if (!ret)
66 break;
67 else if (errno == EAGAIN || errno == EINTR)
68 continue;
69 } while (!exit_backend);
70
71 if (!len)
72 return 0;
73
74 return -1;
75}
76
77static int verify_convert_cmd(struct fio_net_cmd *cmd)
78{
79 uint16_t crc;
80
81 cmd->cmd_crc16 = le16_to_cpu(cmd->cmd_crc16);
82 cmd->pdu_crc16 = le16_to_cpu(cmd->pdu_crc16);
83
84 crc = crc16(cmd, FIO_NET_CMD_CRC_SZ);
85 if (crc != cmd->cmd_crc16) {
86 log_err("fio: server bad crc on command (got %x, wanted %x)\n",
87 cmd->cmd_crc16, crc);
88 return 1;
89 }
90
91 cmd->version = le16_to_cpu(cmd->version);
92 cmd->opcode = le16_to_cpu(cmd->opcode);
93 cmd->flags = le32_to_cpu(cmd->flags);
94 cmd->serial = le64_to_cpu(cmd->serial);
95 cmd->pdu_len = le32_to_cpu(cmd->pdu_len);
96
97 switch (cmd->version) {
98 case FIO_SERVER_VER1:
99 break;
100 default:
101 log_err("fio: bad server cmd version %d\n", cmd->version);
102 return 1;
103 }
104
105 if (cmd->pdu_len > FIO_SERVER_MAX_PDU) {
106 log_err("fio: command payload too large: %u\n", cmd->pdu_len);
107 return 1;
108 }
109
110 return 0;
111}
112
113/*
114 * Read (and defragment, if necessary) incoming commands
115 */
116struct fio_net_cmd *fio_net_recv_cmd(int sk)
117{
118 struct fio_net_cmd cmd, *cmdret = NULL;
119 size_t cmd_size = 0, pdu_offset = 0;
120 uint16_t crc;
121 int ret, first = 1;
122 void *pdu = NULL;
123
124 do {
125 ret = fio_recv_data(sk, &cmd, sizeof(cmd));
126 if (ret)
127 break;
128
129 /* We have a command, verify it and swap if need be */
130 ret = verify_convert_cmd(&cmd);
131 if (ret)
132 break;
133
134 if (first) {
135 /* if this is text, add room for \0 at the end */
136 cmd_size = sizeof(cmd) + cmd.pdu_len + 1;
137 assert(!cmdret);
138 } else
139 cmd_size += cmd.pdu_len;
140
141 cmdret = realloc(cmdret, cmd_size);
142
143 if (first)
144 memcpy(cmdret, &cmd, sizeof(cmd));
145 else
146 assert(cmdret->opcode == cmd.opcode);
147
148 if (!cmd.pdu_len)
149 break;
150
151 /* There's payload, get it */
152 pdu = (void *) cmdret->payload + pdu_offset;
153 ret = fio_recv_data(sk, pdu, cmd.pdu_len);
154 if (ret)
155 break;
156
157 /* Verify payload crc */
158 crc = crc16(pdu, cmd.pdu_len);
159 if (crc != cmd.pdu_crc16) {
160 log_err("fio: server bad crc on payload ");
161 log_err("(got %x, wanted %x)\n", cmd.pdu_crc16, crc);
162 ret = 1;
163 break;
164 }
165
166 pdu_offset += cmd.pdu_len;
167 if (!first)
168 cmdret->pdu_len += cmd.pdu_len;
169 first = 0;
170 } while (cmd.flags & FIO_NET_CMD_F_MORE);
171
172 if (ret) {
173 free(cmdret);
174 cmdret = NULL;
175 } else if (cmdret) {
176 /* zero-terminate text input */
177 if (cmdret->pdu_len && (cmdret->opcode == FIO_NET_CMD_TEXT ||
178 cmdret->opcode == FIO_NET_CMD_JOB)) {
179 char *buf = (char *) cmdret->payload;
180
181 buf[cmdret->pdu_len ] = '\0';
182 }
183 /* frag flag is internal */
184 cmdret->flags &= ~FIO_NET_CMD_F_MORE;
185 }
186
187 return cmdret;
188}
189
190void fio_net_cmd_crc(struct fio_net_cmd *cmd)
191{
192 uint32_t pdu_len;
193
194 cmd->cmd_crc16 = __cpu_to_le16(crc16(cmd, FIO_NET_CMD_CRC_SZ));
195
196 pdu_len = le32_to_cpu(cmd->pdu_len);
197 if (pdu_len)
198 cmd->pdu_crc16 = __cpu_to_le16(crc16(cmd->payload, pdu_len));
199}
200
201int fio_net_send_cmd(int fd, uint16_t opcode, const void *buf, off_t size)
202{
203 struct fio_net_cmd *cmd;
204 size_t this_len;
205 int ret;
206
207 do {
208 this_len = size;
209 if (this_len > FIO_SERVER_MAX_PDU)
210 this_len = FIO_SERVER_MAX_PDU;
211
212 cmd = malloc(sizeof(*cmd) + this_len);
213
214 fio_init_net_cmd(cmd, opcode, buf, this_len);
215
216 if (this_len < size)
217 cmd->flags = __cpu_to_le32(FIO_NET_CMD_F_MORE);
218
219 fio_net_cmd_crc(cmd);
220
221 ret = fio_send_data(fd, cmd, sizeof(*cmd) + this_len);
222 free(cmd);
223 size -= this_len;
224 buf += this_len;
225 } while (!ret && size);
226
227 return ret;
228}
229
230int fio_net_send_simple_cmd(int sk, uint16_t opcode, uint64_t serial)
231{
232 struct fio_net_cmd cmd = {
233 .version = __cpu_to_le16(FIO_SERVER_VER1),
234 .opcode = cpu_to_le16(opcode),
235 .serial = cpu_to_le64(serial),
236 };
237
238 fio_net_cmd_crc(&cmd);
239
240 return fio_send_data(sk, &cmd, sizeof(cmd));
241}
242
243static int fio_server_send_quit_cmd(void)
244{
245 dprint(FD_NET, "server: sending quit\n");
246 return fio_net_send_simple_cmd(server_fd, FIO_NET_CMD_QUIT, 0);
247}
248
249static int handle_job_cmd(struct fio_net_cmd *cmd)
250{
251 char *buf = (char *) cmd->payload;
252 int ret;
253
254 if (parse_jobs_ini(buf, 1, 0)) {
255 fio_server_send_quit_cmd();
256 return -1;
257 }
258
259 fio_net_send_simple_cmd(server_fd, FIO_NET_CMD_START, 0);
260
261 ret = exec_run();
262 fio_server_send_quit_cmd();
263 reset_fio_state();
264 return ret;
265}
266
267static int handle_jobline_cmd(struct fio_net_cmd *cmd)
268{
269 struct cmd_line_pdu *pdu = (struct cmd_line_pdu *) cmd->payload;
270 char *argv[FIO_NET_CMD_JOBLINE_ARGV];
271 int ret, i;
272
273 pdu->argc = le16_to_cpu(pdu->argc);
274
275 dprint(FD_NET, "server: %d command line args\n", pdu->argc);
276
277 for (i = 0; i < pdu->argc; i++) {
278 argv[i] = (char *) pdu->argv[i];
279 dprint(FD_NET, "server: %d: %s\n", i, argv[i]);
280 }
281
282 if (parse_cmd_line(pdu->argc, argv)) {
283 fio_server_send_quit_cmd();
284 return -1;
285 }
286
287 fio_net_send_simple_cmd(server_fd, FIO_NET_CMD_START, 0);
288
289 ret = exec_run();
290 fio_server_send_quit_cmd();
291 reset_fio_state();
292 return ret;
293}
294
295static int handle_probe_cmd(struct fio_net_cmd *cmd)
296{
297 struct cmd_probe_pdu probe;
298
299 memset(&probe, 0, sizeof(probe));
300 gethostname((char *) probe.hostname, sizeof(probe.hostname));
301#ifdef FIO_BIG_ENDIAN
302 probe.bigendian = 1;
303#endif
304 probe.fio_major = FIO_MAJOR;
305 probe.fio_minor = FIO_MINOR;
306 probe.fio_patch = FIO_PATCH;
307
308 return fio_net_send_cmd(server_fd, FIO_NET_CMD_PROBE, &probe, sizeof(probe));
309}
310
311static int handle_command(struct fio_net_cmd *cmd)
312{
313 int ret;
314
315 dprint(FD_NET, "server: got opcode %d\n", cmd->opcode);
316
317 switch (cmd->opcode) {
318 case FIO_NET_CMD_QUIT:
319 fio_terminate_threads(TERMINATE_ALL);
320 return -1;
321 case FIO_NET_CMD_EXIT:
322 exit_backend = 1;
323 return -1;
324 case FIO_NET_CMD_JOB:
325 ret = handle_job_cmd(cmd);
326 break;
327 case FIO_NET_CMD_JOBLINE:
328 ret = handle_jobline_cmd(cmd);
329 break;
330 case FIO_NET_CMD_PROBE:
331 ret = handle_probe_cmd(cmd);
332 break;
333 default:
334 log_err("fio: unknown opcode: %d\n", cmd->opcode);
335 ret = 1;
336 }
337
338 return ret;
339}
340
341static int handle_connection(int sk, int block)
342{
343 struct fio_net_cmd *cmd = NULL;
344 int ret = 0;
345
346 /* read forever */
347 while (!exit_backend) {
348 struct pollfd pfd = {
349 .fd = sk,
350 .events = POLLIN,
351 };
352
353 ret = 0;
354 do {
355 ret = poll(&pfd, 1, 100);
356 if (ret < 0) {
357 if (errno == EINTR)
358 break;
359 log_err("fio: poll: %s\n", strerror(errno));
360 break;
361 } else if (!ret) {
362 if (!block)
363 return 0;
364 continue;
365 }
366
367 if (pfd.revents & POLLIN)
368 break;
369 if (pfd.revents & (POLLERR|POLLHUP)) {
370 ret = 1;
371 break;
372 }
373 } while (!exit_backend);
374
375 if (ret < 0)
376 break;
377
378 cmd = fio_net_recv_cmd(sk);
379 if (!cmd) {
380 ret = -1;
381 break;
382 }
383
384 ret = handle_command(cmd);
385 if (ret)
386 break;
387
388 free(cmd);
389 cmd = NULL;
390 }
391
392 if (cmd)
393 free(cmd);
394
395 return ret;
396}
397
398void fio_server_idle_loop(void)
399{
400 if (server_fd != -1)
401 handle_connection(server_fd, 0);
402}
403
404static int accept_loop(int listen_sk)
405{
406 struct sockaddr_in addr;
407 fio_socklen_t len = sizeof(addr);
408 struct pollfd pfd;
409 int ret, sk, flags, exitval = 0;
410
411 dprint(FD_NET, "server enter accept loop\n");
412
413 flags = fcntl(listen_sk, F_GETFL);
414 flags |= O_NONBLOCK;
415 fcntl(listen_sk, F_SETFL, flags);
416again:
417 pfd.fd = listen_sk;
418 pfd.events = POLLIN;
419 do {
420 ret = poll(&pfd, 1, 100);
421 if (ret < 0) {
422 if (errno == EINTR)
423 break;
424 log_err("fio: poll: %s\n", strerror(errno));
425 goto out;
426 } else if (!ret)
427 continue;
428
429 if (pfd.revents & POLLIN)
430 break;
431 } while (!exit_backend);
432
433 if (exit_backend)
434 goto out;
435
436 sk = accept(listen_sk, (struct sockaddr *) &addr, &len);
437 if (sk < 0) {
438 log_err("fio: accept: %s\n", strerror(errno));
439 return -1;
440 }
441
442 dprint(FD_NET, "server: connect from %s\n", inet_ntoa(addr.sin_addr));
443
444 server_fd = sk;
445
446 exitval = handle_connection(sk, 1);
447
448 server_fd = -1;
449 close(sk);
450
451 if (!exit_backend)
452 goto again;
453
454out:
455 return exitval;
456}
457
458int fio_server_text_output(const char *buf, unsigned int len)
459{
460 if (server_fd != -1)
461 return fio_net_send_cmd(server_fd, FIO_NET_CMD_TEXT, buf, len);
462
463 return fwrite(buf, len, 1, f_err);
464}
465
466static void convert_io_stat(struct io_stat *dst, struct io_stat *src)
467{
468 dst->max_val = cpu_to_le64(src->max_val);
469 dst->min_val = cpu_to_le64(src->min_val);
470 dst->samples = cpu_to_le64(src->samples);
471
472 /*
473 * Encode to IEEE 754 for network transfer
474 */
475 dst->mean.u.i = __cpu_to_le64(fio_double_to_uint64(src->mean.u.f));
476 dst->S.u.i = __cpu_to_le64(fio_double_to_uint64(src->S.u.f));
477}
478
479static void convert_gs(struct group_run_stats *dst, struct group_run_stats *src)
480{
481 int i;
482
483 for (i = 0; i < 2; i++) {
484 dst->max_run[i] = cpu_to_le64(src->max_run[i]);
485 dst->min_run[i] = cpu_to_le64(src->min_run[i]);
486 dst->max_bw[i] = cpu_to_le64(src->max_bw[i]);
487 dst->min_bw[i] = cpu_to_le64(src->min_bw[i]);
488 dst->io_kb[i] = cpu_to_le64(src->io_kb[i]);
489 dst->agg[i] = cpu_to_le64(src->agg[i]);
490 }
491
492 dst->kb_base = cpu_to_le32(src->kb_base);
493 dst->groupid = cpu_to_le32(src->groupid);
494}
495
496/*
497 * Send a CMD_TS, which packs struct thread_stat and group_run_stats
498 * into a single payload.
499 */
500void fio_server_send_ts(struct thread_stat *ts, struct group_run_stats *rs)
501{
502 struct cmd_ts_pdu p;
503 int i, j;
504
505 dprint(FD_NET, "server sending end stats\n");
506
507 memset(&p, 0, sizeof(p));
508
509 strcpy(p.ts.name, ts->name);
510 strcpy(p.ts.verror, ts->verror);
511 strcpy(p.ts.description, ts->description);
512
513 p.ts.error = cpu_to_le32(ts->error);
514 p.ts.groupid = cpu_to_le32(ts->groupid);
515 p.ts.pid = cpu_to_le32(ts->pid);
516 p.ts.members = cpu_to_le32(ts->members);
517
518 for (i = 0; i < 2; i++) {
519 convert_io_stat(&p.ts.clat_stat[i], &ts->clat_stat[i]);
520 convert_io_stat(&p.ts.slat_stat[i], &ts->slat_stat[i]);
521 convert_io_stat(&p.ts.lat_stat[i], &ts->lat_stat[i]);
522 convert_io_stat(&p.ts.bw_stat[i], &ts->bw_stat[i]);
523 }
524
525 p.ts.usr_time = cpu_to_le64(ts->usr_time);
526 p.ts.sys_time = cpu_to_le64(ts->sys_time);
527 p.ts.ctx = cpu_to_le64(ts->ctx);
528 p.ts.minf = cpu_to_le64(ts->minf);
529 p.ts.majf = cpu_to_le64(ts->majf);
530 p.ts.clat_percentiles = cpu_to_le64(ts->clat_percentiles);
531
532 for (i = 0; i < FIO_IO_U_LIST_MAX_LEN; i++) {
533 fio_fp64_t *fp = &p.ts.percentile_list[i];
534
535 fp->u.i = __cpu_to_le64(fio_double_to_uint64(fp->u.f));
536 }
537
538 for (i = 0; i < FIO_IO_U_MAP_NR; i++) {
539 p.ts.io_u_map[i] = cpu_to_le32(ts->io_u_map[i]);
540 p.ts.io_u_submit[i] = cpu_to_le32(ts->io_u_submit[i]);
541 p.ts.io_u_complete[i] = cpu_to_le32(ts->io_u_complete[i]);
542 }
543
544 for (i = 0; i < FIO_IO_U_LAT_U_NR; i++) {
545 p.ts.io_u_lat_u[i] = cpu_to_le32(ts->io_u_lat_u[i]);
546 p.ts.io_u_lat_m[i] = cpu_to_le32(ts->io_u_lat_m[i]);
547 }
548
549 for (i = 0; i < 2; i++)
550 for (j = 0; j < FIO_IO_U_PLAT_NR; j++)
551 p.ts.io_u_plat[i][j] = cpu_to_le32(ts->io_u_plat[i][j]);
552
553 for (i = 0; i < 3; i++) {
554 p.ts.total_io_u[i] = cpu_to_le64(ts->total_io_u[i]);
555 p.ts.short_io_u[i] = cpu_to_le64(ts->short_io_u[i]);
556 }
557
558 p.ts.total_submit = cpu_to_le64(ts->total_submit);
559 p.ts.total_complete = cpu_to_le64(ts->total_complete);
560
561 for (i = 0; i < 2; i++) {
562 p.ts.io_bytes[i] = cpu_to_le64(ts->io_bytes[i]);
563 p.ts.runtime[i] = cpu_to_le64(ts->runtime[i]);
564 }
565
566 p.ts.total_run_time = cpu_to_le64(ts->total_run_time);
567 p.ts.continue_on_error = cpu_to_le16(ts->continue_on_error);
568 p.ts.total_err_count = cpu_to_le64(ts->total_err_count);
569 p.ts.first_error = cpu_to_le32(ts->first_error);
570 p.ts.kb_base = cpu_to_le32(ts->kb_base);
571
572 convert_gs(&p.rs, rs);
573
574 fio_net_send_cmd(server_fd, FIO_NET_CMD_TS, &p, sizeof(p));
575}
576
577void fio_server_send_gs(struct group_run_stats *rs)
578{
579 struct group_run_stats gs;
580
581 dprint(FD_NET, "server sending group run stats\n");
582
583 convert_gs(&gs, rs);
584 fio_net_send_cmd(server_fd, FIO_NET_CMD_GS, &gs, sizeof(gs));
585}
586
587void fio_server_send_status(void)
588{
589 struct jobs_eta *je;
590 size_t size;
591 void *buf;
592 int i;
593
594 size = sizeof(*je) + thread_number * sizeof(char);
595 buf = malloc(size);
596 memset(buf, 0, size);
597 je = buf;
598
599 if (!calc_thread_status(je)) {
600 free(je);
601 return;
602 }
603
604 dprint(FD_NET, "server sending status\n");
605
606 je->nr_running = cpu_to_le32(je->nr_running);
607 je->nr_ramp = cpu_to_le32(je->nr_ramp);
608 je->nr_pending = cpu_to_le32(je->nr_pending);
609 je->files_open = cpu_to_le32(je->files_open);
610 je->m_rate = cpu_to_le32(je->m_rate);
611 je->t_rate = cpu_to_le32(je->t_rate);
612 je->m_iops = cpu_to_le32(je->m_iops);
613 je->t_iops = cpu_to_le32(je->t_iops);
614
615 for (i = 0; i < 2; i++) {
616 je->rate[i] = cpu_to_le32(je->rate[i]);
617 je->iops[i] = cpu_to_le32(je->iops[i]);
618 }
619
620 je->elapsed_sec = cpu_to_le32(je->nr_running);
621 je->eta_sec = cpu_to_le64(je->eta_sec);
622
623 fio_net_send_cmd(server_fd, FIO_NET_CMD_ETA, buf, size);
624 free(je);
625}
626
627int fio_server_log(const char *format, ...)
628{
629 char buffer[1024];
630 va_list args;
631 size_t len;
632
633 dprint(FD_NET, "server log\n");
634
635 va_start(args, format);
636 len = vsnprintf(buffer, sizeof(buffer), format, args);
637 va_end(args);
638
639 return fio_server_text_output(buffer, len);
640}
641
642static int fio_server(void)
643{
644 struct sockaddr_in saddr_in;
645 struct sockaddr addr;
646 fio_socklen_t len;
647 int sk, opt, ret;
648
649 dprint(FD_NET, "starting server\n");
650
651 sk = socket(AF_INET, SOCK_STREAM, 0);
652 if (sk < 0) {
653 log_err("fio: socket: %s\n", strerror(errno));
654 return -1;
655 }
656
657 opt = 1;
658 if (setsockopt(sk, SOL_SOCKET, SO_REUSEADDR, &opt, sizeof(opt)) < 0) {
659 log_err("fio: setsockopt: %s\n", strerror(errno));
660 return -1;
661 }
662#ifdef SO_REUSEPORT
663 if (setsockopt(sk, SOL_SOCKET, SO_REUSEPORT, &opt, sizeof(opt)) < 0) {
664 log_err("fio: setsockopt: %s\n", strerror(errno));
665 return -1;
666 }
667#endif
668
669 saddr_in.sin_family = AF_INET;
670 saddr_in.sin_addr.s_addr = htonl(INADDR_ANY);
671 saddr_in.sin_port = htons(fio_net_port);
672
673 if (bind(sk, (struct sockaddr *) &saddr_in, sizeof(saddr_in)) < 0) {
674 log_err("fio: bind: %s\n", strerror(errno));
675 return -1;
676 }
677
678 if (listen(sk, 1) < 0) {
679 log_err("fio: listen: %s\n", strerror(errno));
680 return -1;
681 }
682
683 len = sizeof(addr);
684 if (getsockname(sk, &addr, &len) < 0) {
685 log_err("fio: getsockname: %s\n", strerror(errno));
686 return -1;
687 }
688
689 ret = accept_loop(sk);
690 close(sk);
691 return ret;
692}
693
694static void sig_int(int sig)
695{
696 fio_terminate_threads(TERMINATE_ALL);
697 exit_backend = 1;
698}
699
700static void server_signal_handler(void)
701{
702 struct sigaction act;
703
704 memset(&act, 0, sizeof(act));
705 act.sa_handler = sig_int;
706 act.sa_flags = SA_RESTART;
707 sigaction(SIGINT, &act, NULL);
708
709 memset(&act, 0, sizeof(act));
710 act.sa_handler = sig_int;
711 act.sa_flags = SA_RESTART;
712 sigaction(SIGTERM, &act, NULL);
713}
714
715int fio_start_server(int daemonize)
716{
717 pid_t pid;
718
719 server_signal_handler();
720
721 if (!daemonize)
722 return fio_server();
723
724 openlog("fio", LOG_NDELAY|LOG_NOWAIT|LOG_PID, LOG_USER);
725 pid = fork();
726 if (pid < 0) {
727 syslog(LOG_ERR, "failed server fork");
728 return -1;
729 } else if (pid)
730 exit(0);
731
732 setsid();
733 close(STDIN_FILENO);
734 close(STDOUT_FILENO);
735 close(STDERR_FILENO);
736 f_out = NULL;
737 f_err = NULL;
738 log_syslog = 1;
739 return fio_server();
740}