Fio 1.99.1
[fio.git] / server.c
... / ...
CommitLineData
1#include <stdio.h>
2#include <stdlib.h>
3#include <stdarg.h>
4#include <unistd.h>
5#include <limits.h>
6#include <errno.h>
7#include <fcntl.h>
8#include <sys/poll.h>
9#include <sys/types.h>
10#include <sys/wait.h>
11#include <sys/socket.h>
12#include <netinet/in.h>
13#include <arpa/inet.h>
14#include <netdb.h>
15#include <syslog.h>
16#include <signal.h>
17
18#include "fio.h"
19#include "server.h"
20#include "crc/crc16.h"
21#include "ieee754.h"
22
23int fio_net_port = 8765;
24
25int exit_backend = 0;
26
27static int server_fd = -1;
28
29int fio_send_data(int sk, const void *p, unsigned int len)
30{
31 assert(len <= sizeof(struct fio_net_cmd) + FIO_SERVER_MAX_PDU);
32
33 do {
34 int ret = send(sk, p, len, 0);
35
36 if (ret > 0) {
37 len -= ret;
38 if (!len)
39 break;
40 p += ret;
41 continue;
42 } else if (!ret)
43 break;
44 else if (errno == EAGAIN || errno == EINTR)
45 continue;
46 } while (!exit_backend);
47
48 if (!len)
49 return 0;
50
51 return 1;
52}
53
54int fio_recv_data(int sk, void *p, unsigned int len)
55{
56 do {
57 int ret = recv(sk, p, len, MSG_WAITALL);
58
59 if (ret > 0) {
60 len -= ret;
61 if (!len)
62 break;
63 p += ret;
64 continue;
65 } else if (!ret)
66 break;
67 else if (errno == EAGAIN || errno == EINTR)
68 continue;
69 } while (!exit_backend);
70
71 if (!len)
72 return 0;
73
74 return -1;
75}
76
77static int verify_convert_cmd(struct fio_net_cmd *cmd)
78{
79 uint16_t crc;
80
81 cmd->cmd_crc16 = le16_to_cpu(cmd->cmd_crc16);
82 cmd->pdu_crc16 = le16_to_cpu(cmd->pdu_crc16);
83
84 crc = crc16(cmd, FIO_NET_CMD_CRC_SZ);
85 if (crc != cmd->cmd_crc16) {
86 log_err("fio: server bad crc on command (got %x, wanted %x)\n",
87 cmd->cmd_crc16, crc);
88 return 1;
89 }
90
91 cmd->version = le16_to_cpu(cmd->version);
92 cmd->opcode = le16_to_cpu(cmd->opcode);
93 cmd->flags = le32_to_cpu(cmd->flags);
94 cmd->serial = le64_to_cpu(cmd->serial);
95 cmd->pdu_len = le32_to_cpu(cmd->pdu_len);
96
97 switch (cmd->version) {
98 case FIO_SERVER_VER2:
99 break;
100 default:
101 log_err("fio: bad server cmd version %d\n", cmd->version);
102 return 1;
103 }
104
105 if (cmd->pdu_len > FIO_SERVER_MAX_PDU) {
106 log_err("fio: command payload too large: %u\n", cmd->pdu_len);
107 return 1;
108 }
109
110 return 0;
111}
112
113/*
114 * Read (and defragment, if necessary) incoming commands
115 */
116struct fio_net_cmd *fio_net_recv_cmd(int sk)
117{
118 struct fio_net_cmd cmd, *cmdret = NULL;
119 size_t cmd_size = 0, pdu_offset = 0;
120 uint16_t crc;
121 int ret, first = 1;
122 void *pdu = NULL;
123
124 do {
125 ret = fio_recv_data(sk, &cmd, sizeof(cmd));
126 if (ret)
127 break;
128
129 /* We have a command, verify it and swap if need be */
130 ret = verify_convert_cmd(&cmd);
131 if (ret)
132 break;
133
134 if (first) {
135 /* if this is text, add room for \0 at the end */
136 cmd_size = sizeof(cmd) + cmd.pdu_len + 1;
137 assert(!cmdret);
138 } else
139 cmd_size += cmd.pdu_len;
140
141 cmdret = realloc(cmdret, cmd_size);
142
143 if (first)
144 memcpy(cmdret, &cmd, sizeof(cmd));
145 else
146 assert(cmdret->opcode == cmd.opcode);
147
148 if (!cmd.pdu_len)
149 break;
150
151 /* There's payload, get it */
152 pdu = (void *) cmdret->payload + pdu_offset;
153 ret = fio_recv_data(sk, pdu, cmd.pdu_len);
154 if (ret)
155 break;
156
157 /* Verify payload crc */
158 crc = crc16(pdu, cmd.pdu_len);
159 if (crc != cmd.pdu_crc16) {
160 log_err("fio: server bad crc on payload ");
161 log_err("(got %x, wanted %x)\n", cmd.pdu_crc16, crc);
162 ret = 1;
163 break;
164 }
165
166 pdu_offset += cmd.pdu_len;
167 if (!first)
168 cmdret->pdu_len += cmd.pdu_len;
169 first = 0;
170 } while (cmd.flags & FIO_NET_CMD_F_MORE);
171
172 if (ret) {
173 free(cmdret);
174 cmdret = NULL;
175 } else if (cmdret) {
176 /* zero-terminate text input */
177 if (cmdret->pdu_len && (cmdret->opcode == FIO_NET_CMD_TEXT ||
178 cmdret->opcode == FIO_NET_CMD_JOB)) {
179 char *buf = (char *) cmdret->payload;
180
181 buf[cmdret->pdu_len ] = '\0';
182 }
183 /* frag flag is internal */
184 cmdret->flags &= ~FIO_NET_CMD_F_MORE;
185 }
186
187 return cmdret;
188}
189
190void fio_net_cmd_crc(struct fio_net_cmd *cmd)
191{
192 uint32_t pdu_len;
193
194 cmd->cmd_crc16 = __cpu_to_le16(crc16(cmd, FIO_NET_CMD_CRC_SZ));
195
196 pdu_len = le32_to_cpu(cmd->pdu_len);
197 if (pdu_len)
198 cmd->pdu_crc16 = __cpu_to_le16(crc16(cmd->payload, pdu_len));
199}
200
201int fio_net_send_cmd(int fd, uint16_t opcode, const void *buf, off_t size)
202{
203 struct fio_net_cmd *cmd;
204 size_t this_len;
205 int ret;
206
207 do {
208 this_len = size;
209 if (this_len > FIO_SERVER_MAX_PDU)
210 this_len = FIO_SERVER_MAX_PDU;
211
212 cmd = malloc(sizeof(*cmd) + this_len);
213
214 fio_init_net_cmd(cmd, opcode, buf, this_len);
215
216 if (this_len < size)
217 cmd->flags = __cpu_to_le32(FIO_NET_CMD_F_MORE);
218
219 fio_net_cmd_crc(cmd);
220
221 ret = fio_send_data(fd, cmd, sizeof(*cmd) + this_len);
222 free(cmd);
223 size -= this_len;
224 buf += this_len;
225 } while (!ret && size);
226
227 return ret;
228}
229
230int fio_net_send_simple_cmd(int sk, uint16_t opcode, uint64_t serial)
231{
232 struct fio_net_cmd cmd;
233
234 fio_init_net_cmd(&cmd, opcode, NULL, 0);
235 fio_net_cmd_crc(&cmd);
236
237 return fio_send_data(sk, &cmd, sizeof(cmd));
238}
239
240static int fio_server_send_quit_cmd(void)
241{
242 dprint(FD_NET, "server: sending quit\n");
243 return fio_net_send_simple_cmd(server_fd, FIO_NET_CMD_QUIT, 0);
244}
245
246static int handle_job_cmd(struct fio_net_cmd *cmd)
247{
248 char *buf = (char *) cmd->payload;
249 int ret;
250
251 if (parse_jobs_ini(buf, 1, 0)) {
252 fio_server_send_quit_cmd();
253 return -1;
254 }
255
256 fio_net_send_simple_cmd(server_fd, FIO_NET_CMD_START, 0);
257
258 ret = exec_run();
259 fio_server_send_quit_cmd();
260 reset_fio_state();
261 return ret;
262}
263
264static int handle_jobline_cmd(struct fio_net_cmd *cmd)
265{
266 struct cmd_line_pdu *pdu = (struct cmd_line_pdu *) cmd->payload;
267 char *argv[FIO_NET_CMD_JOBLINE_ARGV];
268 int ret, i;
269
270 pdu->argc = le16_to_cpu(pdu->argc);
271
272 dprint(FD_NET, "server: %d command line args\n", pdu->argc);
273
274 for (i = 0; i < pdu->argc; i++) {
275 argv[i] = (char *) pdu->argv[i];
276 dprint(FD_NET, "server: %d: %s\n", i, argv[i]);
277 }
278
279 if (parse_cmd_line(pdu->argc, argv)) {
280 fio_server_send_quit_cmd();
281 return -1;
282 }
283
284 fio_net_send_simple_cmd(server_fd, FIO_NET_CMD_START, 0);
285
286 ret = exec_run();
287 fio_server_send_quit_cmd();
288 reset_fio_state();
289 return ret;
290}
291
292static int handle_probe_cmd(struct fio_net_cmd *cmd)
293{
294 struct cmd_probe_pdu probe;
295
296 memset(&probe, 0, sizeof(probe));
297 gethostname((char *) probe.hostname, sizeof(probe.hostname));
298#ifdef FIO_BIG_ENDIAN
299 probe.bigendian = 1;
300#endif
301 probe.fio_major = FIO_MAJOR;
302 probe.fio_minor = FIO_MINOR;
303 probe.fio_patch = FIO_PATCH;
304
305 return fio_net_send_cmd(server_fd, FIO_NET_CMD_PROBE, &probe, sizeof(probe));
306}
307
308static int handle_command(struct fio_net_cmd *cmd)
309{
310 int ret;
311
312 dprint(FD_NET, "server: got opcode %d\n", cmd->opcode);
313
314 switch (cmd->opcode) {
315 case FIO_NET_CMD_QUIT:
316 fio_terminate_threads(TERMINATE_ALL);
317 return -1;
318 case FIO_NET_CMD_EXIT:
319 exit_backend = 1;
320 return -1;
321 case FIO_NET_CMD_JOB:
322 ret = handle_job_cmd(cmd);
323 break;
324 case FIO_NET_CMD_JOBLINE:
325 ret = handle_jobline_cmd(cmd);
326 break;
327 case FIO_NET_CMD_PROBE:
328 ret = handle_probe_cmd(cmd);
329 break;
330 default:
331 log_err("fio: unknown opcode: %d\n", cmd->opcode);
332 ret = 1;
333 }
334
335 return ret;
336}
337
338static int handle_connection(int sk, int block)
339{
340 struct fio_net_cmd *cmd = NULL;
341 int ret = 0;
342
343 /* read forever */
344 while (!exit_backend) {
345 struct pollfd pfd = {
346 .fd = sk,
347 .events = POLLIN,
348 };
349
350 ret = 0;
351 do {
352 ret = poll(&pfd, 1, 100);
353 if (ret < 0) {
354 if (errno == EINTR)
355 break;
356 log_err("fio: poll: %s\n", strerror(errno));
357 break;
358 } else if (!ret) {
359 if (!block)
360 return 0;
361 continue;
362 }
363
364 if (pfd.revents & POLLIN)
365 break;
366 if (pfd.revents & (POLLERR|POLLHUP)) {
367 ret = 1;
368 break;
369 }
370 } while (!exit_backend);
371
372 if (ret < 0)
373 break;
374
375 cmd = fio_net_recv_cmd(sk);
376 if (!cmd) {
377 ret = -1;
378 break;
379 }
380
381 ret = handle_command(cmd);
382 if (ret)
383 break;
384
385 free(cmd);
386 cmd = NULL;
387 }
388
389 if (cmd)
390 free(cmd);
391
392 return ret;
393}
394
395void fio_server_idle_loop(void)
396{
397 if (server_fd != -1)
398 handle_connection(server_fd, 0);
399}
400
401static int accept_loop(int listen_sk)
402{
403 struct sockaddr_in addr;
404 fio_socklen_t len = sizeof(addr);
405 struct pollfd pfd;
406 int ret, sk, flags, exitval = 0;
407
408 dprint(FD_NET, "server enter accept loop\n");
409
410 flags = fcntl(listen_sk, F_GETFL);
411 flags |= O_NONBLOCK;
412 fcntl(listen_sk, F_SETFL, flags);
413again:
414 pfd.fd = listen_sk;
415 pfd.events = POLLIN;
416 do {
417 ret = poll(&pfd, 1, 100);
418 if (ret < 0) {
419 if (errno == EINTR)
420 break;
421 log_err("fio: poll: %s\n", strerror(errno));
422 goto out;
423 } else if (!ret)
424 continue;
425
426 if (pfd.revents & POLLIN)
427 break;
428 } while (!exit_backend);
429
430 if (exit_backend)
431 goto out;
432
433 sk = accept(listen_sk, (struct sockaddr *) &addr, &len);
434 if (sk < 0) {
435 log_err("fio: accept: %s\n", strerror(errno));
436 return -1;
437 }
438
439 dprint(FD_NET, "server: connect from %s\n", inet_ntoa(addr.sin_addr));
440
441 server_fd = sk;
442
443 exitval = handle_connection(sk, 1);
444
445 server_fd = -1;
446 close(sk);
447
448 if (!exit_backend)
449 goto again;
450
451out:
452 return exitval;
453}
454
455int fio_server_text_output(const char *buf, unsigned int len)
456{
457 if (server_fd != -1)
458 return fio_net_send_cmd(server_fd, FIO_NET_CMD_TEXT, buf, len);
459
460 return fwrite(buf, len, 1, f_err);
461}
462
463static void convert_io_stat(struct io_stat *dst, struct io_stat *src)
464{
465 dst->max_val = cpu_to_le64(src->max_val);
466 dst->min_val = cpu_to_le64(src->min_val);
467 dst->samples = cpu_to_le64(src->samples);
468
469 /*
470 * Encode to IEEE 754 for network transfer
471 */
472 dst->mean.u.i = __cpu_to_le64(fio_double_to_uint64(src->mean.u.f));
473 dst->S.u.i = __cpu_to_le64(fio_double_to_uint64(src->S.u.f));
474}
475
476static void convert_gs(struct group_run_stats *dst, struct group_run_stats *src)
477{
478 int i;
479
480 for (i = 0; i < 2; i++) {
481 dst->max_run[i] = cpu_to_le64(src->max_run[i]);
482 dst->min_run[i] = cpu_to_le64(src->min_run[i]);
483 dst->max_bw[i] = cpu_to_le64(src->max_bw[i]);
484 dst->min_bw[i] = cpu_to_le64(src->min_bw[i]);
485 dst->io_kb[i] = cpu_to_le64(src->io_kb[i]);
486 dst->agg[i] = cpu_to_le64(src->agg[i]);
487 }
488
489 dst->kb_base = cpu_to_le32(src->kb_base);
490 dst->groupid = cpu_to_le32(src->groupid);
491}
492
493/*
494 * Send a CMD_TS, which packs struct thread_stat and group_run_stats
495 * into a single payload.
496 */
497void fio_server_send_ts(struct thread_stat *ts, struct group_run_stats *rs)
498{
499 struct cmd_ts_pdu p;
500 int i, j;
501
502 dprint(FD_NET, "server sending end stats\n");
503
504 memset(&p, 0, sizeof(p));
505
506 strcpy(p.ts.name, ts->name);
507 strcpy(p.ts.verror, ts->verror);
508 strcpy(p.ts.description, ts->description);
509
510 p.ts.error = cpu_to_le32(ts->error);
511 p.ts.groupid = cpu_to_le32(ts->groupid);
512 p.ts.pid = cpu_to_le32(ts->pid);
513 p.ts.members = cpu_to_le32(ts->members);
514
515 for (i = 0; i < 2; i++) {
516 convert_io_stat(&p.ts.clat_stat[i], &ts->clat_stat[i]);
517 convert_io_stat(&p.ts.slat_stat[i], &ts->slat_stat[i]);
518 convert_io_stat(&p.ts.lat_stat[i], &ts->lat_stat[i]);
519 convert_io_stat(&p.ts.bw_stat[i], &ts->bw_stat[i]);
520 }
521
522 p.ts.usr_time = cpu_to_le64(ts->usr_time);
523 p.ts.sys_time = cpu_to_le64(ts->sys_time);
524 p.ts.ctx = cpu_to_le64(ts->ctx);
525 p.ts.minf = cpu_to_le64(ts->minf);
526 p.ts.majf = cpu_to_le64(ts->majf);
527 p.ts.clat_percentiles = cpu_to_le64(ts->clat_percentiles);
528
529 for (i = 0; i < FIO_IO_U_LIST_MAX_LEN; i++) {
530 fio_fp64_t *fp = &p.ts.percentile_list[i];
531
532 fp->u.i = __cpu_to_le64(fio_double_to_uint64(fp->u.f));
533 }
534
535 for (i = 0; i < FIO_IO_U_MAP_NR; i++) {
536 p.ts.io_u_map[i] = cpu_to_le32(ts->io_u_map[i]);
537 p.ts.io_u_submit[i] = cpu_to_le32(ts->io_u_submit[i]);
538 p.ts.io_u_complete[i] = cpu_to_le32(ts->io_u_complete[i]);
539 }
540
541 for (i = 0; i < FIO_IO_U_LAT_U_NR; i++) {
542 p.ts.io_u_lat_u[i] = cpu_to_le32(ts->io_u_lat_u[i]);
543 p.ts.io_u_lat_m[i] = cpu_to_le32(ts->io_u_lat_m[i]);
544 }
545
546 for (i = 0; i < 2; i++)
547 for (j = 0; j < FIO_IO_U_PLAT_NR; j++)
548 p.ts.io_u_plat[i][j] = cpu_to_le32(ts->io_u_plat[i][j]);
549
550 for (i = 0; i < 3; i++) {
551 p.ts.total_io_u[i] = cpu_to_le64(ts->total_io_u[i]);
552 p.ts.short_io_u[i] = cpu_to_le64(ts->short_io_u[i]);
553 }
554
555 p.ts.total_submit = cpu_to_le64(ts->total_submit);
556 p.ts.total_complete = cpu_to_le64(ts->total_complete);
557
558 for (i = 0; i < 2; i++) {
559 p.ts.io_bytes[i] = cpu_to_le64(ts->io_bytes[i]);
560 p.ts.runtime[i] = cpu_to_le64(ts->runtime[i]);
561 }
562
563 p.ts.total_run_time = cpu_to_le64(ts->total_run_time);
564 p.ts.continue_on_error = cpu_to_le16(ts->continue_on_error);
565 p.ts.total_err_count = cpu_to_le64(ts->total_err_count);
566 p.ts.first_error = cpu_to_le32(ts->first_error);
567 p.ts.kb_base = cpu_to_le32(ts->kb_base);
568
569 convert_gs(&p.rs, rs);
570
571 fio_net_send_cmd(server_fd, FIO_NET_CMD_TS, &p, sizeof(p));
572}
573
574void fio_server_send_gs(struct group_run_stats *rs)
575{
576 struct group_run_stats gs;
577
578 dprint(FD_NET, "server sending group run stats\n");
579
580 convert_gs(&gs, rs);
581 fio_net_send_cmd(server_fd, FIO_NET_CMD_GS, &gs, sizeof(gs));
582}
583
584void fio_server_send_status(void)
585{
586 struct jobs_eta *je;
587 size_t size;
588 void *buf;
589 int i;
590
591 size = sizeof(*je) + thread_number * sizeof(char);
592 buf = malloc(size);
593 memset(buf, 0, size);
594 je = buf;
595
596 if (!calc_thread_status(je)) {
597 free(je);
598 return;
599 }
600
601 dprint(FD_NET, "server sending status\n");
602
603 je->nr_running = cpu_to_le32(je->nr_running);
604 je->nr_ramp = cpu_to_le32(je->nr_ramp);
605 je->nr_pending = cpu_to_le32(je->nr_pending);
606 je->files_open = cpu_to_le32(je->files_open);
607 je->m_rate = cpu_to_le32(je->m_rate);
608 je->t_rate = cpu_to_le32(je->t_rate);
609 je->m_iops = cpu_to_le32(je->m_iops);
610 je->t_iops = cpu_to_le32(je->t_iops);
611
612 for (i = 0; i < 2; i++) {
613 je->rate[i] = cpu_to_le32(je->rate[i]);
614 je->iops[i] = cpu_to_le32(je->iops[i]);
615 }
616
617 je->elapsed_sec = cpu_to_le32(je->nr_running);
618 je->eta_sec = cpu_to_le64(je->eta_sec);
619
620 fio_net_send_cmd(server_fd, FIO_NET_CMD_ETA, buf, size);
621 free(je);
622}
623
624int fio_server_log(const char *format, ...)
625{
626 char buffer[1024];
627 va_list args;
628 size_t len;
629
630 dprint(FD_NET, "server log\n");
631
632 va_start(args, format);
633 len = vsnprintf(buffer, sizeof(buffer), format, args);
634 va_end(args);
635
636 return fio_server_text_output(buffer, len);
637}
638
639static int fio_server(void)
640{
641 struct sockaddr_in saddr_in;
642 struct sockaddr addr;
643 fio_socklen_t len;
644 int sk, opt, ret;
645
646 dprint(FD_NET, "starting server\n");
647
648 sk = socket(AF_INET, SOCK_STREAM, 0);
649 if (sk < 0) {
650 log_err("fio: socket: %s\n", strerror(errno));
651 return -1;
652 }
653
654 opt = 1;
655 if (setsockopt(sk, SOL_SOCKET, SO_REUSEADDR, &opt, sizeof(opt)) < 0) {
656 log_err("fio: setsockopt: %s\n", strerror(errno));
657 return -1;
658 }
659#ifdef SO_REUSEPORT
660 if (setsockopt(sk, SOL_SOCKET, SO_REUSEPORT, &opt, sizeof(opt)) < 0) {
661 log_err("fio: setsockopt: %s\n", strerror(errno));
662 return -1;
663 }
664#endif
665
666 saddr_in.sin_family = AF_INET;
667 saddr_in.sin_addr.s_addr = htonl(INADDR_ANY);
668 saddr_in.sin_port = htons(fio_net_port);
669
670 if (bind(sk, (struct sockaddr *) &saddr_in, sizeof(saddr_in)) < 0) {
671 log_err("fio: bind: %s\n", strerror(errno));
672 return -1;
673 }
674
675 if (listen(sk, 1) < 0) {
676 log_err("fio: listen: %s\n", strerror(errno));
677 return -1;
678 }
679
680 len = sizeof(addr);
681 if (getsockname(sk, &addr, &len) < 0) {
682 log_err("fio: getsockname: %s\n", strerror(errno));
683 return -1;
684 }
685
686 ret = accept_loop(sk);
687 close(sk);
688 return ret;
689}
690
691static void sig_int(int sig)
692{
693 fio_terminate_threads(TERMINATE_ALL);
694 exit_backend = 1;
695}
696
697static void server_signal_handler(void)
698{
699 struct sigaction act;
700
701 memset(&act, 0, sizeof(act));
702 act.sa_handler = sig_int;
703 act.sa_flags = SA_RESTART;
704 sigaction(SIGINT, &act, NULL);
705
706 memset(&act, 0, sizeof(act));
707 act.sa_handler = sig_int;
708 act.sa_flags = SA_RESTART;
709 sigaction(SIGTERM, &act, NULL);
710}
711
712int fio_start_server(int daemonize)
713{
714 pid_t pid;
715
716 server_signal_handler();
717
718 if (!daemonize)
719 return fio_server();
720
721 openlog("fio", LOG_NDELAY|LOG_NOWAIT|LOG_PID, LOG_USER);
722 pid = fork();
723 if (pid < 0) {
724 syslog(LOG_ERR, "failed server fork");
725 return -1;
726 } else if (pid)
727 exit(0);
728
729 setsid();
730 close(STDIN_FILENO);
731 close(STDOUT_FILENO);
732 close(STDERR_FILENO);
733 f_out = NULL;
734 f_err = NULL;
735 log_syslog = 1;
736 return fio_server();
737}