server: attempt to handle client ctrl-c
[fio.git] / server.c
CommitLineData
50d16976
JA
1#include <stdio.h>
2#include <stdlib.h>
142575e6 3#include <stdarg.h>
50d16976
JA
4#include <unistd.h>
5#include <limits.h>
50d16976
JA
6#include <errno.h>
7#include <fcntl.h>
8#include <sys/poll.h>
50d16976
JA
9#include <sys/types.h>
10#include <sys/wait.h>
50d16976 11#include <sys/mman.h>
50d16976
JA
12#include <netinet/in.h>
13#include <arpa/inet.h>
14#include <netdb.h>
e46d8091 15#include <syslog.h>
50d16976
JA
16
17#include "fio.h"
132159a5 18#include "server.h"
fcee5ff6 19#include "crc/crc16.h"
50d16976 20
132159a5 21int fio_net_port = 8765;
50d16976 22
009b1be4
JA
23int exit_backend = 0;
24
46c48f1f 25static int server_fd = -1;
37db14fe 26
132159a5
JA
27int fio_send_data(int sk, const void *p, unsigned int len)
28{
794d69ca
JA
29 assert(len <= sizeof(struct fio_net_cmd) + FIO_SERVER_MAX_PDU);
30
132159a5
JA
31 do {
32 int ret = send(sk, p, len, 0);
33
34 if (ret > 0) {
35 len -= ret;
36 if (!len)
37 break;
38 p += ret;
39 continue;
40 } else if (!ret)
41 break;
42 else if (errno == EAGAIN || errno == EINTR)
43 continue;
44 } while (!exit_backend);
45
46 if (!len)
47 return 0;
48
49 return 1;
50}
51
52int fio_recv_data(int sk, void *p, unsigned int len)
53{
54 do {
55 int ret = recv(sk, p, len, MSG_WAITALL);
56
57 if (ret > 0) {
58 len -= ret;
59 if (!len)
60 break;
61 p += ret;
62 continue;
63 } else if (!ret)
64 break;
65 else if (errno == EAGAIN || errno == EINTR)
66 continue;
67 } while (!exit_backend);
68
69 if (!len)
70 return 0;
71
72 return -1;
73}
74
75static int verify_convert_cmd(struct fio_net_cmd *cmd)
76{
fcee5ff6 77 uint16_t crc;
132159a5 78
fcee5ff6
JA
79 cmd->cmd_crc16 = le16_to_cpu(cmd->cmd_crc16);
80 cmd->pdu_crc16 = le16_to_cpu(cmd->pdu_crc16);
132159a5 81
fcee5ff6
JA
82 crc = crc16(cmd, FIO_NET_CMD_CRC_SZ);
83 if (crc != cmd->cmd_crc16) {
132159a5 84 log_err("fio: server bad crc on command (got %x, wanted %x)\n",
fcee5ff6 85 cmd->cmd_crc16, crc);
132159a5
JA
86 return 1;
87 }
88
89 cmd->version = le16_to_cpu(cmd->version);
90 cmd->opcode = le16_to_cpu(cmd->opcode);
91 cmd->flags = le32_to_cpu(cmd->flags);
92 cmd->serial = le64_to_cpu(cmd->serial);
93 cmd->pdu_len = le32_to_cpu(cmd->pdu_len);
94
95 switch (cmd->version) {
96 case FIO_SERVER_VER1:
97 break;
98 default:
99 log_err("fio: bad server cmd version %d\n", cmd->version);
100 return 1;
101 }
102
103 if (cmd->pdu_len > FIO_SERVER_MAX_PDU) {
104 log_err("fio: command payload too large: %u\n", cmd->pdu_len);
105 return 1;
106 }
107
108 return 0;
109}
110
a64e88da
JA
111/*
112 * Read (and defragment, if necessary) incoming commands
113 */
114struct fio_net_cmd *fio_net_recv_cmd(int sk)
132159a5 115{
a64e88da
JA
116 struct fio_net_cmd cmd, *cmdret = NULL;
117 size_t cmd_size = 0, pdu_offset = 0;
fcee5ff6 118 uint16_t crc;
a64e88da
JA
119 int ret, first = 1;
120 void *pdu = NULL;
132159a5 121
a64e88da 122 do {
cc0df00a
JA
123 struct pollfd pfd;
124
125 pfd.fd = sk;
126 pfd.events = POLLIN;
127 ret = 0;
128 do {
129 ret = poll(&pfd, 1, 100);
130 if (ret < 0) {
131 log_err("fio: poll: %s\n", strerror(errno));
132 break;
133 } else if (!ret)
134 continue;
135
136 if (pfd.revents & POLLIN)
137 break;
138 if (pfd.revents & (POLLERR|POLLHUP)) {
139 ret = 1;
140 break;
141 }
142 } while (ret >= 0);
143
144 if (ret < 0)
145 break;
146
a64e88da
JA
147 ret = fio_recv_data(sk, &cmd, sizeof(cmd));
148 if (ret)
149 break;
132159a5 150
a64e88da
JA
151 /* We have a command, verify it and swap if need be */
152 ret = verify_convert_cmd(&cmd);
153 if (ret)
154 break;
132159a5 155
a64e88da
JA
156 if (first)
157 cmd_size = sizeof(cmd) + cmd.pdu_len;
158 else
159 cmd_size += cmd.pdu_len;
132159a5 160
a64e88da 161 cmdret = realloc(cmdret, cmd_size);
132159a5 162
a64e88da
JA
163 if (first)
164 memcpy(cmdret, &cmd, sizeof(cmd));
165 else
166 assert(cmdret->opcode == cmd.opcode);
167
168 if (!cmd.pdu_len)
169 break;
170
171 /* There's payload, get it */
172 pdu = (void *) cmdret->payload + pdu_offset;
173 ret = fio_recv_data(sk, pdu, cmd.pdu_len);
174 if (ret)
175 break;
176
177 /* Verify payload crc */
178 crc = crc16(pdu, cmd.pdu_len);
179 if (crc != cmd.pdu_crc16) {
180 log_err("fio: server bad crc on payload ");
181 log_err("(got %x, wanted %x)\n", cmd.pdu_crc16, crc);
182 ret = 1;
183 break;
184 }
185
186 pdu_offset += cmd.pdu_len;
817f06bb
JA
187 if (!first)
188 cmdret->pdu_len += cmd.pdu_len;
a64e88da
JA
189 first = 0;
190 } while (cmd.flags & FIO_NET_CMD_F_MORE);
132159a5 191
a64e88da
JA
192 if (ret) {
193 free(cmdret);
194 cmdret = NULL;
cc0df00a 195 } else if (cmdret)
a64e88da
JA
196 cmdret->flags &= ~FIO_NET_CMD_F_MORE;
197
198 return cmdret;
132159a5
JA
199}
200
201void fio_net_cmd_crc(struct fio_net_cmd *cmd)
202{
203 uint32_t pdu_len;
204
ddcc0b69 205 cmd->cmd_crc16 = __cpu_to_le16(crc16(cmd, FIO_NET_CMD_CRC_SZ));
132159a5
JA
206
207 pdu_len = le32_to_cpu(cmd->pdu_len);
208 if (pdu_len)
ddcc0b69 209 cmd->pdu_crc16 = __cpu_to_le16(crc16(cmd->payload, pdu_len));
132159a5
JA
210}
211
a64e88da 212int fio_net_send_cmd(int fd, uint16_t opcode, const void *buf, off_t size)
794d69ca
JA
213{
214 struct fio_net_cmd *cmd;
215 size_t this_len;
216 int ret;
217
218 do {
219 this_len = size;
220 if (this_len > FIO_SERVER_MAX_PDU)
221 this_len = FIO_SERVER_MAX_PDU;
222
223 cmd = malloc(sizeof(*cmd) + this_len);
224
225 fio_init_net_cmd(cmd, opcode, buf, this_len);
226
227 if (this_len < size)
ddcc0b69 228 cmd->flags = __cpu_to_le32(FIO_NET_CMD_F_MORE);
794d69ca
JA
229
230 fio_net_cmd_crc(cmd);
231
232 ret = fio_send_data(fd, cmd, sizeof(*cmd) + this_len);
233 free(cmd);
234 size -= this_len;
235 buf += this_len;
236 } while (!ret && size);
237
238 return ret;
239}
240
cc0df00a 241int fio_net_send_simple_cmd(int sk, uint16_t opcode, uint64_t serial)
132159a5
JA
242{
243 struct fio_net_cmd cmd = {
ddcc0b69 244 .version = __cpu_to_le16(FIO_SERVER_VER1),
132159a5 245 .opcode = cpu_to_le16(opcode),
bdab4441 246 .serial = cpu_to_le64(serial),
132159a5
JA
247 };
248
249 fio_net_cmd_crc(&cmd);
250
251 return fio_send_data(sk, &cmd, sizeof(cmd));
252}
253
437377e1
JA
254static int send_quit_command(void)
255{
46c48f1f 256 dprint(FD_NET, "server: sending quit\n");
cc0df00a 257 return fio_net_send_simple_cmd(server_fd, FIO_NET_CMD_QUIT, 0);
437377e1
JA
258}
259
794d69ca 260static int handle_cur_job(struct fio_net_cmd *cmd)
132159a5 261{
a64e88da
JA
262 void *buf = cmd->payload;
263 int ret;
132159a5 264
a64e88da 265 parse_jobs_ini(buf, 1, 0);
794d69ca
JA
266 ret = exec_run();
267 send_quit_command();
268 reset_fio_state();
132159a5
JA
269 return ret;
270}
271
272static int handle_command(struct fio_net_cmd *cmd)
273{
274 int ret;
275
46c48f1f
JA
276 dprint(FD_NET, "server: got opcode %d\n", cmd->opcode);
277
132159a5
JA
278 switch (cmd->opcode) {
279 case FIO_NET_CMD_QUIT:
cc0df00a 280 fio_terminate_threads(TERMINATE_ALL);
d7959186
JA
281 return 1;
282 case FIO_NET_CMD_EXIT:
132159a5
JA
283 exit_backend = 1;
284 return 1;
285 case FIO_NET_CMD_ACK:
286 return 0;
287 case FIO_NET_CMD_NAK:
288 return 1;
289 case FIO_NET_CMD_JOB:
794d69ca 290 ret = handle_cur_job(cmd);
132159a5
JA
291 break;
292 default:
293 log_err("fio: unknown opcode: %d\n", cmd->opcode);
294 ret = 1;
295 }
296
297 return ret;
298}
299
300static int handle_connection(int sk)
301{
302 struct fio_net_cmd *cmd = NULL;
303 int ret = 0;
304
305 /* read forever */
306 while (!exit_backend) {
a64e88da 307 cmd = fio_net_recv_cmd(sk);
132159a5
JA
308 if (!cmd) {
309 ret = 1;
310 break;
311 }
312
132159a5
JA
313 ret = handle_command(cmd);
314 if (ret)
315 break;
316
317 free(cmd);
c77a99e7 318 cmd = NULL;
132159a5
JA
319 }
320
321 if (cmd)
322 free(cmd);
323
324 return ret;
325}
326
cc0df00a
JA
327void fio_server_idle_loop(void)
328{
329 if (server_fd != -1)
330 handle_connection(server_fd);
331}
332
50d16976
JA
333static int accept_loop(int listen_sk)
334{
335 struct sockaddr addr;
336 unsigned int len = sizeof(addr);
009b1be4 337 struct pollfd pfd;
132159a5 338 int ret, sk, flags, exitval = 0;
50d16976 339
009b1be4
JA
340 flags = fcntl(listen_sk, F_GETFL);
341 flags |= O_NONBLOCK;
342 fcntl(listen_sk, F_SETFL, flags);
50d16976 343again:
009b1be4
JA
344 pfd.fd = listen_sk;
345 pfd.events = POLLIN;
346 do {
347 ret = poll(&pfd, 1, 100);
348 if (ret < 0) {
349 if (errno == EINTR)
350 break;
fcee5ff6 351 log_err("fio: poll: %s\n", strerror(errno));
009b1be4
JA
352 goto out;
353 } else if (!ret)
354 continue;
355
356 if (pfd.revents & POLLIN)
357 break;
358 } while (!exit_backend);
359
360 if (exit_backend)
361 goto out;
362
50d16976 363 sk = accept(listen_sk, &addr, &len);
50d16976 364 if (sk < 0) {
690e09ae 365 log_err("fio: accept: %s\n", strerror(errno));
50d16976
JA
366 return -1;
367 }
368
46c48f1f
JA
369 dprint(FD_NET, "server got a connection\n");
370
37db14fe
JA
371 server_fd = sk;
372
cc0df00a
JA
373 printf("handle\n");
374
132159a5 375 exitval = handle_connection(sk);
50d16976 376
cc0df00a
JA
377 printf("out, exit %d\n", exitval);
378
37db14fe 379 server_fd = -1;
50d16976 380 close(sk);
5c341e9a 381
009b1be4 382 if (!exit_backend)
5c341e9a
JA
383 goto again;
384
009b1be4 385out:
132159a5 386 return exitval;
50d16976
JA
387}
388
e46d8091 389static int fio_server(void)
50d16976
JA
390{
391 struct sockaddr_in saddr_in;
392 struct sockaddr addr;
393 unsigned int len;
afcf7758 394 int sk, opt, ret;
50d16976 395
46c48f1f
JA
396 dprint(FD_NET, "starting server\n");
397
50d16976
JA
398 sk = socket(AF_INET, SOCK_STREAM, 0);
399 if (sk < 0) {
690e09ae 400 log_err("fio: socket: %s\n", strerror(errno));
50d16976
JA
401 return -1;
402 }
403
404 opt = 1;
405 if (setsockopt(sk, SOL_SOCKET, SO_REUSEADDR, &opt, sizeof(opt)) < 0) {
690e09ae 406 log_err("fio: setsockopt: %s\n", strerror(errno));
50d16976
JA
407 return -1;
408 }
409#ifdef SO_REUSEPORT
410 if (setsockopt(fd, SOL_SOCKET, SO_REUSEPORT, &opt, sizeof(opt)) < 0) {
690e09ae 411 log_err("fio: setsockopt: %s\n", strerror(errno));
50d16976
JA
412 return 1;
413 }
414#endif
415
416 saddr_in.sin_family = AF_INET;
417 saddr_in.sin_addr.s_addr = htonl(INADDR_ANY);
132159a5 418 saddr_in.sin_port = htons(fio_net_port);
50d16976
JA
419
420 if (bind(sk, (struct sockaddr *) &saddr_in, sizeof(saddr_in)) < 0) {
690e09ae 421 log_err("fio: bind: %s\n", strerror(errno));
50d16976
JA
422 return -1;
423 }
424
425 if (listen(sk, 1) < 0) {
690e09ae 426 log_err("fio: listen: %s\n", strerror(errno));
50d16976
JA
427 return -1;
428 }
429
430 len = sizeof(addr);
431 if (getsockname(sk, &addr, &len) < 0) {
690e09ae 432 log_err("fio: getsockname: %s\n", strerror(errno));
50d16976
JA
433 return -1;
434 }
435
afcf7758
JA
436 ret = accept_loop(sk);
437 close(sk);
438 return ret;
50d16976 439}
37db14fe 440
142575e6 441int fio_server_text_output(const char *buf, unsigned int len)
37db14fe 442{
337d75a8
JA
443 if (server_fd != -1)
444 return fio_net_send_cmd(server_fd, FIO_NET_CMD_TEXT, buf, len);
445
446 return 0;
142575e6
JA
447}
448
a64e88da
JA
449static void convert_io_stat(struct io_stat *dst, struct io_stat *src)
450{
451 dst->max_val = cpu_to_le64(src->max_val);
452 dst->min_val = cpu_to_le64(src->min_val);
453 dst->samples = cpu_to_le64(src->samples);
454 /* FIXME */
ddcc0b69
JA
455 dst->mean = __cpu_to_le64(src->mean);
456 dst->S = __cpu_to_le64(src->S);
a64e88da
JA
457}
458
459static void convert_gs(struct group_run_stats *dst, struct group_run_stats *src)
460{
461 int i;
462
463 for (i = 0; i < 2; i++) {
464 dst->max_run[i] = cpu_to_le64(src->max_run[i]);
465 dst->min_run[i] = cpu_to_le64(src->min_run[i]);
466 dst->max_bw[i] = cpu_to_le64(src->max_bw[i]);
467 dst->min_bw[i] = cpu_to_le64(src->min_bw[i]);
468 dst->io_kb[i] = cpu_to_le64(src->io_kb[i]);
469 dst->agg[i] = cpu_to_le64(src->agg[i]);
470 }
471
472 dst->kb_base = cpu_to_le32(src->kb_base);
473 dst->groupid = cpu_to_le32(src->groupid);
474}
475
476/*
477 * Send a CMD_TS, which packs struct thread_stat and group_run_stats
478 * into a single payload.
479 */
480void fio_server_send_ts(struct thread_stat *ts, struct group_run_stats *rs)
481{
482 struct cmd_ts_pdu p;
483 int i, j;
484
485 strcpy(p.ts.name, ts->name);
486 strcpy(p.ts.verror, ts->verror);
487 strcpy(p.ts.description, ts->description);
488
ddcc0b69 489 p.ts.error = cpu_to_le32(ts->error);
a64e88da 490 p.ts.groupid = cpu_to_le32(ts->groupid);
ddcc0b69 491 p.ts.pid = cpu_to_le32(ts->pid);
a64e88da
JA
492 p.ts.members = cpu_to_le32(ts->members);
493
494 for (i = 0; i < 2; i++) {
495 convert_io_stat(&p.ts.clat_stat[i], &ts->clat_stat[i]);
496 convert_io_stat(&p.ts.slat_stat[i], &ts->slat_stat[i]);
497 convert_io_stat(&p.ts.lat_stat[i], &ts->lat_stat[i]);
498 convert_io_stat(&p.ts.bw_stat[i], &ts->bw_stat[i]);
499 }
500
501 p.ts.usr_time = cpu_to_le64(ts->usr_time);
502 p.ts.sys_time = cpu_to_le64(ts->sys_time);
503 p.ts.ctx = cpu_to_le64(ts->ctx);
504 p.ts.minf = cpu_to_le64(ts->minf);
505 p.ts.majf = cpu_to_le64(ts->majf);
506 p.ts.clat_percentiles = cpu_to_le64(ts->clat_percentiles);
507 p.ts.percentile_list = NULL;
508
509 for (i = 0; i < FIO_IO_U_MAP_NR; i++) {
510 p.ts.io_u_map[i] = cpu_to_le32(ts->io_u_map[i]);
511 p.ts.io_u_submit[i] = cpu_to_le32(ts->io_u_submit[i]);
512 p.ts.io_u_complete[i] = cpu_to_le32(ts->io_u_complete[i]);
513 }
514
515 for (i = 0; i < FIO_IO_U_LAT_U_NR; i++) {
516 p.ts.io_u_lat_u[i] = cpu_to_le32(ts->io_u_lat_u[i]);
517 p.ts.io_u_lat_m[i] = cpu_to_le32(ts->io_u_lat_m[i]);
518 }
519
520 for (i = 0; i < 2; i++)
521 for (j = 0; j < FIO_IO_U_PLAT_NR; j++)
522 p.ts.io_u_plat[i][j] = cpu_to_le32(ts->io_u_plat[i][j]);
523
524 for (i = 0; i < 3; i++) {
525 p.ts.total_io_u[i] = cpu_to_le64(ts->total_io_u[i]);
526 p.ts.short_io_u[i] = cpu_to_le64(ts->total_io_u[i]);
527 }
528
529 p.ts.total_submit = cpu_to_le64(ts->total_submit);
530 p.ts.total_complete = cpu_to_le64(ts->total_complete);
531
532 for (i = 0; i < 2; i++) {
533 p.ts.io_bytes[i] = cpu_to_le64(ts->io_bytes[i]);
534 p.ts.runtime[i] = cpu_to_le64(ts->runtime[i]);
535 }
536
537 p.ts.total_run_time = cpu_to_le64(ts->total_run_time);
538 p.ts.continue_on_error = cpu_to_le16(ts->continue_on_error);
539 p.ts.total_err_count = cpu_to_le64(ts->total_err_count);
ddcc0b69
JA
540 p.ts.first_error = cpu_to_le32(ts->first_error);
541 p.ts.kb_base = cpu_to_le32(ts->kb_base);
a64e88da
JA
542
543 convert_gs(&p.rs, rs);
544
545 fio_net_send_cmd(server_fd, FIO_NET_CMD_TS, &p, sizeof(p));
546}
547
548void fio_server_send_gs(struct group_run_stats *rs)
549{
550 struct group_run_stats gs;
551
552 convert_gs(&gs, rs);
553 fio_net_send_cmd(server_fd, FIO_NET_CMD_GS, &gs, sizeof(gs));
554}
555
cf451d1e
JA
556void fio_server_send_status(void)
557{
1d1f45ae
JA
558 struct jobs_eta *je;
559 size_t size;
560 void *buf;
cf451d1e
JA
561 int i;
562
1d1f45ae
JA
563 size = sizeof(*je) + thread_number * sizeof(char);
564 buf = malloc(size);
565 memset(buf, 0, size);
566 je = buf;
567
568 if (!calc_thread_status(je)) {
569 free(je);
cf451d1e 570 return;
1d1f45ae 571 }
cf451d1e 572
1d1f45ae
JA
573 je->nr_running = cpu_to_le32(je->nr_running);
574 je->nr_ramp = cpu_to_le32(je->nr_ramp);
575 je->nr_pending = cpu_to_le32(je->nr_pending);
576 je->files_open = cpu_to_le32(je->files_open);
577 je->m_rate = cpu_to_le32(je->m_rate);
578 je->t_rate = cpu_to_le32(je->t_rate);
579 je->m_iops = cpu_to_le32(je->m_iops);
580 je->t_iops = cpu_to_le32(je->t_iops);
cf451d1e
JA
581
582 for (i = 0; i < 2; i++) {
1d1f45ae
JA
583 je->rate[i] = cpu_to_le32(je->rate[i]);
584 je->iops[i] = cpu_to_le32(je->iops[i]);
cf451d1e
JA
585 }
586
1d1f45ae
JA
587 je->elapsed_sec = cpu_to_le32(je->nr_running);
588 je->eta_sec = cpu_to_le64(je->eta_sec);
cf451d1e 589
1d1f45ae
JA
590 fio_net_send_cmd(server_fd, FIO_NET_CMD_ETA, buf, size);
591 free(je);
cf451d1e
JA
592}
593
142575e6
JA
594int fio_server_log(const char *format, ...)
595{
596 char buffer[1024];
597 va_list args;
82fa6b21 598 size_t len;
142575e6
JA
599
600 va_start(args, format);
82fa6b21 601 len = vsnprintf(buffer, sizeof(buffer), format, args);
142575e6
JA
602 va_end(args);
603
82fa6b21 604 return fio_server_text_output(buffer, len);
37db14fe 605}
e46d8091
JA
606
607int fio_start_server(int daemonize)
608{
609 pid_t pid;
610
611 if (!daemonize)
612 return fio_server();
613
614 openlog("fio", LOG_NDELAY|LOG_NOWAIT|LOG_PID, LOG_USER);
615 pid = fork();
616 if (pid < 0) {
617 syslog(LOG_ERR, "failed server fork");
618 return 1;
619 } else if (pid)
620 exit(0);
621
622 setsid();
623 close(STDIN_FILENO);
624 close(STDOUT_FILENO);
625 close(STDERR_FILENO);
626 f_out = NULL;
627 f_err = NULL;
628 log_syslog = 1;
629 return fio_server();
630}