net: fix accidental overwrite of more than just the address
[fio.git] / engines / net.c
... / ...
CommitLineData
1/*
2 * net engine
3 *
4 * IO engine that reads/writes to/from sockets.
5 *
6 */
7#include <stdio.h>
8#include <stdlib.h>
9#include <unistd.h>
10#include <signal.h>
11#include <errno.h>
12#include <assert.h>
13#include <netinet/in.h>
14#include <netinet/tcp.h>
15#include <arpa/inet.h>
16#include <netdb.h>
17#include <sys/poll.h>
18#include <sys/types.h>
19#include <sys/stat.h>
20#include <sys/socket.h>
21#include <sys/un.h>
22
23#include "../fio.h"
24
25struct netio_data {
26 int listenfd;
27 int use_splice;
28 int pipes[2];
29 struct sockaddr_in addr;
30 struct sockaddr_in6 addr6;
31 struct sockaddr_un addr_un;
32};
33
34struct netio_options {
35 struct thread_data *td;
36 unsigned int port;
37 unsigned int proto;
38 unsigned int listen;
39 unsigned int pingpong;
40 unsigned int nodelay;
41 unsigned int ttl;
42 char *intfc;
43};
44
45struct udp_close_msg {
46 uint32_t magic;
47 uint32_t cmd;
48};
49
50enum {
51 FIO_LINK_CLOSE = 0x89,
52 FIO_LINK_OPEN_CLOSE_MAGIC = 0x6c696e6b,
53 FIO_LINK_OPEN = 0x98,
54
55 FIO_TYPE_TCP = 1,
56 FIO_TYPE_UDP = 2,
57 FIO_TYPE_UNIX = 3,
58 FIO_TYPE_TCP_V6 = 4,
59 FIO_TYPE_UDP_V6 = 5,
60};
61
62static int str_hostname_cb(void *data, const char *input);
63static struct fio_option options[] = {
64 {
65 .name = "hostname",
66 .lname = "net engine hostname",
67 .type = FIO_OPT_STR_STORE,
68 .cb = str_hostname_cb,
69 .help = "Hostname for net IO engine",
70 .category = FIO_OPT_C_ENGINE,
71 .group = FIO_OPT_G_NETIO,
72 },
73 {
74 .name = "port",
75 .lname = "net engine port",
76 .type = FIO_OPT_INT,
77 .off1 = offsetof(struct netio_options, port),
78 .minval = 1,
79 .maxval = 65535,
80 .help = "Port to use for TCP or UDP net connections",
81 .category = FIO_OPT_C_ENGINE,
82 .group = FIO_OPT_G_NETIO,
83 },
84 {
85 .name = "protocol",
86 .lname = "net engine protocol",
87 .alias = "proto",
88 .type = FIO_OPT_STR,
89 .off1 = offsetof(struct netio_options, proto),
90 .help = "Network protocol to use",
91 .def = "tcp",
92 .posval = {
93 { .ival = "tcp",
94 .oval = FIO_TYPE_TCP,
95 .help = "Transmission Control Protocol",
96 },
97#ifdef CONFIG_IPV6
98 { .ival = "tcpv6",
99 .oval = FIO_TYPE_TCP_V6,
100 .help = "Transmission Control Protocol V6",
101 },
102#endif
103 { .ival = "udp",
104 .oval = FIO_TYPE_UDP,
105 .help = "User Datagram Protocol",
106 },
107#ifdef CONFIG_IPV6
108 { .ival = "udpv6",
109 .oval = FIO_TYPE_UDP_V6,
110 .help = "User Datagram Protocol V6",
111 },
112#endif
113 { .ival = "unix",
114 .oval = FIO_TYPE_UNIX,
115 .help = "UNIX domain socket",
116 },
117 },
118 .category = FIO_OPT_C_ENGINE,
119 .group = FIO_OPT_G_NETIO,
120 },
121#ifdef CONFIG_TCP_NODELAY
122 {
123 .name = "nodelay",
124 .type = FIO_OPT_BOOL,
125 .off1 = offsetof(struct netio_options, nodelay),
126 .help = "Use TCP_NODELAY on TCP connections",
127 .category = FIO_OPT_C_ENGINE,
128 .group = FIO_OPT_G_NETIO,
129 },
130#endif
131 {
132 .name = "listen",
133 .lname = "net engine listen",
134 .type = FIO_OPT_STR_SET,
135 .off1 = offsetof(struct netio_options, listen),
136 .help = "Listen for incoming TCP connections",
137 .category = FIO_OPT_C_ENGINE,
138 .group = FIO_OPT_G_NETIO,
139 },
140 {
141 .name = "pingpong",
142 .type = FIO_OPT_STR_SET,
143 .off1 = offsetof(struct netio_options, pingpong),
144 .help = "Ping-pong IO requests",
145 .category = FIO_OPT_C_ENGINE,
146 .group = FIO_OPT_G_NETIO,
147 },
148 {
149 .name = "interface",
150 .lname = "net engine interface",
151 .type = FIO_OPT_STR_STORE,
152 .off1 = offsetof(struct netio_options, intfc),
153 .help = "Network interface to use",
154 .category = FIO_OPT_C_ENGINE,
155 .group = FIO_OPT_G_NETIO,
156 },
157 {
158 .name = "ttl",
159 .lname = "net engine multicast ttl",
160 .type = FIO_OPT_INT,
161 .off1 = offsetof(struct netio_options, ttl),
162 .def = "1",
163 .minval = 0,
164 .help = "Time-to-live value for outgoing UDP multicast packets",
165 .category = FIO_OPT_C_ENGINE,
166 .group = FIO_OPT_G_NETIO,
167 },
168 {
169 .name = NULL,
170 },
171};
172
173static inline int is_udp(struct netio_options *o)
174{
175 return o->proto == FIO_TYPE_UDP || o->proto == FIO_TYPE_UDP_V6;
176}
177
178static inline int is_tcp(struct netio_options *o)
179{
180 return o->proto == FIO_TYPE_TCP || o->proto == FIO_TYPE_TCP_V6;
181}
182
183static inline int is_ipv6(struct netio_options *o)
184{
185 return o->proto == FIO_TYPE_UDP_V6 || o->proto == FIO_TYPE_TCP_V6;
186}
187
188/*
189 * Return -1 for error and 'nr events' for a positive number
190 * of events
191 */
192static int poll_wait(struct thread_data *td, int fd, short events)
193{
194 struct pollfd pfd;
195 int ret;
196
197 while (!td->terminate) {
198 pfd.fd = fd;
199 pfd.events = events;
200 ret = poll(&pfd, 1, -1);
201 if (ret < 0) {
202 if (errno == EINTR)
203 break;
204
205 td_verror(td, errno, "poll");
206 return -1;
207 } else if (!ret)
208 continue;
209
210 break;
211 }
212
213 if (pfd.revents & events)
214 return 1;
215
216 return -1;
217}
218
219static int fio_netio_is_multicast(const char *mcaddr)
220{
221 in_addr_t addr = inet_network(mcaddr);
222 if (addr == -1)
223 return 0;
224
225 if (inet_network("224.0.0.0") <= addr &&
226 inet_network("239.255.255.255") >= addr)
227 return 1;
228
229 return 0;
230}
231
232
233static int fio_netio_prep(struct thread_data *td, struct io_u *io_u)
234{
235 struct netio_options *o = td->eo;
236
237 /*
238 * Make sure we don't see spurious reads to a receiver, and vice versa
239 */
240 if (is_tcp(o))
241 return 0;
242
243 if ((o->listen && io_u->ddir == DDIR_WRITE) ||
244 (!o->listen && io_u->ddir == DDIR_READ)) {
245 td_verror(td, EINVAL, "bad direction");
246 return 1;
247 }
248
249 return 0;
250}
251
252#ifdef CONFIG_LINUX_SPLICE
253static int splice_io_u(int fdin, int fdout, unsigned int len)
254{
255 int bytes = 0;
256
257 while (len) {
258 int ret = splice(fdin, NULL, fdout, NULL, len, 0);
259
260 if (ret < 0) {
261 if (!bytes)
262 bytes = ret;
263
264 break;
265 } else if (!ret)
266 break;
267
268 bytes += ret;
269 len -= ret;
270 }
271
272 return bytes;
273}
274
275/*
276 * Receive bytes from a socket and fill them into the internal pipe
277 */
278static int splice_in(struct thread_data *td, struct io_u *io_u)
279{
280 struct netio_data *nd = td->io_ops->data;
281
282 return splice_io_u(io_u->file->fd, nd->pipes[1], io_u->xfer_buflen);
283}
284
285/*
286 * Transmit 'len' bytes from the internal pipe
287 */
288static int splice_out(struct thread_data *td, struct io_u *io_u,
289 unsigned int len)
290{
291 struct netio_data *nd = td->io_ops->data;
292
293 return splice_io_u(nd->pipes[0], io_u->file->fd, len);
294}
295
296static int vmsplice_io_u(struct io_u *io_u, int fd, unsigned int len)
297{
298 struct iovec iov = {
299 .iov_base = io_u->xfer_buf,
300 .iov_len = len,
301 };
302 int bytes = 0;
303
304 while (iov.iov_len) {
305 int ret = vmsplice(fd, &iov, 1, SPLICE_F_MOVE);
306
307 if (ret < 0) {
308 if (!bytes)
309 bytes = ret;
310 break;
311 } else if (!ret)
312 break;
313
314 iov.iov_len -= ret;
315 iov.iov_base += ret;
316 bytes += ret;
317 }
318
319 return bytes;
320
321}
322
323/*
324 * vmsplice() pipe to io_u buffer
325 */
326static int vmsplice_io_u_out(struct thread_data *td, struct io_u *io_u,
327 unsigned int len)
328{
329 struct netio_data *nd = td->io_ops->data;
330
331 return vmsplice_io_u(io_u, nd->pipes[0], len);
332}
333
334/*
335 * vmsplice() io_u to pipe
336 */
337static int vmsplice_io_u_in(struct thread_data *td, struct io_u *io_u)
338{
339 struct netio_data *nd = td->io_ops->data;
340
341 return vmsplice_io_u(io_u, nd->pipes[1], io_u->xfer_buflen);
342}
343
344/*
345 * splice receive - transfer socket data into a pipe using splice, then map
346 * that pipe data into the io_u using vmsplice.
347 */
348static int fio_netio_splice_in(struct thread_data *td, struct io_u *io_u)
349{
350 int ret;
351
352 ret = splice_in(td, io_u);
353 if (ret > 0)
354 return vmsplice_io_u_out(td, io_u, ret);
355
356 return ret;
357}
358
359/*
360 * splice transmit - map data from the io_u into a pipe by using vmsplice,
361 * then transfer that pipe to a socket using splice.
362 */
363static int fio_netio_splice_out(struct thread_data *td, struct io_u *io_u)
364{
365 int ret;
366
367 ret = vmsplice_io_u_in(td, io_u);
368 if (ret > 0)
369 return splice_out(td, io_u, ret);
370
371 return ret;
372}
373#else
374static int fio_netio_splice_in(struct thread_data *td, struct io_u *io_u)
375{
376 errno = EOPNOTSUPP;
377 return -1;
378}
379
380static int fio_netio_splice_out(struct thread_data *td, struct io_u *io_u)
381{
382 errno = EOPNOTSUPP;
383 return -1;
384}
385#endif
386
387static int fio_netio_send(struct thread_data *td, struct io_u *io_u)
388{
389 struct netio_data *nd = td->io_ops->data;
390 struct netio_options *o = td->eo;
391 int ret, flags = 0;
392
393 do {
394 if (is_udp(o)) {
395 struct sockaddr *to;
396 socklen_t len;
397
398 if (is_ipv6(o)) {
399 to = (struct sockaddr *) &nd->addr6;
400 len = sizeof(nd->addr6);
401 } else {
402 to = (struct sockaddr *) &nd->addr;
403 len = sizeof(nd->addr);
404 }
405
406 ret = sendto(io_u->file->fd, io_u->xfer_buf,
407 io_u->xfer_buflen, flags, to, len);
408 } else {
409 /*
410 * if we are going to write more, set MSG_MORE
411 */
412#ifdef MSG_MORE
413 if ((td->this_io_bytes[DDIR_WRITE] + io_u->xfer_buflen <
414 td->o.size) && !o->pingpong)
415 flags |= MSG_MORE;
416#endif
417 ret = send(io_u->file->fd, io_u->xfer_buf,
418 io_u->xfer_buflen, flags);
419 }
420 if (ret > 0)
421 break;
422
423 ret = poll_wait(td, io_u->file->fd, POLLOUT);
424 if (ret <= 0)
425 break;
426 } while (1);
427
428 return ret;
429}
430
431static int is_udp_close(struct io_u *io_u, int len)
432{
433 struct udp_close_msg *msg;
434
435 if (len != sizeof(struct udp_close_msg))
436 return 0;
437
438 msg = io_u->xfer_buf;
439 if (ntohl(msg->magic) != FIO_LINK_OPEN_CLOSE_MAGIC)
440 return 0;
441 if (ntohl(msg->cmd) != FIO_LINK_CLOSE)
442 return 0;
443
444 return 1;
445}
446
447static int fio_netio_recv(struct thread_data *td, struct io_u *io_u)
448{
449 struct netio_data *nd = td->io_ops->data;
450 struct netio_options *o = td->eo;
451 int ret, flags = 0;
452
453 do {
454 if (is_udp(o)) {
455 struct sockaddr *from;
456 socklen_t l, *len = &l;
457
458 if (o->listen) {
459 if (!is_ipv6(o)) {
460 from = (struct sockaddr *) &nd->addr;
461 *len = sizeof(nd->addr);
462 } else {
463 from = (struct sockaddr *) &nd->addr6;
464 *len = sizeof(nd->addr6);
465 }
466 } else {
467 from = NULL;
468 len = NULL;
469 }
470
471 ret = recvfrom(io_u->file->fd, io_u->xfer_buf,
472 io_u->xfer_buflen, flags, from, len);
473 if (is_udp_close(io_u, ret)) {
474 td->done = 1;
475 return 0;
476 }
477 } else {
478 ret = recv(io_u->file->fd, io_u->xfer_buf,
479 io_u->xfer_buflen, flags);
480 }
481 if (ret > 0)
482 break;
483 else if (!ret && (flags & MSG_WAITALL))
484 break;
485
486 ret = poll_wait(td, io_u->file->fd, POLLIN);
487 if (ret <= 0)
488 break;
489 flags |= MSG_WAITALL;
490 } while (1);
491
492 return ret;
493}
494
495static int __fio_netio_queue(struct thread_data *td, struct io_u *io_u,
496 enum fio_ddir ddir)
497{
498 struct netio_data *nd = td->io_ops->data;
499 struct netio_options *o = td->eo;
500 int ret;
501
502 if (ddir == DDIR_WRITE) {
503 if (!nd->use_splice || is_udp(o) ||
504 o->proto == FIO_TYPE_UNIX)
505 ret = fio_netio_send(td, io_u);
506 else
507 ret = fio_netio_splice_out(td, io_u);
508 } else if (ddir == DDIR_READ) {
509 if (!nd->use_splice || is_udp(o) ||
510 o->proto == FIO_TYPE_UNIX)
511 ret = fio_netio_recv(td, io_u);
512 else
513 ret = fio_netio_splice_in(td, io_u);
514 } else
515 ret = 0; /* must be a SYNC */
516
517 if (ret != (int) io_u->xfer_buflen) {
518 if (ret >= 0) {
519 io_u->resid = io_u->xfer_buflen - ret;
520 io_u->error = 0;
521 return FIO_Q_COMPLETED;
522 } else {
523 int err = errno;
524
525 if (ddir == DDIR_WRITE && err == EMSGSIZE)
526 return FIO_Q_BUSY;
527
528 io_u->error = err;
529 }
530 }
531
532 if (io_u->error)
533 td_verror(td, io_u->error, "xfer");
534
535 return FIO_Q_COMPLETED;
536}
537
538static int fio_netio_queue(struct thread_data *td, struct io_u *io_u)
539{
540 struct netio_options *o = td->eo;
541 int ret;
542
543 fio_ro_check(td, io_u);
544
545 ret = __fio_netio_queue(td, io_u, io_u->ddir);
546 if (!o->pingpong || ret != FIO_Q_COMPLETED)
547 return ret;
548
549 /*
550 * For ping-pong mode, receive or send reply as needed
551 */
552 if (td_read(td) && io_u->ddir == DDIR_READ)
553 ret = __fio_netio_queue(td, io_u, DDIR_WRITE);
554 else if (td_write(td) && io_u->ddir == DDIR_WRITE)
555 ret = __fio_netio_queue(td, io_u, DDIR_READ);
556
557 return ret;
558}
559
560static int fio_netio_connect(struct thread_data *td, struct fio_file *f)
561{
562 struct netio_data *nd = td->io_ops->data;
563 struct netio_options *o = td->eo;
564 int type, domain;
565
566 if (o->proto == FIO_TYPE_TCP) {
567 domain = AF_INET;
568 type = SOCK_STREAM;
569 } else if (o->proto == FIO_TYPE_TCP_V6) {
570 domain = AF_INET6;
571 type = SOCK_STREAM;
572 } else if (o->proto == FIO_TYPE_UDP) {
573 domain = AF_INET;
574 type = SOCK_DGRAM;
575 } else if (o->proto == FIO_TYPE_UDP_V6) {
576 domain = AF_INET6;
577 type = SOCK_DGRAM;
578 } else if (o->proto == FIO_TYPE_UNIX) {
579 domain = AF_UNIX;
580 type = SOCK_STREAM;
581 } else {
582 log_err("fio: bad network type %d\n", o->proto);
583 f->fd = -1;
584 return 1;
585 }
586
587 f->fd = socket(domain, type, 0);
588 if (f->fd < 0) {
589 td_verror(td, errno, "socket");
590 return 1;
591 }
592
593#ifdef CONFIG_TCP_NODELAY
594 if (o->nodelay && is_tcp(o)) {
595 int optval = 1;
596
597 if (setsockopt(f->fd, IPPROTO_TCP, TCP_NODELAY, (void *) &optval, sizeof(int)) < 0) {
598 log_err("fio: cannot set TCP_NODELAY option on socket (%s), disable with 'nodelay=0'\n", strerror(errno));
599 return 1;
600 }
601 }
602#endif
603
604 if (is_udp(o)) {
605 if (!fio_netio_is_multicast(td->o.filename))
606 return 0;
607 if (is_ipv6(o)) {
608 log_err("fio: multicast not supported on IPv6\n");
609 close(f->fd);
610 return 1;
611 }
612
613 if (o->intfc) {
614 struct in_addr interface_addr;
615
616 if (inet_aton(o->intfc, &interface_addr) == 0) {
617 log_err("fio: interface not valid interface IP\n");
618 close(f->fd);
619 return 1;
620 }
621 if (setsockopt(f->fd, IPPROTO_IP, IP_MULTICAST_IF, (const char*)&interface_addr, sizeof(interface_addr)) < 0) {
622 td_verror(td, errno, "setsockopt IP_MULTICAST_IF");
623 close(f->fd);
624 return 1;
625 }
626 }
627 if (setsockopt(f->fd, IPPROTO_IP, IP_MULTICAST_TTL, (const char*)&o->ttl, sizeof(o->ttl)) < 0) {
628 td_verror(td, errno, "setsockopt IP_MULTICAST_TTL");
629 close(f->fd);
630 return 1;
631 }
632 return 0;
633 } else if (o->proto == FIO_TYPE_TCP) {
634 socklen_t len = sizeof(nd->addr);
635
636 if (connect(f->fd, (struct sockaddr *) &nd->addr, len) < 0) {
637 td_verror(td, errno, "connect");
638 close(f->fd);
639 return 1;
640 }
641 } else if (o->proto == FIO_TYPE_TCP_V6) {
642 socklen_t len = sizeof(nd->addr6);
643
644 if (connect(f->fd, (struct sockaddr *) &nd->addr6, len) < 0) {
645 td_verror(td, errno, "connect");
646 close(f->fd);
647 return 1;
648 }
649
650 } else {
651 struct sockaddr_un *addr = &nd->addr_un;
652 socklen_t len;
653
654 len = sizeof(addr->sun_family) + strlen(addr->sun_path) + 1;
655
656 if (connect(f->fd, (struct sockaddr *) addr, len) < 0) {
657 td_verror(td, errno, "connect");
658 close(f->fd);
659 return 1;
660 }
661 }
662
663 return 0;
664}
665
666static int fio_netio_accept(struct thread_data *td, struct fio_file *f)
667{
668 struct netio_data *nd = td->io_ops->data;
669 struct netio_options *o = td->eo;
670 socklen_t socklen;
671 int state;
672
673 if (is_udp(o)) {
674 f->fd = nd->listenfd;
675 return 0;
676 }
677
678 state = td->runstate;
679 td_set_runstate(td, TD_SETTING_UP);
680
681 log_info("fio: waiting for connection\n");
682
683 if (poll_wait(td, nd->listenfd, POLLIN) < 0)
684 goto err;
685
686 if (o->proto == FIO_TYPE_TCP) {
687 socklen = sizeof(nd->addr);
688 f->fd = accept(nd->listenfd, (struct sockaddr *) &nd->addr, &socklen);
689 } else {
690 socklen = sizeof(nd->addr6);
691 f->fd = accept(nd->listenfd, (struct sockaddr *) &nd->addr6, &socklen);
692 }
693
694 if (f->fd < 0) {
695 td_verror(td, errno, "accept");
696 goto err;
697 }
698
699#ifdef CONFIG_TCP_NODELAY
700 if (o->nodelay && is_tcp(o)) {
701 int optval = 1;
702
703 if (setsockopt(f->fd, IPPROTO_TCP, TCP_NODELAY, (void *) &optval, sizeof(int)) < 0) {
704 log_err("fio: cannot set TCP_NODELAY option on socket (%s), disable with 'nodelay=0'\n", strerror(errno));
705 return 1;
706 }
707 }
708#endif
709
710 reset_all_stats(td);
711 td_set_runstate(td, state);
712 return 0;
713err:
714 td_set_runstate(td, state);
715 return 1;
716}
717
718static void fio_netio_udp_close(struct thread_data *td, struct fio_file *f)
719{
720 struct netio_data *nd = td->io_ops->data;
721 struct netio_options *o = td->eo;
722 struct udp_close_msg msg;
723 struct sockaddr *to;
724 socklen_t len;
725 int ret;
726
727 if (is_ipv6(o)) {
728 to = (struct sockaddr *) &nd->addr6;
729 len = sizeof(nd->addr6);
730 } else {
731 to = (struct sockaddr *) &nd->addr;
732 len = sizeof(nd->addr);
733 }
734
735 msg.magic = htonl(FIO_LINK_OPEN_CLOSE_MAGIC);
736 msg.cmd = htonl(FIO_LINK_CLOSE);
737
738 ret = sendto(f->fd, (void *) &msg, sizeof(msg), MSG_WAITALL, to, len);
739 if (ret < 0)
740 td_verror(td, errno, "sendto udp link close");
741}
742
743static int fio_netio_close_file(struct thread_data *td, struct fio_file *f)
744{
745 struct netio_options *o = td->eo;
746
747 /*
748 * If this is an UDP connection, notify the receiver that we are
749 * closing down the link
750 */
751 if (is_udp(o))
752 fio_netio_udp_close(td, f);
753
754 return generic_close_file(td, f);
755}
756
757static int fio_netio_udp_recv_open(struct thread_data *td, struct fio_file *f)
758{
759 struct netio_data *nd = td->io_ops->data;
760 struct netio_options *o = td->eo;
761 struct udp_close_msg msg;
762 struct sockaddr *to;
763 socklen_t len;
764 int ret;
765
766 if (is_ipv6(o)) {
767 len = sizeof(nd->addr6);
768 to = (struct sockaddr *) &nd->addr6;
769 } else {
770 len = sizeof(nd->addr);
771 to = (struct sockaddr *) &nd->addr;
772 }
773
774 ret = recvfrom(f->fd, (void *) &msg, sizeof(msg), MSG_WAITALL, to, &len);
775 if (ret < 0) {
776 td_verror(td, errno, "recvfrom udp link open");
777 return ret;
778 }
779
780 if (ntohl(msg.magic) != FIO_LINK_OPEN_CLOSE_MAGIC ||
781 ntohl(msg.cmd) != FIO_LINK_OPEN) {
782 log_err("fio: bad udp open magic %x/%x\n", ntohl(msg.magic),
783 ntohl(msg.cmd));
784 return -1;
785 }
786
787 return 0;
788}
789
790static int fio_netio_udp_send_open(struct thread_data *td, struct fio_file *f)
791{
792 struct netio_data *nd = td->io_ops->data;
793 struct netio_options *o = td->eo;
794 struct udp_close_msg msg;
795 struct sockaddr *to;
796 socklen_t len;
797 int ret;
798
799 if (is_ipv6(o)) {
800 len = sizeof(nd->addr6);
801 to = (struct sockaddr *) &nd->addr6;
802 } else {
803 len = sizeof(nd->addr);
804 to = (struct sockaddr *) &nd->addr;
805 }
806
807 msg.magic = htonl(FIO_LINK_OPEN_CLOSE_MAGIC);
808 msg.cmd = htonl(FIO_LINK_OPEN);
809
810 ret = sendto(f->fd, (void *) &msg, sizeof(msg), MSG_WAITALL, to, len);
811 if (ret < 0) {
812 td_verror(td, errno, "sendto udp link open");
813 return ret;
814 }
815
816 return 0;
817}
818
819static int fio_netio_open_file(struct thread_data *td, struct fio_file *f)
820{
821 int ret;
822 struct netio_options *o = td->eo;
823
824 if (o->listen)
825 ret = fio_netio_accept(td, f);
826 else
827 ret = fio_netio_connect(td, f);
828
829 if (ret) {
830 f->fd = -1;
831 return ret;
832 }
833
834 if (is_udp(o)) {
835 if (td_write(td))
836 ret = fio_netio_udp_send_open(td, f);
837 else {
838 int state;
839
840 state = td->runstate;
841 td_set_runstate(td, TD_SETTING_UP);
842 ret = fio_netio_udp_recv_open(td, f);
843 td_set_runstate(td, state);
844 }
845 }
846
847 if (ret)
848 fio_netio_close_file(td, f);
849
850 return ret;
851}
852
853static int fio_fill_addr(struct thread_data *td, const char *host, int af,
854 void *dst, struct addrinfo **res)
855{
856 struct netio_options *o = td->eo;
857 struct addrinfo hints;
858 int ret;
859
860 if (inet_pton(af, host, dst))
861 return 0;
862
863 memset(&hints, 0, sizeof(hints));
864
865 if (is_tcp(o))
866 hints.ai_socktype = SOCK_STREAM;
867 else
868 hints.ai_socktype = SOCK_DGRAM;
869
870 if (is_ipv6(o))
871 hints.ai_family = AF_INET6;
872 else
873 hints.ai_family = AF_INET;
874
875 ret = getaddrinfo(host, NULL, &hints, res);
876 if (ret) {
877 int e = EINVAL;
878 char str[128];
879
880 if (ret == EAI_SYSTEM)
881 e = errno;
882
883 snprintf(str, sizeof(str), "getaddrinfo: %s", gai_strerror(ret));
884 td_verror(td, e, str);
885 return 1;
886 }
887
888 return 0;
889}
890
891static int fio_netio_setup_connect_inet(struct thread_data *td,
892 const char *host, unsigned short port)
893{
894 struct netio_data *nd = td->io_ops->data;
895 struct netio_options *o = td->eo;
896 struct addrinfo *res = NULL;
897 void *dst, *src;
898 int af, len;
899
900 if (!host) {
901 log_err("fio: connect with no host to connect to.\n");
902 if (td_read(td))
903 log_err("fio: did you forget to set 'listen'?\n");
904
905 td_verror(td, EINVAL, "no hostname= set");
906 return 1;
907 }
908
909 nd->addr.sin_family = AF_INET;
910 nd->addr.sin_port = htons(port);
911 nd->addr6.sin6_family = AF_INET6;
912 nd->addr6.sin6_port = htons(port);
913
914 if (is_ipv6(o)) {
915 af = AF_INET6;
916 dst = &nd->addr6.sin6_addr;
917 } else {
918 af = AF_INET;
919 dst = &nd->addr.sin_addr;
920 }
921
922 if (fio_fill_addr(td, host, af, dst, &res))
923 return 1;
924
925 if (!res)
926 return 0;
927
928 if (is_ipv6(o)) {
929 len = sizeof(nd->addr6.sin6_addr);
930 src = &((struct sockaddr_in6 *) res->ai_addr)->sin6_addr;
931 } else {
932 len = sizeof(nd->addr.sin_addr);
933 src = &((struct sockaddr_in *) res->ai_addr)->sin_addr;
934 }
935
936 memcpy(dst, src, len);
937 freeaddrinfo(res);
938 return 0;
939}
940
941static int fio_netio_setup_connect_unix(struct thread_data *td,
942 const char *path)
943{
944 struct netio_data *nd = td->io_ops->data;
945 struct sockaddr_un *soun = &nd->addr_un;
946
947 soun->sun_family = AF_UNIX;
948 strcpy(soun->sun_path, path);
949 return 0;
950}
951
952static int fio_netio_setup_connect(struct thread_data *td)
953{
954 struct netio_options *o = td->eo;
955
956 if (is_udp(o) || is_tcp(o))
957 return fio_netio_setup_connect_inet(td, td->o.filename,o->port);
958 else
959 return fio_netio_setup_connect_unix(td, td->o.filename);
960}
961
962static int fio_netio_setup_listen_unix(struct thread_data *td, const char *path)
963{
964 struct netio_data *nd = td->io_ops->data;
965 struct sockaddr_un *addr = &nd->addr_un;
966 mode_t mode;
967 int len, fd;
968
969 fd = socket(AF_UNIX, SOCK_STREAM, 0);
970 if (fd < 0) {
971 log_err("fio: socket: %s\n", strerror(errno));
972 return -1;
973 }
974
975 mode = umask(000);
976
977 memset(addr, 0, sizeof(*addr));
978 addr->sun_family = AF_UNIX;
979 strcpy(addr->sun_path, path);
980 unlink(path);
981
982 len = sizeof(addr->sun_family) + strlen(path) + 1;
983
984 if (bind(fd, (struct sockaddr *) addr, len) < 0) {
985 log_err("fio: bind: %s\n", strerror(errno));
986 close(fd);
987 return -1;
988 }
989
990 umask(mode);
991 nd->listenfd = fd;
992 return 0;
993}
994
995static int fio_netio_setup_listen_inet(struct thread_data *td, short port)
996{
997 struct netio_data *nd = td->io_ops->data;
998 struct netio_options *o = td->eo;
999 struct ip_mreq mr;
1000 struct sockaddr_in sin;
1001 struct sockaddr_in6 sin6;
1002 struct sockaddr *saddr;
1003 int fd, opt, type, domain;
1004 socklen_t len;
1005
1006 memset(&sin, 0, sizeof(sin));
1007 memset(&sin6, 0, sizeof(sin6));
1008
1009 if (o->proto == FIO_TYPE_TCP) {
1010 type = SOCK_STREAM;
1011 domain = AF_INET;
1012 } else if (o->proto == FIO_TYPE_TCP_V6) {
1013 type = SOCK_STREAM;
1014 domain = AF_INET6;
1015 } else if (o->proto == FIO_TYPE_UDP) {
1016 type = SOCK_DGRAM;
1017 domain = AF_INET;
1018 } else if (o->proto == FIO_TYPE_UDP_V6) {
1019 type = SOCK_DGRAM;
1020 domain = AF_INET6;
1021 } else {
1022 log_err("fio: unknown proto %d\n", o->proto);
1023 return 1;
1024 }
1025
1026 fd = socket(domain, type, 0);
1027 if (fd < 0) {
1028 td_verror(td, errno, "socket");
1029 return 1;
1030 }
1031
1032 opt = 1;
1033 if (setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, (void *) &opt, sizeof(opt)) < 0) {
1034 td_verror(td, errno, "setsockopt");
1035 close(fd);
1036 return 1;
1037 }
1038#ifdef SO_REUSEPORT
1039 if (setsockopt(fd, SOL_SOCKET, SO_REUSEPORT, (void *) &opt, sizeof(opt)) < 0) {
1040 td_verror(td, errno, "setsockopt");
1041 close(fd);
1042 return 1;
1043 }
1044#endif
1045
1046 if (td->o.filename) {
1047 if (!is_udp(o) || !fio_netio_is_multicast(td->o.filename)) {
1048 log_err("fio: hostname not valid for non-multicast inbound network IO\n");
1049 close(fd);
1050 return 1;
1051 }
1052 if (is_ipv6(o)) {
1053 log_err("fio: IPv6 not supported for multicast network IO");
1054 close(fd);
1055 return 1;
1056 }
1057
1058 inet_aton(td->o.filename, &sin.sin_addr);
1059
1060 mr.imr_multiaddr = sin.sin_addr;
1061 if (o->intfc) {
1062 if (inet_aton(o->intfc, &mr.imr_interface) == 0) {
1063 log_err("fio: interface not valid interface IP\n");
1064 close(fd);
1065 return 1;
1066 }
1067 } else {
1068 mr.imr_interface.s_addr = htonl(INADDR_ANY);
1069 }
1070
1071 if (setsockopt(fd, IPPROTO_IP, IP_ADD_MEMBERSHIP, (const char*)&mr, sizeof(mr)) < 0) {
1072 td_verror(td, errno, "setsockopt IP_ADD_MEMBERSHIP");
1073 close(fd);
1074 return 1;
1075 }
1076 }
1077
1078 if (!is_ipv6(o)) {
1079 saddr = (struct sockaddr *) &nd->addr;
1080 len = sizeof(nd->addr);
1081
1082 nd->addr.sin_family = AF_INET;
1083 nd->addr.sin_addr.s_addr = sin.sin_addr.s_addr ? sin.sin_addr.s_addr : htonl(INADDR_ANY);
1084 nd->addr.sin_port = htons(port);
1085 } else {
1086 saddr = (struct sockaddr *) &nd->addr6;
1087 len = sizeof(nd->addr6);
1088
1089 nd->addr6.sin6_family = AF_INET6;
1090 nd->addr6.sin6_addr = sin6.sin6_addr.s6_addr ? sin6.sin6_addr : in6addr_any;
1091 nd->addr6.sin6_port = htons(port);
1092 }
1093
1094 if (bind(fd, saddr, len) < 0) {
1095 td_verror(td, errno, "bind");
1096 return 1;
1097 }
1098
1099 nd->listenfd = fd;
1100 return 0;
1101}
1102
1103static int fio_netio_setup_listen(struct thread_data *td)
1104{
1105 struct netio_data *nd = td->io_ops->data;
1106 struct netio_options *o = td->eo;
1107 int ret;
1108
1109 if (is_udp(o) || is_tcp(o))
1110 ret = fio_netio_setup_listen_inet(td, o->port);
1111 else
1112 ret = fio_netio_setup_listen_unix(td, td->o.filename);
1113
1114 if (ret)
1115 return ret;
1116 if (is_udp(o))
1117 return 0;
1118
1119 if (listen(nd->listenfd, 10) < 0) {
1120 td_verror(td, errno, "listen");
1121 nd->listenfd = -1;
1122 return 1;
1123 }
1124
1125 return 0;
1126}
1127
1128static int fio_netio_init(struct thread_data *td)
1129{
1130 struct netio_options *o = td->eo;
1131 int ret;
1132
1133#ifdef WIN32
1134 WSADATA wsd;
1135 WSAStartup(MAKEWORD(2,2), &wsd);
1136#endif
1137
1138 if (td_random(td)) {
1139 log_err("fio: network IO can't be random\n");
1140 return 1;
1141 }
1142
1143 if (o->proto == FIO_TYPE_UNIX && o->port) {
1144 log_err("fio: network IO port not valid with unix socket\n");
1145 return 1;
1146 } else if (o->proto != FIO_TYPE_UNIX && !o->port) {
1147 log_err("fio: network IO requires port for tcp or udp\n");
1148 return 1;
1149 }
1150
1151 if (!is_tcp(o)) {
1152 if (o->listen) {
1153 log_err("fio: listen only valid for TCP proto IO\n");
1154 return 1;
1155 }
1156 if (td_rw(td)) {
1157 log_err("fio: datagram network connections must be"
1158 " read OR write\n");
1159 return 1;
1160 }
1161 if (o->proto == FIO_TYPE_UNIX && !td->o.filename) {
1162 log_err("fio: UNIX sockets need host/filename\n");
1163 return 1;
1164 }
1165 o->listen = td_read(td);
1166 }
1167
1168 if (o->listen)
1169 ret = fio_netio_setup_listen(td);
1170 else
1171 ret = fio_netio_setup_connect(td);
1172
1173 return ret;
1174}
1175
1176static void fio_netio_cleanup(struct thread_data *td)
1177{
1178 struct netio_data *nd = td->io_ops->data;
1179
1180 if (nd) {
1181 if (nd->listenfd != -1)
1182 close(nd->listenfd);
1183 if (nd->pipes[0] != -1)
1184 close(nd->pipes[0]);
1185 if (nd->pipes[1] != -1)
1186 close(nd->pipes[1]);
1187
1188 free(nd);
1189 }
1190}
1191
1192static int fio_netio_setup(struct thread_data *td)
1193{
1194 struct netio_data *nd;
1195
1196 if (!td->files_index) {
1197 add_file(td, td->o.filename ?: "net", 0);
1198 td->o.nr_files = td->o.nr_files ?: 1;
1199 }
1200
1201 if (!td->io_ops->data) {
1202 nd = malloc(sizeof(*nd));;
1203
1204 memset(nd, 0, sizeof(*nd));
1205 nd->listenfd = -1;
1206 nd->pipes[0] = nd->pipes[1] = -1;
1207 td->io_ops->data = nd;
1208 }
1209
1210 return 0;
1211}
1212
1213static void fio_netio_terminate(struct thread_data *td)
1214{
1215 kill(td->pid, SIGUSR2);
1216}
1217
1218#ifdef CONFIG_LINUX_SPLICE
1219static int fio_netio_setup_splice(struct thread_data *td)
1220{
1221 struct netio_data *nd;
1222
1223 fio_netio_setup(td);
1224
1225 nd = td->io_ops->data;
1226 if (nd) {
1227 if (pipe(nd->pipes) < 0)
1228 return 1;
1229
1230 nd->use_splice = 1;
1231 return 0;
1232 }
1233
1234 return 1;
1235}
1236
1237static struct ioengine_ops ioengine_splice = {
1238 .name = "netsplice",
1239 .version = FIO_IOOPS_VERSION,
1240 .prep = fio_netio_prep,
1241 .queue = fio_netio_queue,
1242 .setup = fio_netio_setup_splice,
1243 .init = fio_netio_init,
1244 .cleanup = fio_netio_cleanup,
1245 .open_file = fio_netio_open_file,
1246 .close_file = fio_netio_close_file,
1247 .terminate = fio_netio_terminate,
1248 .options = options,
1249 .option_struct_size = sizeof(struct netio_options),
1250 .flags = FIO_SYNCIO | FIO_DISKLESSIO | FIO_UNIDIR |
1251 FIO_PIPEIO,
1252};
1253#endif
1254
1255static struct ioengine_ops ioengine_rw = {
1256 .name = "net",
1257 .version = FIO_IOOPS_VERSION,
1258 .prep = fio_netio_prep,
1259 .queue = fio_netio_queue,
1260 .setup = fio_netio_setup,
1261 .init = fio_netio_init,
1262 .cleanup = fio_netio_cleanup,
1263 .open_file = fio_netio_open_file,
1264 .close_file = fio_netio_close_file,
1265 .terminate = fio_netio_terminate,
1266 .options = options,
1267 .option_struct_size = sizeof(struct netio_options),
1268 .flags = FIO_SYNCIO | FIO_DISKLESSIO | FIO_UNIDIR |
1269 FIO_PIPEIO | FIO_BIT_BASED,
1270};
1271
1272static int str_hostname_cb(void *data, const char *input)
1273{
1274 struct netio_options *o = data;
1275
1276 if (o->td->o.filename)
1277 free(o->td->o.filename);
1278 o->td->o.filename = strdup(input);
1279 return 0;
1280}
1281
1282static void fio_init fio_netio_register(void)
1283{
1284 register_ioengine(&ioengine_rw);
1285#ifdef CONFIG_LINUX_SPLICE
1286 register_ioengine(&ioengine_splice);
1287#endif
1288}
1289
1290static void fio_exit fio_netio_unregister(void)
1291{
1292 unregister_ioengine(&ioengine_rw);
1293#ifdef CONFIG_LINUX_SPLICE
1294 unregister_ioengine(&ioengine_splice);
1295#endif
1296}