[PATCH] blktrace: net server stat fixes
[blktrace.git] / blktrace.c
CommitLineData
d0ca268b
JA
1/*
2 * block queue tracing application
3 *
d956a2cd
JA
4 * Copyright (C) 2005 Jens Axboe <axboe@suse.de>
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 *
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
15 *
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19 *
d0ca268b
JA
20 */
21#include <pthread.h>
22#include <sys/types.h>
23#include <sys/stat.h>
24#include <unistd.h>
25#include <locale.h>
26#include <signal.h>
27#include <fcntl.h>
28#include <string.h>
29#include <sys/ioctl.h>
b9d4294e 30#include <sys/param.h>
e3e74029 31#include <sys/statfs.h>
eb3c8108 32#include <sys/poll.h>
b7106311 33#include <sys/mman.h>
8e86c98a 34#include <sys/socket.h>
d0ca268b
JA
35#include <stdio.h>
36#include <stdlib.h>
37#include <sched.h>
d39c04ca
AB
38#include <ctype.h>
39#include <getopt.h>
da39451f 40#include <errno.h>
8e86c98a
JA
41#include <netinet/in.h>
42#include <arpa/inet.h>
43#include <netdb.h>
32f18c48 44#include <sys/sendfile.h>
d0ca268b
JA
45
46#include "blktrace.h"
21f55651 47#include "barrier.h"
d0ca268b 48
13d928f0 49static char blktrace_version[] = "0.99";
52724a0e 50
8f551a39
JA
51/*
52 * You may want to increase this even more, if you are logging at a high
53 * rate and see skipped/missed events
54 */
007c233c 55#define BUF_SIZE (512 * 1024)
d0ca268b
JA
56#define BUF_NR (4)
57
007c233c
JA
58#define OFILE_BUF (128 * 1024)
59
e3e74029
NS
60#define RELAYFS_TYPE 0xF0B4A981
61
32f18c48 62#define S_OPTS "d:a:A:r:o:kw:Vb:n:D:lh:p:s"
d5396421 63static struct option l_opts[] = {
5c86134e 64 {
d39c04ca 65 .name = "dev",
428683db 66 .has_arg = required_argument,
d39c04ca
AB
67 .flag = NULL,
68 .val = 'd'
69 },
5c86134e 70 {
d39c04ca 71 .name = "act-mask",
428683db 72 .has_arg = required_argument,
d39c04ca
AB
73 .flag = NULL,
74 .val = 'a'
75 },
5c86134e 76 {
d39c04ca 77 .name = "set-mask",
428683db 78 .has_arg = required_argument,
d39c04ca
AB
79 .flag = NULL,
80 .val = 'A'
81 },
5c86134e 82 {
5270dddd 83 .name = "relay",
428683db 84 .has_arg = required_argument,
5270dddd
JA
85 .flag = NULL,
86 .val = 'r'
87 },
d5396421
JA
88 {
89 .name = "output",
428683db 90 .has_arg = required_argument,
d5396421
JA
91 .flag = NULL,
92 .val = 'o'
93 },
bc39777c
JA
94 {
95 .name = "kill",
428683db 96 .has_arg = no_argument,
bc39777c
JA
97 .flag = NULL,
98 .val = 'k'
99 },
ece238a6
NS
100 {
101 .name = "stopwatch",
428683db 102 .has_arg = required_argument,
ece238a6
NS
103 .flag = NULL,
104 .val = 'w'
105 },
52724a0e
JA
106 {
107 .name = "version",
108 .has_arg = no_argument,
109 .flag = NULL,
57ea8602 110 .val = 'V'
52724a0e 111 },
129aa440 112 {
3f65c585 113 .name = "buffer-size",
129aa440
JA
114 .has_arg = required_argument,
115 .flag = NULL,
116 .val = 'b'
117 },
118 {
3f65c585 119 .name = "num-sub-buffers",
129aa440
JA
120 .has_arg = required_argument,
121 .flag = NULL,
122 .val = 'n'
123 },
d1d7f15f 124 {
3f65c585 125 .name = "output-dir",
d1d7f15f
JA
126 .has_arg = required_argument,
127 .flag = NULL,
128 .val = 'D'
129 },
8e86c98a
JA
130 {
131 .name = "listen",
132 .has_arg = no_argument,
133 .flag = NULL,
134 .val = 'l'
135 },
136 {
137 .name = "host",
138 .has_arg = required_argument,
139 .flag = NULL,
140 .val = 'h'
141 },
142 {
143 .name = "port",
144 .has_arg = required_argument,
145 .flag = NULL,
146 .val = 'p'
147 },
32f18c48
JA
148 {
149 .name = "sendfile",
150 .has_arg = no_argument,
151 .flag = NULL,
152 .val = 's'
153 },
71ef8b7c
JA
154 {
155 .name = NULL,
156 }
d39c04ca
AB
157};
158
9db17354 159struct tip_subbuf {
9db17354 160 void *buf;
5be4bdaf
JA
161 unsigned int len;
162 unsigned int max_len;
32f18c48 163 off_t offset;
9db17354
JA
164};
165
21f55651
JA
166#define FIFO_SIZE (1024) /* should be plenty big! */
167#define CL_SIZE (128) /* cache line, any bigger? */
168
169struct tip_subbuf_fifo {
170 int tail __attribute__((aligned(CL_SIZE)));
171 int head __attribute__((aligned(CL_SIZE)));
172 struct tip_subbuf *q[FIFO_SIZE];
173};
174
d0ca268b
JA
175struct thread_information {
176 int cpu;
177 pthread_t thread;
b9d4294e
JA
178
179 int fd;
a3e4d330 180 void *fd_buf;
b9d4294e
JA
181 char fn[MAXPATHLEN + 64];
182
11eedd9b
JA
183 int pfd;
184 size_t *pfd_buf;
185
007c233c
JA
186 FILE *ofile;
187 char *ofile_buffer;
32f18c48 188 off_t ofile_offset;
9db17354 189 int ofile_stdout;
8e86c98a 190 int ofile_mmap;
007c233c 191
0cc7d25e
JA
192 int (*get_subbuf)(struct thread_information *, unsigned int);
193 int (*flush_subbuf)(struct thread_information *, struct tip_subbuf *);
194 int (*read_data)(struct thread_information *, void *, unsigned int);
195
d0ca268b 196 unsigned long events_processed;
b7106311 197 unsigned long long data_read;
e7c9f3ff 198 struct device_information *device;
9db17354
JA
199
200 int exited;
201
b7106311
JA
202 /*
203 * piped fifo buffers
204 */
21f55651 205 struct tip_subbuf_fifo fifo;
7de86b12 206 struct tip_subbuf *leftover_ts;
b7106311
JA
207
208 /*
209 * mmap controlled output files
210 */
211 unsigned long long fs_size;
212 unsigned long long fs_max_size;
213 unsigned long fs_off;
214 void *fs_buf;
215 unsigned long fs_buf_len;
d0ca268b
JA
216};
217
e7c9f3ff
NS
218struct device_information {
219 int fd;
220 char *path;
221 char buts_name[32];
99c1f5ab 222 volatile int trace_started;
eb3c8108 223 unsigned long drop_count;
e7c9f3ff
NS
224 struct thread_information *threads;
225};
d0ca268b 226
e7c9f3ff 227static int ncpus;
d0ca268b 228static struct thread_information *thread_information;
e7c9f3ff
NS
229static int ndevs;
230static struct device_information *device_information;
231
232/* command line option globals */
233static char *relay_path;
d5396421 234static char *output_name;
d1d7f15f 235static char *output_dir;
5c86134e 236static int act_mask = ~0U;
bc39777c 237static int kill_running_trace;
eb3c8108
JA
238static unsigned long buf_size = BUF_SIZE;
239static unsigned long buf_nr = BUF_NR;
b7106311 240static unsigned int page_size;
d39c04ca 241
e7c9f3ff
NS
242#define is_done() (*(volatile int *)(&done))
243static volatile int done;
244
eb3c8108
JA
245#define is_trace_stopped() (*(volatile int *)(&trace_stopped))
246static volatile int trace_stopped;
247
248#define is_stat_shown() (*(volatile int *)(&stat_shown))
249static volatile int stat_shown;
a3e4d330 250
8e86c98a
JA
251int data_is_native = -1;
252
72ca8801
NS
253static void exit_trace(int status);
254
99c1f5ab
JA
255#define dip_tracing(dip) (*(volatile int *)(&(dip)->trace_started))
256#define dip_set_tracing(dip, v) ((dip)->trace_started = (v))
257
258#define __for_each_dip(__d, __i, __e) \
259 for (__i = 0, __d = device_information; __i < __e; __i++, __d++)
260
261#define for_each_dip(__d, __i) __for_each_dip(__d, __i, ndevs)
9db17354
JA
262#define for_each_tip(__d, __t, __j) \
263 for (__j = 0, __t = (__d)->threads; __j < ncpus; __j++, __t++)
99c1f5ab 264
8e86c98a
JA
265/*
266 * networking stuff follows. we include a magic number so we know whether
267 * to endianness convert or not
268 */
269struct blktrace_net_hdr {
270 u32 magic; /* same as trace magic */
22cd0c02 271 char buts_name[32]; /* trace name */
8e86c98a 272 u32 cpu; /* for which cpu */
22cd0c02 273 u32 max_cpus;
8e86c98a
JA
274 u32 len; /* length of following trace data */
275};
276
277#define TRACE_NET_PORT (8462)
278
279enum {
280 Net_none = 0,
281 Net_server,
282 Net_client,
283};
284
285/*
286 * network cmd line params
287 */
288static char hostname[MAXHOSTNAMELEN];
289static int net_port = TRACE_NET_PORT;
290static int net_mode = 0;
32f18c48 291static int net_sendfile;
8e86c98a
JA
292
293static int net_in_fd = -1;
294static int net_out_fd = -1;
295
296static void handle_sigint(__attribute__((__unused__)) int sig)
297{
298 done = 1;
299}
300
eb3c8108
JA
301static int get_dropped_count(const char *buts_name)
302{
303 int fd;
304 char tmp[MAXPATHLEN + 64];
305
306 snprintf(tmp, sizeof(tmp), "%s/block/%s/dropped",
307 relay_path, buts_name);
308
309 fd = open(tmp, O_RDONLY);
310 if (fd < 0) {
311 /*
312 * this may be ok, if the kernel doesn't support dropped counts
313 */
314 if (errno == ENOENT)
315 return 0;
316
317 fprintf(stderr, "Couldn't open dropped file %s\n", tmp);
318 return -1;
319 }
320
321 if (read(fd, tmp, sizeof(tmp)) < 0) {
322 perror(tmp);
323 close(fd);
324 return -1;
325 }
326
327 close(fd);
328
329 return atoi(tmp);
330}
331
11eedd9b
JA
332static size_t get_subbuf_padding(struct thread_information *tip,
333 unsigned subbuf)
334{
335 size_t padding_size = buf_nr * sizeof(size_t);
336 size_t ret;
337
338 if (read(tip->pfd, tip->pfd_buf, padding_size) < 0) {
339 perror("tip pad read");
340 ret = -1;
341 } else
342 ret = tip->pfd_buf[subbuf];
343
344 return ret;
345}
346
e7c9f3ff 347static int start_trace(struct device_information *dip)
d0ca268b
JA
348{
349 struct blk_user_trace_setup buts;
350
1f79c4a0 351 memset(&buts, 0, sizeof(buts));
129aa440
JA
352 buts.buf_size = buf_size;
353 buts.buf_nr = buf_nr;
d39c04ca 354 buts.act_mask = act_mask;
d0ca268b 355
ed71a31e
JA
356 if (ioctl(dip->fd, BLKTRACESETUP, &buts) < 0) {
357 perror("BLKTRACESETUP");
358 return 1;
359 }
360
361 if (ioctl(dip->fd, BLKTRACESTART) < 0) {
362 perror("BLKTRACESTART");
d0ca268b
JA
363 return 1;
364 }
365
e7c9f3ff 366 memcpy(dip->buts_name, buts.name, sizeof(dip->buts_name));
99c1f5ab 367 dip_set_tracing(dip, 1);
d0ca268b
JA
368 return 0;
369}
370
e7c9f3ff 371static void stop_trace(struct device_information *dip)
d0ca268b 372{
99c1f5ab
JA
373 if (dip_tracing(dip) || kill_running_trace) {
374 dip_set_tracing(dip, 0);
cf9208ea 375
ed71a31e
JA
376 if (ioctl(dip->fd, BLKTRACESTOP) < 0)
377 perror("BLKTRACESTOP");
378 if (ioctl(dip->fd, BLKTRACETEARDOWN) < 0)
379 perror("BLKTRACETEARDOWN");
cf9208ea 380
e7c9f3ff 381 close(dip->fd);
cf9208ea 382 dip->fd = -1;
707b0914 383 }
d0ca268b
JA
384}
385
e7c9f3ff
NS
386static void stop_all_traces(void)
387{
388 struct device_information *dip;
389 int i;
390
eb3c8108
JA
391 for_each_dip(dip, i) {
392 dip->drop_count = get_dropped_count(dip->buts_name);
e7c9f3ff 393 stop_trace(dip);
eb3c8108 394 }
e7c9f3ff
NS
395}
396
eb3c8108
JA
397static void wait_for_data(struct thread_information *tip)
398{
399 struct pollfd pfd = { .fd = tip->fd, .events = POLLIN };
400
9db17354 401 do {
b4aabcb3 402 poll(&pfd, 1, 100);
9db17354
JA
403 if (pfd.revents & POLLIN)
404 break;
405 if (tip->ofile_stdout)
406 break;
407 } while (!is_done());
eb3c8108
JA
408}
409
0cc7d25e
JA
410static int read_data_file(struct thread_information *tip, void *buf,
411 unsigned int len)
d0ca268b 412{
ae9f71b3 413 int ret = 0;
bbabf03a 414
9db17354
JA
415 do {
416 wait_for_data(tip);
ae9f71b3 417
9db17354
JA
418 ret = read(tip->fd, buf, len);
419 if (!ret)
420 continue;
421 else if (ret > 0)
422 return ret;
423 else {
bbabf03a 424 if (errno != EAGAIN) {
a3e4d330
JA
425 perror(tip->fn);
426 fprintf(stderr,"Thread %d failed read of %s\n",
427 tip->cpu, tip->fn);
428 break;
429 }
9db17354 430 continue;
bbabf03a 431 }
9db17354 432 } while (!is_done());
8a43bac5 433
bbabf03a 434 return ret;
8e86c98a 435
8a43bac5
JA
436}
437
0cc7d25e
JA
438static int read_data_net(struct thread_information *tip, void *buf,
439 unsigned int len)
8e86c98a
JA
440{
441 unsigned int bytes_left = len;
442 int ret = 0;
443
444 do {
445 ret = recv(net_in_fd, buf, bytes_left, MSG_WAITALL);
446
447 if (!ret)
448 continue;
449 else if (ret < 0) {
450 if (errno != EAGAIN) {
451 perror(tip->fn);
452 fprintf(stderr, "server: failed read\n");
453 return 0;
454 }
455 continue;
456 } else {
457 buf += ret;
458 bytes_left -= ret;
459 }
460 } while (!is_done() && bytes_left);
461
410d7c62 462 return len - bytes_left;
8e86c98a
JA
463}
464
0cc7d25e
JA
465static int read_data(struct thread_information *tip, void *buf,
466 unsigned int len)
8e86c98a 467{
663962f7 468 return tip->read_data(tip, buf, len);
8e86c98a
JA
469}
470
471static inline struct tip_subbuf *
472subbuf_fifo_dequeue(struct thread_information *tip)
a3e4d330 473{
21f55651
JA
474 const int head = tip->fifo.head;
475 const int next = (head + 1) & (FIFO_SIZE - 1);
476
477 if (head != tip->fifo.tail) {
478 struct tip_subbuf *ts = tip->fifo.q[head];
479
480 store_barrier();
481 tip->fifo.head = next;
482 return ts;
483 }
484
485 return NULL;
9db17354 486}
eb3c8108 487
21f55651
JA
488static inline int subbuf_fifo_queue(struct thread_information *tip,
489 struct tip_subbuf *ts)
9db17354 490{
21f55651
JA
491 const int tail = tip->fifo.tail;
492 const int next = (tail + 1) & (FIFO_SIZE - 1);
493
494 if (next != tip->fifo.head) {
495 tip->fifo.q[tail] = ts;
496 store_barrier();
497 tip->fifo.tail = next;
498 return 0;
499 }
500
501 fprintf(stderr, "fifo too small!\n");
502 return 1;
a3e4d330
JA
503}
504
b7106311
JA
505/*
506 * For file output, truncate and mmap the file appropriately
507 */
8e86c98a 508static int mmap_subbuf(struct thread_information *tip, unsigned int maxlen)
b7106311
JA
509{
510 int ofd = fileno(tip->ofile);
511 int ret;
512
513 /*
514 * extend file, if we have to. use chunks of 16 subbuffers.
515 */
516 if (tip->fs_off + buf_size > tip->fs_buf_len) {
517 if (tip->fs_buf) {
5975d309 518 munlock(tip->fs_buf, tip->fs_buf_len);
b7106311
JA
519 munmap(tip->fs_buf, tip->fs_buf_len);
520 tip->fs_buf = NULL;
521 }
522
523 tip->fs_off = tip->fs_size & (page_size - 1);
524 tip->fs_buf_len = (16 * buf_size) - tip->fs_off;
525 tip->fs_max_size += tip->fs_buf_len;
526
527 if (ftruncate(ofd, tip->fs_max_size) < 0) {
528 perror("ftruncate");
529 return -1;
530 }
531
532 tip->fs_buf = mmap(NULL, tip->fs_buf_len, PROT_WRITE,
533 MAP_SHARED, ofd, tip->fs_size - tip->fs_off);
534 if (tip->fs_buf == MAP_FAILED) {
535 perror("mmap");
536 return -1;
537 }
5975d309 538 mlock(tip->fs_buf, tip->fs_buf_len);
b7106311
JA
539 }
540
8e86c98a 541 ret = read_data(tip, tip->fs_buf + tip->fs_off, maxlen);
b7106311 542 if (ret >= 0) {
dbfbd6db 543 tip->data_read += ret;
b7106311
JA
544 tip->fs_size += ret;
545 tip->fs_off += ret;
546 return 0;
547 }
548
549 return -1;
550}
551
18eed2a7
JA
552/*
553 * Use the copy approach for pipes and network
554 */
555static int get_subbuf(struct thread_information *tip, unsigned int maxlen)
556{
557 struct tip_subbuf *ts = malloc(sizeof(*ts));
558 int ret;
559
560 ts->buf = malloc(buf_size);
561 ts->max_len = maxlen;
562
563 ret = read_data(tip, ts->buf, ts->max_len);
564 if (ret > 0) {
565 ts->len = ret;
dbfbd6db 566 tip->data_read += ret;
18eed2a7
JA
567 return subbuf_fifo_queue(tip, ts);
568 }
569
570 return ret;
571}
572
32f18c48
JA
573static int get_subbuf_sendfile(struct thread_information *tip,
574 unsigned int maxlen)
575{
11eedd9b 576 struct tip_subbuf *ts;
32f18c48 577 struct stat sb;
1be42f3d 578 unsigned int ready, this_size;
11eedd9b 579 int err;
32f18c48 580
18eed2a7
JA
581 wait_for_data(tip);
582
583 /*
584 * hack to get last data out, we can't use sendfile for that
585 */
586 if (is_done())
587 return get_subbuf(tip, maxlen);
588
32f18c48
JA
589 if (fstat(tip->fd, &sb) < 0) {
590 perror("trace stat");
591 return 1;
592 }
593
11eedd9b 594 ready = sb.st_size - tip->ofile_offset;
663962f7
JA
595 if (!ready) {
596 /*
597 * delay a little, since we poll() will return data available
598 * until sendfile() is run
599 */
600 usleep(100);
11eedd9b 601 return 0;
663962f7 602 }
11eedd9b 603
1be42f3d 604 this_size = buf_size;
11eedd9b 605 while (ready) {
1be42f3d
JA
606 if (this_size > ready)
607 this_size = ready;
608
11eedd9b
JA
609 ts = malloc(sizeof(*ts));
610
611 ts->max_len = maxlen;
612 ts->buf = NULL;
613
1be42f3d 614 ts->len = this_size;
11eedd9b
JA
615 ts->max_len = ts->len;
616 ts->offset = tip->ofile_offset;
617 tip->ofile_offset += ts->len;
618
619 err = subbuf_fifo_queue(tip, ts);
620 if (err)
621 return err;
622
1be42f3d 623 ready -= this_size;
11eedd9b
JA
624 }
625
626 return 0;
32f18c48
JA
627}
628
9db17354 629static void close_thread(struct thread_information *tip)
a3e4d330 630{
9db17354
JA
631 if (tip->fd != -1)
632 close(tip->fd);
11eedd9b
JA
633 if (tip->pfd != -1)
634 close(tip->pfd);
9db17354
JA
635 if (tip->ofile)
636 fclose(tip->ofile);
637 if (tip->ofile_buffer)
638 free(tip->ofile_buffer);
639 if (tip->fd_buf)
640 free(tip->fd_buf);
11eedd9b
JA
641 if (tip->pfd_buf)
642 free(tip->pfd_buf);
1c99bc21 643
9db17354 644 tip->fd = -1;
11eedd9b 645 tip->pfd = -1;
9db17354
JA
646 tip->ofile = NULL;
647 tip->ofile_buffer = NULL;
648 tip->fd_buf = NULL;
a3e4d330
JA
649}
650
8e86c98a
JA
651static void tip_ftrunc_final(struct thread_information *tip)
652{
653 /*
654 * truncate to right size and cleanup mmap
655 */
656 if (tip->ofile_mmap) {
657 int ofd = fileno(tip->ofile);
658
659 if (tip->fs_buf)
660 munmap(tip->fs_buf, tip->fs_buf_len);
661
662 ftruncate(ofd, tip->fs_size);
663 }
664}
665
9db17354 666static void *thread_main(void *arg)
a3e4d330 667{
9db17354
JA
668 struct thread_information *tip = arg;
669 pid_t pid = getpid();
670 cpu_set_t cpu_mask;
a3e4d330 671
9db17354
JA
672 CPU_ZERO(&cpu_mask);
673 CPU_SET((tip->cpu), &cpu_mask);
a3e4d330 674
9db17354
JA
675 if (sched_setaffinity(pid, sizeof(cpu_mask), &cpu_mask) == -1) {
676 perror("sched_setaffinity");
677 exit_trace(1);
678 }
a3e4d330 679
9db17354
JA
680 snprintf(tip->fn, sizeof(tip->fn), "%s/block/%s/trace%d",
681 relay_path, tip->device->buts_name, tip->cpu);
682 tip->fd = open(tip->fn, O_RDONLY);
683 if (tip->fd < 0) {
684 perror(tip->fn);
685 fprintf(stderr,"Thread %d failed open of %s\n", tip->cpu,
686 tip->fn);
687 exit_trace(1);
a3e4d330
JA
688 }
689
11eedd9b
JA
690 if (net_mode == Net_client && net_sendfile) {
691 char tmp[MAXPATHLEN + 64];
692
693 snprintf(tmp, sizeof(tmp), "%s/block/%s/trace%d.padding",
694 relay_path, tip->device->buts_name, tip->cpu);
695
696 tip->pfd = open(tmp, O_RDONLY);
697 if (tip->pfd < 0) {
698 fprintf(stderr, "Couldn't open padding file %s\n", tmp);
699 exit_trace(1);
700 }
701
702 tip->pfd_buf = malloc(buf_nr * sizeof(size_t));
703 }
704
b7106311 705 while (!is_done()) {
0cc7d25e
JA
706 if (tip->get_subbuf(tip, buf_size))
707 break;
b7106311
JA
708 }
709
8e86c98a
JA
710 tip_ftrunc_final(tip);
711 tip->exited = 1;
712 return NULL;
713}
b7106311 714
8e86c98a
JA
715static int write_data_net(int fd, void *buf, unsigned int buf_len)
716{
717 unsigned int bytes_left = buf_len;
718 int ret;
b7106311 719
8e86c98a
JA
720 while (bytes_left) {
721 ret = send(fd, buf, bytes_left, 0);
722 if (ret < 0) {
723 perror("send");
724 return 1;
725 }
726
727 buf += ret;
728 bytes_left -= ret;
9db17354 729 }
a3e4d330 730
8e86c98a 731 return 0;
a3e4d330
JA
732}
733
32f18c48 734static int net_send_header(struct thread_information *tip, unsigned int len)
8e86c98a
JA
735{
736 struct blktrace_net_hdr hdr;
8e86c98a
JA
737
738 hdr.magic = BLK_IO_TRACE_MAGIC;
22cd0c02 739 strcpy(hdr.buts_name, tip->device->buts_name);
8e86c98a 740 hdr.cpu = tip->cpu;
22cd0c02 741 hdr.max_cpus = ncpus;
32f18c48 742 hdr.len = len;
8e86c98a 743
32f18c48
JA
744 return write_data_net(net_out_fd, &hdr, sizeof(hdr));
745}
8e86c98a 746
6a752c90
JA
747/*
748 * send header with 0 length to signal end-of-run
749 */
750static void net_client_send_close(void)
751{
752 struct blktrace_net_hdr hdr;
753
754 hdr.magic = BLK_IO_TRACE_MAGIC;
755 hdr.cpu = 0;
756 hdr.max_cpus = ncpus;
757 hdr.len = 0;
758
759 write_data_net(net_out_fd, &hdr, sizeof(hdr));
760}
761
32f18c48
JA
762static int flush_subbuf_net(struct thread_information *tip,
763 struct tip_subbuf *ts)
764{
765 if (net_send_header(tip, ts->len))
766 return 1;
22cd0c02
JA
767 if (write_data_net(net_out_fd, ts->buf, ts->len))
768 return 1;
8e86c98a 769
18eed2a7 770 tip->data_read += ts->len;
f0597a7e 771 free(ts->buf);
8e86c98a
JA
772 free(ts);
773 return 0;
774}
775
32f18c48
JA
776static int flush_subbuf_sendfile(struct thread_information *tip,
777 struct tip_subbuf *ts)
778{
11eedd9b
JA
779 size_t padding;
780 unsigned subbuf;
781 unsigned len;
18eed2a7
JA
782
783 /*
784 * currently we cannot use sendfile() on the last bytes read, as they
785 * may not be a full subbuffer. get_subbuf_sendfile() falls back to
786 * the read approach for those, so use send() to ship them out
787 */
788 if (ts->buf)
789 return flush_subbuf_net(tip, ts);
11eedd9b
JA
790
791 subbuf = (ts->offset / buf_size) % buf_nr;
792 padding = get_subbuf_padding(tip, subbuf);
793 len = ts->len - padding;
794
795 if (net_send_header(tip, len))
32f18c48 796 return 1;
11eedd9b 797 if (sendfile(net_out_fd, tip->fd, &ts->offset, len) < 0) {
32f18c48
JA
798 perror("sendfile");
799 return 1;
800 }
801
18eed2a7 802 tip->data_read += ts->len;
32f18c48
JA
803 free(ts);
804 return 0;
805}
806
8e86c98a
JA
807static int write_data(struct thread_information *tip, void *buf,
808 unsigned int buf_len)
8a43bac5 809{
7126171a 810 int ret;
8a43bac5 811
6480258a
JA
812 if (!buf_len)
813 return 0;
814
7126171a
JA
815 while (1) {
816 ret = fwrite(buf, buf_len, 1, tip->ofile);
007c233c 817 if (ret == 1)
8a43bac5
JA
818 break;
819
db6fe5bc
JA
820 if (ret < 0) {
821 perror("write");
822 return 1;
8a43bac5 823 }
d0ca268b
JA
824 }
825
9db17354 826 if (tip->ofile_stdout)
7126171a
JA
827 fflush(tip->ofile);
828
8a43bac5
JA
829 return 0;
830}
831
8e86c98a
JA
832static int flush_subbuf_file(struct thread_information *tip,
833 struct tip_subbuf *ts)
8a43bac5 834{
9db17354
JA
835 unsigned int offset = 0;
836 struct blk_io_trace *t;
837 int pdu_len, events = 0;
8a43bac5 838
9db17354 839 /*
7de86b12 840 * surplus from last run
9db17354 841 */
7de86b12
AB
842 if (tip->leftover_ts) {
843 struct tip_subbuf *prev_ts = tip->leftover_ts;
844
9e8b753c 845 if (prev_ts->len + ts->len > prev_ts->max_len) {
7de86b12
AB
846 prev_ts->max_len += ts->len;
847 prev_ts->buf = realloc(prev_ts->buf, prev_ts->max_len);
848 }
849
9e8b753c 850 memcpy(prev_ts->buf + prev_ts->len, ts->buf, ts->len);
7de86b12
AB
851 prev_ts->len += ts->len;
852
853 free(ts->buf);
854 free(ts);
855
856 ts = prev_ts;
857 tip->leftover_ts = NULL;
9db17354 858 }
d0ca268b 859
9db17354
JA
860 while (offset + sizeof(*t) <= ts->len) {
861 t = ts->buf + offset;
3a9d6c13 862
9cfa6c2b
AB
863 if (verify_trace(t)) {
864 write_data(tip, ts->buf, offset);
9db17354 865 return -1;
9cfa6c2b 866 }
3a9d6c13 867
9db17354 868 pdu_len = t->pdu_len;
3a9d6c13 869
9db17354 870 if (offset + sizeof(*t) + pdu_len > ts->len)
3a9d6c13 871 break;
4b5db44a 872
9db17354
JA
873 offset += sizeof(*t) + pdu_len;
874 tip->events_processed++;
b7106311 875 tip->data_read += sizeof(*t) + pdu_len;
9db17354 876 events++;
3a9d6c13
JA
877 }
878
9cfa6c2b
AB
879 if (write_data(tip, ts->buf, offset))
880 return -1;
881
3a9d6c13 882 /*
9db17354 883 * leftover bytes, save them for next time
3a9d6c13 884 */
9db17354 885 if (offset != ts->len) {
7de86b12 886 tip->leftover_ts = ts;
9e8b753c
JA
887 ts->len -= offset;
888 memmove(ts->buf, ts->buf + offset, ts->len);
7de86b12
AB
889 } else {
890 free(ts->buf);
891 free(ts);
9db17354 892 }
4b5db44a 893
9db17354 894 return events;
4b5db44a
JA
895}
896
9db17354 897static int write_tip_events(struct thread_information *tip)
d5396421 898{
21f55651 899 struct tip_subbuf *ts = subbuf_fifo_dequeue(tip);
d5396421 900
0cc7d25e
JA
901 if (ts)
902 return tip->flush_subbuf(tip, ts);
91816d54 903
9db17354 904 return 0;
91816d54
JA
905}
906
9db17354
JA
907/*
908 * scans the tips we know and writes out the subbuffers we accumulate
909 */
910static void get_and_write_events(void)
d0ca268b 911{
9db17354
JA
912 struct device_information *dip;
913 struct thread_information *tip;
27223f19 914 int i, j, events, ret, tips_running;
d0ca268b 915
9db17354
JA
916 while (!is_done()) {
917 events = 0;
d0ca268b 918
9db17354
JA
919 for_each_dip(dip, i) {
920 for_each_tip(dip, tip, j) {
921 ret = write_tip_events(tip);
922 if (ret > 0)
923 events += ret;
924 }
925 }
d0ca268b 926
9db17354
JA
927 if (!events)
928 usleep(10);
d0ca268b
JA
929 }
930
a3e4d330 931 /*
9db17354 932 * reap stored events
a3e4d330 933 */
9db17354
JA
934 do {
935 events = 0;
27223f19 936 tips_running = 0;
9db17354
JA
937 for_each_dip(dip, i) {
938 for_each_tip(dip, tip, j) {
939 ret = write_tip_events(tip);
940 if (ret > 0)
941 events += ret;
27223f19 942 tips_running += !tip->exited;
9db17354 943 }
69e65a9e 944 }
9db17354 945 usleep(10);
27223f19 946 } while (events || tips_running);
d0ca268b
JA
947}
948
b7106311
JA
949static void wait_for_threads(void)
950{
951 /*
8e86c98a
JA
952 * for piped or network output, poll and fetch data for writeout.
953 * for files, we just wait around for trace threads to exit
b7106311 954 */
8e86c98a
JA
955 if ((output_name && !strcmp(output_name, "-")) ||
956 net_mode == Net_client)
b7106311
JA
957 get_and_write_events();
958 else {
959 struct device_information *dip;
960 struct thread_information *tip;
961 int i, j, tips_running;
962
963 do {
964 tips_running = 0;
965 usleep(1000);
966
967 for_each_dip(dip, i)
968 for_each_tip(dip, tip, j)
969 tips_running += !tip->exited;
970 } while (tips_running);
971 }
6a752c90
JA
972
973 if (net_mode == Net_client)
974 net_client_send_close();
b7106311
JA
975}
976
8e86c98a
JA
977static void fill_ofname(char *dst, char *buts_name, int cpu)
978{
979 int len = 0;
980
981 if (output_dir)
982 len = sprintf(dst, "%s/", output_dir);
983
984 if (output_name)
985 sprintf(dst + len, "%s.blktrace.%d", output_name, cpu);
986 else
987 sprintf(dst + len, "%s.blktrace.%d", buts_name, cpu);
988}
989
0cc7d25e
JA
990static void fill_ops(struct thread_information *tip)
991{
992 /*
993 * setup ops
994 */
32f18c48
JA
995 if (net_mode == Net_client) {
996 if (net_sendfile) {
997 tip->get_subbuf = get_subbuf_sendfile;
998 tip->flush_subbuf = flush_subbuf_sendfile;
999 } else {
1000 tip->get_subbuf = get_subbuf;
1001 tip->flush_subbuf = flush_subbuf_net;
1002 }
1003 } else {
1004 if (tip->ofile_mmap)
1005 tip->get_subbuf = mmap_subbuf;
1006 else
1007 tip->get_subbuf = get_subbuf;
0cc7d25e 1008
0cc7d25e 1009 tip->flush_subbuf = flush_subbuf_file;
32f18c48
JA
1010 }
1011
0cc7d25e
JA
1012 if (net_mode == Net_server)
1013 tip->read_data = read_data_net;
1014 else
1015 tip->read_data = read_data_file;
1016}
1017
ddf22842
JA
1018static int tip_open_output(struct device_information *dip,
1019 struct thread_information *tip)
d0ca268b 1020{
ddf22842 1021 int pipeline = output_name && !strcmp(output_name, "-");
8e86c98a 1022 int mode, vbuf_size;
22cd0c02 1023 char op[64];
d0ca268b 1024
ddf22842
JA
1025 if (net_mode == Net_client) {
1026 tip->ofile = NULL;
1027 tip->ofile_stdout = 0;
1028 tip->ofile_mmap = 0;
1029 vbuf_size = 0;
1be42f3d 1030 mode = 0; /* gcc 4.x issues a bogus warning */
ddf22842
JA
1031 } else if (pipeline) {
1032 tip->ofile = fdopen(STDOUT_FILENO, "w");
1033 tip->ofile_stdout = 1;
1034 tip->ofile_mmap = 0;
1035 mode = _IOLBF;
1036 vbuf_size = 512;
1037 } else {
1038 fill_ofname(op, dip->buts_name, tip->cpu);
1039 tip->ofile = fopen(op, "w+");
1040 tip->ofile_stdout = 0;
1041 tip->ofile_mmap = 1;
1042 mode = _IOFBF;
1043 vbuf_size = OFILE_BUF;
1044 }
d5396421 1045
ddf22842
JA
1046 if (net_mode != Net_client && tip->ofile == NULL) {
1047 perror(op);
1048 return 1;
1049 }
d5396421 1050
ddf22842 1051 if (vbuf_size) {
57e8a2ad
TZ
1052 tip->ofile_buffer = malloc(vbuf_size);
1053 if (setvbuf(tip->ofile, tip->ofile_buffer, mode, vbuf_size)) {
007c233c
JA
1054 perror("setvbuf");
1055 close_thread(tip);
1056 return 1;
1057 }
ddf22842
JA
1058 }
1059
1060 fill_ops(tip);
1061 return 0;
1062}
007c233c 1063
ddf22842
JA
1064static int start_threads(struct device_information *dip)
1065{
1066 struct thread_information *tip;
1067 int j;
1068
1069 for_each_tip(dip, tip, j) {
1070 tip->cpu = j;
1071 tip->device = dip;
1072 tip->events_processed = 0;
11eedd9b
JA
1073 tip->fd = -1;
1074 tip->pfd = -1;
ddf22842
JA
1075 memset(&tip->fifo, 0, sizeof(tip->fifo));
1076 tip->leftover_ts = NULL;
1077
1078 if (tip_open_output(dip, tip))
1079 return 1;
0cc7d25e 1080
9db17354 1081 if (pthread_create(&tip->thread, NULL, thread_main, tip)) {
e7c9f3ff 1082 perror("pthread_create");
007c233c 1083 close_thread(tip);
e7c9f3ff 1084 return 1;
d0ca268b
JA
1085 }
1086 }
1087
e7c9f3ff 1088 return 0;
d0ca268b
JA
1089}
1090
e7c9f3ff 1091static void stop_threads(struct device_information *dip)
3aabcd89 1092{
e7c9f3ff 1093 struct thread_information *tip;
91816d54 1094 unsigned long ret;
007c233c
JA
1095 int i;
1096
9db17354 1097 for_each_tip(dip, tip, i) {
91816d54 1098 (void) pthread_join(tip->thread, (void *) &ret);
9db17354
JA
1099 close_thread(tip);
1100 }
3aabcd89
JA
1101}
1102
e7c9f3ff 1103static void stop_all_threads(void)
72ca8801 1104{
e7c9f3ff 1105 struct device_information *dip;
72ca8801
NS
1106 int i;
1107
99c1f5ab 1108 for_each_dip(dip, i)
e7c9f3ff
NS
1109 stop_threads(dip);
1110}
1111
1112static void stop_all_tracing(void)
1113{
1114 struct device_information *dip;
91816d54 1115 int i;
007c233c 1116
91816d54 1117 for_each_dip(dip, i)
e7c9f3ff 1118 stop_trace(dip);
72ca8801
NS
1119}
1120
1121static void exit_trace(int status)
1122{
eb3c8108
JA
1123 if (!is_trace_stopped()) {
1124 trace_stopped = 1;
1125 stop_all_threads();
1126 stop_all_tracing();
1127 }
1128
72ca8801
NS
1129 exit(status);
1130}
1131
e7c9f3ff
NS
1132static int resize_devices(char *path)
1133{
1134 int size = (ndevs + 1) * sizeof(struct device_information);
1135
1136 device_information = realloc(device_information, size);
1137 if (!device_information) {
1138 fprintf(stderr, "Out of memory, device %s (%d)\n", path, size);
1139 return 1;
1140 }
1141 device_information[ndevs].path = path;
1142 ndevs++;
1143 return 0;
1144}
1145
1146static int open_devices(void)
d0ca268b 1147{
e7c9f3ff 1148 struct device_information *dip;
d0ca268b 1149 int i;
d0ca268b 1150
99c1f5ab 1151 for_each_dip(dip, i) {
cf9208ea 1152 dip->fd = open(dip->path, O_RDONLY | O_NONBLOCK);
e7c9f3ff
NS
1153 if (dip->fd < 0) {
1154 perror(dip->path);
1155 return 1;
1156 }
1157 }
99c1f5ab 1158
e7c9f3ff
NS
1159 return 0;
1160}
1161
1162static int start_devices(void)
1163{
1164 struct device_information *dip;
1165 int i, j, size;
1166
1167 size = ncpus * sizeof(struct thread_information);
1168 thread_information = malloc(size * ndevs);
1169 if (!thread_information) {
1170 fprintf(stderr, "Out of memory, threads (%d)\n", size * ndevs);
1171 return 1;
1172 }
d5396421 1173
99c1f5ab 1174 for_each_dip(dip, i) {
e7c9f3ff
NS
1175 if (start_trace(dip)) {
1176 close(dip->fd);
1177 fprintf(stderr, "Failed to start trace on %s\n",
1178 dip->path);
1179 break;
1180 }
1181 }
99c1f5ab 1182
e7c9f3ff 1183 if (i != ndevs) {
99c1f5ab 1184 __for_each_dip(dip, j, i)
e7c9f3ff 1185 stop_trace(dip);
99c1f5ab 1186
e7c9f3ff
NS
1187 return 1;
1188 }
1189
99c1f5ab 1190 for_each_dip(dip, i) {
e7c9f3ff
NS
1191 dip->threads = thread_information + (i * ncpus);
1192 if (start_threads(dip)) {
1193 fprintf(stderr, "Failed to start worker threads\n");
1194 break;
1195 }
1196 }
99c1f5ab 1197
e7c9f3ff 1198 if (i != ndevs) {
99c1f5ab 1199 __for_each_dip(dip, j, i)
e7c9f3ff 1200 stop_threads(dip);
99c1f5ab 1201 for_each_dip(dip, i)
e7c9f3ff 1202 stop_trace(dip);
99c1f5ab 1203
e7c9f3ff 1204 return 1;
d0ca268b
JA
1205 }
1206
e7c9f3ff 1207 return 0;
d0ca268b
JA
1208}
1209
e7c9f3ff
NS
1210static void show_stats(void)
1211{
e7c9f3ff
NS
1212 struct device_information *dip;
1213 struct thread_information *tip;
b7106311 1214 unsigned long long events_processed, data_read;
eb3c8108 1215 unsigned long total_drops;
2f903295 1216 int i, j, no_stdout = 0;
eb3c8108
JA
1217
1218 if (is_stat_shown())
1219 return;
1220
2f903295
JA
1221 if (output_name && !strcmp(output_name, "-"))
1222 no_stdout = 1;
1223
eb3c8108 1224 stat_shown = 1;
428683db 1225
56070ea4 1226 total_drops = 0;
99c1f5ab 1227 for_each_dip(dip, i) {
2f903295 1228 if (!no_stdout)
56070ea4 1229 printf("Device: %s\n", dip->path);
e7c9f3ff 1230 events_processed = 0;
b7106311 1231 data_read = 0;
99c1f5ab 1232 for_each_tip(dip, tip, j) {
2f903295 1233 if (!no_stdout)
b7106311
JA
1234 printf(" CPU%3d: %20lu events, %8llu KiB data\n",
1235 tip->cpu, tip->events_processed,
54824c20 1236 (tip->data_read + 1023) >> 10);
e7c9f3ff 1237 events_processed += tip->events_processed;
b7106311 1238 data_read += tip->data_read;
e7c9f3ff 1239 }
eb3c8108 1240 total_drops += dip->drop_count;
2f903295 1241 if (!no_stdout)
b7106311
JA
1242 printf(" Total: %20llu events (dropped %lu), %8llu KiB data\n",
1243 events_processed, dip->drop_count,
18d8437d 1244 (data_read + 1023) >> 10);
e7c9f3ff 1245 }
56070ea4
JA
1246
1247 if (total_drops)
1248 fprintf(stderr, "You have dropped events, consider using a larger buffer size (-b)\n");
e7c9f3ff 1249}
52724a0e 1250
22cd0c02 1251static struct device_information *net_get_dip(char *buts_name)
8e86c98a 1252{
22cd0c02 1253 struct device_information *dip;
8e86c98a
JA
1254 int i;
1255
22cd0c02
JA
1256 for (i = 0; i < ndevs; i++) {
1257 dip = &device_information[i];
8e86c98a 1258
22cd0c02
JA
1259 if (!strcmp(dip->buts_name, buts_name))
1260 return dip;
8e86c98a
JA
1261 }
1262
22cd0c02
JA
1263 device_information = realloc(device_information, (ndevs + 1) * sizeof(*dip));
1264 dip = &device_information[ndevs];
1265 strcpy(dip->buts_name, buts_name);
410d7c62 1266 strcpy(dip->path, buts_name);
22cd0c02
JA
1267 ndevs++;
1268 dip->threads = malloc(ncpus * sizeof(struct thread_information));
1269 memset(dip->threads, 0, ncpus * sizeof(struct thread_information));
1270
1271 /*
1272 * open all files
1273 */
1274 for (i = 0; i < ncpus; i++) {
1275 struct thread_information *tip = &dip->threads[i];
8e86c98a 1276
22cd0c02 1277 tip->cpu = i;
22cd0c02 1278 tip->device = dip;
8e86c98a 1279
ddf22842 1280 if (tip_open_output(dip, tip))
22cd0c02 1281 return NULL;
8e86c98a
JA
1282 }
1283
22cd0c02
JA
1284 return dip;
1285}
1286
1287static struct thread_information *net_get_tip(struct blktrace_net_hdr *bnh)
1288{
1289 struct device_information *dip;
1290
1291 ncpus = bnh->max_cpus;
1292 dip = net_get_dip(bnh->buts_name);
1293 return &dip->threads[bnh->cpu];
8e86c98a
JA
1294}
1295
1296static int net_get_header(struct blktrace_net_hdr *bnh)
1297{
1298 int fl = fcntl(net_in_fd, F_GETFL);
1299 int bytes_left, ret;
1300 void *p = bnh;
1301
1302 fcntl(net_in_fd, F_SETFL, fl | O_NONBLOCK);
1303 bytes_left = sizeof(*bnh);
1304 while (bytes_left && !is_done()) {
1305 ret = recv(net_in_fd, p, bytes_left, MSG_WAITALL);
1306 if (ret < 0) {
1307 if (errno != EAGAIN) {
1308 perror("recv header");
1309 return 1;
1310 }
1311 usleep(100);
1312 continue;
1313 } else if (!ret) {
1314 usleep(100);
1315 continue;
1316 } else {
1317 p += ret;
1318 bytes_left -= ret;
1319 }
1320 }
1321 fcntl(net_in_fd, F_SETFL, fl & ~O_NONBLOCK);
1322 return 0;
1323}
1324
1325static int net_server_loop(void)
1326{
1327 struct thread_information *tip;
1328 struct blktrace_net_hdr bnh;
1329
1330 if (net_get_header(&bnh))
1331 return 1;
1332
1333 if (data_is_native == -1 && check_data_endianness(bnh.magic)) {
1334 fprintf(stderr, "server: received data is bad\n");
1335 return 1;
1336 }
1337
1338 if (!data_is_native) {
1339 bnh.cpu = be32_to_cpu(bnh.cpu);
1340 bnh.len = be32_to_cpu(bnh.len);
1341 }
1342
6a752c90
JA
1343 /*
1344 * len == 0 means that the other end signalled end-of-run
1345 */
1346 if (!bnh.len) {
1347 fprintf(stderr, "server: end of run\n");
1348 return 1;
1349 }
1350
8e86c98a
JA
1351 tip = net_get_tip(&bnh);
1352 if (!tip)
1353 return 1;
1354
1355 if (mmap_subbuf(tip, bnh.len))
1356 return 1;
1357
1358 return 0;
1359}
1360
1361/*
1362 * Start here when we are in server mode - just fetch data from the network
1363 * and dump to files
1364 */
1365static int net_server(void)
1366{
898bbd3b
JA
1367 struct device_information *dip;
1368 struct thread_information *tip;
8e86c98a
JA
1369 struct sockaddr_in addr;
1370 socklen_t socklen;
22cd0c02 1371 int fd, opt, i, j;
8e86c98a
JA
1372
1373 fd = socket(AF_INET, SOCK_STREAM, 0);
1374 if (fd < 0) {
1375 perror("server: socket");
1376 return 1;
1377 }
1378
1379 opt = 1;
1380 if (setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, &opt, sizeof(opt)) < 0) {
1381 perror("setsockopt");
1382 return 1;
1383 }
1384
1385 memset(&addr, 0, sizeof(addr));
1386 addr.sin_family = AF_INET;
1387 addr.sin_addr.s_addr = htonl(INADDR_ANY);
1388 addr.sin_port = htons(net_port);
1389
1390 if (bind(fd, (struct sockaddr *) &addr, sizeof(addr)) < 0) {
1391 perror("bind");
1392 return 1;
1393 }
1394
1395 if (listen(fd, 1) < 0) {
1396 perror("listen");
1397 return 1;
1398 }
1399
6a752c90 1400repeat:
bbb1c18a
JA
1401 signal(SIGINT, NULL);
1402 signal(SIGHUP, NULL);
1403 signal(SIGTERM, NULL);
1404 signal(SIGALRM, NULL);
1405
8e86c98a
JA
1406 printf("blktrace: waiting for incoming connection...\n");
1407
1408 socklen = sizeof(addr);
1409 net_in_fd = accept(fd, (struct sockaddr *) &addr, &socklen);
1410 if (net_in_fd < 0) {
1411 perror("accept");
1412 return 1;
1413 }
1414
1415 signal(SIGINT, handle_sigint);
1416 signal(SIGHUP, handle_sigint);
1417 signal(SIGTERM, handle_sigint);
1418 signal(SIGALRM, handle_sigint);
1419
e85ee0f2 1420 printf("blktrace: connection from %s\n", inet_ntoa(addr.sin_addr));
8e86c98a
JA
1421
1422 while (!is_done()) {
1423 if (net_server_loop())
1424 break;
1425 }
1426
898bbd3b
JA
1427 for_each_dip(dip, i)
1428 for_each_tip(dip, tip, j)
1429 tip_ftrunc_final(tip);
8e86c98a 1430
410d7c62 1431 show_stats();
6a752c90
JA
1432
1433 if (is_done())
1434 return 0;
1435
898bbd3b
JA
1436 /*
1437 * cleanup for next run
1438 */
1439 for_each_dip(dip, i) {
1440 for_each_tip(dip, tip, j)
1441 fclose(tip->ofile);
1442
1443 free(dip->threads);
1444 }
1445
1446 free(device_information);
1447 device_information = NULL;
1448 ncpus = ndevs = 0;
b46a0342
JA
1449
1450 close(net_in_fd);
1451 net_in_fd = -1;
dbfbd6db 1452 stat_shown = 0;
6a752c90 1453 goto repeat;
8e86c98a
JA
1454}
1455
1456/*
1457 * Setup outgoing network connection where we will transmit data
1458 */
1459static int net_setup_client(void)
1460{
1461 struct sockaddr_in addr;
1462 int fd;
1463
1464 fd = socket(AF_INET, SOCK_STREAM, 0);
1465 if (fd < 0) {
1466 perror("client: socket");
1467 return 1;
1468 }
1469
1470 memset(&addr, 0, sizeof(addr));
1471 addr.sin_family = AF_INET;
1472 addr.sin_port = htons(net_port);
1473
1474 if (inet_aton(hostname, &addr.sin_addr) != 1) {
1475 struct hostent *hent = gethostbyname(hostname);
1476 if (!hent) {
1477 perror("gethostbyname");
1478 return 1;
1479 }
1480
1481 memcpy(&addr.sin_addr, hent->h_addr, 4);
1482 strcpy(hostname, hent->h_name);
1483 }
1484
1485 printf("blktrace: connecting to %s\n", hostname);
1486
1487 if (connect(fd, (struct sockaddr *) &addr, sizeof(addr)) < 0) {
1488 perror("client: connect");
1489 return 1;
1490 }
1491
1492 printf("blktrace: connected!\n");
1493 net_out_fd = fd;
1494 return 0;
1495}
1496
52724a0e
JA
1497static char usage_str[] = \
1498 "-d <dev> [ -r relay path ] [ -o <output> ] [-k ] [ -w time ]\n" \
1499 "[ -a action ] [ -A action mask ] [ -v ]\n\n" \
1500 "\t-d Use specified device. May also be given last after options\n" \
1501 "\t-r Path to mounted relayfs, defaults to /relay\n" \
1502 "\t-o File(s) to send output to\n" \
d1d7f15f 1503 "\t-D Directory to prepend to output file names\n" \
52724a0e
JA
1504 "\t-k Kill a running trace\n" \
1505 "\t-w Stop after defined time, in seconds\n" \
1506 "\t-a Only trace specified actions. See documentation\n" \
1507 "\t-A Give trace mask as a single value. See documentation\n" \
129aa440
JA
1508 "\t-b Sub buffer size in KiB\n" \
1509 "\t-n Number of sub buffers\n" \
f531b94d
JA
1510 "\t-l Run in network listen mode (blktrace server)\n" \
1511 "\t-h Run in network client mode, connecting to the given host\n" \
1512 "\t-p Network port to use (default 8462)\n" \
1513 "\t-s Make the network client use sendfile() to transfer data\n" \
1514 "\t-V Print program version info\n\n";
52724a0e 1515
ee1f4158
NS
1516static void show_usage(char *program)
1517{
52724a0e 1518 fprintf(stderr, "Usage: %s %s %s",program, blktrace_version, usage_str);
ee1f4158 1519}
d0ca268b
JA
1520
1521int main(int argc, char *argv[])
1522{
5270dddd 1523 static char default_relay_path[] = "/relay";
e3e74029 1524 struct statfs st;
d39c04ca 1525 int i, c;
ece238a6 1526 int stop_watch = 0;
d39c04ca
AB
1527 int act_mask_tmp = 0;
1528
1529 while ((c = getopt_long(argc, argv, S_OPTS, l_opts, NULL)) >= 0) {
1530 switch (c) {
1531 case 'a':
1532 i = find_mask_map(optarg);
1533 if (i < 0) {
ab197ca7 1534 fprintf(stderr,"Invalid action mask %s\n",
d39c04ca 1535 optarg);
7425d456 1536 return 1;
d39c04ca
AB
1537 }
1538 act_mask_tmp |= i;
1539 break;
1540
1541 case 'A':
98f8386b
AB
1542 if ((sscanf(optarg, "%x", &i) != 1) ||
1543 !valid_act_opt(i)) {
d39c04ca 1544 fprintf(stderr,
ab197ca7 1545 "Invalid set action mask %s/0x%x\n",
d39c04ca 1546 optarg, i);
7425d456 1547 return 1;
d39c04ca
AB
1548 }
1549 act_mask_tmp = i;
1550 break;
d0ca268b 1551
d39c04ca 1552 case 'd':
e7c9f3ff
NS
1553 if (resize_devices(optarg) != 0)
1554 return 1;
d39c04ca
AB
1555 break;
1556
5270dddd
JA
1557 case 'r':
1558 relay_path = optarg;
1559 break;
1560
d5396421 1561 case 'o':
66efebf8 1562 output_name = optarg;
d5396421 1563 break;
bc39777c
JA
1564 case 'k':
1565 kill_running_trace = 1;
1566 break;
ece238a6
NS
1567 case 'w':
1568 stop_watch = atoi(optarg);
1569 if (stop_watch <= 0) {
1570 fprintf(stderr,
1571 "Invalid stopwatch value (%d secs)\n",
1572 stop_watch);
1573 return 1;
1574 }
1575 break;
57ea8602 1576 case 'V':
52724a0e
JA
1577 printf("%s version %s\n", argv[0], blktrace_version);
1578 return 0;
129aa440 1579 case 'b':
eb3c8108 1580 buf_size = strtoul(optarg, NULL, 10);
183a0855 1581 if (buf_size <= 0 || buf_size > 16*1024) {
129aa440 1582 fprintf(stderr,
eb3c8108 1583 "Invalid buffer size (%lu)\n",buf_size);
129aa440
JA
1584 return 1;
1585 }
1586 buf_size <<= 10;
1587 break;
1588 case 'n':
eb3c8108 1589 buf_nr = strtoul(optarg, NULL, 10);
129aa440
JA
1590 if (buf_nr <= 0) {
1591 fprintf(stderr,
eb3c8108 1592 "Invalid buffer nr (%lu)\n", buf_nr);
129aa440
JA
1593 return 1;
1594 }
1595 break;
d1d7f15f
JA
1596 case 'D':
1597 output_dir = optarg;
1598 break;
8e86c98a
JA
1599 case 'h':
1600 net_mode = Net_client;
1601 strcpy(hostname, optarg);
1602 break;
1603 case 'l':
1604 net_mode = Net_server;
1605 break;
1606 case 'p':
1607 net_port = atoi(optarg);
1608 break;
32f18c48
JA
1609 case 's':
1610 net_sendfile = 1;
1611 break;
d39c04ca 1612 default:
ee1f4158 1613 show_usage(argv[0]);
7425d456 1614 return 1;
d39c04ca
AB
1615 }
1616 }
1617
8e86c98a
JA
1618 setlocale(LC_NUMERIC, "en_US");
1619
1620 page_size = getpagesize();
1621
1622 if (net_mode == Net_server)
1623 return net_server();
1624
22cd0c02
JA
1625 while (optind < argc) {
1626 if (resize_devices(argv[optind++]) != 0)
1627 return 1;
1628 }
1629
e7c9f3ff 1630 if (ndevs == 0) {
ee1f4158 1631 show_usage(argv[0]);
7425d456 1632 return 1;
d39c04ca
AB
1633 }
1634
5270dddd
JA
1635 if (!relay_path)
1636 relay_path = default_relay_path;
1637
d5396421 1638 if (act_mask_tmp != 0)
d39c04ca 1639 act_mask = act_mask_tmp;
d0ca268b 1640
e3e74029
NS
1641 if (statfs(relay_path, &st) < 0) {
1642 perror("statfs");
1643 fprintf(stderr,"%s does not appear to be a valid path\n",
1644 relay_path);
1645 return 1;
64acacae 1646 } else if (st.f_type != (long) RELAYFS_TYPE) {
e3e74029 1647 fprintf(stderr,"%s does not appear to be a relay filesystem\n",
d0ca268b 1648 relay_path);
7425d456 1649 return 1;
d0ca268b
JA
1650 }
1651
e7c9f3ff 1652 if (open_devices() != 0)
7425d456 1653 return 1;
bc39777c
JA
1654
1655 if (kill_running_trace) {
e7c9f3ff 1656 stop_all_traces();
7425d456 1657 return 0;
bc39777c
JA
1658 }
1659
e7c9f3ff
NS
1660 ncpus = sysconf(_SC_NPROCESSORS_ONLN);
1661 if (ncpus < 0) {
1662 fprintf(stderr, "sysconf(_SC_NPROCESSORS_ONLN) failed\n");
7425d456 1663 return 1;
d0ca268b
JA
1664 }
1665
d0ca268b
JA
1666 signal(SIGINT, handle_sigint);
1667 signal(SIGHUP, handle_sigint);
1668 signal(SIGTERM, handle_sigint);
ece238a6 1669 signal(SIGALRM, handle_sigint);
d0ca268b 1670
8e86c98a
JA
1671 if (net_mode == Net_client && net_setup_client())
1672 return 1;
1673
1674 if (start_devices() != 0)
1675 return 1;
1676
e7c9f3ff 1677 atexit(stop_all_tracing);
830fd65c 1678
ece238a6
NS
1679 if (stop_watch)
1680 alarm(stop_watch);
1681
b7106311 1682 wait_for_threads();
d0ca268b 1683
eb3c8108
JA
1684 if (!is_trace_stopped()) {
1685 trace_stopped = 1;
91816d54
JA
1686 stop_all_threads();
1687 stop_all_traces();
91816d54 1688 }
d0ca268b 1689
eb3c8108
JA
1690 show_stats();
1691
d0ca268b
JA
1692 return 0;
1693}
1694