client: handle connection failure
[fio.git] / client.c
CommitLineData
132159a5
JA
1#include <stdio.h>
2#include <stdlib.h>
3#include <unistd.h>
4#include <limits.h>
5#include <errno.h>
6#include <fcntl.h>
7#include <sys/poll.h>
8#include <sys/types.h>
9#include <sys/stat.h>
10#include <sys/wait.h>
11#include <sys/mman.h>
12#include <netinet/in.h>
13#include <arpa/inet.h>
14#include <netdb.h>
15
16#include "fio.h"
17#include "server.h"
18#include "crc/crc32.h"
b66570dc 19#include "flist.h"
132159a5 20
b66570dc
JA
21struct fio_client {
22 struct flist_head list;
23 struct sockaddr_in addr;
24 char *hostname;
25 int fd;
26};
27
28static FLIST_HEAD(client_list);
b66570dc
JA
29
30static struct fio_client *find_client_by_fd(int fd)
31{
32 struct fio_client *client;
33 struct flist_head *entry;
34
35 flist_for_each(entry, &client_list) {
36 client = flist_entry(entry, struct fio_client, list);
37
38 if (client->fd == fd)
39 return client;
40 }
41
42 return NULL;
43}
44
a37f69b7 45#if 0
b66570dc
JA
46static struct fio_client *find_client_by_name(const char *name)
47{
48 struct fio_client *client;
49 struct flist_head *entry;
50
51 flist_for_each(entry, &client_list) {
52 client = flist_entry(entry, struct fio_client, list);
53
54 if (!strcmp(name, client->hostname))
55 return client;
56 }
57
58 return NULL;
59}
a37f69b7 60#endif
b66570dc
JA
61
62static void remove_client(struct fio_client *client)
63{
46c48f1f 64 dprint(FD_NET, "removed client <%s>\n", client->hostname);
b66570dc
JA
65 flist_del(&client->list);
66 nr_clients--;
67 free(client->hostname);
68 free(client);
69}
132159a5 70
a37f69b7 71void fio_client_add(const char *hostname)
132159a5 72{
b66570dc 73 struct fio_client *client;
132159a5 74
46c48f1f 75 dprint(FD_NET, "added client <%s>\n", hostname);
b66570dc 76 client = malloc(sizeof(*client));
a37f69b7
JA
77 memset(client, 0, sizeof(*client));
78 client->hostname = strdup(hostname);
79 client->fd = -1;
80 flist_add(&client->list, &client_list);
81 nr_clients++;
82}
83
84static int fio_client_connect(struct fio_client *client)
85{
86 int fd;
132159a5 87
46c48f1f
JA
88 dprint(FD_NET, "connect to host %s\n", client->hostname);
89
b66570dc
JA
90 memset(&client->addr, 0, sizeof(client->addr));
91 client->addr.sin_family = AF_INET;
92 client->addr.sin_port = htons(fio_net_port);
93
a37f69b7 94 if (inet_aton(client->hostname, &client->addr.sin_addr) != 1) {
132159a5
JA
95 struct hostent *hent;
96
a37f69b7 97 hent = gethostbyname(client->hostname);
132159a5
JA
98 if (!hent) {
99 log_err("fio: gethostbyname: %s\n", strerror(errno));
100 return 1;
101 }
102
b66570dc 103 memcpy(&client->addr.sin_addr, hent->h_addr, 4);
132159a5
JA
104 }
105
106 fd = socket(AF_INET, SOCK_STREAM, 0);
107 if (fd < 0) {
108 log_err("fio: socket: %s\n", strerror(errno));
109 return 1;
110 }
111
b66570dc 112 if (connect(fd, (struct sockaddr *) &client->addr, sizeof(client->addr)) < 0) {
132159a5 113 log_err("fio: connect: %s\n", strerror(errno));
cdf54d85 114 log_err("fio: failed to connect to %s\n", client->hostname);
132159a5
JA
115 return 1;
116 }
117
b66570dc 118 client->fd = fd;
132159a5
JA
119 return 0;
120}
121
cc0df00a
JA
122void fio_clients_terminate(void)
123{
124 struct flist_head *entry;
125 struct fio_client *client;
126
127 flist_for_each(entry, &client_list) {
128 client = flist_entry(entry, struct fio_client, list);
129
130 fio_net_send_simple_cmd(client->fd, FIO_NET_CMD_QUIT, 0);
131 }
132}
133
134static void sig_int(int sig)
135{
136 fio_clients_terminate();
137}
138
139static void client_signal_handler(void)
140{
141 struct sigaction act;
142
143 memset(&act, 0, sizeof(act));
144 act.sa_handler = sig_int;
145 act.sa_flags = SA_RESTART;
146 sigaction(SIGINT, &act, NULL);
147
148 memset(&act, 0, sizeof(act));
149 act.sa_handler = sig_int;
150 act.sa_flags = SA_RESTART;
151 sigaction(SIGTERM, &act, NULL);
152}
153
a37f69b7
JA
154int fio_clients_connect(void)
155{
156 struct fio_client *client;
157 struct flist_head *entry, *tmp;
158 int ret;
159
cc0df00a
JA
160 client_signal_handler();
161
a37f69b7
JA
162 flist_for_each_safe(entry, tmp, &client_list) {
163 client = flist_entry(entry, struct fio_client, list);
164
165 ret = fio_client_connect(client);
166 if (ret)
167 remove_client(client);
168 }
169
170 return !nr_clients;
171}
172
b66570dc 173static int send_file_buf(struct fio_client *client, char *buf, off_t size)
132159a5 174{
b66570dc 175 return fio_net_send_cmd(client->fd, FIO_NET_CMD_JOB, buf, size);
132159a5
JA
176}
177
178/*
179 * Send file contents to server backend. We could use sendfile(), but to remain
180 * more portable lets just read/write the darn thing.
181 */
a37f69b7 182static int fio_client_send_ini(struct fio_client *client, const char *filename)
132159a5
JA
183{
184 struct stat sb;
185 char *p, *buf;
186 off_t len;
187 int fd, ret;
188
46c48f1f
JA
189 dprint(FD_NET, "send ini %s to %s\n", filename, client->hostname);
190
132159a5
JA
191 fd = open(filename, O_RDONLY);
192 if (fd < 0) {
193 log_err("fio: job file open: %s\n", strerror(errno));
194 return 1;
195 }
196
197 if (fstat(fd, &sb) < 0) {
198 log_err("fio: job file stat: %s\n", strerror(errno));
199 return 1;
200 }
201
202 buf = malloc(sb.st_size);
203
204 len = sb.st_size;
205 p = buf;
206 do {
207 ret = read(fd, p, len);
208 if (ret > 0) {
209 len -= ret;
210 if (!len)
211 break;
212 p += ret;
213 continue;
214 } else if (!ret)
215 break;
216 else if (errno == EAGAIN || errno == EINTR)
217 continue;
218 } while (1);
219
b66570dc 220 ret = send_file_buf(client, buf, sb.st_size);
132159a5
JA
221 free(buf);
222 return ret;
223}
37db14fe 224
a37f69b7
JA
225int fio_clients_send_ini(const char *filename)
226{
227 struct fio_client *client;
228 struct flist_head *entry, *tmp;
229
230 flist_for_each_safe(entry, tmp, &client_list) {
231 client = flist_entry(entry, struct fio_client, list);
232
233 if (fio_client_send_ini(client, filename))
234 remove_client(client);
235 }
236
237 return !nr_clients;
238}
239
a64e88da
JA
240static void convert_io_stat(struct io_stat *dst, struct io_stat *src)
241{
242 dst->max_val = le64_to_cpu(src->max_val);
243 dst->min_val = le64_to_cpu(src->min_val);
244 dst->samples = le64_to_cpu(src->samples);
245 /* FIXME */
ddcc0b69
JA
246 dst->mean = __le64_to_cpu(src->mean);
247 dst->S = __le64_to_cpu(src->S);
a64e88da
JA
248}
249
250static void convert_ts(struct thread_stat *dst, struct thread_stat *src)
251{
252 int i, j;
253
254 dst->error = le32_to_cpu(src->error);
255 dst->groupid = le32_to_cpu(src->groupid);
256 dst->pid = le32_to_cpu(src->pid);
257 dst->members = le32_to_cpu(src->members);
258
259 for (i = 0; i < 2; i++) {
260 convert_io_stat(&dst->clat_stat[i], &src->clat_stat[i]);
261 convert_io_stat(&dst->slat_stat[i], &src->slat_stat[i]);
262 convert_io_stat(&dst->lat_stat[i], &src->lat_stat[i]);
263 convert_io_stat(&dst->bw_stat[i], &src->bw_stat[i]);
264 }
265
266 dst->usr_time = le64_to_cpu(src->usr_time);
267 dst->sys_time = le64_to_cpu(src->sys_time);
268 dst->ctx = le64_to_cpu(src->ctx);
269 dst->minf = le64_to_cpu(src->minf);
270 dst->majf = le64_to_cpu(src->majf);
271 dst->clat_percentiles = le64_to_cpu(src->clat_percentiles);
272 dst->percentile_list = NULL;
273
274 for (i = 0; i < FIO_IO_U_MAP_NR; i++) {
275 dst->io_u_map[i] = le32_to_cpu(src->io_u_map[i]);
276 dst->io_u_submit[i] = le32_to_cpu(src->io_u_submit[i]);
277 dst->io_u_complete[i] = le32_to_cpu(src->io_u_complete[i]);
278 }
279
280 for (i = 0; i < FIO_IO_U_LAT_U_NR; i++) {
281 dst->io_u_lat_u[i] = le32_to_cpu(src->io_u_lat_u[i]);
282 dst->io_u_lat_m[i] = le32_to_cpu(src->io_u_lat_m[i]);
283 }
284
285 for (i = 0; i < 2; i++)
286 for (j = 0; j < FIO_IO_U_PLAT_NR; j++)
287 dst->io_u_plat[i][j] = le32_to_cpu(src->io_u_plat[i][j]);
288
289 for (i = 0; i < 3; i++) {
290 dst->total_io_u[i] = le64_to_cpu(src->total_io_u[i]);
93eee04a 291 dst->short_io_u[i] = le64_to_cpu(src->short_io_u[i]);
a64e88da
JA
292 }
293
294 dst->total_submit = le64_to_cpu(src->total_submit);
295 dst->total_complete = le64_to_cpu(src->total_complete);
296
297 for (i = 0; i < 2; i++) {
298 dst->io_bytes[i] = le64_to_cpu(src->io_bytes[i]);
299 dst->runtime[i] = le64_to_cpu(src->runtime[i]);
300 }
301
302 dst->total_run_time = le64_to_cpu(src->total_run_time);
303 dst->continue_on_error = le16_to_cpu(src->continue_on_error);
304 dst->total_err_count = le64_to_cpu(src->total_err_count);
ddcc0b69
JA
305 dst->first_error = le32_to_cpu(src->first_error);
306 dst->kb_base = le32_to_cpu(src->kb_base);
a64e88da
JA
307}
308
309static void convert_gs(struct group_run_stats *dst, struct group_run_stats *src)
310{
311 int i;
312
313 for (i = 0; i < 2; i++) {
314 dst->max_run[i] = le64_to_cpu(src->max_run[i]);
315 dst->min_run[i] = le64_to_cpu(src->min_run[i]);
316 dst->max_bw[i] = le64_to_cpu(src->max_bw[i]);
317 dst->min_bw[i] = le64_to_cpu(src->min_bw[i]);
318 dst->io_kb[i] = le64_to_cpu(src->io_kb[i]);
319 dst->agg[i] = le64_to_cpu(src->agg[i]);
320 }
321
322 dst->kb_base = le32_to_cpu(src->kb_base);
323 dst->groupid = le32_to_cpu(src->groupid);
324}
325
326static void handle_ts(struct fio_net_cmd *cmd)
327{
328 struct cmd_ts_pdu *p = (struct cmd_ts_pdu *) cmd->payload;
329
330 convert_ts(&p->ts, &p->ts);
331 convert_gs(&p->rs, &p->rs);
332
333 show_thread_status(&p->ts, &p->rs);
334}
335
336static void handle_gs(struct fio_net_cmd *cmd)
337{
338 struct group_run_stats *gs = (struct group_run_stats *) cmd->payload;
339
340 convert_gs(gs, gs);
341 show_group_stats(gs);
342}
343
cf451d1e
JA
344static void handle_eta(struct fio_net_cmd *cmd)
345{
346 struct jobs_eta *je = (struct jobs_eta *) cmd->payload;
347 int i;
348
349 je->nr_running = le32_to_cpu(je->nr_running);
350 je->nr_ramp = le32_to_cpu(je->nr_ramp);
351 je->nr_pending = le32_to_cpu(je->nr_pending);
352 je->files_open = le32_to_cpu(je->files_open);
353 je->m_rate = le32_to_cpu(je->m_rate);
354 je->t_rate = le32_to_cpu(je->t_rate);
355 je->m_iops = le32_to_cpu(je->m_iops);
356 je->t_iops = le32_to_cpu(je->t_iops);
357
358 for (i = 0; i < 2; i++) {
359 je->rate[i] = le32_to_cpu(je->rate[i]);
360 je->iops[i] = le32_to_cpu(je->iops[i]);
361 }
362
363 je->elapsed_sec = le32_to_cpu(je->nr_running);
364 je->eta_sec = le64_to_cpu(je->eta_sec);
365
366 display_thread_status(je);
367}
368
b66570dc 369static int handle_client(struct fio_client *client)
37db14fe
JA
370{
371 struct fio_net_cmd *cmd;
a450e492 372 int done = 0;
37db14fe 373
a64e88da 374 while ((cmd = fio_net_recv_cmd(client->fd)) != NULL) {
46c48f1f
JA
375 dprint(FD_NET, "%s: got cmd op %d\n", client->hostname,
376 cmd->opcode);
377
a64e88da
JA
378 switch (cmd->opcode) {
379 case FIO_NET_CMD_ACK:
37db14fe 380 free(cmd);
a64e88da
JA
381 break;
382 case FIO_NET_CMD_QUIT:
b66570dc 383 remove_client(client);
437377e1 384 free(cmd);
a450e492 385 done = 1;
437377e1 386 break;
a64e88da
JA
387 case FIO_NET_CMD_TEXT:
388 fwrite(cmd->payload, cmd->pdu_len, 1, stdout);
389 fflush(stdout);
37db14fe 390 free(cmd);
a64e88da
JA
391 break;
392 case FIO_NET_CMD_TS:
393 handle_ts(cmd);
394 free(cmd);
395 break;
396 case FIO_NET_CMD_GS:
397 handle_gs(cmd);
398 free(cmd);
399 break;
cf451d1e
JA
400 case FIO_NET_CMD_ETA:
401 handle_eta(cmd);
402 free(cmd);
403 break;
a64e88da
JA
404 default:
405 log_err("fio: unknown client op: %d\n", cmd->opcode);
406 free(cmd);
407 break;
37db14fe 408 }
a450e492
JA
409
410 if (done)
411 break;
37db14fe
JA
412 }
413
414 return 0;
415}
b66570dc
JA
416
417int fio_handle_clients(void)
418{
419 struct fio_client *client;
420 struct flist_head *entry;
421 struct pollfd *pfds;
82a4be1b 422 int i, ret = 0;
b66570dc
JA
423
424 pfds = malloc(nr_clients * sizeof(struct pollfd));
425
82a4be1b
JA
426 while (!exit_backend && nr_clients) {
427 i = 0;
428 flist_for_each(entry, &client_list) {
429 client = flist_entry(entry, struct fio_client, list);
b66570dc 430
82a4be1b
JA
431 pfds[i].fd = client->fd;
432 pfds[i].events = POLLIN;
433 i++;
434 }
435
436 assert(i == nr_clients);
b66570dc 437
b66570dc
JA
438 ret = poll(pfds, nr_clients, 100);
439 if (ret < 0) {
440 if (errno == EINTR)
441 continue;
442 log_err("fio: poll clients: %s\n", strerror(errno));
443 break;
444 } else if (!ret)
445 continue;
446
447 for (i = 0; i < nr_clients; i++) {
448 if (!(pfds[i].revents & POLLIN))
449 continue;
450
451 client = find_client_by_fd(pfds[i].fd);
452 if (!client) {
453 log_err("fio: unknown client\n");
454 continue;
455 }
456 handle_client(client);
457 }
458 }
459
460 free(pfds);
b66570dc
JA
461 return 0;
462}