Commit | Line | Data |
---|---|---|
8a4c41dd | 1 | #include <inttypes.h> |
9f8f2064 JA |
2 | #include <stdio.h> |
3 | #include <string.h> | |
9f8f2064 JA |
4 | #include <sys/types.h> |
5 | #include <sys/stat.h> | |
036a1599 | 6 | #include <sys/sysmacros.h> |
9f8f2064 JA |
7 | #include <dirent.h> |
8 | #include <libgen.h> | |
4f37732a BVA |
9 | #ifdef CONFIG_VALGRIND_DEV |
10 | #include <valgrind/drd.h> | |
11 | #else | |
12 | #define DRD_IGNORE_VAR(x) do { } while (0) | |
13 | #endif | |
9f8f2064 JA |
14 | |
15 | #include "fio.h" | |
c97bd0fa | 16 | #include "smalloc.h" |
7c9b1bce | 17 | #include "diskutil.h" |
a39fb9ea | 18 | #include "helper_thread.h" |
9f8f2064 JA |
19 | |
20 | static int last_majdev, last_mindev; | |
c97bd0fa | 21 | static struct disk_util *last_du; |
9f8f2064 | 22 | |
971caeb1 | 23 | static struct fio_sem *disk_util_sem; |
9ec7779f | 24 | |
2db4ecca JA |
25 | static struct disk_util *__init_per_file_disk_util(struct thread_data *td, |
26 | int majdev, int mindev, char *path); | |
27 | ||
c97bd0fa JA |
28 | static void disk_util_free(struct disk_util *du) |
29 | { | |
30 | if (du == last_du) | |
31 | last_du = NULL; | |
32 | ||
b8d541d5 JA |
33 | while (!flist_empty(&du->slaves)) { |
34 | struct disk_util *slave; | |
35 | ||
9342d5f8 | 36 | slave = flist_first_entry(&du->slaves, struct disk_util, slavelist); |
b8d541d5 JA |
37 | flist_del(&slave->slavelist); |
38 | slave->users--; | |
39 | } | |
93bcfd20 | 40 | |
971caeb1 | 41 | fio_sem_remove(du->lock); |
2a20eebc | 42 | free(du->sysfs_root); |
c97bd0fa JA |
43 | sfree(du); |
44 | } | |
45 | ||
9f8f2064 JA |
46 | static int get_io_ticks(struct disk_util *du, struct disk_util_stat *dus) |
47 | { | |
48 | unsigned in_flight; | |
d09a64a0 | 49 | unsigned long long sectors[2]; |
9f8f2064 JA |
50 | char line[256]; |
51 | FILE *f; | |
52 | char *p; | |
5ec10eaa | 53 | int ret; |
9f8f2064 | 54 | |
cd991b9e JA |
55 | dprint(FD_DISKUTIL, "open stat file: %s\n", du->path); |
56 | ||
9f8f2064 JA |
57 | f = fopen(du->path, "r"); |
58 | if (!f) | |
59 | return 1; | |
60 | ||
61 | p = fgets(line, sizeof(line), f); | |
62 | if (!p) { | |
63 | fclose(f); | |
64 | return 1; | |
65 | } | |
66 | ||
cd991b9e JA |
67 | dprint(FD_DISKUTIL, "%s: %s", du->path, p); |
68 | ||
8a4c41dd BVA |
69 | ret = sscanf(p, "%"SCNu64" %"SCNu64" %llu %"SCNu64" " |
70 | "%"SCNu64" %"SCNu64" %llu %"SCNu64" " | |
71 | "%u %"SCNu64" %"SCNu64"\n", | |
72 | &dus->s.ios[0], &dus->s.merges[0], §ors[0], | |
73 | &dus->s.ticks[0], | |
74 | &dus->s.ios[1], &dus->s.merges[1], §ors[1], | |
75 | &dus->s.ticks[1], | |
76 | &in_flight, &dus->s.io_ticks, &dus->s.time_in_queue); | |
9f8f2064 | 77 | fclose(f); |
cd991b9e | 78 | dprint(FD_DISKUTIL, "%s: stat read ok? %d\n", du->path, ret == 1); |
a3b4cf7d JA |
79 | dus->s.sectors[0] = sectors[0]; |
80 | dus->s.sectors[1] = sectors[1]; | |
cd991b9e | 81 | return ret != 11; |
9f8f2064 JA |
82 | } |
83 | ||
84 | static void update_io_tick_disk(struct disk_util *du) | |
85 | { | |
86 | struct disk_util_stat __dus, *dus, *ldus; | |
8b6a404c | 87 | struct timespec t; |
9f8f2064 | 88 | |
c97bd0fa JA |
89 | if (!du->users) |
90 | return; | |
90b97ac3 JA |
91 | if (get_io_ticks(du, &__dus)) |
92 | return; | |
9f8f2064 JA |
93 | |
94 | dus = &du->dus; | |
95 | ldus = &du->last_dus; | |
96 | ||
a3b4cf7d JA |
97 | dus->s.sectors[0] += (__dus.s.sectors[0] - ldus->s.sectors[0]); |
98 | dus->s.sectors[1] += (__dus.s.sectors[1] - ldus->s.sectors[1]); | |
99 | dus->s.ios[0] += (__dus.s.ios[0] - ldus->s.ios[0]); | |
100 | dus->s.ios[1] += (__dus.s.ios[1] - ldus->s.ios[1]); | |
101 | dus->s.merges[0] += (__dus.s.merges[0] - ldus->s.merges[0]); | |
102 | dus->s.merges[1] += (__dus.s.merges[1] - ldus->s.merges[1]); | |
103 | dus->s.ticks[0] += (__dus.s.ticks[0] - ldus->s.ticks[0]); | |
104 | dus->s.ticks[1] += (__dus.s.ticks[1] - ldus->s.ticks[1]); | |
105 | dus->s.io_ticks += (__dus.s.io_ticks - ldus->s.io_ticks); | |
106 | dus->s.time_in_queue += (__dus.s.time_in_queue - ldus->s.time_in_queue); | |
9f8f2064 JA |
107 | |
108 | fio_gettime(&t, NULL); | |
a3b4cf7d | 109 | dus->s.msec += mtime_since(&du->time, &t); |
9f8f2064 | 110 | memcpy(&du->time, &t, sizeof(t)); |
a3b4cf7d | 111 | memcpy(&ldus->s, &__dus.s, sizeof(__dus.s)); |
9f8f2064 JA |
112 | } |
113 | ||
9ec7779f | 114 | int update_io_ticks(void) |
9f8f2064 | 115 | { |
01743ee1 | 116 | struct flist_head *entry; |
9f8f2064 | 117 | struct disk_util *du; |
9ec7779f | 118 | int ret = 0; |
9f8f2064 | 119 | |
cd991b9e JA |
120 | dprint(FD_DISKUTIL, "update io ticks\n"); |
121 | ||
971caeb1 | 122 | fio_sem_down(disk_util_sem); |
9ec7779f | 123 | |
a47591e4 | 124 | if (!helper_should_exit()) { |
9ec7779f JA |
125 | flist_for_each(entry, &disk_list) { |
126 | du = flist_entry(entry, struct disk_util, list); | |
127 | update_io_tick_disk(du); | |
128 | } | |
129 | } else | |
130 | ret = 1; | |
131 | ||
971caeb1 | 132 | fio_sem_up(disk_util_sem); |
9ec7779f | 133 | return ret; |
9f8f2064 JA |
134 | } |
135 | ||
e11c410c | 136 | static struct disk_util *disk_util_exists(int major, int minor) |
9f8f2064 | 137 | { |
01743ee1 | 138 | struct flist_head *entry; |
9f8f2064 JA |
139 | struct disk_util *du; |
140 | ||
971caeb1 | 141 | fio_sem_down(disk_util_sem); |
9ec7779f | 142 | |
01743ee1 JA |
143 | flist_for_each(entry, &disk_list) { |
144 | du = flist_entry(entry, struct disk_util, list); | |
9f8f2064 | 145 | |
9ec7779f | 146 | if (major == du->major && minor == du->minor) { |
971caeb1 | 147 | fio_sem_up(disk_util_sem); |
e11c410c | 148 | return du; |
9ec7779f | 149 | } |
9f8f2064 JA |
150 | } |
151 | ||
971caeb1 | 152 | fio_sem_up(disk_util_sem); |
e11c410c | 153 | return NULL; |
9f8f2064 JA |
154 | } |
155 | ||
67423013 ST |
156 | static int get_device_numbers(char *file_name, int *maj, int *min) |
157 | { | |
158 | struct stat st; | |
159 | int majdev, mindev; | |
160 | char tempname[PATH_MAX], *p; | |
161 | ||
162 | if (!lstat(file_name, &st)) { | |
163 | if (S_ISBLK(st.st_mode)) { | |
164 | majdev = major(st.st_rdev); | |
165 | mindev = minor(st.st_rdev); | |
38297555 ES |
166 | } else if (S_ISCHR(st.st_mode) || |
167 | S_ISFIFO(st.st_mode)) { | |
67423013 | 168 | return -1; |
38297555 | 169 | } else { |
67423013 ST |
170 | majdev = major(st.st_dev); |
171 | mindev = minor(st.st_dev); | |
172 | } | |
173 | } else { | |
174 | /* | |
175 | * must be a file, open "." in that path | |
176 | */ | |
59f94d26 | 177 | snprintf(tempname, FIO_ARRAY_SIZE(tempname), "%s", file_name); |
67423013 ST |
178 | p = dirname(tempname); |
179 | if (stat(p, &st)) { | |
180 | perror("disk util stat"); | |
181 | return -1; | |
182 | } | |
183 | ||
184 | majdev = major(st.st_dev); | |
185 | mindev = minor(st.st_dev); | |
186 | } | |
187 | ||
188 | *min = mindev; | |
189 | *maj = majdev; | |
190 | ||
191 | return 0; | |
192 | } | |
193 | ||
194 | static int read_block_dev_entry(char *path, int *maj, int *min) | |
195 | { | |
196 | char line[256], *p; | |
197 | FILE *f; | |
198 | ||
199 | f = fopen(path, "r"); | |
200 | if (!f) { | |
201 | perror("open path"); | |
202 | return 1; | |
203 | } | |
204 | ||
205 | p = fgets(line, sizeof(line), f); | |
206 | fclose(f); | |
207 | ||
208 | if (!p) | |
209 | return 1; | |
210 | ||
211 | if (sscanf(p, "%u:%u", maj, min) != 2) | |
212 | return 1; | |
213 | ||
214 | return 0; | |
215 | } | |
216 | ||
67423013 | 217 | static void find_add_disk_slaves(struct thread_data *td, char *path, |
2db4ecca | 218 | struct disk_util *masterdu) |
67423013 ST |
219 | { |
220 | DIR *dirhandle = NULL; | |
221 | struct dirent *dirent = NULL; | |
222 | char slavesdir[PATH_MAX], temppath[PATH_MAX], slavepath[PATH_MAX]; | |
223 | struct disk_util *slavedu = NULL; | |
224 | int majdev, mindev; | |
225 | ssize_t linklen; | |
226 | ||
2db4ecca | 227 | sprintf(slavesdir, "%s/%s", path, "slaves"); |
67423013 ST |
228 | dirhandle = opendir(slavesdir); |
229 | if (!dirhandle) | |
230 | return; | |
231 | ||
232 | while ((dirent = readdir(dirhandle)) != NULL) { | |
2db4ecca JA |
233 | if (!strcmp(dirent->d_name, ".") || |
234 | !strcmp(dirent->d_name, "..")) | |
67423013 ST |
235 | continue; |
236 | ||
b4d2bc70 BVA |
237 | nowarn_snprintf(temppath, sizeof(temppath), "%s/%s", slavesdir, |
238 | dirent->d_name); | |
67423013 ST |
239 | /* Can we always assume that the slaves device entries |
240 | * are links to the real directories for the slave | |
241 | * devices? | |
242 | */ | |
976406b8 | 243 | linklen = readlink(temppath, slavepath, PATH_MAX - 1); |
81286ecd | 244 | if (linklen < 0) { |
67423013 | 245 | perror("readlink() for slave device."); |
f0cc675f | 246 | closedir(dirhandle); |
67423013 ST |
247 | return; |
248 | } | |
2db4ecca | 249 | slavepath[linklen] = '\0'; |
67423013 | 250 | |
b4d2bc70 BVA |
251 | nowarn_snprintf(temppath, sizeof(temppath), "%s/%s/dev", |
252 | slavesdir, slavepath); | |
75d5519d | 253 | if (access(temppath, F_OK) != 0) |
b4d2bc70 BVA |
254 | nowarn_snprintf(temppath, sizeof(temppath), |
255 | "%s/%s/device/dev", slavesdir, | |
256 | slavepath); | |
67423013 | 257 | if (read_block_dev_entry(temppath, &majdev, &mindev)) { |
81286ecd | 258 | perror("Error getting slave device numbers"); |
f0cc675f | 259 | closedir(dirhandle); |
67423013 ST |
260 | return; |
261 | } | |
262 | ||
b06de82e AB |
263 | /* |
264 | * See if this maj,min already exists | |
265 | */ | |
266 | slavedu = disk_util_exists(majdev, mindev); | |
267 | if (slavedu) | |
268 | continue; | |
269 | ||
b4d2bc70 BVA |
270 | nowarn_snprintf(temppath, sizeof(temppath), "%s/%s", slavesdir, |
271 | slavepath); | |
67423013 ST |
272 | __init_per_file_disk_util(td, majdev, mindev, temppath); |
273 | slavedu = disk_util_exists(majdev, mindev); | |
274 | ||
275 | /* Should probably use an assert here. slavedu should | |
276 | * always be present at this point. */ | |
b8d541d5 JA |
277 | if (slavedu) { |
278 | slavedu->users++; | |
67423013 | 279 | flist_add_tail(&slavedu->slavelist, &masterdu->slaves); |
b8d541d5 | 280 | } |
67423013 ST |
281 | } |
282 | ||
283 | closedir(dirhandle); | |
67423013 ST |
284 | } |
285 | ||
b8fefc2b | 286 | static struct disk_util *disk_util_add(struct thread_data *td, int majdev, |
c97bd0fa | 287 | int mindev, char *path) |
9f8f2064 JA |
288 | { |
289 | struct disk_util *du, *__du; | |
01743ee1 | 290 | struct flist_head *entry; |
4b919f77 | 291 | int l; |
9f8f2064 | 292 | |
cd991b9e JA |
293 | dprint(FD_DISKUTIL, "add maj/min %d/%d: %s\n", majdev, mindev, path); |
294 | ||
c97bd0fa | 295 | du = smalloc(sizeof(*du)); |
81b3c86f | 296 | if (!du) |
fba5c5ff | 297 | return NULL; |
fba5c5ff | 298 | |
4f37732a | 299 | DRD_IGNORE_VAR(du->users); |
9f8f2064 | 300 | memset(du, 0, sizeof(*du)); |
01743ee1 | 301 | INIT_FLIST_HEAD(&du->list); |
4b919f77 KR |
302 | l = snprintf(du->path, sizeof(du->path), "%s/stat", path); |
303 | if (l < 0 || l >= sizeof(du->path)) { | |
304 | log_err("constructed path \"%.100s[...]/stat\" larger than buffer (%zu bytes)\n", | |
305 | path, sizeof(du->path) - 1); | |
306 | sfree(du); | |
307 | return NULL; | |
308 | } | |
59f94d26 | 309 | snprintf((char *) du->dus.name, FIO_ARRAY_SIZE(du->dus.name), "%s", |
36833fb0 | 310 | basename(path)); |
2a20eebc | 311 | du->sysfs_root = strdup(path); |
9f8f2064 JA |
312 | du->major = majdev; |
313 | du->minor = mindev; | |
67423013 ST |
314 | INIT_FLIST_HEAD(&du->slavelist); |
315 | INIT_FLIST_HEAD(&du->slaves); | |
971caeb1 | 316 | du->lock = fio_sem_init(FIO_SEM_UNLOCKED); |
c97bd0fa | 317 | du->users = 0; |
9f8f2064 | 318 | |
971caeb1 | 319 | fio_sem_down(disk_util_sem); |
9ec7779f | 320 | |
01743ee1 JA |
321 | flist_for_each(entry, &disk_list) { |
322 | __du = flist_entry(entry, struct disk_util, list); | |
9f8f2064 | 323 | |
d09a64a0 | 324 | dprint(FD_DISKUTIL, "found %s in list\n", __du->dus.name); |
cd991b9e | 325 | |
d09a64a0 | 326 | if (!strcmp((char *) du->dus.name, (char *) __du->dus.name)) { |
c97bd0fa | 327 | disk_util_free(du); |
971caeb1 | 328 | fio_sem_up(disk_util_sem); |
c97bd0fa | 329 | return __du; |
9f8f2064 JA |
330 | } |
331 | } | |
332 | ||
d09a64a0 | 333 | dprint(FD_DISKUTIL, "add %s to list\n", du->dus.name); |
cd991b9e | 334 | |
9f8f2064 JA |
335 | fio_gettime(&du->time, NULL); |
336 | get_io_ticks(du, &du->last_dus); | |
337 | ||
01743ee1 | 338 | flist_add_tail(&du->list, &disk_list); |
971caeb1 | 339 | fio_sem_up(disk_util_sem); |
9ec7779f | 340 | |
67423013 | 341 | find_add_disk_slaves(td, path, du); |
c97bd0fa | 342 | return du; |
9f8f2064 JA |
343 | } |
344 | ||
345 | static int check_dev_match(int majdev, int mindev, char *path) | |
346 | { | |
347 | int major, minor; | |
9f8f2064 | 348 | |
67423013 | 349 | if (read_block_dev_entry(path, &major, &minor)) |
9f8f2064 | 350 | return 1; |
9f8f2064 | 351 | |
c97bd0fa | 352 | if (majdev == major && mindev == minor) |
9f8f2064 | 353 | return 0; |
9f8f2064 | 354 | |
9f8f2064 JA |
355 | return 1; |
356 | } | |
357 | ||
ac0be2ac | 358 | static int find_block_dir(int majdev, int mindev, char *path, int link_ok) |
9f8f2064 JA |
359 | { |
360 | struct dirent *dir; | |
361 | struct stat st; | |
362 | int found = 0; | |
363 | DIR *D; | |
364 | ||
365 | D = opendir(path); | |
366 | if (!D) | |
367 | return 0; | |
368 | ||
369 | while ((dir = readdir(D)) != NULL) { | |
5ccdfd74 | 370 | char full_path[257]; |
9f8f2064 JA |
371 | |
372 | if (!strcmp(dir->d_name, ".") || !strcmp(dir->d_name, "..")) | |
373 | continue; | |
374 | ||
22497370 | 375 | sprintf(full_path, "%s/%s", path, dir->d_name); |
9f8f2064 JA |
376 | |
377 | if (!strcmp(dir->d_name, "dev")) { | |
378 | if (!check_dev_match(majdev, mindev, full_path)) { | |
379 | found = 1; | |
380 | break; | |
381 | } | |
382 | } | |
383 | ||
ac0be2ac JA |
384 | if (link_ok) { |
385 | if (stat(full_path, &st) == -1) { | |
386 | perror("stat"); | |
387 | break; | |
388 | } | |
389 | } else { | |
390 | if (lstat(full_path, &st) == -1) { | |
391 | perror("stat"); | |
392 | break; | |
393 | } | |
9f8f2064 JA |
394 | } |
395 | ||
396 | if (!S_ISDIR(st.st_mode) || S_ISLNK(st.st_mode)) | |
397 | continue; | |
398 | ||
ac0be2ac | 399 | found = find_block_dir(majdev, mindev, full_path, 0); |
9f8f2064 JA |
400 | if (found) { |
401 | strcpy(path, full_path); | |
402 | break; | |
403 | } | |
404 | } | |
405 | ||
406 | closedir(D); | |
407 | return found; | |
408 | } | |
409 | ||
c97bd0fa JA |
410 | static struct disk_util *__init_per_file_disk_util(struct thread_data *td, |
411 | int majdev, int mindev, | |
412 | char *path) | |
9f8f2064 JA |
413 | { |
414 | struct stat st; | |
67423013 | 415 | char tmp[PATH_MAX]; |
9f8f2064 JA |
416 | char *p; |
417 | ||
67423013 ST |
418 | /* |
419 | * If there's a ../queue/ directory there, we are inside a partition. | |
420 | * Check if that is the case and jump back. For loop/md/dm etc we | |
421 | * are already in the right spot. | |
422 | */ | |
423 | sprintf(tmp, "%s/../queue", path); | |
424 | if (!stat(tmp, &st)) { | |
425 | p = dirname(path); | |
426 | sprintf(tmp, "%s/queue", p); | |
427 | if (stat(tmp, &st)) { | |
428 | log_err("unknown sysfs layout\n"); | |
c97bd0fa | 429 | return NULL; |
9f8f2064 | 430 | } |
59f94d26 | 431 | snprintf(tmp, FIO_ARRAY_SIZE(tmp), "%s", p); |
67423013 | 432 | sprintf(path, "%s", tmp); |
9f8f2064 JA |
433 | } |
434 | ||
c97bd0fa | 435 | return disk_util_add(td, majdev, mindev, path); |
67423013 ST |
436 | } |
437 | ||
c97bd0fa JA |
438 | static struct disk_util *init_per_file_disk_util(struct thread_data *td, |
439 | char *filename) | |
67423013 ST |
440 | { |
441 | ||
442 | char foo[PATH_MAX]; | |
443 | struct disk_util *du; | |
444 | int mindev, majdev; | |
445 | ||
c97bd0fa JA |
446 | if (get_device_numbers(filename, &majdev, &mindev)) |
447 | return NULL; | |
67423013 ST |
448 | |
449 | dprint(FD_DISKUTIL, "%s belongs to maj/min %d/%d\n", filename, majdev, | |
450 | mindev); | |
cd991b9e | 451 | |
e11c410c | 452 | du = disk_util_exists(majdev, mindev); |
bd4d9bdc | 453 | if (du) |
c97bd0fa | 454 | return du; |
9f8f2064 JA |
455 | |
456 | /* | |
457 | * for an fs without a device, we will repeatedly stat through | |
458 | * sysfs which can take oodles of time for thousands of files. so | |
459 | * cache the last lookup and compare with that before going through | |
460 | * everything again. | |
461 | */ | |
462 | if (mindev == last_mindev && majdev == last_majdev) | |
c97bd0fa | 463 | return last_du; |
9f8f2064 JA |
464 | |
465 | last_mindev = mindev; | |
466 | last_majdev = majdev; | |
5ec10eaa | 467 | |
9f8f2064 | 468 | sprintf(foo, "/sys/block"); |
ac0be2ac | 469 | if (!find_block_dir(majdev, mindev, foo, 1)) |
c97bd0fa | 470 | return NULL; |
9f8f2064 | 471 | |
c97bd0fa | 472 | return __init_per_file_disk_util(td, majdev, mindev, foo); |
67423013 | 473 | } |
9f8f2064 | 474 | |
c97bd0fa JA |
475 | static struct disk_util *__init_disk_util(struct thread_data *td, |
476 | struct fio_file *f) | |
67423013 ST |
477 | { |
478 | return init_per_file_disk_util(td, f->file_name); | |
9f8f2064 JA |
479 | } |
480 | ||
481 | void init_disk_util(struct thread_data *td) | |
482 | { | |
483 | struct fio_file *f; | |
484 | unsigned int i; | |
485 | ||
486 | if (!td->o.do_disk_util || | |
9b87f09b | 487 | td_ioengine_flagged(td, FIO_DISKLESSIO | FIO_NODISKUTIL)) |
9f8f2064 JA |
488 | return; |
489 | ||
490 | for_each_file(td, f, i) | |
c97bd0fa | 491 | f->du = __init_disk_util(td, f); |
9f8f2064 JA |
492 | } |
493 | ||
27357187 | 494 | void disk_util_prune_entries(void) |
d09a64a0 | 495 | { |
971caeb1 | 496 | fio_sem_down(disk_util_sem); |
9ec7779f | 497 | |
d09a64a0 | 498 | while (!flist_empty(&disk_list)) { |
27357187 JA |
499 | struct disk_util *du; |
500 | ||
9342d5f8 | 501 | du = flist_first_entry(&disk_list, struct disk_util, list); |
d09a64a0 JA |
502 | flist_del(&du->list); |
503 | disk_util_free(du); | |
504 | } | |
043b74b9 | 505 | |
d09a64a0 | 506 | last_majdev = last_mindev = -1; |
971caeb1 BVA |
507 | fio_sem_up(disk_util_sem); |
508 | fio_sem_remove(disk_util_sem); | |
d09a64a0 JA |
509 | } |
510 | ||
9ec7779f JA |
511 | void setup_disk_util(void) |
512 | { | |
971caeb1 | 513 | disk_util_sem = fio_sem_init(FIO_SEM_UNLOCKED); |
9f8f2064 | 514 | } |