Make I/O priority option generic for non-Linux environment [1/2]
[fio.git] / os / os-linux.h
... / ...
CommitLineData
1#ifndef FIO_OS_LINUX_H
2#define FIO_OS_LINUX_H
3
4#define FIO_OS os_linux
5
6#include <sys/ioctl.h>
7#include <sys/uio.h>
8#include <sys/syscall.h>
9#include <sys/sysmacros.h>
10#include <sys/vfs.h>
11#include <sys/mman.h>
12#include <unistd.h>
13#include <fcntl.h>
14#include <errno.h>
15#include <sched.h>
16#include <linux/unistd.h>
17#include <linux/raw.h>
18#include <linux/major.h>
19#include <byteswap.h>
20
21#include "binject.h"
22#include "../file.h"
23
24#define FIO_HAVE_CPU_AFFINITY
25#define FIO_HAVE_DISK_UTIL
26#define FIO_HAVE_SGIO
27#define FIO_HAVE_IOPRIO
28#define FIO_HAVE_IOSCHED_SWITCH
29#define FIO_HAVE_ODIRECT
30#define FIO_HAVE_HUGETLB
31#define FIO_HAVE_RAWBIND
32#define FIO_HAVE_BLKTRACE
33#define FIO_HAVE_PSHARED_MUTEX
34#define FIO_HAVE_CL_SIZE
35#define FIO_HAVE_CGROUPS
36#define FIO_HAVE_FS_STAT
37#define FIO_HAVE_TRIM
38#define FIO_HAVE_BINJECT
39#define FIO_HAVE_GETTID
40#define FIO_USE_GENERIC_INIT_RANDOM_STATE
41#define FIO_HAVE_PWRITEV2
42
43#ifdef MAP_HUGETLB
44#define FIO_HAVE_MMAP_HUGE
45#endif
46
47#define OS_MAP_ANON MAP_ANONYMOUS
48
49typedef cpu_set_t os_cpu_mask_t;
50
51typedef struct drand48_data os_random_state_t;
52
53#ifdef CONFIG_3ARG_AFFINITY
54#define fio_setaffinity(pid, cpumask) \
55 sched_setaffinity((pid), sizeof(cpumask), &(cpumask))
56#define fio_getaffinity(pid, ptr) \
57 sched_getaffinity((pid), sizeof(cpu_set_t), (ptr))
58#elif defined(CONFIG_2ARG_AFFINITY)
59#define fio_setaffinity(pid, cpumask) \
60 sched_setaffinity((pid), &(cpumask))
61#define fio_getaffinity(pid, ptr) \
62 sched_getaffinity((pid), (ptr))
63#endif
64
65#define fio_cpu_clear(mask, cpu) (void) CPU_CLR((cpu), (mask))
66#define fio_cpu_set(mask, cpu) (void) CPU_SET((cpu), (mask))
67#define fio_cpu_isset(mask, cpu) CPU_ISSET((cpu), (mask))
68#define fio_cpu_count(mask) CPU_COUNT((mask))
69
70static inline int fio_cpuset_init(os_cpu_mask_t *mask)
71{
72 CPU_ZERO(mask);
73 return 0;
74}
75
76static inline int fio_cpuset_exit(os_cpu_mask_t *mask)
77{
78 return 0;
79}
80
81#define FIO_MAX_CPUS CPU_SETSIZE
82
83enum {
84 IOPRIO_CLASS_NONE,
85 IOPRIO_CLASS_RT,
86 IOPRIO_CLASS_BE,
87 IOPRIO_CLASS_IDLE,
88};
89
90enum {
91 IOPRIO_WHO_PROCESS = 1,
92 IOPRIO_WHO_PGRP,
93 IOPRIO_WHO_USER,
94};
95
96#define IOPRIO_BITS 16
97#define IOPRIO_CLASS_SHIFT 13
98
99#define IOPRIO_MIN_PRIO 0 /* highest priority */
100#define IOPRIO_MAX_PRIO 7 /* lowest priority */
101
102#define IOPRIO_MIN_PRIO_CLASS 0
103#define IOPRIO_MAX_PRIO_CLASS 3
104
105static inline int ioprio_set(int which, int who, int ioprio_class, int ioprio)
106{
107 /*
108 * If no class is set, assume BE
109 */
110 if (!ioprio_class)
111 ioprio_class = IOPRIO_CLASS_BE;
112
113 ioprio |= ioprio_class << IOPRIO_CLASS_SHIFT;
114 return syscall(__NR_ioprio_set, which, who, ioprio);
115}
116
117static inline int gettid(void)
118{
119 return syscall(__NR_gettid);
120}
121
122#define SPLICE_DEF_SIZE (64*1024)
123
124#ifndef BLKGETSIZE64
125#define BLKGETSIZE64 _IOR(0x12,114,size_t)
126#endif
127
128#ifndef BLKFLSBUF
129#define BLKFLSBUF _IO(0x12,97)
130#endif
131
132#ifndef BLKDISCARD
133#define BLKDISCARD _IO(0x12,119)
134#endif
135
136static inline int blockdev_invalidate_cache(struct fio_file *f)
137{
138 return ioctl(f->fd, BLKFLSBUF);
139}
140
141static inline int blockdev_size(struct fio_file *f, unsigned long long *bytes)
142{
143 if (!ioctl(f->fd, BLKGETSIZE64, bytes))
144 return 0;
145
146 return errno;
147}
148
149static inline unsigned long long os_phys_mem(void)
150{
151 long pagesize, pages;
152
153 pagesize = sysconf(_SC_PAGESIZE);
154 pages = sysconf(_SC_PHYS_PAGES);
155 if (pages == -1 || pagesize == -1)
156 return 0;
157
158 return (unsigned long long) pages * (unsigned long long) pagesize;
159}
160
161static inline void os_random_seed(unsigned long seed, os_random_state_t *rs)
162{
163 srand48_r(seed, rs);
164}
165
166static inline long os_random_long(os_random_state_t *rs)
167{
168 long val;
169
170 lrand48_r(rs, &val);
171 return val;
172}
173
174static inline int fio_lookup_raw(dev_t dev, int *majdev, int *mindev)
175{
176 struct raw_config_request rq;
177 int fd;
178
179 if (major(dev) != RAW_MAJOR)
180 return 1;
181
182 /*
183 * we should be able to find /dev/rawctl or /dev/raw/rawctl
184 */
185 fd = open("/dev/rawctl", O_RDONLY);
186 if (fd < 0) {
187 fd = open("/dev/raw/rawctl", O_RDONLY);
188 if (fd < 0)
189 return 1;
190 }
191
192 rq.raw_minor = minor(dev);
193 if (ioctl(fd, RAW_GETBIND, &rq) < 0) {
194 close(fd);
195 return 1;
196 }
197
198 close(fd);
199 *majdev = rq.block_major;
200 *mindev = rq.block_minor;
201 return 0;
202}
203
204#ifdef O_NOATIME
205#define FIO_O_NOATIME O_NOATIME
206#else
207#define FIO_O_NOATIME 0
208#endif
209
210#ifdef O_ATOMIC
211#define OS_O_ATOMIC O_ATOMIC
212#else
213#define OS_O_ATOMIC 040000000
214#endif
215
216#ifdef MADV_REMOVE
217#define FIO_MADV_FREE MADV_REMOVE
218#endif
219
220#if defined(__builtin_bswap16)
221#define fio_swap16(x) __builtin_bswap16(x)
222#else
223#define fio_swap16(x) __bswap_16(x)
224#endif
225#if defined(__builtin_bswap32)
226#define fio_swap32(x) __builtin_bswap32(x)
227#else
228#define fio_swap32(x) __bswap_32(x)
229#endif
230#if defined(__builtin_bswap64)
231#define fio_swap64(x) __builtin_bswap64(x)
232#else
233#define fio_swap64(x) __bswap_64(x)
234#endif
235
236#define CACHE_LINE_FILE \
237 "/sys/devices/system/cpu/cpu0/cache/index0/coherency_line_size"
238
239static inline int arch_cache_line_size(void)
240{
241 char size[32];
242 int fd, ret;
243
244 fd = open(CACHE_LINE_FILE, O_RDONLY);
245 if (fd < 0)
246 return -1;
247
248 ret = read(fd, size, sizeof(size));
249
250 close(fd);
251
252 if (ret <= 0)
253 return -1;
254 else
255 return atoi(size);
256}
257
258static inline unsigned long long get_fs_free_size(const char *path)
259{
260 unsigned long long ret;
261 struct statfs s;
262
263 if (statfs(path, &s) < 0)
264 return -1ULL;
265
266 ret = s.f_bsize;
267 ret *= (unsigned long long) s.f_bfree;
268 return ret;
269}
270
271static inline int os_trim(int fd, unsigned long long start,
272 unsigned long long len)
273{
274 uint64_t range[2];
275
276 range[0] = start;
277 range[1] = len;
278
279 if (!ioctl(fd, BLKDISCARD, range))
280 return 0;
281
282 return errno;
283}
284
285#ifdef CONFIG_SCHED_IDLE
286static inline int fio_set_sched_idle(void)
287{
288 struct sched_param p = { .sched_priority = 0, };
289 return sched_setscheduler(gettid(), SCHED_IDLE, &p);
290}
291#endif
292
293#ifndef POSIX_FADV_STREAMID
294#define POSIX_FADV_STREAMID 8
295#endif
296
297#define FIO_HAVE_STREAMID
298
299#ifndef RWF_HIPRI
300#define RWF_HIPRI 0x00000001
301#endif
302#ifndef RWF_DSYNC
303#define RWF_DSYNC 0x00000002
304#endif
305#ifndef RWF_SYNC
306#define RWF_SYNC 0x00000004
307#endif
308
309#ifndef CONFIG_PWRITEV2
310#ifdef __NR_preadv2
311static inline void make_pos_h_l(unsigned long *pos_h, unsigned long *pos_l,
312 off_t offset)
313{
314 *pos_l = offset & 0xffffffff;
315 *pos_h = ((uint64_t) offset) >> 32;
316
317}
318static inline ssize_t preadv2(int fd, const struct iovec *iov, int iovcnt,
319 off_t offset, unsigned int flags)
320{
321 unsigned long pos_l, pos_h;
322
323 make_pos_h_l(&pos_h, &pos_l, offset);
324 return syscall(__NR_preadv2, fd, iov, iovcnt, pos_l, pos_h, flags);
325}
326static inline ssize_t pwritev2(int fd, const struct iovec *iov, int iovcnt,
327 off_t offset, unsigned int flags)
328{
329 unsigned long pos_l, pos_h;
330
331 make_pos_h_l(&pos_h, &pos_l, offset);
332 return syscall(__NR_pwritev2, fd, iov, iovcnt, pos_l, pos_h, flags);
333}
334#else
335static inline ssize_t preadv2(int fd, const struct iovec *iov, int iovcnt,
336 off_t offset, unsigned int flags)
337{
338 errno = ENOSYS;
339 return -1;
340}
341static inline ssize_t pwritev2(int fd, const struct iovec *iov, int iovcnt,
342 off_t offset, unsigned int flags)
343{
344 errno = ENOSYS;
345 return -1;
346}
347#endif /* __NR_preadv2 */
348#endif /* CONFIG_PWRITEV2 */
349
350#endif