1 /* This file contains functions which implement those POSIX and Linux functions
2 * that MinGW and Microsoft don't provide. The implementations contain just enough
3 * functionality to support fio.
7 #include <netinet/in.h>
15 #include <semaphore.h>
19 #include <sys/resource.h>
22 #include "../os-windows.h"
23 #include "../../lib/hweight.h"
25 extern unsigned long mtime_since_now(struct timeval *);
26 extern void fio_gettime(struct timeval *, void *);
28 /* These aren't defined in the MinGW headers */
29 HRESULT WINAPI StringCchCopyA(
34 HRESULT WINAPI StringCchPrintfA(
37 const char *pszFormat,
42 size_t numberOfElements,
46 int win_to_posix_error(DWORD winerr)
50 case ERROR_FILE_NOT_FOUND: return ENOENT;
51 case ERROR_PATH_NOT_FOUND: return ENOENT;
52 case ERROR_ACCESS_DENIED: return EACCES;
53 case ERROR_INVALID_HANDLE: return EBADF;
54 case ERROR_NOT_ENOUGH_MEMORY: return ENOMEM;
55 case ERROR_INVALID_DATA: return EINVAL;
56 case ERROR_OUTOFMEMORY: return ENOMEM;
57 case ERROR_INVALID_DRIVE: return ENODEV;
58 case ERROR_NOT_SAME_DEVICE: return EXDEV;
59 case ERROR_WRITE_PROTECT: return EROFS;
60 case ERROR_BAD_UNIT: return ENODEV;
61 case ERROR_SHARING_VIOLATION: return EACCES;
62 case ERROR_LOCK_VIOLATION: return EACCES;
63 case ERROR_SHARING_BUFFER_EXCEEDED: return ENOLCK;
64 case ERROR_HANDLE_DISK_FULL: return ENOSPC;
65 case ERROR_NOT_SUPPORTED: return ENOSYS;
66 case ERROR_FILE_EXISTS: return EEXIST;
67 case ERROR_CANNOT_MAKE: return EPERM;
68 case ERROR_INVALID_PARAMETER: return EINVAL;
69 case ERROR_NO_PROC_SLOTS: return EAGAIN;
70 case ERROR_BROKEN_PIPE: return EPIPE;
71 case ERROR_OPEN_FAILED: return EIO;
72 case ERROR_NO_MORE_SEARCH_HANDLES: return ENFILE;
73 case ERROR_CALL_NOT_IMPLEMENTED: return ENOSYS;
74 case ERROR_INVALID_NAME: return ENOENT;
75 case ERROR_WAIT_NO_CHILDREN: return ECHILD;
76 case ERROR_CHILD_NOT_COMPLETE: return EBUSY;
77 case ERROR_DIR_NOT_EMPTY: return ENOTEMPTY;
78 case ERROR_SIGNAL_REFUSED: return EIO;
79 case ERROR_BAD_PATHNAME: return ENOENT;
80 case ERROR_SIGNAL_PENDING: return EBUSY;
81 case ERROR_MAX_THRDS_REACHED: return EAGAIN;
82 case ERROR_BUSY: return EBUSY;
83 case ERROR_ALREADY_EXISTS: return EEXIST;
84 case ERROR_NO_SIGNAL_SENT: return EIO;
85 case ERROR_FILENAME_EXCED_RANGE: return EINVAL;
86 case ERROR_META_EXPANSION_TOO_LONG: return EINVAL;
87 case ERROR_INVALID_SIGNAL_NUMBER: return EINVAL;
88 case ERROR_THREAD_1_INACTIVE: return EINVAL;
89 case ERROR_BAD_PIPE: return EINVAL;
90 case ERROR_PIPE_BUSY: return EBUSY;
91 case ERROR_NO_DATA: return EPIPE;
92 case ERROR_MORE_DATA: return EAGAIN;
93 case ERROR_DIRECTORY: return ENOTDIR;
94 case ERROR_PIPE_CONNECTED: return EBUSY;
95 case ERROR_NO_TOKEN: return EINVAL;
96 case ERROR_PROCESS_ABORTED: return EFAULT;
97 case ERROR_BAD_DEVICE: return ENODEV;
98 case ERROR_BAD_USERNAME: return EINVAL;
99 case ERROR_OPEN_FILES: return EAGAIN;
100 case ERROR_ACTIVE_CONNECTIONS: return EAGAIN;
101 case ERROR_DEVICE_IN_USE: return EAGAIN;
102 case ERROR_INVALID_AT_INTERRUPT_TIME: return EINTR;
103 case ERROR_IO_DEVICE: return EIO;
104 case ERROR_NOT_OWNER: return EPERM;
105 case ERROR_END_OF_MEDIA: return ENOSPC;
106 case ERROR_EOM_OVERFLOW: return ENOSPC;
107 case ERROR_BEGINNING_OF_MEDIA: return ESPIPE;
108 case ERROR_SETMARK_DETECTED: return ESPIPE;
109 case ERROR_NO_DATA_DETECTED: return ENOSPC;
110 case ERROR_POSSIBLE_DEADLOCK: return EDEADLOCK;
111 case ERROR_CRC: return EIO;
112 case ERROR_NEGATIVE_SEEK: return EINVAL;
113 case ERROR_DISK_FULL: return ENOSPC;
114 case ERROR_NOACCESS: return EFAULT;
115 case ERROR_FILE_INVALID: return ENXIO;
121 int GetNumLogicalProcessors(void)
123 SYSTEM_LOGICAL_PROCESSOR_INFORMATION *processor_info = NULL;
125 DWORD num_processors = 0;
129 while (!GetLogicalProcessorInformation(processor_info, &len)) {
130 error = GetLastError();
131 if (error == ERROR_INSUFFICIENT_BUFFER)
132 processor_info = malloc(len);
134 log_err("Error: GetLogicalProcessorInformation failed: %d\n", error);
138 if (processor_info == NULL) {
139 log_err("Error: failed to allocate memory for GetLogicalProcessorInformation");
144 for (i = 0; i < len / sizeof(SYSTEM_LOGICAL_PROCESSOR_INFORMATION); i++)
146 if (processor_info[i].Relationship == RelationProcessorCore)
147 num_processors += hweight64(processor_info[i].ProcessorMask);
150 free(processor_info);
151 return num_processors;
154 long sysconf(int name)
159 MEMORYSTATUSEX status;
163 case _SC_NPROCESSORS_ONLN:
164 val = GetNumLogicalProcessors();
166 log_err("sysconf(_SC_NPROCESSORS_ONLN) failed\n");
171 GetSystemInfo(&sysInfo);
172 val = sysInfo.dwPageSize;
176 status.dwLength = sizeof(status);
177 val2 = sysconf(_SC_PAGESIZE);
178 if (GlobalMemoryStatusEx(&status) && val2 != -1)
179 val = status.ullTotalPhys / val2;
181 log_err("sysconf(_SC_PHYS_PAGES) failed\n");
184 log_err("sysconf(%d) is not implemented\n", name);
191 char *dl_error = NULL;
193 int dlclose(void *handle)
195 return !FreeLibrary((HMODULE)handle);
198 void *dlopen(const char *file, int mode)
202 hMod = LoadLibrary(file);
203 if (hMod == INVALID_HANDLE_VALUE)
204 dl_error = (char*)"LoadLibrary failed";
211 void *dlsym(void *handle, const char *name)
215 fnPtr = GetProcAddress((HMODULE)handle, name);
217 dl_error = (char*)"GetProcAddress failed";
229 int gettimeofday(struct timeval *restrict tp, void *restrict tzp)
232 uint64_t unix_time, windows_time;
233 const uint64_t MILLISECONDS_BETWEEN_1601_AND_1970 = 11644473600000;
235 /* Ignore the timezone parameter */
239 * Windows time is stored as the number 100 ns intervals since January 1 1601.
240 * Conversion details from http://www.informit.com/articles/article.aspx?p=102236&seqNum=3
241 * Its precision is 100 ns but accuracy is only one clock tick, or normally around 15 ms.
243 GetSystemTimeAsFileTime(&fileTime);
244 windows_time = ((uint64_t)fileTime.dwHighDateTime << 32) + fileTime.dwLowDateTime;
245 /* Divide by 10,000 to convert to ms and subtract the time between 1601 and 1970 */
246 unix_time = (((windows_time)/10000) - MILLISECONDS_BETWEEN_1601_AND_1970);
247 /* unix_time is now the number of milliseconds since 1970 (the Unix epoch) */
248 tp->tv_sec = unix_time / 1000;
249 tp->tv_usec = (unix_time % 1000) * 1000;
253 int sigaction(int sig, const struct sigaction *act,
254 struct sigaction *oact)
257 void (*prev_handler)(int);
259 prev_handler = signal(sig, act->sa_handler);
261 oact->sa_handler = prev_handler;
263 if (prev_handler == SIG_ERR)
269 int lstat(const char * path, struct stat * buf)
271 return stat(path, buf);
274 void *mmap(void *addr, size_t len, int prot, int flags,
275 int fildes, off_t off)
278 void* allocAddr = NULL;
280 if (prot & PROT_NONE)
281 vaProt |= PAGE_NOACCESS;
283 if ((prot & PROT_READ) && !(prot & PROT_WRITE))
284 vaProt |= PAGE_READONLY;
286 if (prot & PROT_WRITE)
287 vaProt |= PAGE_READWRITE;
289 if ((flags & MAP_ANON) | (flags & MAP_ANONYMOUS))
291 allocAddr = VirtualAlloc(addr, len, MEM_COMMIT, vaProt);
292 if (allocAddr == NULL)
293 errno = win_to_posix_error(GetLastError());
299 int munmap(void *addr, size_t len)
301 if (!VirtualFree(addr, 0, MEM_RELEASE)) {
302 errno = win_to_posix_error(GetLastError());
311 log_err("%s is not implemented\n", __func__);
318 log_err("%s is not implemented\n", __func__);
323 static HANDLE log_file = INVALID_HANDLE_VALUE;
325 void openlog(const char *ident, int logopt, int facility)
327 if (log_file == INVALID_HANDLE_VALUE)
328 log_file = CreateFileA("syslog.txt", GENERIC_WRITE, FILE_SHARE_READ | FILE_SHARE_WRITE, NULL, OPEN_ALWAYS, 0, NULL);
333 CloseHandle(log_file);
334 log_file = INVALID_HANDLE_VALUE;
337 void syslog(int priority, const char *message, ... /* argument */)
344 if (log_file == INVALID_HANDLE_VALUE) {
345 log_file = CreateFileA("syslog.txt", GENERIC_WRITE, FILE_SHARE_READ | FILE_SHARE_WRITE, NULL, OPEN_ALWAYS, 0, NULL);
348 if (log_file == INVALID_HANDLE_VALUE) {
349 log_err("syslog: failed to open log file\n");
353 va_start(v, message);
354 len = _vscprintf(message, v);
355 output = malloc(len + sizeof(char));
356 vsprintf(output, message, v);
357 WriteFile(log_file, output, len, &bytes_written, NULL);
362 int kill(pid_t pid, int sig)
369 * This is assumed to be used only by the network code,
370 * and so doesn't try and handle any of the other cases
372 int fcntl(int fildes, int cmd, ...)
375 * non-blocking mode doesn't work the same as in BSD sockets,
380 int val, opt, status;
384 else if (cmd != F_SETFL) {
391 opt = va_arg(ap, int);
392 if (opt & O_NONBLOCK)
397 status = ioctlsocket((SOCKET)fildes, opt, &val);
399 if (status == SOCKET_ERROR) {
412 * Get the value of a local clock source.
413 * This implementation supports 2 clocks: CLOCK_MONOTONIC provides high-accuracy
414 * relative time, while CLOCK_REALTIME provides a low-accuracy wall time.
416 int clock_gettime(clockid_t clock_id, struct timespec *tp)
420 if (clock_id == CLOCK_MONOTONIC)
422 static LARGE_INTEGER freq = {{0,0}};
423 LARGE_INTEGER counts;
425 QueryPerformanceCounter(&counts);
426 if (freq.QuadPart == 0)
427 QueryPerformanceFrequency(&freq);
429 tp->tv_sec = counts.QuadPart / freq.QuadPart;
430 /* Get the difference between the number of ns stored
431 * in 'tv_sec' and that stored in 'counts' */
432 uint64_t t = tp->tv_sec * freq.QuadPart;
433 t = counts.QuadPart - t;
434 /* 't' now contains the number of cycles since the last second.
435 * We want the number of nanoseconds, so multiply out by 1,000,000,000
436 * and then divide by the frequency. */
438 tp->tv_nsec = t / freq.QuadPart;
440 else if (clock_id == CLOCK_REALTIME)
442 /* clock_gettime(CLOCK_REALTIME,...) is just an alias for gettimeofday with a
443 * higher-precision field. */
445 gettimeofday(&tv, NULL);
446 tp->tv_sec = tv.tv_sec;
447 tp->tv_nsec = tv.tv_usec * 1000;
456 int mlock(const void * addr, size_t len)
460 HANDLE process = GetCurrentProcess();
462 success = GetProcessWorkingSetSize(process, &min, &max);
464 errno = win_to_posix_error(GetLastError());
470 success = SetProcessWorkingSetSize(process, min, max);
472 errno = win_to_posix_error(GetLastError());
476 success = VirtualLock((LPVOID)addr, len);
478 errno = win_to_posix_error(GetLastError());
485 int munlock(const void * addr, size_t len)
487 BOOL success = VirtualUnlock((LPVOID)addr, len);
489 errno = win_to_posix_error(GetLastError());
496 pid_t waitpid(pid_t pid, int *stat_loc, int options)
498 log_err("%s is not implemented\n", __func__);
503 int usleep(useconds_t useconds)
505 Sleep(useconds / 1000);
509 char *basename(char *path)
511 static char name[MAX_PATH];
514 if (path == NULL || strlen(path) == 0)
517 i = strlen(path) - 1;
519 while (path[i] != '\\' && path[i] != '/' && i >= 0)
522 strncpy(name, path + i + 1, MAX_PATH);
527 int fsync(int fildes)
529 HANDLE hFile = (HANDLE)_get_osfhandle(fildes);
530 if (!FlushFileBuffers(hFile)) {
531 errno = win_to_posix_error(GetLastError());
538 int nFileMappings = 0;
539 HANDLE fileMappings[1024];
541 int shmget(key_t key, size_t size, int shmflg)
544 uint32_t size_low = size & 0xFFFFFFFF;
545 uint32_t size_high = ((uint64_t)size) >> 32;
546 HANDLE hMapping = CreateFileMapping(INVALID_HANDLE_VALUE, NULL, (PAGE_EXECUTE_READWRITE | SEC_RESERVE), size_high, size_low, NULL);
547 if (hMapping != NULL) {
548 fileMappings[nFileMappings] = hMapping;
549 mapid = nFileMappings;
558 void *shmat(int shmid, const void *shmaddr, int shmflg)
561 MEMORY_BASIC_INFORMATION memInfo;
562 mapAddr = MapViewOfFile(fileMappings[shmid], FILE_MAP_ALL_ACCESS, 0, 0, 0);
563 if (mapAddr == NULL) {
564 errno = win_to_posix_error(GetLastError());
568 if (VirtualQuery(mapAddr, &memInfo, sizeof(memInfo)) == 0) {
569 errno = win_to_posix_error(GetLastError());
573 mapAddr = VirtualAlloc(mapAddr, memInfo.RegionSize, MEM_COMMIT, PAGE_READWRITE);
574 if (mapAddr == NULL) {
575 errno = win_to_posix_error(GetLastError());
582 int shmdt(const void *shmaddr)
584 if (!UnmapViewOfFile(shmaddr)) {
585 errno = win_to_posix_error(GetLastError());
592 int shmctl(int shmid, int cmd, struct shmid_ds *buf)
594 if (cmd == IPC_RMID) {
595 fileMappings[shmid] = INVALID_HANDLE_VALUE;
598 log_err("%s is not implemented\n", __func__);
604 int setuid(uid_t uid)
606 log_err("%s is not implemented\n", __func__);
611 int setgid(gid_t gid)
613 log_err("%s is not implemented\n", __func__);
628 int getrusage(int who, struct rusage *r_usage)
630 const uint64_t SECONDS_BETWEEN_1601_AND_1970 = 11644473600;
631 FILETIME cTime, eTime, kTime, uTime;
635 memset(r_usage, 0, sizeof(*r_usage));
637 if (who == RUSAGE_SELF) {
638 h = GetCurrentProcess();
639 GetProcessTimes(h, &cTime, &eTime, &kTime, &uTime);
640 } else if (who == RUSAGE_THREAD) {
641 h = GetCurrentThread();
642 GetThreadTimes(h, &cTime, &eTime, &kTime, &uTime);
644 log_err("fio: getrusage %d is not implemented\n", who);
648 time = ((uint64_t)uTime.dwHighDateTime << 32) + uTime.dwLowDateTime;
649 /* Divide by 10,000,000 to get the number of seconds and move the epoch from
651 time = (time_t)(((time)/10000000) - SECONDS_BETWEEN_1601_AND_1970);
652 r_usage->ru_utime.tv_sec = time;
653 /* getrusage() doesn't care about anything other than seconds, so set tv_usec to 0 */
654 r_usage->ru_utime.tv_usec = 0;
655 time = ((uint64_t)kTime.dwHighDateTime << 32) + kTime.dwLowDateTime;
656 /* Divide by 10,000,000 to get the number of seconds and move the epoch from
658 time = (time_t)(((time)/10000000) - SECONDS_BETWEEN_1601_AND_1970);
659 r_usage->ru_stime.tv_sec = time;
660 r_usage->ru_stime.tv_usec = 0;
664 int posix_fadvise(int fd, off_t offset, off_t len, int advice)
669 int posix_madvise(void *addr, size_t len, int advice)
671 log_err("%s is not implemented\n", __func__);
675 /* Windows doesn't support advice for memory pages. Just ignore it. */
676 int msync(void *addr, size_t len, int flags)
682 int fdatasync(int fildes)
684 return fsync(fildes);
687 ssize_t pwrite(int fildes, const void *buf, size_t nbyte,
690 int64_t pos = _telli64(fildes);
691 ssize_t len = _write(fildes, buf, nbyte);
692 _lseeki64(fildes, pos, SEEK_SET);
696 ssize_t pread(int fildes, void *buf, size_t nbyte, off_t offset)
698 int64_t pos = _telli64(fildes);
699 ssize_t len = read(fildes, buf, nbyte);
700 _lseeki64(fildes, pos, SEEK_SET);
704 ssize_t readv(int fildes, const struct iovec *iov, int iovcnt)
706 log_err("%s is not implemented\n", __func__);
711 ssize_t writev(int fildes, const struct iovec *iov, int iovcnt)
713 log_err("%s is not implemented\n", __func__);
718 long long strtoll(const char *restrict str, char **restrict endptr,
721 return _strtoi64(str, endptr, base);
724 int poll(struct pollfd fds[], nfds_t nfds, int timeout)
727 struct timeval *to = NULL;
728 fd_set readfds, writefds, exceptfds;
734 to->tv_sec = timeout / 1000;
735 to->tv_usec = (timeout % 1000) * 1000;
742 for (i = 0; i < nfds; i++)
749 if (fds[i].events & POLLIN)
750 FD_SET(fds[i].fd, &readfds);
752 if (fds[i].events & POLLOUT)
753 FD_SET(fds[i].fd, &writefds);
755 FD_SET(fds[i].fd, &exceptfds);
758 rc = select(nfds, &readfds, &writefds, &exceptfds, to);
760 if (rc != SOCKET_ERROR) {
761 for (i = 0; i < nfds; i++)
767 if ((fds[i].events & POLLIN) && FD_ISSET(fds[i].fd, &readfds))
768 fds[i].revents |= POLLIN;
770 if ((fds[i].events & POLLOUT) && FD_ISSET(fds[i].fd, &writefds))
771 fds[i].revents |= POLLOUT;
773 if (FD_ISSET(fds[i].fd, &exceptfds))
774 fds[i].revents |= POLLHUP;
781 int nanosleep(const struct timespec *rqtp, struct timespec *rmtp)
785 DWORD ms_total = (rqtp->tv_sec * 1000) + (rqtp->tv_nsec / 1000000.0);
790 ms_remaining = ms_total;
792 /* Since Sleep() can sleep for less than the requested time, add a loop to
793 ensure we only return after the requested length of time has elapsed */
795 fio_gettime(&tv, NULL);
797 ms_remaining = ms_total - mtime_since_now(&tv);
798 } while (ms_remaining > 0 && ms_remaining < ms_total);
800 /* this implementation will never sleep for less than the requested time */
809 DIR *opendir(const char *dirname)
811 struct dirent_ctx *dc = NULL;
813 /* See if we can open it. If not, we'll return an error here */
814 HANDLE file = CreateFileA(dirname, 0, FILE_SHARE_READ | FILE_SHARE_WRITE, NULL, OPEN_EXISTING, FILE_FLAG_BACKUP_SEMANTICS, NULL);
815 if (file != INVALID_HANDLE_VALUE) {
817 dc = (struct dirent_ctx*)malloc(sizeof(struct dirent_ctx));
818 StringCchCopyA(dc->dirname, MAX_PATH, dirname);
819 dc->find_handle = INVALID_HANDLE_VALUE;
821 DWORD error = GetLastError();
822 if (error == ERROR_FILE_NOT_FOUND)
825 else if (error == ERROR_PATH_NOT_FOUND)
827 else if (error == ERROR_TOO_MANY_OPEN_FILES)
829 else if (error == ERROR_ACCESS_DENIED)
838 int closedir(DIR *dirp)
840 if (dirp != NULL && dirp->find_handle != INVALID_HANDLE_VALUE)
841 FindClose(dirp->find_handle);
847 struct dirent *readdir(DIR *dirp)
849 static struct dirent de;
850 WIN32_FIND_DATA find_data;
855 if (dirp->find_handle == INVALID_HANDLE_VALUE) {
856 char search_pattern[MAX_PATH];
857 StringCchPrintfA(search_pattern, MAX_PATH, "%s\\*", dirp->dirname);
858 dirp->find_handle = FindFirstFileA(search_pattern, &find_data);
859 if (dirp->find_handle == INVALID_HANDLE_VALUE)
862 if (!FindNextFile(dirp->find_handle, &find_data))
866 StringCchCopyA(de.d_name, MAX_PATH, find_data.cFileName);
874 log_err("%s is not implemented\n", __func__);
879 const char* inet_ntop(int af, const void *restrict src,
880 char *restrict dst, socklen_t size)
882 INT status = SOCKET_ERROR;
886 if (af != AF_INET && af != AF_INET6) {
887 errno = EAFNOSUPPORT;
891 WSAStartup(MAKEWORD(2,2), &wsd);
894 struct sockaddr_in si;
896 memset(&si, 0, sizeof(si));
898 memcpy(&si.sin_addr, src, sizeof(si.sin_addr));
899 status = WSAAddressToString((struct sockaddr*)&si, sizeof(si), NULL, dst, &len);
900 } else if (af == AF_INET6) {
901 struct sockaddr_in6 si6;
903 memset(&si6, 0, sizeof(si6));
904 si6.sin6_family = af;
905 memcpy(&si6.sin6_addr, src, sizeof(si6.sin6_addr));
906 status = WSAAddressToString((struct sockaddr*)&si6, sizeof(si6), NULL, dst, &len);
909 if (status != SOCKET_ERROR)
919 int inet_pton(int af, const char *restrict src, void *restrict dst)
921 INT status = SOCKET_ERROR;
925 if (af != AF_INET && af != AF_INET6) {
926 errno = EAFNOSUPPORT;
930 WSAStartup(MAKEWORD(2,2), &wsd);
933 struct sockaddr_in si;
934 INT len = sizeof(si);
935 memset(&si, 0, sizeof(si));
937 status = WSAStringToAddressA((char*)src, af, NULL, (struct sockaddr*)&si, &len);
938 if (status != SOCKET_ERROR)
939 memcpy(dst, &si.sin_addr, sizeof(si.sin_addr));
940 } else if (af == AF_INET6) {
941 struct sockaddr_in6 si6;
942 INT len = sizeof(si6);
943 memset(&si6, 0, sizeof(si6));
944 si6.sin6_family = af;
945 status = WSAStringToAddressA((char*)src, af, NULL, (struct sockaddr*)&si6, &len);
946 if (status != SOCKET_ERROR)
947 memcpy(dst, &si6.sin6_addr, sizeof(si6.sin6_addr));
950 if (status == SOCKET_ERROR) {