fs: introduce f_op->mmap_capabilities for nommu mmap support
[linux-block.git] / drivers / char / mem.c
CommitLineData
1da177e4
LT
1/*
2 * linux/drivers/char/mem.c
3 *
4 * Copyright (C) 1991, 1992 Linus Torvalds
5 *
d7d4d849 6 * Added devfs support.
1da177e4 7 * Jan-11-1998, C. Scott Ananian <cananian@alumni.princeton.edu>
af901ca1 8 * Shared /dev/zero mmapping support, Feb 2000, Kanoj Sarcar <kanoj@sgi.com>
1da177e4
LT
9 */
10
1da177e4
LT
11#include <linux/mm.h>
12#include <linux/miscdevice.h>
13#include <linux/slab.h>
14#include <linux/vmalloc.h>
15#include <linux/mman.h>
16#include <linux/random.h>
17#include <linux/init.h>
18#include <linux/raw.h>
19#include <linux/tty.h>
20#include <linux/capability.h>
1da177e4
LT
21#include <linux/ptrace.h>
22#include <linux/device.h>
50b1fdbd 23#include <linux/highmem.h>
1da177e4 24#include <linux/backing-dev.h>
d6b29d7c 25#include <linux/splice.h>
b8a3ad5b 26#include <linux/pfn.h>
66300e66 27#include <linux/export.h>
e1612de9 28#include <linux/io.h>
a27bb332 29#include <linux/aio.h>
1da177e4
LT
30
31#include <asm/uaccess.h>
1da177e4
LT
32
33#ifdef CONFIG_IA64
34# include <linux/efi.h>
35#endif
36
e1612de9
HM
37#define DEVPORT_MINOR 4
38
f222318e
WF
39static inline unsigned long size_inside_page(unsigned long start,
40 unsigned long size)
41{
42 unsigned long sz;
43
7fabaddd 44 sz = PAGE_SIZE - (start & (PAGE_SIZE - 1));
f222318e 45
7fabaddd 46 return min(sz, size);
f222318e
WF
47}
48
1da177e4 49#ifndef ARCH_HAS_VALID_PHYS_ADDR_RANGE
7e6735c3 50static inline int valid_phys_addr_range(phys_addr_t addr, size_t count)
1da177e4 51{
cfaf346c 52 return addr + count <= __pa(high_memory);
1da177e4 53}
80851ef2 54
06c67bef 55static inline int valid_mmap_phys_addr_range(unsigned long pfn, size_t size)
80851ef2
BH
56{
57 return 1;
58}
1da177e4
LT
59#endif
60
d092633b 61#ifdef CONFIG_STRICT_DEVMEM
e2beb3ea 62static inline int range_is_allowed(unsigned long pfn, unsigned long size)
ae531c26 63{
e2beb3ea
VP
64 u64 from = ((u64)pfn) << PAGE_SHIFT;
65 u64 to = from + size;
66 u64 cursor = from;
67
68 while (cursor < to) {
69 if (!devmem_is_allowed(pfn)) {
70 printk(KERN_INFO
71 "Program %s tried to access /dev/mem between %Lx->%Lx.\n",
ae531c26
AV
72 current->comm, from, to);
73 return 0;
74 }
e2beb3ea
VP
75 cursor += PAGE_SIZE;
76 pfn++;
ae531c26
AV
77 }
78 return 1;
79}
80#else
e2beb3ea 81static inline int range_is_allowed(unsigned long pfn, unsigned long size)
ae531c26
AV
82{
83 return 1;
84}
85#endif
86
4707a341
TR
87#ifndef unxlate_dev_mem_ptr
88#define unxlate_dev_mem_ptr unxlate_dev_mem_ptr
89void __weak unxlate_dev_mem_ptr(phys_addr_t phys, void *addr)
e045fb2a 90{
91}
4707a341 92#endif
e045fb2a 93
1da177e4 94/*
d7d4d849
AM
95 * This funcion reads the *physical* memory. The f_pos points directly to the
96 * memory location.
1da177e4 97 */
d7d4d849 98static ssize_t read_mem(struct file *file, char __user *buf,
1da177e4
LT
99 size_t count, loff_t *ppos)
100{
7e6735c3 101 phys_addr_t p = *ppos;
1da177e4 102 ssize_t read, sz;
4707a341 103 void *ptr;
1da177e4 104
08d2d00b
PT
105 if (p != *ppos)
106 return 0;
107
136939a2 108 if (!valid_phys_addr_range(p, count))
1da177e4
LT
109 return -EFAULT;
110 read = 0;
111#ifdef __ARCH_HAS_NO_PAGE_ZERO_MAPPED
112 /* we don't have page 0 mapped on sparc and m68k.. */
113 if (p < PAGE_SIZE) {
7fabaddd 114 sz = size_inside_page(p, count);
1da177e4
LT
115 if (sz > 0) {
116 if (clear_user(buf, sz))
117 return -EFAULT;
d7d4d849
AM
118 buf += sz;
119 p += sz;
120 count -= sz;
121 read += sz;
1da177e4
LT
122 }
123 }
124#endif
125
126 while (count > 0) {
fa29e97b
WF
127 unsigned long remaining;
128
f222318e 129 sz = size_inside_page(p, count);
1da177e4 130
e045fb2a 131 if (!range_is_allowed(p >> PAGE_SHIFT, count))
132 return -EPERM;
133
1da177e4 134 /*
d7d4d849
AM
135 * On ia64 if a page has been mapped somewhere as uncached, then
136 * it must also be accessed uncached by the kernel or data
137 * corruption may occur.
1da177e4
LT
138 */
139 ptr = xlate_dev_mem_ptr(p);
e045fb2a 140 if (!ptr)
141 return -EFAULT;
1da177e4 142
fa29e97b 143 remaining = copy_to_user(buf, ptr, sz);
e045fb2a 144 unxlate_dev_mem_ptr(p, ptr);
fa29e97b
WF
145 if (remaining)
146 return -EFAULT;
e045fb2a 147
1da177e4
LT
148 buf += sz;
149 p += sz;
150 count -= sz;
151 read += sz;
152 }
153
154 *ppos += read;
155 return read;
156}
157
d7d4d849 158static ssize_t write_mem(struct file *file, const char __user *buf,
1da177e4
LT
159 size_t count, loff_t *ppos)
160{
7e6735c3 161 phys_addr_t p = *ppos;
1da177e4
LT
162 ssize_t written, sz;
163 unsigned long copied;
164 void *ptr;
165
08d2d00b
PT
166 if (p != *ppos)
167 return -EFBIG;
168
136939a2 169 if (!valid_phys_addr_range(p, count))
1da177e4
LT
170 return -EFAULT;
171
172 written = 0;
173
174#ifdef __ARCH_HAS_NO_PAGE_ZERO_MAPPED
175 /* we don't have page 0 mapped on sparc and m68k.. */
176 if (p < PAGE_SIZE) {
7fabaddd 177 sz = size_inside_page(p, count);
1da177e4
LT
178 /* Hmm. Do something? */
179 buf += sz;
180 p += sz;
181 count -= sz;
182 written += sz;
183 }
184#endif
185
186 while (count > 0) {
f222318e 187 sz = size_inside_page(p, count);
1da177e4 188
e045fb2a 189 if (!range_is_allowed(p >> PAGE_SHIFT, sz))
190 return -EPERM;
191
1da177e4 192 /*
d7d4d849
AM
193 * On ia64 if a page has been mapped somewhere as uncached, then
194 * it must also be accessed uncached by the kernel or data
195 * corruption may occur.
1da177e4
LT
196 */
197 ptr = xlate_dev_mem_ptr(p);
e045fb2a 198 if (!ptr) {
199 if (written)
200 break;
201 return -EFAULT;
202 }
1da177e4
LT
203
204 copied = copy_from_user(ptr, buf, sz);
fa29e97b 205 unxlate_dev_mem_ptr(p, ptr);
1da177e4 206 if (copied) {
c654d60e
JB
207 written += sz - copied;
208 if (written)
209 break;
1da177e4
LT
210 return -EFAULT;
211 }
e045fb2a 212
1da177e4
LT
213 buf += sz;
214 p += sz;
215 count -= sz;
216 written += sz;
217 }
218
219 *ppos += written;
220 return written;
221}
222
d7d4d849 223int __weak phys_mem_access_prot_allowed(struct file *file,
f0970c13 224 unsigned long pfn, unsigned long size, pgprot_t *vma_prot)
225{
226 return 1;
227}
228
44ac8413 229#ifndef __HAVE_PHYS_MEM_ACCESS_PROT
d7d4d849
AM
230
231/*
232 * Architectures vary in how they handle caching for addresses
233 * outside of main memory.
234 *
235 */
ea56f411 236#ifdef pgprot_noncached
7e6735c3 237static int uncached_access(struct file *file, phys_addr_t addr)
d7d4d849
AM
238{
239#if defined(CONFIG_IA64)
240 /*
241 * On ia64, we ignore O_DSYNC because we cannot tolerate memory
242 * attribute aliases.
243 */
244 return !(efi_mem_attributes(addr) & EFI_MEMORY_WB);
245#elif defined(CONFIG_MIPS)
246 {
247 extern int __uncached_access(struct file *file,
248 unsigned long addr);
249
250 return __uncached_access(file, addr);
251 }
252#else
253 /*
254 * Accessing memory above the top the kernel knows about or through a
255 * file pointer
256 * that was marked O_DSYNC will be done non-cached.
257 */
258 if (file->f_flags & O_DSYNC)
259 return 1;
260 return addr >= __pa(high_memory);
261#endif
262}
ea56f411 263#endif
d7d4d849 264
44ac8413
BH
265static pgprot_t phys_mem_access_prot(struct file *file, unsigned long pfn,
266 unsigned long size, pgprot_t vma_prot)
267{
268#ifdef pgprot_noncached
7e6735c3 269 phys_addr_t offset = pfn << PAGE_SHIFT;
44ac8413
BH
270
271 if (uncached_access(file, offset))
272 return pgprot_noncached(vma_prot);
273#endif
274 return vma_prot;
275}
276#endif
277
5da6185b
DH
278#ifndef CONFIG_MMU
279static unsigned long get_unmapped_area_mem(struct file *file,
280 unsigned long addr,
281 unsigned long len,
282 unsigned long pgoff,
283 unsigned long flags)
284{
285 if (!valid_mmap_phys_addr_range(pgoff, len))
286 return (unsigned long) -EINVAL;
8a93258c 287 return pgoff << PAGE_SHIFT;
5da6185b
DH
288}
289
b4caecd4
CH
290/* permit direct mmap, for read, write or exec */
291static unsigned memory_mmap_capabilities(struct file *file)
292{
293 return NOMMU_MAP_DIRECT |
294 NOMMU_MAP_READ | NOMMU_MAP_WRITE | NOMMU_MAP_EXEC;
295}
296
297static unsigned zero_mmap_capabilities(struct file *file)
298{
299 return NOMMU_MAP_COPY;
300}
301
5da6185b
DH
302/* can't do an in-place private mapping if there's no MMU */
303static inline int private_mapping_ok(struct vm_area_struct *vma)
304{
305 return vma->vm_flags & VM_MAYSHARE;
306}
307#else
5da6185b
DH
308
309static inline int private_mapping_ok(struct vm_area_struct *vma)
310{
311 return 1;
312}
313#endif
314
f0f37e2f 315static const struct vm_operations_struct mmap_mem_ops = {
7ae8ed50
RR
316#ifdef CONFIG_HAVE_IOREMAP_PROT
317 .access = generic_access_phys
318#endif
e7f260a2 319};
320
d7d4d849 321static int mmap_mem(struct file *file, struct vm_area_struct *vma)
1da177e4 322{
80851ef2
BH
323 size_t size = vma->vm_end - vma->vm_start;
324
06c67bef 325 if (!valid_mmap_phys_addr_range(vma->vm_pgoff, size))
80851ef2
BH
326 return -EINVAL;
327
5da6185b
DH
328 if (!private_mapping_ok(vma))
329 return -ENOSYS;
330
e2beb3ea
VP
331 if (!range_is_allowed(vma->vm_pgoff, size))
332 return -EPERM;
333
f0970c13 334 if (!phys_mem_access_prot_allowed(file, vma->vm_pgoff, size,
335 &vma->vm_page_prot))
336 return -EINVAL;
337
8b150478 338 vma->vm_page_prot = phys_mem_access_prot(file, vma->vm_pgoff,
80851ef2 339 size,
1da177e4 340 vma->vm_page_prot);
1da177e4 341
e7f260a2 342 vma->vm_ops = &mmap_mem_ops;
343
314e51b9 344 /* Remap-pfn-range will mark the range VM_IO */
1da177e4
LT
345 if (remap_pfn_range(vma,
346 vma->vm_start,
347 vma->vm_pgoff,
80851ef2 348 size,
e7f260a2 349 vma->vm_page_prot)) {
1da177e4 350 return -EAGAIN;
e7f260a2 351 }
1da177e4
LT
352 return 0;
353}
354
b781ecb6 355#ifdef CONFIG_DEVKMEM
d7d4d849 356static int mmap_kmem(struct file *file, struct vm_area_struct *vma)
1da177e4 357{
4bb82551
LT
358 unsigned long pfn;
359
6d3154cc
LT
360 /* Turn a kernel-virtual address into a physical page frame */
361 pfn = __pa((u64)vma->vm_pgoff << PAGE_SHIFT) >> PAGE_SHIFT;
4bb82551 362
1da177e4 363 /*
d7d4d849
AM
364 * RED-PEN: on some architectures there is more mapped memory than
365 * available in mem_map which pfn_valid checks for. Perhaps should add a
366 * new macro here.
1da177e4
LT
367 *
368 * RED-PEN: vmalloc is not supported right now.
369 */
4bb82551 370 if (!pfn_valid(pfn))
1da177e4 371 return -EIO;
4bb82551
LT
372
373 vma->vm_pgoff = pfn;
1da177e4
LT
374 return mmap_mem(file, vma);
375}
b781ecb6 376#endif
1da177e4 377
b781ecb6 378#ifdef CONFIG_DEVKMEM
1da177e4
LT
379/*
380 * This function reads the *virtual* memory as seen by the kernel.
381 */
d7d4d849 382static ssize_t read_kmem(struct file *file, char __user *buf,
1da177e4
LT
383 size_t count, loff_t *ppos)
384{
385 unsigned long p = *ppos;
386 ssize_t low_count, read, sz;
890537b3 387 char *kbuf; /* k-addr because vread() takes vmlist_lock rwlock */
325fda71 388 int err = 0;
1da177e4
LT
389
390 read = 0;
391 if (p < (unsigned long) high_memory) {
392 low_count = count;
d7d4d849
AM
393 if (count > (unsigned long)high_memory - p)
394 low_count = (unsigned long)high_memory - p;
1da177e4
LT
395
396#ifdef __ARCH_HAS_NO_PAGE_ZERO_MAPPED
397 /* we don't have page 0 mapped on sparc and m68k.. */
398 if (p < PAGE_SIZE && low_count > 0) {
7fabaddd
WF
399 sz = size_inside_page(p, low_count);
400 if (clear_user(buf, sz))
1da177e4 401 return -EFAULT;
7fabaddd
WF
402 buf += sz;
403 p += sz;
404 read += sz;
405 low_count -= sz;
406 count -= sz;
1da177e4
LT
407 }
408#endif
409 while (low_count > 0) {
f222318e 410 sz = size_inside_page(p, low_count);
1da177e4
LT
411
412 /*
413 * On ia64 if a page has been mapped somewhere as
414 * uncached, then it must also be accessed uncached
415 * by the kernel or data corruption may occur
416 */
4707a341 417 kbuf = xlate_dev_kmem_ptr((void *)p);
1da177e4
LT
418
419 if (copy_to_user(buf, kbuf, sz))
420 return -EFAULT;
421 buf += sz;
422 p += sz;
423 read += sz;
424 low_count -= sz;
425 count -= sz;
426 }
427 }
428
429 if (count > 0) {
430 kbuf = (char *)__get_free_page(GFP_KERNEL);
431 if (!kbuf)
432 return -ENOMEM;
433 while (count > 0) {
80ad89a0 434 sz = size_inside_page(p, count);
325fda71
KH
435 if (!is_vmalloc_or_module_addr((void *)p)) {
436 err = -ENXIO;
437 break;
438 }
80ad89a0
WF
439 sz = vread(kbuf, (char *)p, sz);
440 if (!sz)
1da177e4 441 break;
80ad89a0 442 if (copy_to_user(buf, kbuf, sz)) {
325fda71
KH
443 err = -EFAULT;
444 break;
1da177e4 445 }
80ad89a0
WF
446 count -= sz;
447 buf += sz;
448 read += sz;
449 p += sz;
1da177e4
LT
450 }
451 free_page((unsigned long)kbuf);
452 }
325fda71
KH
453 *ppos = p;
454 return read ? read : err;
1da177e4
LT
455}
456
457
d7d4d849
AM
458static ssize_t do_write_kmem(unsigned long p, const char __user *buf,
459 size_t count, loff_t *ppos)
1da177e4
LT
460{
461 ssize_t written, sz;
462 unsigned long copied;
463
464 written = 0;
465#ifdef __ARCH_HAS_NO_PAGE_ZERO_MAPPED
466 /* we don't have page 0 mapped on sparc and m68k.. */
ee32398f
WF
467 if (p < PAGE_SIZE) {
468 sz = size_inside_page(p, count);
1da177e4
LT
469 /* Hmm. Do something? */
470 buf += sz;
471 p += sz;
1da177e4
LT
472 count -= sz;
473 written += sz;
474 }
475#endif
476
477 while (count > 0) {
4707a341 478 void *ptr;
1da177e4 479
ee32398f 480 sz = size_inside_page(p, count);
1da177e4
LT
481
482 /*
d7d4d849
AM
483 * On ia64 if a page has been mapped somewhere as uncached, then
484 * it must also be accessed uncached by the kernel or data
485 * corruption may occur.
1da177e4 486 */
4707a341 487 ptr = xlate_dev_kmem_ptr((void *)p);
1da177e4
LT
488
489 copied = copy_from_user(ptr, buf, sz);
490 if (copied) {
c654d60e
JB
491 written += sz - copied;
492 if (written)
493 break;
1da177e4
LT
494 return -EFAULT;
495 }
496 buf += sz;
497 p += sz;
1da177e4
LT
498 count -= sz;
499 written += sz;
500 }
501
502 *ppos += written;
503 return written;
504}
505
1da177e4
LT
506/*
507 * This function writes to the *virtual* memory as seen by the kernel.
508 */
d7d4d849 509static ssize_t write_kmem(struct file *file, const char __user *buf,
1da177e4
LT
510 size_t count, loff_t *ppos)
511{
512 unsigned long p = *ppos;
513 ssize_t wrote = 0;
514 ssize_t virtr = 0;
890537b3 515 char *kbuf; /* k-addr because vwrite() takes vmlist_lock rwlock */
325fda71 516 int err = 0;
1da177e4
LT
517
518 if (p < (unsigned long) high_memory) {
80ad89a0
WF
519 unsigned long to_write = min_t(unsigned long, count,
520 (unsigned long)high_memory - p);
ee32398f 521 wrote = do_write_kmem(p, buf, to_write, ppos);
80ad89a0
WF
522 if (wrote != to_write)
523 return wrote;
1da177e4
LT
524 p += wrote;
525 buf += wrote;
526 count -= wrote;
527 }
528
529 if (count > 0) {
530 kbuf = (char *)__get_free_page(GFP_KERNEL);
531 if (!kbuf)
532 return wrote ? wrote : -ENOMEM;
533 while (count > 0) {
80ad89a0
WF
534 unsigned long sz = size_inside_page(p, count);
535 unsigned long n;
1da177e4 536
325fda71
KH
537 if (!is_vmalloc_or_module_addr((void *)p)) {
538 err = -ENXIO;
539 break;
540 }
80ad89a0
WF
541 n = copy_from_user(kbuf, buf, sz);
542 if (n) {
325fda71
KH
543 err = -EFAULT;
544 break;
1da177e4 545 }
c85e9a97 546 vwrite(kbuf, (char *)p, sz);
80ad89a0
WF
547 count -= sz;
548 buf += sz;
549 virtr += sz;
550 p += sz;
1da177e4
LT
551 }
552 free_page((unsigned long)kbuf);
553 }
554
325fda71
KH
555 *ppos = p;
556 return virtr + wrote ? : err;
1da177e4 557}
b781ecb6 558#endif
1da177e4 559
4f911d64 560#ifdef CONFIG_DEVPORT
d7d4d849 561static ssize_t read_port(struct file *file, char __user *buf,
1da177e4
LT
562 size_t count, loff_t *ppos)
563{
564 unsigned long i = *ppos;
565 char __user *tmp = buf;
566
567 if (!access_ok(VERIFY_WRITE, buf, count))
d7d4d849 568 return -EFAULT;
1da177e4 569 while (count-- > 0 && i < 65536) {
d7d4d849
AM
570 if (__put_user(inb(i), tmp) < 0)
571 return -EFAULT;
1da177e4
LT
572 i++;
573 tmp++;
574 }
575 *ppos = i;
576 return tmp-buf;
577}
578
d7d4d849 579static ssize_t write_port(struct file *file, const char __user *buf,
1da177e4
LT
580 size_t count, loff_t *ppos)
581{
582 unsigned long i = *ppos;
890537b3 583 const char __user *tmp = buf;
1da177e4 584
d7d4d849 585 if (!access_ok(VERIFY_READ, buf, count))
1da177e4
LT
586 return -EFAULT;
587 while (count-- > 0 && i < 65536) {
588 char c;
c654d60e
JB
589 if (__get_user(c, tmp)) {
590 if (tmp > buf)
591 break;
d7d4d849 592 return -EFAULT;
c654d60e 593 }
d7d4d849 594 outb(c, i);
1da177e4
LT
595 i++;
596 tmp++;
597 }
598 *ppos = i;
599 return tmp-buf;
600}
601#endif
602
d7d4d849 603static ssize_t read_null(struct file *file, char __user *buf,
1da177e4
LT
604 size_t count, loff_t *ppos)
605{
606 return 0;
607}
608
d7d4d849 609static ssize_t write_null(struct file *file, const char __user *buf,
1da177e4
LT
610 size_t count, loff_t *ppos)
611{
612 return count;
613}
614
162934de
ZB
615static ssize_t aio_read_null(struct kiocb *iocb, const struct iovec *iov,
616 unsigned long nr_segs, loff_t pos)
617{
618 return 0;
619}
620
621static ssize_t aio_write_null(struct kiocb *iocb, const struct iovec *iov,
622 unsigned long nr_segs, loff_t pos)
623{
624 return iov_length(iov, nr_segs);
625}
626
1ebd32fc
JA
627static int pipe_to_null(struct pipe_inode_info *info, struct pipe_buffer *buf,
628 struct splice_desc *sd)
629{
630 return sd->len;
631}
632
d7d4d849 633static ssize_t splice_write_null(struct pipe_inode_info *pipe, struct file *out,
1ebd32fc
JA
634 loff_t *ppos, size_t len, unsigned int flags)
635{
636 return splice_from_pipe(pipe, out, ppos, len, flags, pipe_to_null);
637}
638
13ba33e8 639static ssize_t read_iter_zero(struct kiocb *iocb, struct iov_iter *iter)
1da177e4 640{
13ba33e8 641 size_t written = 0;
1da177e4 642
13ba33e8
AV
643 while (iov_iter_count(iter)) {
644 size_t chunk = iov_iter_count(iter), n;
557ed1fa
NP
645 if (chunk > PAGE_SIZE)
646 chunk = PAGE_SIZE; /* Just for latency reasons */
13ba33e8
AV
647 n = iov_iter_zero(chunk, iter);
648 if (!n && iov_iter_count(iter))
649 return written ? written : -EFAULT;
650 written += n;
2b838687
LT
651 if (signal_pending(current))
652 return written ? written : -ERESTARTSYS;
1da177e4
LT
653 cond_resched();
654 }
13ba33e8 655 return written;
162934de
ZB
656}
657
d7d4d849 658static int mmap_zero(struct file *file, struct vm_area_struct *vma)
1da177e4 659{
557ed1fa 660#ifndef CONFIG_MMU
1da177e4 661 return -ENOSYS;
557ed1fa
NP
662#endif
663 if (vma->vm_flags & VM_SHARED)
664 return shmem_zero_setup(vma);
665 return 0;
1da177e4 666}
1da177e4 667
d7d4d849 668static ssize_t write_full(struct file *file, const char __user *buf,
1da177e4
LT
669 size_t count, loff_t *ppos)
670{
671 return -ENOSPC;
672}
673
674/*
675 * Special lseek() function for /dev/null and /dev/zero. Most notably, you
676 * can fopen() both devices with "a" now. This was previously impossible.
677 * -- SRB.
678 */
d7d4d849 679static loff_t null_lseek(struct file *file, loff_t offset, int orig)
1da177e4
LT
680{
681 return file->f_pos = 0;
682}
683
684/*
685 * The memory devices use the full 32/64 bits of the offset, and so we cannot
686 * check against negative addresses: they are ok. The return value is weird,
687 * though, in that case (0).
688 *
689 * also note that seeking relative to the "end of file" isn't supported:
690 * it has no meaning, so it returns -EINVAL.
691 */
d7d4d849 692static loff_t memory_lseek(struct file *file, loff_t offset, int orig)
1da177e4
LT
693{
694 loff_t ret;
695
496ad9aa 696 mutex_lock(&file_inode(file)->i_mutex);
1da177e4 697 switch (orig) {
d7d4d849
AM
698 case SEEK_CUR:
699 offset += file->f_pos;
d7d4d849
AM
700 case SEEK_SET:
701 /* to avoid userland mistaking f_pos=-9 as -EBADF=-9 */
71811f32 702 if (IS_ERR_VALUE((unsigned long long)offset)) {
d7d4d849 703 ret = -EOVERFLOW;
1da177e4 704 break;
d7d4d849
AM
705 }
706 file->f_pos = offset;
707 ret = file->f_pos;
708 force_successful_syscall_return();
709 break;
710 default:
711 ret = -EINVAL;
1da177e4 712 }
496ad9aa 713 mutex_unlock(&file_inode(file)->i_mutex);
1da177e4
LT
714 return ret;
715}
716
890537b3 717static int open_port(struct inode *inode, struct file *filp)
1da177e4
LT
718{
719 return capable(CAP_SYS_RAWIO) ? 0 : -EPERM;
720}
721
722#define zero_lseek null_lseek
723#define full_lseek null_lseek
724#define write_zero write_null
162934de 725#define aio_write_zero aio_write_null
1da177e4
LT
726#define open_mem open_port
727#define open_kmem open_mem
728
62322d25 729static const struct file_operations mem_fops = {
1da177e4
LT
730 .llseek = memory_lseek,
731 .read = read_mem,
732 .write = write_mem,
733 .mmap = mmap_mem,
734 .open = open_mem,
b4caecd4 735#ifndef CONFIG_MMU
5da6185b 736 .get_unmapped_area = get_unmapped_area_mem,
b4caecd4
CH
737 .mmap_capabilities = memory_mmap_capabilities,
738#endif
1da177e4
LT
739};
740
b781ecb6 741#ifdef CONFIG_DEVKMEM
62322d25 742static const struct file_operations kmem_fops = {
1da177e4
LT
743 .llseek = memory_lseek,
744 .read = read_kmem,
745 .write = write_kmem,
746 .mmap = mmap_kmem,
747 .open = open_kmem,
b4caecd4 748#ifndef CONFIG_MMU
5da6185b 749 .get_unmapped_area = get_unmapped_area_mem,
b4caecd4
CH
750 .mmap_capabilities = memory_mmap_capabilities,
751#endif
1da177e4 752};
b781ecb6 753#endif
1da177e4 754
62322d25 755static const struct file_operations null_fops = {
1da177e4
LT
756 .llseek = null_lseek,
757 .read = read_null,
758 .write = write_null,
162934de
ZB
759 .aio_read = aio_read_null,
760 .aio_write = aio_write_null,
1ebd32fc 761 .splice_write = splice_write_null,
1da177e4
LT
762};
763
4f911d64 764#ifdef CONFIG_DEVPORT
62322d25 765static const struct file_operations port_fops = {
1da177e4
LT
766 .llseek = memory_lseek,
767 .read = read_port,
768 .write = write_port,
769 .open = open_port,
770};
771#endif
772
62322d25 773static const struct file_operations zero_fops = {
1da177e4 774 .llseek = zero_lseek,
13ba33e8 775 .read = new_sync_read,
1da177e4 776 .write = write_zero,
13ba33e8 777 .read_iter = read_iter_zero,
162934de 778 .aio_write = aio_write_zero,
1da177e4 779 .mmap = mmap_zero,
b4caecd4
CH
780#ifndef CONFIG_MMU
781 .mmap_capabilities = zero_mmap_capabilities,
782#endif
1da177e4
LT
783};
784
62322d25 785static const struct file_operations full_fops = {
1da177e4 786 .llseek = full_lseek,
13ba33e8
AV
787 .read = new_sync_read,
788 .read_iter = read_iter_zero,
1da177e4
LT
789 .write = write_full,
790};
791
389e0cb9
KS
792static const struct memdev {
793 const char *name;
2c9ede55 794 umode_t mode;
389e0cb9 795 const struct file_operations *fops;
b4caecd4 796 fmode_t fmode;
389e0cb9 797} devlist[] = {
b4caecd4 798 [1] = { "mem", 0, &mem_fops, FMODE_UNSIGNED_OFFSET },
b781ecb6 799#ifdef CONFIG_DEVKMEM
b4caecd4 800 [2] = { "kmem", 0, &kmem_fops, FMODE_UNSIGNED_OFFSET },
b781ecb6 801#endif
b4caecd4 802 [3] = { "null", 0666, &null_fops, 0 },
4f911d64 803#ifdef CONFIG_DEVPORT
b4caecd4 804 [4] = { "port", 0, &port_fops, 0 },
1da177e4 805#endif
b4caecd4
CH
806 [5] = { "zero", 0666, &zero_fops, 0 },
807 [7] = { "full", 0666, &full_fops, 0 },
808 [8] = { "random", 0666, &random_fops, 0 },
809 [9] = { "urandom", 0666, &urandom_fops, 0 },
7f3a781d 810#ifdef CONFIG_PRINTK
b4caecd4 811 [11] = { "kmsg", 0644, &kmsg_fops, 0 },
7f3a781d 812#endif
d6f47bef
ASF
813};
814
815static int memory_open(struct inode *inode, struct file *filp)
816{
389e0cb9
KS
817 int minor;
818 const struct memdev *dev;
d6f47bef 819
389e0cb9
KS
820 minor = iminor(inode);
821 if (minor >= ARRAY_SIZE(devlist))
205153aa 822 return -ENXIO;
d6f47bef 823
389e0cb9
KS
824 dev = &devlist[minor];
825 if (!dev->fops)
205153aa 826 return -ENXIO;
d6f47bef 827
389e0cb9 828 filp->f_op = dev->fops;
b4caecd4 829 filp->f_mode |= dev->fmode;
4a3956c7 830
389e0cb9 831 if (dev->fops->open)
205153aa
FW
832 return dev->fops->open(inode, filp);
833
834 return 0;
1da177e4
LT
835}
836
62322d25 837static const struct file_operations memory_fops = {
d7d4d849 838 .open = memory_open,
6038f373 839 .llseek = noop_llseek,
1da177e4
LT
840};
841
2c9ede55 842static char *mem_devnode(struct device *dev, umode_t *mode)
e454cea2
KS
843{
844 if (mode && devlist[MINOR(dev->devt)].mode)
845 *mode = devlist[MINOR(dev->devt)].mode;
846 return NULL;
847}
848
ca8eca68 849static struct class *mem_class;
1da177e4
LT
850
851static int __init chr_dev_init(void)
852{
389e0cb9 853 int minor;
1da177e4 854
d7d4d849 855 if (register_chrdev(MEM_MAJOR, "mem", &memory_fops))
1da177e4
LT
856 printk("unable to get major %d for memory devs\n", MEM_MAJOR);
857
ca8eca68 858 mem_class = class_create(THIS_MODULE, "mem");
6e191f7b
AB
859 if (IS_ERR(mem_class))
860 return PTR_ERR(mem_class);
861
e454cea2 862 mem_class->devnode = mem_devnode;
389e0cb9
KS
863 for (minor = 1; minor < ARRAY_SIZE(devlist); minor++) {
864 if (!devlist[minor].name)
865 continue;
e1612de9
HM
866
867 /*
890537b3 868 * Create /dev/port?
e1612de9
HM
869 */
870 if ((minor == DEVPORT_MINOR) && !arch_has_dev_port())
871 continue;
872
389e0cb9
KS
873 device_create(mem_class, NULL, MKDEV(MEM_MAJOR, minor),
874 NULL, devlist[minor].name);
875 }
ebf644c4 876
31d1d48e 877 return tty_init();
1da177e4
LT
878}
879
880fs_initcall(chr_dev_init);