x86: introduce /dev/mem restrictions with a config option
[linux-block.git] / drivers / char / mem.c
CommitLineData
1da177e4
LT
1/*
2 * linux/drivers/char/mem.c
3 *
4 * Copyright (C) 1991, 1992 Linus Torvalds
5 *
6 * Added devfs support.
7 * Jan-11-1998, C. Scott Ananian <cananian@alumni.princeton.edu>
8 * Shared /dev/zero mmaping support, Feb 2000, Kanoj Sarcar <kanoj@sgi.com>
9 */
10
1da177e4
LT
11#include <linux/mm.h>
12#include <linux/miscdevice.h>
13#include <linux/slab.h>
14#include <linux/vmalloc.h>
15#include <linux/mman.h>
16#include <linux/random.h>
17#include <linux/init.h>
18#include <linux/raw.h>
19#include <linux/tty.h>
20#include <linux/capability.h>
1da177e4
LT
21#include <linux/ptrace.h>
22#include <linux/device.h>
50b1fdbd
VG
23#include <linux/highmem.h>
24#include <linux/crash_dump.h>
1da177e4 25#include <linux/backing-dev.h>
315c215c 26#include <linux/bootmem.h>
d6b29d7c 27#include <linux/splice.h>
b8a3ad5b 28#include <linux/pfn.h>
1da177e4
LT
29
30#include <asm/uaccess.h>
31#include <asm/io.h>
32
33#ifdef CONFIG_IA64
34# include <linux/efi.h>
35#endif
36
1da177e4
LT
37/*
38 * Architectures vary in how they handle caching for addresses
39 * outside of main memory.
40 *
41 */
42static inline int uncached_access(struct file *file, unsigned long addr)
43{
ca5cd877 44#if defined(__i386__) && !defined(__arch_um__)
1da177e4
LT
45 /*
46 * On the PPro and successors, the MTRRs are used to set
47 * memory types for physical addresses outside main memory,
48 * so blindly setting PCD or PWT on those pages is wrong.
49 * For Pentiums and earlier, the surround logic should disable
50 * caching for the high addresses through the KEN pin, but
51 * we maintain the tradition of paranoia in this code.
52 */
53 if (file->f_flags & O_SYNC)
54 return 1;
55 return !( test_bit(X86_FEATURE_MTRR, boot_cpu_data.x86_capability) ||
56 test_bit(X86_FEATURE_K6_MTRR, boot_cpu_data.x86_capability) ||
57 test_bit(X86_FEATURE_CYRIX_ARR, boot_cpu_data.x86_capability) ||
58 test_bit(X86_FEATURE_CENTAUR_MCR, boot_cpu_data.x86_capability) )
59 && addr >= __pa(high_memory);
ca5cd877 60#elif defined(__x86_64__) && !defined(__arch_um__)
1da177e4
LT
61 /*
62 * This is broken because it can generate memory type aliases,
63 * which can cause cache corruptions
64 * But it is only available for root and we have to be bug-to-bug
65 * compatible with i386.
66 */
67 if (file->f_flags & O_SYNC)
68 return 1;
69 /* same behaviour as i386. PAT always set to cached and MTRRs control the
70 caching behaviour.
71 Hopefully a full PAT implementation will fix that soon. */
72 return 0;
73#elif defined(CONFIG_IA64)
74 /*
75 * On ia64, we ignore O_SYNC because we cannot tolerate memory attribute aliases.
76 */
77 return !(efi_mem_attributes(addr) & EFI_MEMORY_WB);
24e9d0b9
RB
78#elif defined(CONFIG_MIPS)
79 {
80 extern int __uncached_access(struct file *file,
81 unsigned long addr);
82
83 return __uncached_access(file, addr);
84 }
1da177e4
LT
85#else
86 /*
87 * Accessing memory above the top the kernel knows about or through a file pointer
88 * that was marked O_SYNC will be done non-cached.
89 */
90 if (file->f_flags & O_SYNC)
91 return 1;
92 return addr >= __pa(high_memory);
93#endif
94}
95
96#ifndef ARCH_HAS_VALID_PHYS_ADDR_RANGE
136939a2 97static inline int valid_phys_addr_range(unsigned long addr, size_t count)
1da177e4 98{
136939a2 99 if (addr + count > __pa(high_memory))
1da177e4
LT
100 return 0;
101
1da177e4
LT
102 return 1;
103}
80851ef2 104
06c67bef 105static inline int valid_mmap_phys_addr_range(unsigned long pfn, size_t size)
80851ef2
BH
106{
107 return 1;
108}
1da177e4
LT
109#endif
110
ae531c26
AV
111#ifdef CONFIG_NONPROMISC_DEVMEM
112static inline int range_is_allowed(unsigned long from, unsigned long to)
113{
114 unsigned long cursor;
115
116 cursor = from >> PAGE_SHIFT;
117 while ((cursor << PAGE_SHIFT) < to) {
118 if (!devmem_is_allowed(cursor)) {
119 printk(KERN_INFO "Program %s tried to read /dev/mem "
120 "between %lx->%lx.\n",
121 current->comm, from, to);
122 return 0;
123 }
124 cursor++;
125 }
126 return 1;
127}
128#else
129static inline int range_is_allowed(unsigned long from, unsigned long to)
130{
131 return 1;
132}
133#endif
134
1da177e4
LT
135/*
136 * This funcion reads the *physical* memory. The f_pos points directly to the
137 * memory location.
138 */
139static ssize_t read_mem(struct file * file, char __user * buf,
140 size_t count, loff_t *ppos)
141{
142 unsigned long p = *ppos;
143 ssize_t read, sz;
144 char *ptr;
145
136939a2 146 if (!valid_phys_addr_range(p, count))
1da177e4
LT
147 return -EFAULT;
148 read = 0;
149#ifdef __ARCH_HAS_NO_PAGE_ZERO_MAPPED
150 /* we don't have page 0 mapped on sparc and m68k.. */
151 if (p < PAGE_SIZE) {
152 sz = PAGE_SIZE - p;
153 if (sz > count)
154 sz = count;
155 if (sz > 0) {
156 if (clear_user(buf, sz))
157 return -EFAULT;
158 buf += sz;
159 p += sz;
160 count -= sz;
161 read += sz;
162 }
163 }
164#endif
165
166 while (count > 0) {
167 /*
168 * Handle first page in case it's not aligned
169 */
170 if (-p & (PAGE_SIZE - 1))
171 sz = -p & (PAGE_SIZE - 1);
172 else
173 sz = PAGE_SIZE;
174
175 sz = min_t(unsigned long, sz, count);
176
177 /*
178 * On ia64 if a page has been mapped somewhere as
179 * uncached, then it must also be accessed uncached
180 * by the kernel or data corruption may occur
181 */
182 ptr = xlate_dev_mem_ptr(p);
183
ae531c26
AV
184 if (!range_is_allowed(p, p+count))
185 return -EPERM;
1da177e4
LT
186 if (copy_to_user(buf, ptr, sz))
187 return -EFAULT;
188 buf += sz;
189 p += sz;
190 count -= sz;
191 read += sz;
192 }
193
194 *ppos += read;
195 return read;
196}
197
198static ssize_t write_mem(struct file * file, const char __user * buf,
199 size_t count, loff_t *ppos)
200{
201 unsigned long p = *ppos;
202 ssize_t written, sz;
203 unsigned long copied;
204 void *ptr;
205
136939a2 206 if (!valid_phys_addr_range(p, count))
1da177e4
LT
207 return -EFAULT;
208
209 written = 0;
210
211#ifdef __ARCH_HAS_NO_PAGE_ZERO_MAPPED
212 /* we don't have page 0 mapped on sparc and m68k.. */
213 if (p < PAGE_SIZE) {
214 unsigned long sz = PAGE_SIZE - p;
215 if (sz > count)
216 sz = count;
217 /* Hmm. Do something? */
218 buf += sz;
219 p += sz;
220 count -= sz;
221 written += sz;
222 }
223#endif
224
225 while (count > 0) {
226 /*
227 * Handle first page in case it's not aligned
228 */
229 if (-p & (PAGE_SIZE - 1))
230 sz = -p & (PAGE_SIZE - 1);
231 else
232 sz = PAGE_SIZE;
233
234 sz = min_t(unsigned long, sz, count);
235
236 /*
237 * On ia64 if a page has been mapped somewhere as
238 * uncached, then it must also be accessed uncached
239 * by the kernel or data corruption may occur
240 */
241 ptr = xlate_dev_mem_ptr(p);
242
ae531c26
AV
243 if (!range_is_allowed(p, p+sz))
244 return -EPERM;
1da177e4
LT
245 copied = copy_from_user(ptr, buf, sz);
246 if (copied) {
c654d60e
JB
247 written += sz - copied;
248 if (written)
249 break;
1da177e4
LT
250 return -EFAULT;
251 }
252 buf += sz;
253 p += sz;
254 count -= sz;
255 written += sz;
256 }
257
258 *ppos += written;
259 return written;
260}
261
44ac8413
BH
262#ifndef __HAVE_PHYS_MEM_ACCESS_PROT
263static pgprot_t phys_mem_access_prot(struct file *file, unsigned long pfn,
264 unsigned long size, pgprot_t vma_prot)
265{
266#ifdef pgprot_noncached
267 unsigned long offset = pfn << PAGE_SHIFT;
268
269 if (uncached_access(file, offset))
270 return pgprot_noncached(vma_prot);
271#endif
272 return vma_prot;
273}
274#endif
275
5da6185b
DH
276#ifndef CONFIG_MMU
277static unsigned long get_unmapped_area_mem(struct file *file,
278 unsigned long addr,
279 unsigned long len,
280 unsigned long pgoff,
281 unsigned long flags)
282{
283 if (!valid_mmap_phys_addr_range(pgoff, len))
284 return (unsigned long) -EINVAL;
8a93258c 285 return pgoff << PAGE_SHIFT;
5da6185b
DH
286}
287
288/* can't do an in-place private mapping if there's no MMU */
289static inline int private_mapping_ok(struct vm_area_struct *vma)
290{
291 return vma->vm_flags & VM_MAYSHARE;
292}
293#else
294#define get_unmapped_area_mem NULL
295
296static inline int private_mapping_ok(struct vm_area_struct *vma)
297{
298 return 1;
299}
300#endif
301
1da177e4
LT
302static int mmap_mem(struct file * file, struct vm_area_struct * vma)
303{
80851ef2
BH
304 size_t size = vma->vm_end - vma->vm_start;
305
06c67bef 306 if (!valid_mmap_phys_addr_range(vma->vm_pgoff, size))
80851ef2
BH
307 return -EINVAL;
308
5da6185b
DH
309 if (!private_mapping_ok(vma))
310 return -ENOSYS;
311
8b150478 312 vma->vm_page_prot = phys_mem_access_prot(file, vma->vm_pgoff,
80851ef2 313 size,
1da177e4 314 vma->vm_page_prot);
1da177e4
LT
315
316 /* Remap-pfn-range will mark the range VM_IO and VM_RESERVED */
317 if (remap_pfn_range(vma,
318 vma->vm_start,
319 vma->vm_pgoff,
80851ef2 320 size,
1da177e4
LT
321 vma->vm_page_prot))
322 return -EAGAIN;
323 return 0;
324}
325
326static int mmap_kmem(struct file * file, struct vm_area_struct * vma)
327{
4bb82551
LT
328 unsigned long pfn;
329
6d3154cc
LT
330 /* Turn a kernel-virtual address into a physical page frame */
331 pfn = __pa((u64)vma->vm_pgoff << PAGE_SHIFT) >> PAGE_SHIFT;
4bb82551 332
1da177e4
LT
333 /*
334 * RED-PEN: on some architectures there is more mapped memory
335 * than available in mem_map which pfn_valid checks
336 * for. Perhaps should add a new macro here.
337 *
338 * RED-PEN: vmalloc is not supported right now.
339 */
4bb82551 340 if (!pfn_valid(pfn))
1da177e4 341 return -EIO;
4bb82551
LT
342
343 vma->vm_pgoff = pfn;
1da177e4
LT
344 return mmap_mem(file, vma);
345}
346
50b1fdbd
VG
347#ifdef CONFIG_CRASH_DUMP
348/*
349 * Read memory corresponding to the old kernel.
50b1fdbd 350 */
315c215c 351static ssize_t read_oldmem(struct file *file, char __user *buf,
50b1fdbd
VG
352 size_t count, loff_t *ppos)
353{
315c215c
VG
354 unsigned long pfn, offset;
355 size_t read = 0, csize;
356 int rc = 0;
50b1fdbd 357
72414d3f 358 while (count) {
50b1fdbd 359 pfn = *ppos / PAGE_SIZE;
315c215c
VG
360 if (pfn > saved_max_pfn)
361 return read;
50b1fdbd 362
315c215c
VG
363 offset = (unsigned long)(*ppos % PAGE_SIZE);
364 if (count > PAGE_SIZE - offset)
365 csize = PAGE_SIZE - offset;
366 else
367 csize = count;
50b1fdbd 368
315c215c
VG
369 rc = copy_oldmem_page(pfn, buf, csize, offset, 1);
370 if (rc < 0)
371 return rc;
50b1fdbd
VG
372 buf += csize;
373 *ppos += csize;
374 read += csize;
375 count -= csize;
376 }
50b1fdbd
VG
377 return read;
378}
379#endif
380
1da177e4
LT
381extern long vread(char *buf, char *addr, unsigned long count);
382extern long vwrite(char *buf, char *addr, unsigned long count);
383
384/*
385 * This function reads the *virtual* memory as seen by the kernel.
386 */
387static ssize_t read_kmem(struct file *file, char __user *buf,
388 size_t count, loff_t *ppos)
389{
390 unsigned long p = *ppos;
391 ssize_t low_count, read, sz;
392 char * kbuf; /* k-addr because vread() takes vmlist_lock rwlock */
393
394 read = 0;
395 if (p < (unsigned long) high_memory) {
396 low_count = count;
397 if (count > (unsigned long) high_memory - p)
398 low_count = (unsigned long) high_memory - p;
399
400#ifdef __ARCH_HAS_NO_PAGE_ZERO_MAPPED
401 /* we don't have page 0 mapped on sparc and m68k.. */
402 if (p < PAGE_SIZE && low_count > 0) {
403 size_t tmp = PAGE_SIZE - p;
404 if (tmp > low_count) tmp = low_count;
405 if (clear_user(buf, tmp))
406 return -EFAULT;
407 buf += tmp;
408 p += tmp;
409 read += tmp;
410 low_count -= tmp;
411 count -= tmp;
412 }
413#endif
414 while (low_count > 0) {
415 /*
416 * Handle first page in case it's not aligned
417 */
418 if (-p & (PAGE_SIZE - 1))
419 sz = -p & (PAGE_SIZE - 1);
420 else
421 sz = PAGE_SIZE;
422
423 sz = min_t(unsigned long, sz, low_count);
424
425 /*
426 * On ia64 if a page has been mapped somewhere as
427 * uncached, then it must also be accessed uncached
428 * by the kernel or data corruption may occur
429 */
430 kbuf = xlate_dev_kmem_ptr((char *)p);
431
432 if (copy_to_user(buf, kbuf, sz))
433 return -EFAULT;
434 buf += sz;
435 p += sz;
436 read += sz;
437 low_count -= sz;
438 count -= sz;
439 }
440 }
441
442 if (count > 0) {
443 kbuf = (char *)__get_free_page(GFP_KERNEL);
444 if (!kbuf)
445 return -ENOMEM;
446 while (count > 0) {
447 int len = count;
448
449 if (len > PAGE_SIZE)
450 len = PAGE_SIZE;
451 len = vread(kbuf, (char *)p, len);
452 if (!len)
453 break;
454 if (copy_to_user(buf, kbuf, len)) {
455 free_page((unsigned long)kbuf);
456 return -EFAULT;
457 }
458 count -= len;
459 buf += len;
460 read += len;
461 p += len;
462 }
463 free_page((unsigned long)kbuf);
464 }
465 *ppos = p;
466 return read;
467}
468
469
470static inline ssize_t
471do_write_kmem(void *p, unsigned long realp, const char __user * buf,
472 size_t count, loff_t *ppos)
473{
474 ssize_t written, sz;
475 unsigned long copied;
476
477 written = 0;
478#ifdef __ARCH_HAS_NO_PAGE_ZERO_MAPPED
479 /* we don't have page 0 mapped on sparc and m68k.. */
480 if (realp < PAGE_SIZE) {
481 unsigned long sz = PAGE_SIZE - realp;
482 if (sz > count)
483 sz = count;
484 /* Hmm. Do something? */
485 buf += sz;
486 p += sz;
487 realp += sz;
488 count -= sz;
489 written += sz;
490 }
491#endif
492
493 while (count > 0) {
494 char *ptr;
495 /*
496 * Handle first page in case it's not aligned
497 */
498 if (-realp & (PAGE_SIZE - 1))
499 sz = -realp & (PAGE_SIZE - 1);
500 else
501 sz = PAGE_SIZE;
502
503 sz = min_t(unsigned long, sz, count);
504
505 /*
506 * On ia64 if a page has been mapped somewhere as
507 * uncached, then it must also be accessed uncached
508 * by the kernel or data corruption may occur
509 */
510 ptr = xlate_dev_kmem_ptr(p);
511
512 copied = copy_from_user(ptr, buf, sz);
513 if (copied) {
c654d60e
JB
514 written += sz - copied;
515 if (written)
516 break;
1da177e4
LT
517 return -EFAULT;
518 }
519 buf += sz;
520 p += sz;
521 realp += sz;
522 count -= sz;
523 written += sz;
524 }
525
526 *ppos += written;
527 return written;
528}
529
530
531/*
532 * This function writes to the *virtual* memory as seen by the kernel.
533 */
534static ssize_t write_kmem(struct file * file, const char __user * buf,
535 size_t count, loff_t *ppos)
536{
537 unsigned long p = *ppos;
538 ssize_t wrote = 0;
539 ssize_t virtr = 0;
540 ssize_t written;
541 char * kbuf; /* k-addr because vwrite() takes vmlist_lock rwlock */
542
543 if (p < (unsigned long) high_memory) {
544
545 wrote = count;
546 if (count > (unsigned long) high_memory - p)
547 wrote = (unsigned long) high_memory - p;
548
549 written = do_write_kmem((void*)p, p, buf, wrote, ppos);
550 if (written != wrote)
551 return written;
552 wrote = written;
553 p += wrote;
554 buf += wrote;
555 count -= wrote;
556 }
557
558 if (count > 0) {
559 kbuf = (char *)__get_free_page(GFP_KERNEL);
560 if (!kbuf)
561 return wrote ? wrote : -ENOMEM;
562 while (count > 0) {
563 int len = count;
564
565 if (len > PAGE_SIZE)
566 len = PAGE_SIZE;
567 if (len) {
568 written = copy_from_user(kbuf, buf, len);
569 if (written) {
c654d60e
JB
570 if (wrote + virtr)
571 break;
1da177e4 572 free_page((unsigned long)kbuf);
c654d60e 573 return -EFAULT;
1da177e4
LT
574 }
575 }
576 len = vwrite(kbuf, (char *)p, len);
577 count -= len;
578 buf += len;
579 virtr += len;
580 p += len;
581 }
582 free_page((unsigned long)kbuf);
583 }
584
585 *ppos = p;
586 return virtr + wrote;
587}
588
4f911d64 589#ifdef CONFIG_DEVPORT
1da177e4
LT
590static ssize_t read_port(struct file * file, char __user * buf,
591 size_t count, loff_t *ppos)
592{
593 unsigned long i = *ppos;
594 char __user *tmp = buf;
595
596 if (!access_ok(VERIFY_WRITE, buf, count))
597 return -EFAULT;
598 while (count-- > 0 && i < 65536) {
599 if (__put_user(inb(i),tmp) < 0)
600 return -EFAULT;
601 i++;
602 tmp++;
603 }
604 *ppos = i;
605 return tmp-buf;
606}
607
608static ssize_t write_port(struct file * file, const char __user * buf,
609 size_t count, loff_t *ppos)
610{
611 unsigned long i = *ppos;
612 const char __user * tmp = buf;
613
614 if (!access_ok(VERIFY_READ,buf,count))
615 return -EFAULT;
616 while (count-- > 0 && i < 65536) {
617 char c;
c654d60e
JB
618 if (__get_user(c, tmp)) {
619 if (tmp > buf)
620 break;
1da177e4 621 return -EFAULT;
c654d60e 622 }
1da177e4
LT
623 outb(c,i);
624 i++;
625 tmp++;
626 }
627 *ppos = i;
628 return tmp-buf;
629}
630#endif
631
632static ssize_t read_null(struct file * file, char __user * buf,
633 size_t count, loff_t *ppos)
634{
635 return 0;
636}
637
638static ssize_t write_null(struct file * file, const char __user * buf,
639 size_t count, loff_t *ppos)
640{
641 return count;
642}
643
1ebd32fc
JA
644static int pipe_to_null(struct pipe_inode_info *info, struct pipe_buffer *buf,
645 struct splice_desc *sd)
646{
647 return sd->len;
648}
649
650static ssize_t splice_write_null(struct pipe_inode_info *pipe,struct file *out,
651 loff_t *ppos, size_t len, unsigned int flags)
652{
653 return splice_from_pipe(pipe, out, ppos, len, flags, pipe_to_null);
654}
655
1da177e4
LT
656static ssize_t read_zero(struct file * file, char __user * buf,
657 size_t count, loff_t *ppos)
658{
557ed1fa 659 size_t written;
1da177e4
LT
660
661 if (!count)
662 return 0;
663
664 if (!access_ok(VERIFY_WRITE, buf, count))
665 return -EFAULT;
666
557ed1fa
NP
667 written = 0;
668 while (count) {
669 unsigned long unwritten;
670 size_t chunk = count;
1da177e4 671
557ed1fa
NP
672 if (chunk > PAGE_SIZE)
673 chunk = PAGE_SIZE; /* Just for latency reasons */
674 unwritten = clear_user(buf, chunk);
675 written += chunk - unwritten;
1da177e4 676 if (unwritten)
557ed1fa 677 break;
1da177e4 678 buf += chunk;
557ed1fa 679 count -= chunk;
1da177e4
LT
680 cond_resched();
681 }
557ed1fa 682 return written ? written : -EFAULT;
1da177e4
LT
683}
684
685static int mmap_zero(struct file * file, struct vm_area_struct * vma)
686{
557ed1fa 687#ifndef CONFIG_MMU
1da177e4 688 return -ENOSYS;
557ed1fa
NP
689#endif
690 if (vma->vm_flags & VM_SHARED)
691 return shmem_zero_setup(vma);
692 return 0;
1da177e4 693}
1da177e4
LT
694
695static ssize_t write_full(struct file * file, const char __user * buf,
696 size_t count, loff_t *ppos)
697{
698 return -ENOSPC;
699}
700
701/*
702 * Special lseek() function for /dev/null and /dev/zero. Most notably, you
703 * can fopen() both devices with "a" now. This was previously impossible.
704 * -- SRB.
705 */
706
707static loff_t null_lseek(struct file * file, loff_t offset, int orig)
708{
709 return file->f_pos = 0;
710}
711
712/*
713 * The memory devices use the full 32/64 bits of the offset, and so we cannot
714 * check against negative addresses: they are ok. The return value is weird,
715 * though, in that case (0).
716 *
717 * also note that seeking relative to the "end of file" isn't supported:
718 * it has no meaning, so it returns -EINVAL.
719 */
720static loff_t memory_lseek(struct file * file, loff_t offset, int orig)
721{
722 loff_t ret;
723
a7113a96 724 mutex_lock(&file->f_path.dentry->d_inode->i_mutex);
1da177e4
LT
725 switch (orig) {
726 case 0:
727 file->f_pos = offset;
728 ret = file->f_pos;
729 force_successful_syscall_return();
730 break;
731 case 1:
732 file->f_pos += offset;
733 ret = file->f_pos;
734 force_successful_syscall_return();
735 break;
736 default:
737 ret = -EINVAL;
738 }
a7113a96 739 mutex_unlock(&file->f_path.dentry->d_inode->i_mutex);
1da177e4
LT
740 return ret;
741}
742
743static int open_port(struct inode * inode, struct file * filp)
744{
745 return capable(CAP_SYS_RAWIO) ? 0 : -EPERM;
746}
747
748#define zero_lseek null_lseek
749#define full_lseek null_lseek
750#define write_zero write_null
751#define read_full read_zero
752#define open_mem open_port
753#define open_kmem open_mem
50b1fdbd 754#define open_oldmem open_mem
1da177e4 755
62322d25 756static const struct file_operations mem_fops = {
1da177e4
LT
757 .llseek = memory_lseek,
758 .read = read_mem,
759 .write = write_mem,
760 .mmap = mmap_mem,
761 .open = open_mem,
5da6185b 762 .get_unmapped_area = get_unmapped_area_mem,
1da177e4
LT
763};
764
62322d25 765static const struct file_operations kmem_fops = {
1da177e4
LT
766 .llseek = memory_lseek,
767 .read = read_kmem,
768 .write = write_kmem,
769 .mmap = mmap_kmem,
770 .open = open_kmem,
5da6185b 771 .get_unmapped_area = get_unmapped_area_mem,
1da177e4
LT
772};
773
62322d25 774static const struct file_operations null_fops = {
1da177e4
LT
775 .llseek = null_lseek,
776 .read = read_null,
777 .write = write_null,
1ebd32fc 778 .splice_write = splice_write_null,
1da177e4
LT
779};
780
4f911d64 781#ifdef CONFIG_DEVPORT
62322d25 782static const struct file_operations port_fops = {
1da177e4
LT
783 .llseek = memory_lseek,
784 .read = read_port,
785 .write = write_port,
786 .open = open_port,
787};
788#endif
789
62322d25 790static const struct file_operations zero_fops = {
1da177e4
LT
791 .llseek = zero_lseek,
792 .read = read_zero,
793 .write = write_zero,
794 .mmap = mmap_zero,
795};
796
5da6185b
DH
797/*
798 * capabilities for /dev/zero
799 * - permits private mappings, "copies" are taken of the source of zeros
800 */
1da177e4
LT
801static struct backing_dev_info zero_bdi = {
802 .capabilities = BDI_CAP_MAP_COPY,
803};
804
62322d25 805static const struct file_operations full_fops = {
1da177e4
LT
806 .llseek = full_lseek,
807 .read = read_full,
808 .write = write_full,
809};
810
50b1fdbd 811#ifdef CONFIG_CRASH_DUMP
62322d25 812static const struct file_operations oldmem_fops = {
50b1fdbd
VG
813 .read = read_oldmem,
814 .open = open_oldmem,
815};
816#endif
817
1da177e4
LT
818static ssize_t kmsg_write(struct file * file, const char __user * buf,
819 size_t count, loff_t *ppos)
820{
821 char *tmp;
cd140a5c 822 ssize_t ret;
1da177e4
LT
823
824 tmp = kmalloc(count + 1, GFP_KERNEL);
825 if (tmp == NULL)
826 return -ENOMEM;
827 ret = -EFAULT;
828 if (!copy_from_user(tmp, buf, count)) {
829 tmp[count] = 0;
830 ret = printk("%s", tmp);
cd140a5c
GC
831 if (ret > count)
832 /* printk can add a prefix */
833 ret = count;
1da177e4
LT
834 }
835 kfree(tmp);
836 return ret;
837}
838
62322d25 839static const struct file_operations kmsg_fops = {
1da177e4
LT
840 .write = kmsg_write,
841};
842
843static int memory_open(struct inode * inode, struct file * filp)
844{
845 switch (iminor(inode)) {
846 case 1:
847 filp->f_op = &mem_fops;
5da6185b
DH
848 filp->f_mapping->backing_dev_info =
849 &directly_mappable_cdev_bdi;
1da177e4
LT
850 break;
851 case 2:
852 filp->f_op = &kmem_fops;
5da6185b
DH
853 filp->f_mapping->backing_dev_info =
854 &directly_mappable_cdev_bdi;
1da177e4
LT
855 break;
856 case 3:
857 filp->f_op = &null_fops;
858 break;
4f911d64 859#ifdef CONFIG_DEVPORT
1da177e4
LT
860 case 4:
861 filp->f_op = &port_fops;
862 break;
863#endif
864 case 5:
865 filp->f_mapping->backing_dev_info = &zero_bdi;
866 filp->f_op = &zero_fops;
867 break;
868 case 7:
869 filp->f_op = &full_fops;
870 break;
871 case 8:
872 filp->f_op = &random_fops;
873 break;
874 case 9:
875 filp->f_op = &urandom_fops;
876 break;
877 case 11:
878 filp->f_op = &kmsg_fops;
879 break;
50b1fdbd
VG
880#ifdef CONFIG_CRASH_DUMP
881 case 12:
882 filp->f_op = &oldmem_fops;
883 break;
884#endif
1da177e4
LT
885 default:
886 return -ENXIO;
887 }
888 if (filp->f_op && filp->f_op->open)
889 return filp->f_op->open(inode,filp);
890 return 0;
891}
892
62322d25 893static const struct file_operations memory_fops = {
1da177e4
LT
894 .open = memory_open, /* just a selector for the real open */
895};
896
897static const struct {
898 unsigned int minor;
899 char *name;
900 umode_t mode;
99ac48f5 901 const struct file_operations *fops;
1da177e4
LT
902} devlist[] = { /* list of minor devices */
903 {1, "mem", S_IRUSR | S_IWUSR | S_IRGRP, &mem_fops},
904 {2, "kmem", S_IRUSR | S_IWUSR | S_IRGRP, &kmem_fops},
905 {3, "null", S_IRUGO | S_IWUGO, &null_fops},
4f911d64 906#ifdef CONFIG_DEVPORT
1da177e4
LT
907 {4, "port", S_IRUSR | S_IWUSR | S_IRGRP, &port_fops},
908#endif
909 {5, "zero", S_IRUGO | S_IWUGO, &zero_fops},
910 {7, "full", S_IRUGO | S_IWUGO, &full_fops},
911 {8, "random", S_IRUGO | S_IWUSR, &random_fops},
912 {9, "urandom", S_IRUGO | S_IWUSR, &urandom_fops},
913 {11,"kmsg", S_IRUGO | S_IWUSR, &kmsg_fops},
50b1fdbd
VG
914#ifdef CONFIG_CRASH_DUMP
915 {12,"oldmem", S_IRUSR | S_IWUSR | S_IRGRP, &oldmem_fops},
916#endif
1da177e4
LT
917};
918
ca8eca68 919static struct class *mem_class;
1da177e4
LT
920
921static int __init chr_dev_init(void)
922{
923 int i;
e0bf68dd
PZ
924 int err;
925
926 err = bdi_init(&zero_bdi);
927 if (err)
928 return err;
1da177e4
LT
929
930 if (register_chrdev(MEM_MAJOR,"mem",&memory_fops))
931 printk("unable to get major %d for memory devs\n", MEM_MAJOR);
932
ca8eca68 933 mem_class = class_create(THIS_MODULE, "mem");
7c69ef79 934 for (i = 0; i < ARRAY_SIZE(devlist); i++)
ebf644c4
GKH
935 device_create(mem_class, NULL,
936 MKDEV(MEM_MAJOR, devlist[i].minor),
937 devlist[i].name);
938
1da177e4
LT
939 return 0;
940}
941
942fs_initcall(chr_dev_init);