Commit | Line | Data |
---|---|---|
62b5f7d0 DH |
1 | /* |
2 | * Intel Memory Protection Keys management | |
3 | * Copyright (c) 2015, Intel Corporation. | |
4 | * | |
5 | * This program is free software; you can redistribute it and/or modify it | |
6 | * under the terms and conditions of the GNU General Public License, | |
7 | * version 2, as published by the Free Software Foundation. | |
8 | * | |
9 | * This program is distributed in the hope it will be useful, but WITHOUT | |
10 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | |
11 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for | |
12 | * more details. | |
13 | */ | |
76de9937 | 14 | #include <linux/debugfs.h> /* debugfs_create_u32() */ |
62b5f7d0 DH |
15 | #include <linux/mm_types.h> /* mm_struct, vma, etc... */ |
16 | #include <linux/pkeys.h> /* PKEY_* */ | |
17 | #include <uapi/asm-generic/mman-common.h> | |
18 | ||
19 | #include <asm/cpufeature.h> /* boot_cpu_has, ... */ | |
20 | #include <asm/mmu_context.h> /* vma_pkey() */ | |
62b5f7d0 DH |
21 | |
22 | int __execute_only_pkey(struct mm_struct *mm) | |
23 | { | |
e8c24d3a DH |
24 | bool need_to_set_mm_pkey = false; |
25 | int execute_only_pkey = mm->context.execute_only_pkey; | |
62b5f7d0 DH |
26 | int ret; |
27 | ||
e8c24d3a DH |
28 | /* Do we need to assign a pkey for mm's execute-only maps? */ |
29 | if (execute_only_pkey == -1) { | |
30 | /* Go allocate one to use, which might fail */ | |
31 | execute_only_pkey = mm_pkey_alloc(mm); | |
32 | if (execute_only_pkey < 0) | |
33 | return -1; | |
34 | need_to_set_mm_pkey = true; | |
35 | } | |
36 | ||
62b5f7d0 DH |
37 | /* |
38 | * We do not want to go through the relatively costly | |
39 | * dance to set PKRU if we do not need to. Check it | |
40 | * first and assume that if the execute-only pkey is | |
41 | * write-disabled that we do not have to set it | |
42 | * ourselves. We need preempt off so that nobody | |
43 | * can make fpregs inactive. | |
44 | */ | |
45 | preempt_disable(); | |
e8c24d3a | 46 | if (!need_to_set_mm_pkey && |
e4a81bfc | 47 | current->thread.fpu.initialized && |
e8c24d3a | 48 | !__pkru_allows_read(read_pkru(), execute_only_pkey)) { |
62b5f7d0 | 49 | preempt_enable(); |
e8c24d3a | 50 | return execute_only_pkey; |
62b5f7d0 DH |
51 | } |
52 | preempt_enable(); | |
e8c24d3a DH |
53 | |
54 | /* | |
55 | * Set up PKRU so that it denies access for everything | |
56 | * other than execution. | |
57 | */ | |
58 | ret = arch_set_user_pkey_access(current, execute_only_pkey, | |
62b5f7d0 DH |
59 | PKEY_DISABLE_ACCESS); |
60 | /* | |
61 | * If the PKRU-set operation failed somehow, just return | |
62 | * 0 and effectively disable execute-only support. | |
63 | */ | |
e8c24d3a DH |
64 | if (ret) { |
65 | mm_set_pkey_free(mm, execute_only_pkey); | |
66 | return -1; | |
67 | } | |
62b5f7d0 | 68 | |
e8c24d3a DH |
69 | /* We got one, store it and use it from here on out */ |
70 | if (need_to_set_mm_pkey) | |
71 | mm->context.execute_only_pkey = execute_only_pkey; | |
72 | return execute_only_pkey; | |
62b5f7d0 DH |
73 | } |
74 | ||
75 | static inline bool vma_is_pkey_exec_only(struct vm_area_struct *vma) | |
76 | { | |
77 | /* Do this check first since the vm_flags should be hot */ | |
78 | if ((vma->vm_flags & (VM_READ | VM_WRITE | VM_EXEC)) != VM_EXEC) | |
79 | return false; | |
e8c24d3a | 80 | if (vma_pkey(vma) != vma->vm_mm->context.execute_only_pkey) |
62b5f7d0 DH |
81 | return false; |
82 | ||
83 | return true; | |
84 | } | |
85 | ||
86 | /* | |
87 | * This is only called for *plain* mprotect calls. | |
88 | */ | |
89 | int __arch_override_mprotect_pkey(struct vm_area_struct *vma, int prot, int pkey) | |
90 | { | |
91 | /* | |
92 | * Is this an mprotect_pkey() call? If so, never | |
93 | * override the value that came from the user. | |
94 | */ | |
95 | if (pkey != -1) | |
96 | return pkey; | |
0a0b1520 | 97 | |
62b5f7d0 DH |
98 | /* |
99 | * The mapping is execute-only. Go try to get the | |
100 | * execute-only protection key. If we fail to do that, | |
101 | * fall through as if we do not have execute-only | |
0a0b1520 | 102 | * support in this mm. |
62b5f7d0 DH |
103 | */ |
104 | if (prot == PROT_EXEC) { | |
105 | pkey = execute_only_pkey(vma->vm_mm); | |
106 | if (pkey > 0) | |
107 | return pkey; | |
0a0b1520 DH |
108 | } else if (vma_is_pkey_exec_only(vma)) { |
109 | /* | |
110 | * Protections are *not* PROT_EXEC, but the mapping | |
111 | * is using the exec-only pkey. This mapping was | |
112 | * PROT_EXEC and will no longer be. Move back to | |
113 | * the default pkey. | |
114 | */ | |
115 | return ARCH_DEFAULT_PKEY; | |
62b5f7d0 | 116 | } |
0a0b1520 | 117 | |
62b5f7d0 DH |
118 | /* |
119 | * This is a vanilla, non-pkey mprotect (or we failed to | |
120 | * setup execute-only), inherit the pkey from the VMA we | |
121 | * are working on. | |
122 | */ | |
123 | return vma_pkey(vma); | |
124 | } | |
acd547b2 DH |
125 | |
126 | #define PKRU_AD_KEY(pkey) (PKRU_AD_BIT << ((pkey) * PKRU_BITS_PER_PKEY)) | |
127 | ||
128 | /* | |
129 | * Make the default PKRU value (at execve() time) as restrictive | |
130 | * as possible. This ensures that any threads clone()'d early | |
131 | * in the process's lifetime will not accidentally get access | |
132 | * to data which is pkey-protected later on. | |
133 | */ | |
134 | u32 init_pkru_value = PKRU_AD_KEY( 1) | PKRU_AD_KEY( 2) | PKRU_AD_KEY( 3) | | |
135 | PKRU_AD_KEY( 4) | PKRU_AD_KEY( 5) | PKRU_AD_KEY( 6) | | |
136 | PKRU_AD_KEY( 7) | PKRU_AD_KEY( 8) | PKRU_AD_KEY( 9) | | |
137 | PKRU_AD_KEY(10) | PKRU_AD_KEY(11) | PKRU_AD_KEY(12) | | |
138 | PKRU_AD_KEY(13) | PKRU_AD_KEY(14) | PKRU_AD_KEY(15); | |
139 | ||
140 | /* | |
141 | * Called from the FPU code when creating a fresh set of FPU | |
142 | * registers. This is called from a very specific context where | |
143 | * we know the FPU regstiers are safe for use and we can use PKRU | |
e6365084 | 144 | * directly. |
acd547b2 DH |
145 | */ |
146 | void copy_init_pkru_to_fpregs(void) | |
147 | { | |
148 | u32 init_pkru_value_snapshot = READ_ONCE(init_pkru_value); | |
149 | /* | |
150 | * Any write to PKRU takes it out of the XSAVE 'init | |
151 | * state' which increases context switch cost. Avoid | |
152 | * writing 0 when PKRU was already 0. | |
153 | */ | |
154 | if (!init_pkru_value_snapshot && !read_pkru()) | |
155 | return; | |
156 | /* | |
157 | * Override the PKRU state that came from 'init_fpstate' | |
158 | * with the baseline from the process. | |
159 | */ | |
160 | write_pkru(init_pkru_value_snapshot); | |
161 | } | |
76de9937 DH |
162 | |
163 | static ssize_t init_pkru_read_file(struct file *file, char __user *user_buf, | |
164 | size_t count, loff_t *ppos) | |
165 | { | |
166 | char buf[32]; | |
167 | unsigned int len; | |
168 | ||
169 | len = sprintf(buf, "0x%x\n", init_pkru_value); | |
170 | return simple_read_from_buffer(user_buf, count, ppos, buf, len); | |
171 | } | |
172 | ||
173 | static ssize_t init_pkru_write_file(struct file *file, | |
174 | const char __user *user_buf, size_t count, loff_t *ppos) | |
175 | { | |
176 | char buf[32]; | |
177 | ssize_t len; | |
178 | u32 new_init_pkru; | |
179 | ||
180 | len = min(count, sizeof(buf) - 1); | |
181 | if (copy_from_user(buf, user_buf, len)) | |
182 | return -EFAULT; | |
183 | ||
184 | /* Make the buffer a valid string that we can not overrun */ | |
185 | buf[len] = '\0'; | |
186 | if (kstrtouint(buf, 0, &new_init_pkru)) | |
187 | return -EINVAL; | |
188 | ||
189 | /* | |
190 | * Don't allow insane settings that will blow the system | |
191 | * up immediately if someone attempts to disable access | |
192 | * or writes to pkey 0. | |
193 | */ | |
194 | if (new_init_pkru & (PKRU_AD_BIT|PKRU_WD_BIT)) | |
195 | return -EINVAL; | |
196 | ||
197 | WRITE_ONCE(init_pkru_value, new_init_pkru); | |
198 | return count; | |
199 | } | |
200 | ||
201 | static const struct file_operations fops_init_pkru = { | |
202 | .read = init_pkru_read_file, | |
203 | .write = init_pkru_write_file, | |
204 | .llseek = default_llseek, | |
205 | }; | |
206 | ||
207 | static int __init create_init_pkru_value(void) | |
208 | { | |
209 | debugfs_create_file("init_pkru", S_IRUSR | S_IWUSR, | |
210 | arch_debugfs_dir, NULL, &fops_init_pkru); | |
211 | return 0; | |
212 | } | |
213 | late_initcall(create_init_pkru_value); | |
214 | ||
215 | static __init int setup_init_pkru(char *opt) | |
216 | { | |
217 | u32 new_init_pkru; | |
218 | ||
219 | if (kstrtouint(opt, 0, &new_init_pkru)) | |
220 | return 1; | |
221 | ||
222 | WRITE_ONCE(init_pkru_value, new_init_pkru); | |
223 | ||
224 | return 1; | |
225 | } | |
226 | __setup("init_pkru=", setup_init_pkru); |