Commit | Line | Data |
---|---|---|
e01402b1 RB |
1 | /* |
2 | * Copyright (C) 2004, 2005 MIPS Technologies, Inc. All rights reserved. | |
3 | * | |
4 | * This program is free software; you can distribute it and/or modify it | |
5 | * under the terms of the GNU General Public License (Version 2) as | |
6 | * published by the Free Software Foundation. | |
7 | * | |
8 | * This program is distributed in the hope it will be useful, but WITHOUT | |
9 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | |
10 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License | |
11 | * for more details. | |
12 | * | |
13 | * You should have received a copy of the GNU General Public License along | |
14 | * with this program; if not, write to the Free Software Foundation, Inc., | |
15 | * 59 Temple Place - Suite 330, Boston MA 02111-1307, USA. | |
e01402b1 RB |
16 | */ |
17 | ||
18 | /* | |
19 | * VPE support module | |
20 | * | |
21 | * Provides support for loading a MIPS SP program on VPE1. | |
22 | * The SP enviroment is rather simple, no tlb's. It needs to be relocatable | |
23 | * (or partially linked). You should initialise your stack in the startup | |
24 | * code. This loader looks for the symbol __start and sets up | |
25 | * execution to resume from there. The MIPS SDE kit contains suitable examples. | |
26 | * | |
27 | * To load and run, simply cat a SP 'program file' to /dev/vpe1. | |
28 | * i.e cat spapp >/dev/vpe1. | |
e01402b1 | 29 | */ |
e01402b1 | 30 | #include <linux/kernel.h> |
27a3bbaf | 31 | #include <linux/device.h> |
e01402b1 RB |
32 | #include <linux/module.h> |
33 | #include <linux/fs.h> | |
34 | #include <linux/init.h> | |
35 | #include <asm/uaccess.h> | |
36 | #include <linux/slab.h> | |
37 | #include <linux/list.h> | |
38 | #include <linux/vmalloc.h> | |
39 | #include <linux/elf.h> | |
40 | #include <linux/seq_file.h> | |
41 | #include <linux/syscalls.h> | |
42 | #include <linux/moduleloader.h> | |
43 | #include <linux/interrupt.h> | |
44 | #include <linux/poll.h> | |
45 | #include <linux/bootmem.h> | |
46 | #include <asm/mipsregs.h> | |
340ee4b9 | 47 | #include <asm/mipsmtregs.h> |
e01402b1 RB |
48 | #include <asm/cacheflush.h> |
49 | #include <asm/atomic.h> | |
50 | #include <asm/cpu.h> | |
27a3bbaf | 51 | #include <asm/mips_mt.h> |
e01402b1 RB |
52 | #include <asm/processor.h> |
53 | #include <asm/system.h> | |
2600990e RB |
54 | #include <asm/vpe.h> |
55 | #include <asm/kspd.h> | |
e01402b1 RB |
56 | |
57 | typedef void *vpe_handle; | |
58 | ||
e01402b1 RB |
59 | #ifndef ARCH_SHF_SMALL |
60 | #define ARCH_SHF_SMALL 0 | |
61 | #endif | |
62 | ||
63 | /* If this is set, the section belongs in the init part of the module */ | |
64 | #define INIT_OFFSET_MASK (1UL << (BITS_PER_LONG-1)) | |
65 | ||
41790e04 RB |
66 | /* |
67 | * The number of TCs and VPEs physically available on the core | |
68 | */ | |
69 | static int hw_tcs, hw_vpes; | |
e01402b1 | 70 | static char module_name[] = "vpe"; |
307bd284 | 71 | static int major; |
27a3bbaf | 72 | static const int minor = 1; /* fixed for now */ |
e01402b1 | 73 | |
2600990e RB |
74 | #ifdef CONFIG_MIPS_APSP_KSPD |
75 | static struct kspd_notifications kspd_events; | |
76 | static int kspd_events_reqd = 0; | |
77 | #endif | |
78 | ||
e01402b1 RB |
79 | /* grab the likely amount of memory we will need. */ |
80 | #ifdef CONFIG_MIPS_VPE_LOADER_TOM | |
81 | #define P_SIZE (2 * 1024 * 1024) | |
82 | #else | |
83 | /* add an overhead to the max kmalloc size for non-striped symbols/etc */ | |
84 | #define P_SIZE (256 * 1024) | |
85 | #endif | |
86 | ||
2600990e RB |
87 | extern unsigned long physical_memsize; |
88 | ||
e01402b1 | 89 | #define MAX_VPES 16 |
2600990e | 90 | #define VPE_PATH_MAX 256 |
e01402b1 RB |
91 | |
92 | enum vpe_state { | |
93 | VPE_STATE_UNUSED = 0, | |
94 | VPE_STATE_INUSE, | |
95 | VPE_STATE_RUNNING | |
96 | }; | |
97 | ||
98 | enum tc_state { | |
99 | TC_STATE_UNUSED = 0, | |
100 | TC_STATE_INUSE, | |
101 | TC_STATE_RUNNING, | |
102 | TC_STATE_DYNAMIC | |
103 | }; | |
104 | ||
307bd284 | 105 | struct vpe { |
e01402b1 RB |
106 | enum vpe_state state; |
107 | ||
108 | /* (device) minor associated with this vpe */ | |
109 | int minor; | |
110 | ||
111 | /* elfloader stuff */ | |
112 | void *load_addr; | |
571e0bed | 113 | unsigned long len; |
e01402b1 | 114 | char *pbuffer; |
571e0bed | 115 | unsigned long plen; |
2600990e RB |
116 | unsigned int uid, gid; |
117 | char cwd[VPE_PATH_MAX]; | |
e01402b1 RB |
118 | |
119 | unsigned long __start; | |
120 | ||
121 | /* tc's associated with this vpe */ | |
122 | struct list_head tc; | |
123 | ||
124 | /* The list of vpe's */ | |
125 | struct list_head list; | |
126 | ||
127 | /* shared symbol address */ | |
128 | void *shared_ptr; | |
2600990e RB |
129 | |
130 | /* the list of who wants to know when something major happens */ | |
131 | struct list_head notify; | |
41790e04 RB |
132 | |
133 | unsigned int ntcs; | |
307bd284 RB |
134 | }; |
135 | ||
136 | struct tc { | |
137 | enum tc_state state; | |
138 | int index; | |
139 | ||
07cc0c9e RB |
140 | struct vpe *pvpe; /* parent VPE */ |
141 | struct list_head tc; /* The list of TC's with this VPE */ | |
142 | struct list_head list; /* The global list of tc's */ | |
307bd284 | 143 | }; |
e01402b1 | 144 | |
9cfdf6f1 | 145 | struct { |
e01402b1 RB |
146 | /* Virtual processing elements */ |
147 | struct list_head vpe_list; | |
148 | ||
149 | /* Thread contexts */ | |
150 | struct list_head tc_list; | |
9cfdf6f1 RB |
151 | } vpecontrol = { |
152 | .vpe_list = LIST_HEAD_INIT(vpecontrol.vpe_list), | |
153 | .tc_list = LIST_HEAD_INIT(vpecontrol.tc_list) | |
154 | }; | |
e01402b1 RB |
155 | |
156 | static void release_progmem(void *ptr); | |
e01402b1 RB |
157 | extern void save_gp_address(unsigned int secbase, unsigned int rel); |
158 | ||
159 | /* get the vpe associated with this minor */ | |
160 | struct vpe *get_vpe(int minor) | |
161 | { | |
162 | struct vpe *v; | |
163 | ||
2600990e RB |
164 | if (!cpu_has_mipsmt) |
165 | return NULL; | |
166 | ||
e01402b1 RB |
167 | list_for_each_entry(v, &vpecontrol.vpe_list, list) { |
168 | if (v->minor == minor) | |
169 | return v; | |
170 | } | |
171 | ||
e01402b1 RB |
172 | return NULL; |
173 | } | |
174 | ||
175 | /* get the vpe associated with this minor */ | |
176 | struct tc *get_tc(int index) | |
177 | { | |
178 | struct tc *t; | |
179 | ||
180 | list_for_each_entry(t, &vpecontrol.tc_list, list) { | |
181 | if (t->index == index) | |
182 | return t; | |
183 | } | |
184 | ||
e01402b1 RB |
185 | return NULL; |
186 | } | |
187 | ||
188 | struct tc *get_tc_unused(void) | |
189 | { | |
190 | struct tc *t; | |
191 | ||
192 | list_for_each_entry(t, &vpecontrol.tc_list, list) { | |
193 | if (t->state == TC_STATE_UNUSED) | |
194 | return t; | |
195 | } | |
196 | ||
e01402b1 RB |
197 | return NULL; |
198 | } | |
199 | ||
200 | /* allocate a vpe and associate it with this minor (or index) */ | |
201 | struct vpe *alloc_vpe(int minor) | |
202 | { | |
203 | struct vpe *v; | |
204 | ||
307bd284 | 205 | if ((v = kzalloc(sizeof(struct vpe), GFP_KERNEL)) == NULL) { |
e01402b1 RB |
206 | return NULL; |
207 | } | |
208 | ||
e01402b1 RB |
209 | INIT_LIST_HEAD(&v->tc); |
210 | list_add_tail(&v->list, &vpecontrol.vpe_list); | |
211 | ||
2600990e | 212 | INIT_LIST_HEAD(&v->notify); |
e01402b1 RB |
213 | v->minor = minor; |
214 | return v; | |
215 | } | |
216 | ||
217 | /* allocate a tc. At startup only tc0 is running, all other can be halted. */ | |
218 | struct tc *alloc_tc(int index) | |
219 | { | |
07cc0c9e | 220 | struct tc *tc; |
e01402b1 | 221 | |
07cc0c9e RB |
222 | if ((tc = kzalloc(sizeof(struct tc), GFP_KERNEL)) == NULL) |
223 | goto out; | |
e01402b1 | 224 | |
07cc0c9e RB |
225 | INIT_LIST_HEAD(&tc->tc); |
226 | tc->index = index; | |
227 | list_add_tail(&tc->list, &vpecontrol.tc_list); | |
e01402b1 | 228 | |
07cc0c9e RB |
229 | out: |
230 | return tc; | |
e01402b1 RB |
231 | } |
232 | ||
233 | /* clean up and free everything */ | |
234 | void release_vpe(struct vpe *v) | |
235 | { | |
236 | list_del(&v->list); | |
237 | if (v->load_addr) | |
238 | release_progmem(v); | |
239 | kfree(v); | |
240 | } | |
241 | ||
242 | void dump_mtregs(void) | |
243 | { | |
244 | unsigned long val; | |
245 | ||
246 | val = read_c0_config3(); | |
247 | printk("config3 0x%lx MT %ld\n", val, | |
248 | (val & CONFIG3_MT) >> CONFIG3_MT_SHIFT); | |
249 | ||
e01402b1 RB |
250 | val = read_c0_mvpcontrol(); |
251 | printk("MVPControl 0x%lx, STLB %ld VPC %ld EVP %ld\n", val, | |
252 | (val & MVPCONTROL_STLB) >> MVPCONTROL_STLB_SHIFT, | |
253 | (val & MVPCONTROL_VPC) >> MVPCONTROL_VPC_SHIFT, | |
254 | (val & MVPCONTROL_EVP)); | |
255 | ||
2600990e RB |
256 | val = read_c0_mvpconf0(); |
257 | printk("mvpconf0 0x%lx, PVPE %ld PTC %ld M %ld\n", val, | |
258 | (val & MVPCONF0_PVPE) >> MVPCONF0_PVPE_SHIFT, | |
259 | val & MVPCONF0_PTC, (val & MVPCONF0_M) >> MVPCONF0_M_SHIFT); | |
e01402b1 RB |
260 | } |
261 | ||
262 | /* Find some VPE program space */ | |
571e0bed | 263 | static void *alloc_progmem(unsigned long len) |
e01402b1 | 264 | { |
5408c490 RB |
265 | void *addr; |
266 | ||
e01402b1 | 267 | #ifdef CONFIG_MIPS_VPE_LOADER_TOM |
5408c490 RB |
268 | /* |
269 | * This means you must tell Linux to use less memory than you | |
270 | * physically have, for example by passing a mem= boot argument. | |
271 | */ | |
272 | addr = pfn_to_kaddr(max_pfn); | |
273 | memset(addr, 0, len); | |
e01402b1 | 274 | #else |
5408c490 RB |
275 | /* simple grab some mem for now */ |
276 | addr = kzalloc(len, GFP_KERNEL); | |
e01402b1 | 277 | #endif |
5408c490 RB |
278 | |
279 | return addr; | |
e01402b1 RB |
280 | } |
281 | ||
282 | static void release_progmem(void *ptr) | |
283 | { | |
284 | #ifndef CONFIG_MIPS_VPE_LOADER_TOM | |
285 | kfree(ptr); | |
286 | #endif | |
287 | } | |
288 | ||
289 | /* Update size with this section: return offset. */ | |
290 | static long get_offset(unsigned long *size, Elf_Shdr * sechdr) | |
291 | { | |
292 | long ret; | |
293 | ||
294 | ret = ALIGN(*size, sechdr->sh_addralign ? : 1); | |
295 | *size = ret + sechdr->sh_size; | |
296 | return ret; | |
297 | } | |
298 | ||
299 | /* Lay out the SHF_ALLOC sections in a way not dissimilar to how ld | |
300 | might -- code, read-only data, read-write data, small data. Tally | |
301 | sizes, and place the offsets into sh_entsize fields: high bit means it | |
302 | belongs in init. */ | |
303 | static void layout_sections(struct module *mod, const Elf_Ehdr * hdr, | |
304 | Elf_Shdr * sechdrs, const char *secstrings) | |
305 | { | |
306 | static unsigned long const masks[][2] = { | |
307 | /* NOTE: all executable code must be the first section | |
308 | * in this array; otherwise modify the text_size | |
309 | * finder in the two loops below */ | |
310 | {SHF_EXECINSTR | SHF_ALLOC, ARCH_SHF_SMALL}, | |
311 | {SHF_ALLOC, SHF_WRITE | ARCH_SHF_SMALL}, | |
312 | {SHF_WRITE | SHF_ALLOC, ARCH_SHF_SMALL}, | |
313 | {ARCH_SHF_SMALL | SHF_ALLOC, 0} | |
314 | }; | |
315 | unsigned int m, i; | |
316 | ||
317 | for (i = 0; i < hdr->e_shnum; i++) | |
318 | sechdrs[i].sh_entsize = ~0UL; | |
319 | ||
320 | for (m = 0; m < ARRAY_SIZE(masks); ++m) { | |
321 | for (i = 0; i < hdr->e_shnum; ++i) { | |
322 | Elf_Shdr *s = &sechdrs[i]; | |
323 | ||
324 | // || strncmp(secstrings + s->sh_name, ".init", 5) == 0) | |
325 | if ((s->sh_flags & masks[m][0]) != masks[m][0] | |
326 | || (s->sh_flags & masks[m][1]) | |
327 | || s->sh_entsize != ~0UL) | |
328 | continue; | |
329 | s->sh_entsize = get_offset(&mod->core_size, s); | |
330 | } | |
331 | ||
332 | if (m == 0) | |
333 | mod->core_text_size = mod->core_size; | |
334 | ||
335 | } | |
336 | } | |
337 | ||
338 | ||
339 | /* from module-elf32.c, but subverted a little */ | |
340 | ||
341 | struct mips_hi16 { | |
342 | struct mips_hi16 *next; | |
343 | Elf32_Addr *addr; | |
344 | Elf32_Addr value; | |
345 | }; | |
346 | ||
347 | static struct mips_hi16 *mips_hi16_list; | |
348 | static unsigned int gp_offs, gp_addr; | |
349 | ||
350 | static int apply_r_mips_none(struct module *me, uint32_t *location, | |
351 | Elf32_Addr v) | |
352 | { | |
353 | return 0; | |
354 | } | |
355 | ||
356 | static int apply_r_mips_gprel16(struct module *me, uint32_t *location, | |
357 | Elf32_Addr v) | |
358 | { | |
359 | int rel; | |
360 | ||
361 | if( !(*location & 0xffff) ) { | |
362 | rel = (int)v - gp_addr; | |
363 | } | |
364 | else { | |
365 | /* .sbss + gp(relative) + offset */ | |
366 | /* kludge! */ | |
367 | rel = (int)(short)((int)v + gp_offs + | |
368 | (int)(short)(*location & 0xffff) - gp_addr); | |
369 | } | |
370 | ||
371 | if( (rel > 32768) || (rel < -32768) ) { | |
2600990e RB |
372 | printk(KERN_DEBUG "VPE loader: apply_r_mips_gprel16: " |
373 | "relative address 0x%x out of range of gp register\n", | |
374 | rel); | |
e01402b1 RB |
375 | return -ENOEXEC; |
376 | } | |
377 | ||
378 | *location = (*location & 0xffff0000) | (rel & 0xffff); | |
379 | ||
380 | return 0; | |
381 | } | |
382 | ||
383 | static int apply_r_mips_pc16(struct module *me, uint32_t *location, | |
384 | Elf32_Addr v) | |
385 | { | |
386 | int rel; | |
387 | rel = (((unsigned int)v - (unsigned int)location)); | |
388 | rel >>= 2; // because the offset is in _instructions_ not bytes. | |
389 | rel -= 1; // and one instruction less due to the branch delay slot. | |
390 | ||
391 | if( (rel > 32768) || (rel < -32768) ) { | |
2600990e RB |
392 | printk(KERN_DEBUG "VPE loader: " |
393 | "apply_r_mips_pc16: relative address out of range 0x%x\n", rel); | |
e01402b1 RB |
394 | return -ENOEXEC; |
395 | } | |
396 | ||
397 | *location = (*location & 0xffff0000) | (rel & 0xffff); | |
398 | ||
399 | return 0; | |
400 | } | |
401 | ||
402 | static int apply_r_mips_32(struct module *me, uint32_t *location, | |
403 | Elf32_Addr v) | |
404 | { | |
405 | *location += v; | |
406 | ||
407 | return 0; | |
408 | } | |
409 | ||
410 | static int apply_r_mips_26(struct module *me, uint32_t *location, | |
411 | Elf32_Addr v) | |
412 | { | |
413 | if (v % 4) { | |
2600990e RB |
414 | printk(KERN_DEBUG "VPE loader: apply_r_mips_26 " |
415 | " unaligned relocation\n"); | |
e01402b1 RB |
416 | return -ENOEXEC; |
417 | } | |
418 | ||
307bd284 RB |
419 | /* |
420 | * Not desperately convinced this is a good check of an overflow condition | |
421 | * anyway. But it gets in the way of handling undefined weak symbols which | |
422 | * we want to set to zero. | |
423 | * if ((v & 0xf0000000) != (((unsigned long)location + 4) & 0xf0000000)) { | |
424 | * printk(KERN_ERR | |
425 | * "module %s: relocation overflow\n", | |
426 | * me->name); | |
427 | * return -ENOEXEC; | |
428 | * } | |
429 | */ | |
e01402b1 RB |
430 | |
431 | *location = (*location & ~0x03ffffff) | | |
432 | ((*location + (v >> 2)) & 0x03ffffff); | |
433 | return 0; | |
434 | } | |
435 | ||
436 | static int apply_r_mips_hi16(struct module *me, uint32_t *location, | |
437 | Elf32_Addr v) | |
438 | { | |
439 | struct mips_hi16 *n; | |
440 | ||
441 | /* | |
442 | * We cannot relocate this one now because we don't know the value of | |
443 | * the carry we need to add. Save the information, and let LO16 do the | |
444 | * actual relocation. | |
445 | */ | |
446 | n = kmalloc(sizeof *n, GFP_KERNEL); | |
447 | if (!n) | |
448 | return -ENOMEM; | |
449 | ||
450 | n->addr = location; | |
451 | n->value = v; | |
452 | n->next = mips_hi16_list; | |
453 | mips_hi16_list = n; | |
454 | ||
455 | return 0; | |
456 | } | |
457 | ||
458 | static int apply_r_mips_lo16(struct module *me, uint32_t *location, | |
459 | Elf32_Addr v) | |
460 | { | |
461 | unsigned long insnlo = *location; | |
462 | Elf32_Addr val, vallo; | |
463 | ||
464 | /* Sign extend the addend we extract from the lo insn. */ | |
465 | vallo = ((insnlo & 0xffff) ^ 0x8000) - 0x8000; | |
466 | ||
467 | if (mips_hi16_list != NULL) { | |
468 | struct mips_hi16 *l; | |
469 | ||
470 | l = mips_hi16_list; | |
471 | while (l != NULL) { | |
472 | struct mips_hi16 *next; | |
473 | unsigned long insn; | |
474 | ||
475 | /* | |
476 | * The value for the HI16 had best be the same. | |
477 | */ | |
2600990e RB |
478 | if (v != l->value) { |
479 | printk(KERN_DEBUG "VPE loader: " | |
b1e3afa0 | 480 | "apply_r_mips_lo16/hi16: \t" |
2600990e RB |
481 | "inconsistent value information\n"); |
482 | return -ENOEXEC; | |
e01402b1 RB |
483 | } |
484 | ||
e01402b1 RB |
485 | /* |
486 | * Do the HI16 relocation. Note that we actually don't | |
487 | * need to know anything about the LO16 itself, except | |
488 | * where to find the low 16 bits of the addend needed | |
489 | * by the LO16. | |
490 | */ | |
491 | insn = *l->addr; | |
492 | val = ((insn & 0xffff) << 16) + vallo; | |
493 | val += v; | |
494 | ||
495 | /* | |
496 | * Account for the sign extension that will happen in | |
497 | * the low bits. | |
498 | */ | |
499 | val = ((val >> 16) + ((val & 0x8000) != 0)) & 0xffff; | |
500 | ||
501 | insn = (insn & ~0xffff) | val; | |
502 | *l->addr = insn; | |
503 | ||
504 | next = l->next; | |
505 | kfree(l); | |
506 | l = next; | |
507 | } | |
508 | ||
509 | mips_hi16_list = NULL; | |
510 | } | |
511 | ||
512 | /* | |
513 | * Ok, we're done with the HI16 relocs. Now deal with the LO16. | |
514 | */ | |
515 | val = v + vallo; | |
516 | insnlo = (insnlo & ~0xffff) | (val & 0xffff); | |
517 | *location = insnlo; | |
518 | ||
519 | return 0; | |
e01402b1 RB |
520 | } |
521 | ||
522 | static int (*reloc_handlers[]) (struct module *me, uint32_t *location, | |
523 | Elf32_Addr v) = { | |
524 | [R_MIPS_NONE] = apply_r_mips_none, | |
525 | [R_MIPS_32] = apply_r_mips_32, | |
526 | [R_MIPS_26] = apply_r_mips_26, | |
527 | [R_MIPS_HI16] = apply_r_mips_hi16, | |
528 | [R_MIPS_LO16] = apply_r_mips_lo16, | |
529 | [R_MIPS_GPREL16] = apply_r_mips_gprel16, | |
530 | [R_MIPS_PC16] = apply_r_mips_pc16 | |
531 | }; | |
532 | ||
2600990e | 533 | static char *rstrs[] = { |
e0daad44 | 534 | [R_MIPS_NONE] = "MIPS_NONE", |
2600990e RB |
535 | [R_MIPS_32] = "MIPS_32", |
536 | [R_MIPS_26] = "MIPS_26", | |
537 | [R_MIPS_HI16] = "MIPS_HI16", | |
538 | [R_MIPS_LO16] = "MIPS_LO16", | |
539 | [R_MIPS_GPREL16] = "MIPS_GPREL16", | |
540 | [R_MIPS_PC16] = "MIPS_PC16" | |
541 | }; | |
e01402b1 RB |
542 | |
543 | int apply_relocations(Elf32_Shdr *sechdrs, | |
544 | const char *strtab, | |
545 | unsigned int symindex, | |
546 | unsigned int relsec, | |
547 | struct module *me) | |
548 | { | |
549 | Elf32_Rel *rel = (void *) sechdrs[relsec].sh_addr; | |
550 | Elf32_Sym *sym; | |
551 | uint32_t *location; | |
552 | unsigned int i; | |
553 | Elf32_Addr v; | |
554 | int res; | |
555 | ||
556 | for (i = 0; i < sechdrs[relsec].sh_size / sizeof(*rel); i++) { | |
557 | Elf32_Word r_info = rel[i].r_info; | |
558 | ||
559 | /* This is where to make the change */ | |
560 | location = (void *)sechdrs[sechdrs[relsec].sh_info].sh_addr | |
561 | + rel[i].r_offset; | |
562 | /* This is the symbol it is referring to */ | |
563 | sym = (Elf32_Sym *)sechdrs[symindex].sh_addr | |
564 | + ELF32_R_SYM(r_info); | |
565 | ||
566 | if (!sym->st_value) { | |
567 | printk(KERN_DEBUG "%s: undefined weak symbol %s\n", | |
568 | me->name, strtab + sym->st_name); | |
569 | /* just print the warning, dont barf */ | |
570 | } | |
571 | ||
572 | v = sym->st_value; | |
573 | ||
574 | res = reloc_handlers[ELF32_R_TYPE(r_info)](me, location, v); | |
575 | if( res ) { | |
2600990e RB |
576 | char *r = rstrs[ELF32_R_TYPE(r_info)]; |
577 | printk(KERN_WARNING "VPE loader: .text+0x%x " | |
578 | "relocation type %s for symbol \"%s\" failed\n", | |
579 | rel[i].r_offset, r ? r : "UNKNOWN", | |
580 | strtab + sym->st_name); | |
e01402b1 | 581 | return res; |
2600990e | 582 | } |
e01402b1 RB |
583 | } |
584 | ||
585 | return 0; | |
586 | } | |
587 | ||
588 | void save_gp_address(unsigned int secbase, unsigned int rel) | |
589 | { | |
590 | gp_addr = secbase + rel; | |
591 | gp_offs = gp_addr - (secbase & 0xffff0000); | |
592 | } | |
593 | /* end module-elf32.c */ | |
594 | ||
595 | ||
596 | ||
597 | /* Change all symbols so that sh_value encodes the pointer directly. */ | |
2600990e | 598 | static void simplify_symbols(Elf_Shdr * sechdrs, |
e01402b1 RB |
599 | unsigned int symindex, |
600 | const char *strtab, | |
601 | const char *secstrings, | |
602 | unsigned int nsecs, struct module *mod) | |
603 | { | |
604 | Elf_Sym *sym = (void *)sechdrs[symindex].sh_addr; | |
605 | unsigned long secbase, bssbase = 0; | |
606 | unsigned int i, n = sechdrs[symindex].sh_size / sizeof(Elf_Sym); | |
2600990e | 607 | int size; |
e01402b1 RB |
608 | |
609 | /* find the .bss section for COMMON symbols */ | |
610 | for (i = 0; i < nsecs; i++) { | |
2600990e | 611 | if (strncmp(secstrings + sechdrs[i].sh_name, ".bss", 4) == 0) { |
e01402b1 | 612 | bssbase = sechdrs[i].sh_addr; |
2600990e RB |
613 | break; |
614 | } | |
e01402b1 RB |
615 | } |
616 | ||
617 | for (i = 1; i < n; i++) { | |
618 | switch (sym[i].st_shndx) { | |
619 | case SHN_COMMON: | |
2600990e RB |
620 | /* Allocate space for the symbol in the .bss section. |
621 | st_value is currently size. | |
e01402b1 RB |
622 | We want it to have the address of the symbol. */ |
623 | ||
624 | size = sym[i].st_value; | |
625 | sym[i].st_value = bssbase; | |
626 | ||
627 | bssbase += size; | |
628 | break; | |
629 | ||
630 | case SHN_ABS: | |
631 | /* Don't need to do anything */ | |
632 | break; | |
633 | ||
634 | case SHN_UNDEF: | |
635 | /* ret = -ENOENT; */ | |
636 | break; | |
637 | ||
638 | case SHN_MIPS_SCOMMON: | |
b1e3afa0 | 639 | printk(KERN_DEBUG "simplify_symbols: ignoring SHN_MIPS_SCOMMON " |
2600990e RB |
640 | "symbol <%s> st_shndx %d\n", strtab + sym[i].st_name, |
641 | sym[i].st_shndx); | |
e01402b1 RB |
642 | // .sbss section |
643 | break; | |
644 | ||
645 | default: | |
646 | secbase = sechdrs[sym[i].st_shndx].sh_addr; | |
647 | ||
648 | if (strncmp(strtab + sym[i].st_name, "_gp", 3) == 0) { | |
649 | save_gp_address(secbase, sym[i].st_value); | |
650 | } | |
651 | ||
652 | sym[i].st_value += secbase; | |
653 | break; | |
654 | } | |
e01402b1 | 655 | } |
e01402b1 RB |
656 | } |
657 | ||
658 | #ifdef DEBUG_ELFLOADER | |
659 | static void dump_elfsymbols(Elf_Shdr * sechdrs, unsigned int symindex, | |
660 | const char *strtab, struct module *mod) | |
661 | { | |
662 | Elf_Sym *sym = (void *)sechdrs[symindex].sh_addr; | |
663 | unsigned int i, n = sechdrs[symindex].sh_size / sizeof(Elf_Sym); | |
664 | ||
665 | printk(KERN_DEBUG "dump_elfsymbols: n %d\n", n); | |
666 | for (i = 1; i < n; i++) { | |
667 | printk(KERN_DEBUG " i %d name <%s> 0x%x\n", i, | |
668 | strtab + sym[i].st_name, sym[i].st_value); | |
669 | } | |
670 | } | |
671 | #endif | |
672 | ||
e01402b1 | 673 | /* We are prepared so configure and start the VPE... */ |
be6e1437 | 674 | static int vpe_run(struct vpe * v) |
e01402b1 | 675 | { |
07cc0c9e | 676 | unsigned long flags, val, dmt_flag; |
2600990e | 677 | struct vpe_notifications *n; |
07cc0c9e | 678 | unsigned int vpeflags; |
e01402b1 RB |
679 | struct tc *t; |
680 | ||
681 | /* check we are the Master VPE */ | |
07cc0c9e | 682 | local_irq_save(flags); |
e01402b1 RB |
683 | val = read_c0_vpeconf0(); |
684 | if (!(val & VPECONF0_MVP)) { | |
685 | printk(KERN_WARNING | |
2600990e | 686 | "VPE loader: only Master VPE's are allowed to configure MT\n"); |
07cc0c9e RB |
687 | local_irq_restore(flags); |
688 | ||
e01402b1 RB |
689 | return -1; |
690 | } | |
691 | ||
07cc0c9e RB |
692 | dmt_flag = dmt(); |
693 | vpeflags = dvpe(); | |
e01402b1 | 694 | |
2600990e | 695 | if (!list_empty(&v->tc)) { |
e0daad44 | 696 | if ((t = list_entry(v->tc.next, struct tc, tc)) == NULL) { |
07cc0c9e RB |
697 | evpe(vpeflags); |
698 | emt(dmt_flag); | |
699 | local_irq_restore(flags); | |
700 | ||
701 | printk(KERN_WARNING | |
702 | "VPE loader: TC %d is already in use.\n", | |
703 | t->index); | |
e0daad44 RB |
704 | return -ENOEXEC; |
705 | } | |
706 | } else { | |
07cc0c9e RB |
707 | evpe(vpeflags); |
708 | emt(dmt_flag); | |
709 | local_irq_restore(flags); | |
710 | ||
711 | printk(KERN_WARNING | |
712 | "VPE loader: No TC's associated with VPE %d\n", | |
e0daad44 | 713 | v->minor); |
07cc0c9e | 714 | |
e0daad44 RB |
715 | return -ENOEXEC; |
716 | } | |
2600990e | 717 | |
e01402b1 | 718 | /* Put MVPE's into 'configuration state' */ |
340ee4b9 | 719 | set_c0_mvpcontrol(MVPCONTROL_VPC); |
e01402b1 | 720 | |
e01402b1 RB |
721 | settc(t->index); |
722 | ||
e01402b1 RB |
723 | /* should check it is halted, and not activated */ |
724 | if ((read_tc_c0_tcstatus() & TCSTATUS_A) || !(read_tc_c0_tchalt() & TCHALT_H)) { | |
07cc0c9e RB |
725 | evpe(vpeflags); |
726 | emt(dmt_flag); | |
727 | local_irq_restore(flags); | |
728 | ||
729 | printk(KERN_WARNING "VPE loader: TC %d is already active!\n", | |
e01402b1 | 730 | t->index); |
07cc0c9e | 731 | |
e01402b1 RB |
732 | return -ENOEXEC; |
733 | } | |
734 | ||
735 | /* Write the address we want it to start running from in the TCPC register. */ | |
736 | write_tc_c0_tcrestart((unsigned long)v->__start); | |
e01402b1 | 737 | write_tc_c0_tccontext((unsigned long)0); |
07cc0c9e | 738 | |
2600990e RB |
739 | /* |
740 | * Mark the TC as activated, not interrupt exempt and not dynamically | |
741 | * allocatable | |
742 | */ | |
e01402b1 RB |
743 | val = read_tc_c0_tcstatus(); |
744 | val = (val & ~(TCSTATUS_DA | TCSTATUS_IXMT)) | TCSTATUS_A; | |
745 | write_tc_c0_tcstatus(val); | |
746 | ||
747 | write_tc_c0_tchalt(read_tc_c0_tchalt() & ~TCHALT_H); | |
748 | ||
e01402b1 RB |
749 | /* |
750 | * The sde-kit passes 'memsize' to __start in $a3, so set something | |
2600990e | 751 | * here... Or set $a3 to zero and define DFLT_STACK_SIZE and |
e01402b1 RB |
752 | * DFLT_HEAP_SIZE when you compile your program |
753 | */ | |
41790e04 | 754 | mttgpr(6, v->ntcs); |
07cc0c9e | 755 | mttgpr(7, physical_memsize); |
2600990e RB |
756 | |
757 | /* set up VPE1 */ | |
758 | /* | |
759 | * bind the TC to VPE 1 as late as possible so we only have the final | |
760 | * VPE registers to set up, and so an EJTAG probe can trigger on it | |
761 | */ | |
07cc0c9e | 762 | write_tc_c0_tcbind((read_tc_c0_tcbind() & ~TCBIND_CURVPE) | 1); |
e01402b1 | 763 | |
a94d7020 EO |
764 | write_vpe_c0_vpeconf0(read_vpe_c0_vpeconf0() & ~(VPECONF0_VPA)); |
765 | ||
766 | back_to_back_c0_hazard(); | |
767 | ||
e0daad44 RB |
768 | /* Set up the XTC bit in vpeconf0 to point at our tc */ |
769 | write_vpe_c0_vpeconf0( (read_vpe_c0_vpeconf0() & ~(VPECONF0_XTC)) | |
770 | | (t->index << VPECONF0_XTC_SHIFT)); | |
e01402b1 | 771 | |
a94d7020 EO |
772 | back_to_back_c0_hazard(); |
773 | ||
e0daad44 RB |
774 | /* enable this VPE */ |
775 | write_vpe_c0_vpeconf0(read_vpe_c0_vpeconf0() | VPECONF0_VPA); | |
e01402b1 RB |
776 | |
777 | /* clear out any left overs from a previous program */ | |
2600990e | 778 | write_vpe_c0_status(0); |
e01402b1 RB |
779 | write_vpe_c0_cause(0); |
780 | ||
781 | /* take system out of configuration state */ | |
340ee4b9 | 782 | clear_c0_mvpcontrol(MVPCONTROL_VPC); |
e01402b1 | 783 | |
07cc0c9e | 784 | #ifdef CONFIG_SMP |
e01402b1 | 785 | evpe(EVPE_ENABLE); |
07cc0c9e RB |
786 | #else |
787 | evpe(vpeflags); | |
788 | #endif | |
789 | emt(dmt_flag); | |
790 | local_irq_restore(flags); | |
e01402b1 | 791 | |
07cc0c9e RB |
792 | list_for_each_entry(n, &v->notify, list) |
793 | n->start(minor); | |
2600990e | 794 | |
e01402b1 RB |
795 | return 0; |
796 | } | |
797 | ||
2600990e | 798 | static int find_vpe_symbols(struct vpe * v, Elf_Shdr * sechdrs, |
e01402b1 RB |
799 | unsigned int symindex, const char *strtab, |
800 | struct module *mod) | |
801 | { | |
802 | Elf_Sym *sym = (void *)sechdrs[symindex].sh_addr; | |
803 | unsigned int i, n = sechdrs[symindex].sh_size / sizeof(Elf_Sym); | |
804 | ||
805 | for (i = 1; i < n; i++) { | |
806 | if (strcmp(strtab + sym[i].st_name, "__start") == 0) { | |
807 | v->__start = sym[i].st_value; | |
808 | } | |
809 | ||
810 | if (strcmp(strtab + sym[i].st_name, "vpe_shared") == 0) { | |
811 | v->shared_ptr = (void *)sym[i].st_value; | |
812 | } | |
813 | } | |
814 | ||
2600990e RB |
815 | if ( (v->__start == 0) || (v->shared_ptr == NULL)) |
816 | return -1; | |
817 | ||
e01402b1 RB |
818 | return 0; |
819 | } | |
820 | ||
307bd284 | 821 | /* |
2600990e RB |
822 | * Allocates a VPE with some program code space(the load address), copies the |
823 | * contents of the program (p)buffer performing relocatations/etc, free's it | |
824 | * when finished. | |
825 | */ | |
be6e1437 | 826 | static int vpe_elfload(struct vpe * v) |
e01402b1 RB |
827 | { |
828 | Elf_Ehdr *hdr; | |
829 | Elf_Shdr *sechdrs; | |
830 | long err = 0; | |
831 | char *secstrings, *strtab = NULL; | |
2600990e | 832 | unsigned int len, i, symindex = 0, strindex = 0, relocate = 0; |
e01402b1 RB |
833 | struct module mod; // so we can re-use the relocations code |
834 | ||
835 | memset(&mod, 0, sizeof(struct module)); | |
2600990e | 836 | strcpy(mod.name, "VPE loader"); |
e01402b1 RB |
837 | |
838 | hdr = (Elf_Ehdr *) v->pbuffer; | |
839 | len = v->plen; | |
840 | ||
841 | /* Sanity checks against insmoding binaries or wrong arch, | |
842 | weird elf version */ | |
843 | if (memcmp(hdr->e_ident, ELFMAG, 4) != 0 | |
2600990e RB |
844 | || (hdr->e_type != ET_REL && hdr->e_type != ET_EXEC) |
845 | || !elf_check_arch(hdr) | |
e01402b1 RB |
846 | || hdr->e_shentsize != sizeof(*sechdrs)) { |
847 | printk(KERN_WARNING | |
2600990e | 848 | "VPE loader: program wrong arch or weird elf version\n"); |
e01402b1 RB |
849 | |
850 | return -ENOEXEC; | |
851 | } | |
852 | ||
2600990e RB |
853 | if (hdr->e_type == ET_REL) |
854 | relocate = 1; | |
855 | ||
e01402b1 | 856 | if (len < hdr->e_shoff + hdr->e_shnum * sizeof(Elf_Shdr)) { |
2600990e RB |
857 | printk(KERN_ERR "VPE loader: program length %u truncated\n", |
858 | len); | |
859 | ||
e01402b1 RB |
860 | return -ENOEXEC; |
861 | } | |
862 | ||
863 | /* Convenience variables */ | |
864 | sechdrs = (void *)hdr + hdr->e_shoff; | |
865 | secstrings = (void *)hdr + sechdrs[hdr->e_shstrndx].sh_offset; | |
866 | sechdrs[0].sh_addr = 0; | |
867 | ||
868 | /* And these should exist, but gcc whinges if we don't init them */ | |
869 | symindex = strindex = 0; | |
870 | ||
2600990e RB |
871 | if (relocate) { |
872 | for (i = 1; i < hdr->e_shnum; i++) { | |
873 | if (sechdrs[i].sh_type != SHT_NOBITS | |
874 | && len < sechdrs[i].sh_offset + sechdrs[i].sh_size) { | |
875 | printk(KERN_ERR "VPE program length %u truncated\n", | |
876 | len); | |
877 | return -ENOEXEC; | |
878 | } | |
e01402b1 | 879 | |
2600990e RB |
880 | /* Mark all sections sh_addr with their address in the |
881 | temporary image. */ | |
882 | sechdrs[i].sh_addr = (size_t) hdr + sechdrs[i].sh_offset; | |
e01402b1 | 883 | |
2600990e RB |
884 | /* Internal symbols and strings. */ |
885 | if (sechdrs[i].sh_type == SHT_SYMTAB) { | |
886 | symindex = i; | |
887 | strindex = sechdrs[i].sh_link; | |
888 | strtab = (char *)hdr + sechdrs[strindex].sh_offset; | |
889 | } | |
e01402b1 | 890 | } |
2600990e | 891 | layout_sections(&mod, hdr, sechdrs, secstrings); |
e01402b1 RB |
892 | } |
893 | ||
e01402b1 | 894 | v->load_addr = alloc_progmem(mod.core_size); |
5408c490 RB |
895 | if (!v->load_addr) |
896 | return -ENOMEM; | |
e01402b1 | 897 | |
5408c490 | 898 | pr_info("VPE loader: loading to %p\n", v->load_addr); |
e01402b1 | 899 | |
2600990e RB |
900 | if (relocate) { |
901 | for (i = 0; i < hdr->e_shnum; i++) { | |
902 | void *dest; | |
e01402b1 | 903 | |
2600990e RB |
904 | if (!(sechdrs[i].sh_flags & SHF_ALLOC)) |
905 | continue; | |
e01402b1 | 906 | |
2600990e | 907 | dest = v->load_addr + sechdrs[i].sh_entsize; |
e01402b1 | 908 | |
2600990e RB |
909 | if (sechdrs[i].sh_type != SHT_NOBITS) |
910 | memcpy(dest, (void *)sechdrs[i].sh_addr, | |
911 | sechdrs[i].sh_size); | |
912 | /* Update sh_addr to point to copy in image. */ | |
913 | sechdrs[i].sh_addr = (unsigned long)dest; | |
e01402b1 | 914 | |
2600990e RB |
915 | printk(KERN_DEBUG " section sh_name %s sh_addr 0x%x\n", |
916 | secstrings + sechdrs[i].sh_name, sechdrs[i].sh_addr); | |
917 | } | |
e01402b1 | 918 | |
2600990e RB |
919 | /* Fix up syms, so that st_value is a pointer to location. */ |
920 | simplify_symbols(sechdrs, symindex, strtab, secstrings, | |
921 | hdr->e_shnum, &mod); | |
922 | ||
923 | /* Now do relocations. */ | |
924 | for (i = 1; i < hdr->e_shnum; i++) { | |
925 | const char *strtab = (char *)sechdrs[strindex].sh_addr; | |
926 | unsigned int info = sechdrs[i].sh_info; | |
927 | ||
928 | /* Not a valid relocation section? */ | |
929 | if (info >= hdr->e_shnum) | |
930 | continue; | |
931 | ||
932 | /* Don't bother with non-allocated sections */ | |
933 | if (!(sechdrs[info].sh_flags & SHF_ALLOC)) | |
934 | continue; | |
935 | ||
936 | if (sechdrs[i].sh_type == SHT_REL) | |
937 | err = apply_relocations(sechdrs, strtab, symindex, i, | |
938 | &mod); | |
939 | else if (sechdrs[i].sh_type == SHT_RELA) | |
940 | err = apply_relocate_add(sechdrs, strtab, symindex, i, | |
941 | &mod); | |
942 | if (err < 0) | |
943 | return err; | |
944 | ||
945 | } | |
946 | } else { | |
bdf5d42c | 947 | struct elf_phdr *phdr = (struct elf_phdr *) ((char *)hdr + hdr->e_phoff); |
2600990e | 948 | |
bdf5d42c RB |
949 | for (i = 0; i < hdr->e_phnum; i++) { |
950 | if (phdr->p_type != PT_LOAD) | |
951 | continue; | |
952 | ||
82923663 RB |
953 | memcpy((void *)phdr->p_paddr, (char *)hdr + phdr->p_offset, phdr->p_filesz); |
954 | memset((void *)phdr->p_paddr + phdr->p_filesz, 0, phdr->p_memsz - phdr->p_filesz); | |
bdf5d42c RB |
955 | phdr++; |
956 | } | |
957 | ||
958 | for (i = 0; i < hdr->e_shnum; i++) { | |
2600990e RB |
959 | /* Internal symbols and strings. */ |
960 | if (sechdrs[i].sh_type == SHT_SYMTAB) { | |
961 | symindex = i; | |
962 | strindex = sechdrs[i].sh_link; | |
963 | strtab = (char *)hdr + sechdrs[strindex].sh_offset; | |
964 | ||
965 | /* mark the symtab's address for when we try to find the | |
966 | magic symbols */ | |
967 | sechdrs[i].sh_addr = (size_t) hdr + sechdrs[i].sh_offset; | |
968 | } | |
e01402b1 RB |
969 | } |
970 | } | |
971 | ||
972 | /* make sure it's physically written out */ | |
973 | flush_icache_range((unsigned long)v->load_addr, | |
974 | (unsigned long)v->load_addr + v->len); | |
975 | ||
976 | if ((find_vpe_symbols(v, sechdrs, symindex, strtab, &mod)) < 0) { | |
2600990e RB |
977 | if (v->__start == 0) { |
978 | printk(KERN_WARNING "VPE loader: program does not contain " | |
979 | "a __start symbol\n"); | |
980 | return -ENOEXEC; | |
981 | } | |
e01402b1 | 982 | |
2600990e RB |
983 | if (v->shared_ptr == NULL) |
984 | printk(KERN_WARNING "VPE loader: " | |
985 | "program does not contain vpe_shared symbol.\n" | |
986 | " Unable to use AMVP (AP/SP) facilities.\n"); | |
e01402b1 RB |
987 | } |
988 | ||
989 | printk(" elf loaded\n"); | |
2600990e | 990 | return 0; |
e01402b1 RB |
991 | } |
992 | ||
2600990e RB |
993 | static void cleanup_tc(struct tc *tc) |
994 | { | |
07cc0c9e RB |
995 | unsigned long flags; |
996 | unsigned int mtflags, vpflags; | |
2600990e RB |
997 | int tmp; |
998 | ||
07cc0c9e RB |
999 | local_irq_save(flags); |
1000 | mtflags = dmt(); | |
1001 | vpflags = dvpe(); | |
2600990e RB |
1002 | /* Put MVPE's into 'configuration state' */ |
1003 | set_c0_mvpcontrol(MVPCONTROL_VPC); | |
1004 | ||
1005 | settc(tc->index); | |
1006 | tmp = read_tc_c0_tcstatus(); | |
1007 | ||
1008 | /* mark not allocated and not dynamically allocatable */ | |
1009 | tmp &= ~(TCSTATUS_A | TCSTATUS_DA); | |
1010 | tmp |= TCSTATUS_IXMT; /* interrupt exempt */ | |
1011 | write_tc_c0_tcstatus(tmp); | |
1012 | ||
1013 | write_tc_c0_tchalt(TCHALT_H); | |
7c3a622d | 1014 | mips_ihb(); |
2600990e RB |
1015 | |
1016 | /* bind it to anything other than VPE1 */ | |
07cc0c9e | 1017 | // write_tc_c0_tcbind(read_tc_c0_tcbind() & ~TCBIND_CURVPE); // | TCBIND_CURVPE |
2600990e RB |
1018 | |
1019 | clear_c0_mvpcontrol(MVPCONTROL_VPC); | |
07cc0c9e RB |
1020 | evpe(vpflags); |
1021 | emt(mtflags); | |
1022 | local_irq_restore(flags); | |
2600990e RB |
1023 | } |
1024 | ||
1025 | static int getcwd(char *buff, int size) | |
1026 | { | |
1027 | mm_segment_t old_fs; | |
1028 | int ret; | |
1029 | ||
1030 | old_fs = get_fs(); | |
1031 | set_fs(KERNEL_DS); | |
1032 | ||
21a151d8 | 1033 | ret = sys_getcwd(buff, size); |
2600990e RB |
1034 | |
1035 | set_fs(old_fs); | |
1036 | ||
1037 | return ret; | |
1038 | } | |
1039 | ||
1040 | /* checks VPE is unused and gets ready to load program */ | |
e01402b1 RB |
1041 | static int vpe_open(struct inode *inode, struct file *filp) |
1042 | { | |
c4c4018b | 1043 | enum vpe_state state; |
2600990e | 1044 | struct vpe_notifications *not; |
07cc0c9e RB |
1045 | struct vpe *v; |
1046 | int ret; | |
e01402b1 | 1047 | |
07cc0c9e RB |
1048 | if (minor != iminor(inode)) { |
1049 | /* assume only 1 device at the moment. */ | |
2600990e | 1050 | printk(KERN_WARNING "VPE loader: only vpe1 is supported\n"); |
e01402b1 RB |
1051 | return -ENODEV; |
1052 | } | |
1053 | ||
07cc0c9e | 1054 | if ((v = get_vpe(tclimit)) == NULL) { |
2600990e | 1055 | printk(KERN_WARNING "VPE loader: unable to get vpe\n"); |
e01402b1 RB |
1056 | return -ENODEV; |
1057 | } | |
1058 | ||
c4c4018b RB |
1059 | state = xchg(&v->state, VPE_STATE_INUSE); |
1060 | if (state != VPE_STATE_UNUSED) { | |
2600990e | 1061 | printk(KERN_DEBUG "VPE loader: tc in use dumping regs\n"); |
e01402b1 | 1062 | |
2600990e | 1063 | list_for_each_entry(not, &v->notify, list) { |
07cc0c9e | 1064 | not->stop(tclimit); |
2600990e | 1065 | } |
e01402b1 | 1066 | |
2600990e | 1067 | release_progmem(v->load_addr); |
07cc0c9e | 1068 | cleanup_tc(get_tc(tclimit)); |
e01402b1 RB |
1069 | } |
1070 | ||
e01402b1 RB |
1071 | /* this of-course trashes what was there before... */ |
1072 | v->pbuffer = vmalloc(P_SIZE); | |
1073 | v->plen = P_SIZE; | |
1074 | v->load_addr = NULL; | |
1075 | v->len = 0; | |
1076 | ||
2600990e RB |
1077 | v->uid = filp->f_uid; |
1078 | v->gid = filp->f_gid; | |
1079 | ||
1080 | #ifdef CONFIG_MIPS_APSP_KSPD | |
1081 | /* get kspd to tell us when a syscall_exit happens */ | |
1082 | if (!kspd_events_reqd) { | |
1083 | kspd_notify(&kspd_events); | |
1084 | kspd_events_reqd++; | |
1085 | } | |
1086 | #endif | |
1087 | ||
1088 | v->cwd[0] = 0; | |
1089 | ret = getcwd(v->cwd, VPE_PATH_MAX); | |
1090 | if (ret < 0) | |
1091 | printk(KERN_WARNING "VPE loader: open, getcwd returned %d\n", ret); | |
1092 | ||
1093 | v->shared_ptr = NULL; | |
1094 | v->__start = 0; | |
07cc0c9e | 1095 | |
e01402b1 RB |
1096 | return 0; |
1097 | } | |
1098 | ||
1099 | static int vpe_release(struct inode *inode, struct file *filp) | |
1100 | { | |
307bd284 | 1101 | struct vpe *v; |
e01402b1 | 1102 | Elf_Ehdr *hdr; |
07cc0c9e | 1103 | int ret = 0; |
e01402b1 | 1104 | |
07cc0c9e RB |
1105 | v = get_vpe(tclimit); |
1106 | if (v == NULL) | |
e01402b1 RB |
1107 | return -ENODEV; |
1108 | ||
e01402b1 RB |
1109 | hdr = (Elf_Ehdr *) v->pbuffer; |
1110 | if (memcmp(hdr->e_ident, ELFMAG, 4) == 0) { | |
07cc0c9e | 1111 | if (vpe_elfload(v) >= 0) { |
e01402b1 | 1112 | vpe_run(v); |
07cc0c9e | 1113 | } else { |
2600990e | 1114 | printk(KERN_WARNING "VPE loader: ELF load failed.\n"); |
e01402b1 RB |
1115 | ret = -ENOEXEC; |
1116 | } | |
1117 | } else { | |
2600990e | 1118 | printk(KERN_WARNING "VPE loader: only elf files are supported\n"); |
e01402b1 RB |
1119 | ret = -ENOEXEC; |
1120 | } | |
1121 | ||
2600990e RB |
1122 | /* It's good to be able to run the SP and if it chokes have a look at |
1123 | the /dev/rt?. But if we reset the pointer to the shared struct we | |
1124 | loose what has happened. So perhaps if garbage is sent to the vpe | |
1125 | device, use it as a trigger for the reset. Hopefully a nice | |
1126 | executable will be along shortly. */ | |
1127 | if (ret < 0) | |
1128 | v->shared_ptr = NULL; | |
1129 | ||
e01402b1 RB |
1130 | // cleanup any temp buffers |
1131 | if (v->pbuffer) | |
1132 | vfree(v->pbuffer); | |
1133 | v->plen = 0; | |
1134 | return ret; | |
1135 | } | |
1136 | ||
1137 | static ssize_t vpe_write(struct file *file, const char __user * buffer, | |
1138 | size_t count, loff_t * ppos) | |
1139 | { | |
e01402b1 | 1140 | size_t ret = count; |
307bd284 | 1141 | struct vpe *v; |
e01402b1 | 1142 | |
07cc0c9e RB |
1143 | if (iminor(file->f_path.dentry->d_inode) != minor) |
1144 | return -ENODEV; | |
1145 | ||
1146 | v = get_vpe(tclimit); | |
1147 | if (v == NULL) | |
e01402b1 RB |
1148 | return -ENODEV; |
1149 | ||
1150 | if (v->pbuffer == NULL) { | |
2600990e | 1151 | printk(KERN_ERR "VPE loader: no buffer for program\n"); |
e01402b1 RB |
1152 | return -ENOMEM; |
1153 | } | |
1154 | ||
1155 | if ((count + v->len) > v->plen) { | |
1156 | printk(KERN_WARNING | |
2600990e | 1157 | "VPE loader: elf size too big. Perhaps strip uneeded symbols\n"); |
e01402b1 RB |
1158 | return -ENOMEM; |
1159 | } | |
1160 | ||
1161 | count -= copy_from_user(v->pbuffer + v->len, buffer, count); | |
2600990e | 1162 | if (!count) |
e01402b1 | 1163 | return -EFAULT; |
e01402b1 RB |
1164 | |
1165 | v->len += count; | |
1166 | return ret; | |
1167 | } | |
1168 | ||
5dfe4c96 | 1169 | static const struct file_operations vpe_fops = { |
e01402b1 RB |
1170 | .owner = THIS_MODULE, |
1171 | .open = vpe_open, | |
1172 | .release = vpe_release, | |
1173 | .write = vpe_write | |
1174 | }; | |
1175 | ||
1176 | /* module wrapper entry points */ | |
1177 | /* give me a vpe */ | |
1178 | vpe_handle vpe_alloc(void) | |
1179 | { | |
1180 | int i; | |
1181 | struct vpe *v; | |
1182 | ||
1183 | /* find a vpe */ | |
1184 | for (i = 1; i < MAX_VPES; i++) { | |
1185 | if ((v = get_vpe(i)) != NULL) { | |
1186 | v->state = VPE_STATE_INUSE; | |
1187 | return v; | |
1188 | } | |
1189 | } | |
1190 | return NULL; | |
1191 | } | |
1192 | ||
1193 | EXPORT_SYMBOL(vpe_alloc); | |
1194 | ||
1195 | /* start running from here */ | |
1196 | int vpe_start(vpe_handle vpe, unsigned long start) | |
1197 | { | |
1198 | struct vpe *v = vpe; | |
1199 | ||
1200 | v->__start = start; | |
1201 | return vpe_run(v); | |
1202 | } | |
1203 | ||
1204 | EXPORT_SYMBOL(vpe_start); | |
1205 | ||
1206 | /* halt it for now */ | |
1207 | int vpe_stop(vpe_handle vpe) | |
1208 | { | |
1209 | struct vpe *v = vpe; | |
1210 | struct tc *t; | |
1211 | unsigned int evpe_flags; | |
1212 | ||
1213 | evpe_flags = dvpe(); | |
1214 | ||
1215 | if ((t = list_entry(v->tc.next, struct tc, tc)) != NULL) { | |
1216 | ||
1217 | settc(t->index); | |
1218 | write_vpe_c0_vpeconf0(read_vpe_c0_vpeconf0() & ~VPECONF0_VPA); | |
1219 | } | |
1220 | ||
1221 | evpe(evpe_flags); | |
1222 | ||
1223 | return 0; | |
1224 | } | |
1225 | ||
1226 | EXPORT_SYMBOL(vpe_stop); | |
1227 | ||
1228 | /* I've done with it thank you */ | |
1229 | int vpe_free(vpe_handle vpe) | |
1230 | { | |
1231 | struct vpe *v = vpe; | |
1232 | struct tc *t; | |
1233 | unsigned int evpe_flags; | |
1234 | ||
1235 | if ((t = list_entry(v->tc.next, struct tc, tc)) == NULL) { | |
1236 | return -ENOEXEC; | |
1237 | } | |
1238 | ||
1239 | evpe_flags = dvpe(); | |
1240 | ||
1241 | /* Put MVPE's into 'configuration state' */ | |
340ee4b9 | 1242 | set_c0_mvpcontrol(MVPCONTROL_VPC); |
e01402b1 RB |
1243 | |
1244 | settc(t->index); | |
1245 | write_vpe_c0_vpeconf0(read_vpe_c0_vpeconf0() & ~VPECONF0_VPA); | |
1246 | ||
7c3a622d | 1247 | /* halt the TC */ |
e01402b1 | 1248 | write_tc_c0_tchalt(TCHALT_H); |
7c3a622d NS |
1249 | mips_ihb(); |
1250 | ||
1251 | /* mark the TC unallocated */ | |
1252 | write_tc_c0_tcstatus(read_tc_c0_tcstatus() & ~TCSTATUS_A); | |
e01402b1 RB |
1253 | |
1254 | v->state = VPE_STATE_UNUSED; | |
1255 | ||
340ee4b9 | 1256 | clear_c0_mvpcontrol(MVPCONTROL_VPC); |
e01402b1 RB |
1257 | evpe(evpe_flags); |
1258 | ||
1259 | return 0; | |
1260 | } | |
1261 | ||
1262 | EXPORT_SYMBOL(vpe_free); | |
1263 | ||
1264 | void *vpe_get_shared(int index) | |
1265 | { | |
1266 | struct vpe *v; | |
1267 | ||
2600990e | 1268 | if ((v = get_vpe(index)) == NULL) |
e01402b1 | 1269 | return NULL; |
e01402b1 RB |
1270 | |
1271 | return v->shared_ptr; | |
1272 | } | |
1273 | ||
1274 | EXPORT_SYMBOL(vpe_get_shared); | |
1275 | ||
2600990e RB |
1276 | int vpe_getuid(int index) |
1277 | { | |
1278 | struct vpe *v; | |
1279 | ||
1280 | if ((v = get_vpe(index)) == NULL) | |
1281 | return -1; | |
1282 | ||
1283 | return v->uid; | |
1284 | } | |
1285 | ||
1286 | EXPORT_SYMBOL(vpe_getuid); | |
1287 | ||
1288 | int vpe_getgid(int index) | |
1289 | { | |
1290 | struct vpe *v; | |
1291 | ||
1292 | if ((v = get_vpe(index)) == NULL) | |
1293 | return -1; | |
1294 | ||
1295 | return v->gid; | |
1296 | } | |
1297 | ||
1298 | EXPORT_SYMBOL(vpe_getgid); | |
1299 | ||
1300 | int vpe_notify(int index, struct vpe_notifications *notify) | |
1301 | { | |
1302 | struct vpe *v; | |
1303 | ||
1304 | if ((v = get_vpe(index)) == NULL) | |
1305 | return -1; | |
1306 | ||
1307 | list_add(¬ify->list, &v->notify); | |
1308 | return 0; | |
1309 | } | |
1310 | ||
1311 | EXPORT_SYMBOL(vpe_notify); | |
1312 | ||
1313 | char *vpe_getcwd(int index) | |
1314 | { | |
1315 | struct vpe *v; | |
1316 | ||
1317 | if ((v = get_vpe(index)) == NULL) | |
1318 | return NULL; | |
1319 | ||
1320 | return v->cwd; | |
1321 | } | |
1322 | ||
1323 | EXPORT_SYMBOL(vpe_getcwd); | |
1324 | ||
1325 | #ifdef CONFIG_MIPS_APSP_KSPD | |
1326 | static void kspd_sp_exit( int sp_id) | |
1327 | { | |
1328 | cleanup_tc(get_tc(sp_id)); | |
1329 | } | |
1330 | #endif | |
1331 | ||
736fad17 KS |
1332 | static ssize_t store_kill(struct device *dev, struct device_attribute *attr, |
1333 | const char *buf, size_t len) | |
0f5d0df3 RB |
1334 | { |
1335 | struct vpe *vpe = get_vpe(tclimit); | |
1336 | struct vpe_notifications *not; | |
1337 | ||
1338 | list_for_each_entry(not, &vpe->notify, list) { | |
1339 | not->stop(tclimit); | |
1340 | } | |
1341 | ||
1342 | release_progmem(vpe->load_addr); | |
1343 | cleanup_tc(get_tc(tclimit)); | |
1344 | vpe_stop(vpe); | |
1345 | vpe_free(vpe); | |
1346 | ||
1347 | return len; | |
1348 | } | |
1349 | ||
736fad17 KS |
1350 | static ssize_t show_ntcs(struct device *cd, struct device_attribute *attr, |
1351 | char *buf) | |
41790e04 RB |
1352 | { |
1353 | struct vpe *vpe = get_vpe(tclimit); | |
1354 | ||
1355 | return sprintf(buf, "%d\n", vpe->ntcs); | |
1356 | } | |
1357 | ||
736fad17 KS |
1358 | static ssize_t store_ntcs(struct device *dev, struct device_attribute *attr, |
1359 | const char *buf, size_t len) | |
41790e04 RB |
1360 | { |
1361 | struct vpe *vpe = get_vpe(tclimit); | |
1362 | unsigned long new; | |
1363 | char *endp; | |
1364 | ||
1365 | new = simple_strtoul(buf, &endp, 0); | |
1366 | if (endp == buf) | |
1367 | goto out_einval; | |
1368 | ||
1369 | if (new == 0 || new > (hw_tcs - tclimit)) | |
1370 | goto out_einval; | |
1371 | ||
1372 | vpe->ntcs = new; | |
1373 | ||
1374 | return len; | |
1375 | ||
1376 | out_einval: | |
1377 | return -EINVAL;; | |
1378 | } | |
1379 | ||
736fad17 | 1380 | static struct device_attribute vpe_class_attributes[] = { |
0f5d0df3 | 1381 | __ATTR(kill, S_IWUSR, NULL, store_kill), |
41790e04 RB |
1382 | __ATTR(ntcs, S_IRUGO | S_IWUSR, show_ntcs, store_ntcs), |
1383 | {} | |
1384 | }; | |
1385 | ||
736fad17 | 1386 | static void vpe_device_release(struct device *cd) |
41790e04 RB |
1387 | { |
1388 | kfree(cd); | |
1389 | } | |
1390 | ||
1391 | struct class vpe_class = { | |
1392 | .name = "vpe", | |
1393 | .owner = THIS_MODULE, | |
736fad17 KS |
1394 | .dev_release = vpe_device_release, |
1395 | .dev_attrs = vpe_class_attributes, | |
41790e04 RB |
1396 | }; |
1397 | ||
736fad17 | 1398 | struct device vpe_device; |
27a3bbaf | 1399 | |
e01402b1 RB |
1400 | static int __init vpe_module_init(void) |
1401 | { | |
07cc0c9e | 1402 | unsigned int mtflags, vpflags; |
07cc0c9e | 1403 | unsigned long flags, val; |
e01402b1 RB |
1404 | struct vpe *v = NULL; |
1405 | struct tc *t; | |
41790e04 | 1406 | int tc, err; |
e01402b1 RB |
1407 | |
1408 | if (!cpu_has_mipsmt) { | |
1409 | printk("VPE loader: not a MIPS MT capable processor\n"); | |
1410 | return -ENODEV; | |
1411 | } | |
1412 | ||
07cc0c9e RB |
1413 | if (vpelimit == 0) { |
1414 | printk(KERN_WARNING "No VPEs reserved for AP/SP, not " | |
1415 | "initializing VPE loader.\nPass maxvpes=<n> argument as " | |
1416 | "kernel argument\n"); | |
1417 | ||
1418 | return -ENODEV; | |
1419 | } | |
1420 | ||
1421 | if (tclimit == 0) { | |
1422 | printk(KERN_WARNING "No TCs reserved for AP/SP, not " | |
1423 | "initializing VPE loader.\nPass maxtcs=<n> argument as " | |
1424 | "kernel argument\n"); | |
1425 | ||
1426 | return -ENODEV; | |
1427 | } | |
1428 | ||
682e852e AD |
1429 | major = register_chrdev(0, module_name, &vpe_fops); |
1430 | if (major < 0) { | |
e01402b1 | 1431 | printk("VPE loader: unable to register character device\n"); |
307bd284 | 1432 | return major; |
e01402b1 RB |
1433 | } |
1434 | ||
41790e04 RB |
1435 | err = class_register(&vpe_class); |
1436 | if (err) { | |
1437 | printk(KERN_ERR "vpe_class registration failed\n"); | |
27a3bbaf RB |
1438 | goto out_chrdev; |
1439 | } | |
41790e04 | 1440 | |
736fad17 | 1441 | device_initialize(&vpe_device); |
41790e04 RB |
1442 | vpe_device.class = &vpe_class, |
1443 | vpe_device.parent = NULL, | |
736fad17 | 1444 | strlcpy(vpe_device.bus_id, "vpe1", BUS_ID_SIZE); |
41790e04 | 1445 | vpe_device.devt = MKDEV(major, minor); |
736fad17 | 1446 | err = device_add(&vpe_device); |
41790e04 RB |
1447 | if (err) { |
1448 | printk(KERN_ERR "Adding vpe_device failed\n"); | |
1449 | goto out_class; | |
1450 | } | |
27a3bbaf | 1451 | |
07cc0c9e RB |
1452 | local_irq_save(flags); |
1453 | mtflags = dmt(); | |
1454 | vpflags = dvpe(); | |
e01402b1 RB |
1455 | |
1456 | /* Put MVPE's into 'configuration state' */ | |
340ee4b9 | 1457 | set_c0_mvpcontrol(MVPCONTROL_VPC); |
e01402b1 RB |
1458 | |
1459 | /* dump_mtregs(); */ | |
1460 | ||
e01402b1 | 1461 | val = read_c0_mvpconf0(); |
07cc0c9e RB |
1462 | hw_tcs = (val & MVPCONF0_PTC) + 1; |
1463 | hw_vpes = ((val & MVPCONF0_PVPE) >> MVPCONF0_PVPE_SHIFT) + 1; | |
1464 | ||
1465 | for (tc = tclimit; tc < hw_tcs; tc++) { | |
1466 | /* | |
1467 | * Must re-enable multithreading temporarily or in case we | |
1468 | * reschedule send IPIs or similar we might hang. | |
1469 | */ | |
1470 | clear_c0_mvpcontrol(MVPCONTROL_VPC); | |
1471 | evpe(vpflags); | |
1472 | emt(mtflags); | |
1473 | local_irq_restore(flags); | |
1474 | t = alloc_tc(tc); | |
1475 | if (!t) { | |
1476 | err = -ENOMEM; | |
1477 | goto out; | |
1478 | } | |
1479 | ||
1480 | local_irq_save(flags); | |
1481 | mtflags = dmt(); | |
1482 | vpflags = dvpe(); | |
1483 | set_c0_mvpcontrol(MVPCONTROL_VPC); | |
e01402b1 RB |
1484 | |
1485 | /* VPE's */ | |
07cc0c9e RB |
1486 | if (tc < hw_tcs) { |
1487 | settc(tc); | |
e01402b1 | 1488 | |
07cc0c9e | 1489 | if ((v = alloc_vpe(tc)) == NULL) { |
e01402b1 | 1490 | printk(KERN_WARNING "VPE: unable to allocate VPE\n"); |
07cc0c9e RB |
1491 | |
1492 | goto out_reenable; | |
e01402b1 RB |
1493 | } |
1494 | ||
41790e04 RB |
1495 | v->ntcs = hw_tcs - tclimit; |
1496 | ||
2600990e RB |
1497 | /* add the tc to the list of this vpe's tc's. */ |
1498 | list_add(&t->tc, &v->tc); | |
e01402b1 RB |
1499 | |
1500 | /* deactivate all but vpe0 */ | |
07cc0c9e | 1501 | if (tc >= tclimit) { |
e01402b1 RB |
1502 | unsigned long tmp = read_vpe_c0_vpeconf0(); |
1503 | ||
1504 | tmp &= ~VPECONF0_VPA; | |
1505 | ||
1506 | /* master VPE */ | |
1507 | tmp |= VPECONF0_MVP; | |
1508 | write_vpe_c0_vpeconf0(tmp); | |
1509 | } | |
1510 | ||
1511 | /* disable multi-threading with TC's */ | |
1512 | write_vpe_c0_vpecontrol(read_vpe_c0_vpecontrol() & ~VPECONTROL_TE); | |
1513 | ||
07cc0c9e | 1514 | if (tc >= vpelimit) { |
2600990e RB |
1515 | /* |
1516 | * Set config to be the same as vpe0, | |
1517 | * particularly kseg0 coherency alg | |
1518 | */ | |
e01402b1 RB |
1519 | write_vpe_c0_config(read_c0_config()); |
1520 | } | |
e01402b1 RB |
1521 | } |
1522 | ||
1523 | /* TC's */ | |
1524 | t->pvpe = v; /* set the parent vpe */ | |
1525 | ||
07cc0c9e | 1526 | if (tc >= tclimit) { |
e01402b1 RB |
1527 | unsigned long tmp; |
1528 | ||
07cc0c9e | 1529 | settc(tc); |
e01402b1 | 1530 | |
2600990e RB |
1531 | /* Any TC that is bound to VPE0 gets left as is - in case |
1532 | we are running SMTC on VPE0. A TC that is bound to any | |
1533 | other VPE gets bound to VPE0, ideally I'd like to make | |
1534 | it homeless but it doesn't appear to let me bind a TC | |
1535 | to a non-existent VPE. Which is perfectly reasonable. | |
1536 | ||
1537 | The (un)bound state is visible to an EJTAG probe so may | |
1538 | notify GDB... | |
1539 | */ | |
1540 | ||
1541 | if (((tmp = read_tc_c0_tcbind()) & TCBIND_CURVPE)) { | |
1542 | /* tc is bound >vpe0 */ | |
1543 | write_tc_c0_tcbind(tmp & ~TCBIND_CURVPE); | |
1544 | ||
1545 | t->pvpe = get_vpe(0); /* set the parent vpe */ | |
1546 | } | |
e01402b1 | 1547 | |
7c3a622d NS |
1548 | /* halt the TC */ |
1549 | write_tc_c0_tchalt(TCHALT_H); | |
1550 | mips_ihb(); | |
1551 | ||
e01402b1 RB |
1552 | tmp = read_tc_c0_tcstatus(); |
1553 | ||
2600990e | 1554 | /* mark not activated and not dynamically allocatable */ |
e01402b1 RB |
1555 | tmp &= ~(TCSTATUS_A | TCSTATUS_DA); |
1556 | tmp |= TCSTATUS_IXMT; /* interrupt exempt */ | |
1557 | write_tc_c0_tcstatus(tmp); | |
e01402b1 RB |
1558 | } |
1559 | } | |
1560 | ||
07cc0c9e | 1561 | out_reenable: |
e01402b1 | 1562 | /* release config state */ |
340ee4b9 | 1563 | clear_c0_mvpcontrol(MVPCONTROL_VPC); |
e01402b1 | 1564 | |
07cc0c9e RB |
1565 | evpe(vpflags); |
1566 | emt(mtflags); | |
1567 | local_irq_restore(flags); | |
1568 | ||
2600990e RB |
1569 | #ifdef CONFIG_MIPS_APSP_KSPD |
1570 | kspd_events.kspd_sp_exit = kspd_sp_exit; | |
1571 | #endif | |
e01402b1 | 1572 | return 0; |
27a3bbaf | 1573 | |
41790e04 RB |
1574 | out_class: |
1575 | class_unregister(&vpe_class); | |
27a3bbaf RB |
1576 | out_chrdev: |
1577 | unregister_chrdev(major, module_name); | |
1578 | ||
07cc0c9e | 1579 | out: |
27a3bbaf | 1580 | return err; |
e01402b1 RB |
1581 | } |
1582 | ||
1583 | static void __exit vpe_module_exit(void) | |
1584 | { | |
1585 | struct vpe *v, *n; | |
1586 | ||
1587 | list_for_each_entry_safe(v, n, &vpecontrol.vpe_list, list) { | |
1588 | if (v->state != VPE_STATE_UNUSED) { | |
1589 | release_vpe(v); | |
1590 | } | |
1591 | } | |
1592 | ||
736fad17 | 1593 | device_del(&vpe_device); |
e01402b1 RB |
1594 | unregister_chrdev(major, module_name); |
1595 | } | |
1596 | ||
1597 | module_init(vpe_module_init); | |
1598 | module_exit(vpe_module_exit); | |
1599 | MODULE_DESCRIPTION("MIPS VPE Loader"); | |
2600990e | 1600 | MODULE_AUTHOR("Elizabeth Oldham, MIPS Technologies, Inc."); |
e01402b1 | 1601 | MODULE_LICENSE("GPL"); |