]>
Commit | Line | Data |
---|---|---|
e01402b1 RB |
1 | /* |
2 | * Copyright (C) 2004, 2005 MIPS Technologies, Inc. All rights reserved. | |
3 | * | |
4 | * This program is free software; you can distribute it and/or modify it | |
5 | * under the terms of the GNU General Public License (Version 2) as | |
6 | * published by the Free Software Foundation. | |
7 | * | |
8 | * This program is distributed in the hope it will be useful, but WITHOUT | |
9 | * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | |
10 | * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License | |
11 | * for more details. | |
12 | * | |
13 | * You should have received a copy of the GNU General Public License along | |
14 | * with this program; if not, write to the Free Software Foundation, Inc., | |
15 | * 59 Temple Place - Suite 330, Boston MA 02111-1307, USA. | |
e01402b1 RB |
16 | */ |
17 | ||
18 | /* | |
19 | * VPE support module | |
20 | * | |
21 | * Provides support for loading a MIPS SP program on VPE1. | |
22 | * The SP enviroment is rather simple, no tlb's. It needs to be relocatable | |
23 | * (or partially linked). You should initialise your stack in the startup | |
24 | * code. This loader looks for the symbol __start and sets up | |
25 | * execution to resume from there. The MIPS SDE kit contains suitable examples. | |
26 | * | |
27 | * To load and run, simply cat a SP 'program file' to /dev/vpe1. | |
28 | * i.e cat spapp >/dev/vpe1. | |
e01402b1 | 29 | */ |
e01402b1 | 30 | #include <linux/kernel.h> |
27a3bbaf | 31 | #include <linux/device.h> |
e01402b1 RB |
32 | #include <linux/module.h> |
33 | #include <linux/fs.h> | |
34 | #include <linux/init.h> | |
35 | #include <asm/uaccess.h> | |
36 | #include <linux/slab.h> | |
37 | #include <linux/list.h> | |
38 | #include <linux/vmalloc.h> | |
39 | #include <linux/elf.h> | |
40 | #include <linux/seq_file.h> | |
41 | #include <linux/syscalls.h> | |
42 | #include <linux/moduleloader.h> | |
43 | #include <linux/interrupt.h> | |
44 | #include <linux/poll.h> | |
45 | #include <linux/bootmem.h> | |
46 | #include <asm/mipsregs.h> | |
340ee4b9 | 47 | #include <asm/mipsmtregs.h> |
e01402b1 RB |
48 | #include <asm/cacheflush.h> |
49 | #include <asm/atomic.h> | |
50 | #include <asm/cpu.h> | |
27a3bbaf | 51 | #include <asm/mips_mt.h> |
e01402b1 RB |
52 | #include <asm/processor.h> |
53 | #include <asm/system.h> | |
2600990e RB |
54 | #include <asm/vpe.h> |
55 | #include <asm/kspd.h> | |
07cc0c9e | 56 | #include <asm/mips_mt.h> |
e01402b1 RB |
57 | |
58 | typedef void *vpe_handle; | |
59 | ||
e01402b1 RB |
60 | #ifndef ARCH_SHF_SMALL |
61 | #define ARCH_SHF_SMALL 0 | |
62 | #endif | |
63 | ||
64 | /* If this is set, the section belongs in the init part of the module */ | |
65 | #define INIT_OFFSET_MASK (1UL << (BITS_PER_LONG-1)) | |
66 | ||
e01402b1 | 67 | static char module_name[] = "vpe"; |
307bd284 | 68 | static int major; |
27a3bbaf | 69 | static const int minor = 1; /* fixed for now */ |
e01402b1 | 70 | |
2600990e RB |
71 | #ifdef CONFIG_MIPS_APSP_KSPD |
72 | static struct kspd_notifications kspd_events; | |
73 | static int kspd_events_reqd = 0; | |
74 | #endif | |
75 | ||
e01402b1 RB |
76 | /* grab the likely amount of memory we will need. */ |
77 | #ifdef CONFIG_MIPS_VPE_LOADER_TOM | |
78 | #define P_SIZE (2 * 1024 * 1024) | |
79 | #else | |
80 | /* add an overhead to the max kmalloc size for non-striped symbols/etc */ | |
81 | #define P_SIZE (256 * 1024) | |
82 | #endif | |
83 | ||
2600990e RB |
84 | extern unsigned long physical_memsize; |
85 | ||
e01402b1 | 86 | #define MAX_VPES 16 |
2600990e | 87 | #define VPE_PATH_MAX 256 |
e01402b1 RB |
88 | |
89 | enum vpe_state { | |
90 | VPE_STATE_UNUSED = 0, | |
91 | VPE_STATE_INUSE, | |
92 | VPE_STATE_RUNNING | |
93 | }; | |
94 | ||
95 | enum tc_state { | |
96 | TC_STATE_UNUSED = 0, | |
97 | TC_STATE_INUSE, | |
98 | TC_STATE_RUNNING, | |
99 | TC_STATE_DYNAMIC | |
100 | }; | |
101 | ||
307bd284 | 102 | struct vpe { |
e01402b1 RB |
103 | enum vpe_state state; |
104 | ||
105 | /* (device) minor associated with this vpe */ | |
106 | int minor; | |
107 | ||
108 | /* elfloader stuff */ | |
109 | void *load_addr; | |
571e0bed | 110 | unsigned long len; |
e01402b1 | 111 | char *pbuffer; |
571e0bed | 112 | unsigned long plen; |
2600990e RB |
113 | unsigned int uid, gid; |
114 | char cwd[VPE_PATH_MAX]; | |
e01402b1 RB |
115 | |
116 | unsigned long __start; | |
117 | ||
118 | /* tc's associated with this vpe */ | |
119 | struct list_head tc; | |
120 | ||
121 | /* The list of vpe's */ | |
122 | struct list_head list; | |
123 | ||
124 | /* shared symbol address */ | |
125 | void *shared_ptr; | |
2600990e RB |
126 | |
127 | /* the list of who wants to know when something major happens */ | |
128 | struct list_head notify; | |
307bd284 RB |
129 | }; |
130 | ||
131 | struct tc { | |
132 | enum tc_state state; | |
133 | int index; | |
134 | ||
07cc0c9e RB |
135 | struct vpe *pvpe; /* parent VPE */ |
136 | struct list_head tc; /* The list of TC's with this VPE */ | |
137 | struct list_head list; /* The global list of tc's */ | |
307bd284 | 138 | }; |
e01402b1 | 139 | |
9cfdf6f1 | 140 | struct { |
e01402b1 RB |
141 | /* Virtual processing elements */ |
142 | struct list_head vpe_list; | |
143 | ||
144 | /* Thread contexts */ | |
145 | struct list_head tc_list; | |
9cfdf6f1 RB |
146 | } vpecontrol = { |
147 | .vpe_list = LIST_HEAD_INIT(vpecontrol.vpe_list), | |
148 | .tc_list = LIST_HEAD_INIT(vpecontrol.tc_list) | |
149 | }; | |
e01402b1 RB |
150 | |
151 | static void release_progmem(void *ptr); | |
e01402b1 RB |
152 | extern void save_gp_address(unsigned int secbase, unsigned int rel); |
153 | ||
154 | /* get the vpe associated with this minor */ | |
155 | struct vpe *get_vpe(int minor) | |
156 | { | |
157 | struct vpe *v; | |
158 | ||
2600990e RB |
159 | if (!cpu_has_mipsmt) |
160 | return NULL; | |
161 | ||
e01402b1 RB |
162 | list_for_each_entry(v, &vpecontrol.vpe_list, list) { |
163 | if (v->minor == minor) | |
164 | return v; | |
165 | } | |
166 | ||
e01402b1 RB |
167 | return NULL; |
168 | } | |
169 | ||
170 | /* get the vpe associated with this minor */ | |
171 | struct tc *get_tc(int index) | |
172 | { | |
173 | struct tc *t; | |
174 | ||
175 | list_for_each_entry(t, &vpecontrol.tc_list, list) { | |
176 | if (t->index == index) | |
177 | return t; | |
178 | } | |
179 | ||
e01402b1 RB |
180 | return NULL; |
181 | } | |
182 | ||
183 | struct tc *get_tc_unused(void) | |
184 | { | |
185 | struct tc *t; | |
186 | ||
187 | list_for_each_entry(t, &vpecontrol.tc_list, list) { | |
188 | if (t->state == TC_STATE_UNUSED) | |
189 | return t; | |
190 | } | |
191 | ||
e01402b1 RB |
192 | return NULL; |
193 | } | |
194 | ||
195 | /* allocate a vpe and associate it with this minor (or index) */ | |
196 | struct vpe *alloc_vpe(int minor) | |
197 | { | |
198 | struct vpe *v; | |
199 | ||
307bd284 | 200 | if ((v = kzalloc(sizeof(struct vpe), GFP_KERNEL)) == NULL) { |
e01402b1 RB |
201 | return NULL; |
202 | } | |
203 | ||
e01402b1 RB |
204 | INIT_LIST_HEAD(&v->tc); |
205 | list_add_tail(&v->list, &vpecontrol.vpe_list); | |
206 | ||
2600990e | 207 | INIT_LIST_HEAD(&v->notify); |
e01402b1 RB |
208 | v->minor = minor; |
209 | return v; | |
210 | } | |
211 | ||
212 | /* allocate a tc. At startup only tc0 is running, all other can be halted. */ | |
213 | struct tc *alloc_tc(int index) | |
214 | { | |
07cc0c9e | 215 | struct tc *tc; |
e01402b1 | 216 | |
07cc0c9e RB |
217 | if ((tc = kzalloc(sizeof(struct tc), GFP_KERNEL)) == NULL) |
218 | goto out; | |
e01402b1 | 219 | |
07cc0c9e RB |
220 | INIT_LIST_HEAD(&tc->tc); |
221 | tc->index = index; | |
222 | list_add_tail(&tc->list, &vpecontrol.tc_list); | |
e01402b1 | 223 | |
07cc0c9e RB |
224 | out: |
225 | return tc; | |
e01402b1 RB |
226 | } |
227 | ||
228 | /* clean up and free everything */ | |
229 | void release_vpe(struct vpe *v) | |
230 | { | |
231 | list_del(&v->list); | |
232 | if (v->load_addr) | |
233 | release_progmem(v); | |
234 | kfree(v); | |
235 | } | |
236 | ||
237 | void dump_mtregs(void) | |
238 | { | |
239 | unsigned long val; | |
240 | ||
241 | val = read_c0_config3(); | |
242 | printk("config3 0x%lx MT %ld\n", val, | |
243 | (val & CONFIG3_MT) >> CONFIG3_MT_SHIFT); | |
244 | ||
e01402b1 RB |
245 | val = read_c0_mvpcontrol(); |
246 | printk("MVPControl 0x%lx, STLB %ld VPC %ld EVP %ld\n", val, | |
247 | (val & MVPCONTROL_STLB) >> MVPCONTROL_STLB_SHIFT, | |
248 | (val & MVPCONTROL_VPC) >> MVPCONTROL_VPC_SHIFT, | |
249 | (val & MVPCONTROL_EVP)); | |
250 | ||
2600990e RB |
251 | val = read_c0_mvpconf0(); |
252 | printk("mvpconf0 0x%lx, PVPE %ld PTC %ld M %ld\n", val, | |
253 | (val & MVPCONF0_PVPE) >> MVPCONF0_PVPE_SHIFT, | |
254 | val & MVPCONF0_PTC, (val & MVPCONF0_M) >> MVPCONF0_M_SHIFT); | |
e01402b1 RB |
255 | } |
256 | ||
257 | /* Find some VPE program space */ | |
571e0bed | 258 | static void *alloc_progmem(unsigned long len) |
e01402b1 RB |
259 | { |
260 | #ifdef CONFIG_MIPS_VPE_LOADER_TOM | |
261 | /* this means you must tell linux to use less memory than you physically have */ | |
571e0bed | 262 | return pfn_to_kaddr(max_pfn); |
e01402b1 RB |
263 | #else |
264 | // simple grab some mem for now | |
265 | return kmalloc(len, GFP_KERNEL); | |
266 | #endif | |
267 | } | |
268 | ||
269 | static void release_progmem(void *ptr) | |
270 | { | |
271 | #ifndef CONFIG_MIPS_VPE_LOADER_TOM | |
272 | kfree(ptr); | |
273 | #endif | |
274 | } | |
275 | ||
276 | /* Update size with this section: return offset. */ | |
277 | static long get_offset(unsigned long *size, Elf_Shdr * sechdr) | |
278 | { | |
279 | long ret; | |
280 | ||
281 | ret = ALIGN(*size, sechdr->sh_addralign ? : 1); | |
282 | *size = ret + sechdr->sh_size; | |
283 | return ret; | |
284 | } | |
285 | ||
286 | /* Lay out the SHF_ALLOC sections in a way not dissimilar to how ld | |
287 | might -- code, read-only data, read-write data, small data. Tally | |
288 | sizes, and place the offsets into sh_entsize fields: high bit means it | |
289 | belongs in init. */ | |
290 | static void layout_sections(struct module *mod, const Elf_Ehdr * hdr, | |
291 | Elf_Shdr * sechdrs, const char *secstrings) | |
292 | { | |
293 | static unsigned long const masks[][2] = { | |
294 | /* NOTE: all executable code must be the first section | |
295 | * in this array; otherwise modify the text_size | |
296 | * finder in the two loops below */ | |
297 | {SHF_EXECINSTR | SHF_ALLOC, ARCH_SHF_SMALL}, | |
298 | {SHF_ALLOC, SHF_WRITE | ARCH_SHF_SMALL}, | |
299 | {SHF_WRITE | SHF_ALLOC, ARCH_SHF_SMALL}, | |
300 | {ARCH_SHF_SMALL | SHF_ALLOC, 0} | |
301 | }; | |
302 | unsigned int m, i; | |
303 | ||
304 | for (i = 0; i < hdr->e_shnum; i++) | |
305 | sechdrs[i].sh_entsize = ~0UL; | |
306 | ||
307 | for (m = 0; m < ARRAY_SIZE(masks); ++m) { | |
308 | for (i = 0; i < hdr->e_shnum; ++i) { | |
309 | Elf_Shdr *s = &sechdrs[i]; | |
310 | ||
311 | // || strncmp(secstrings + s->sh_name, ".init", 5) == 0) | |
312 | if ((s->sh_flags & masks[m][0]) != masks[m][0] | |
313 | || (s->sh_flags & masks[m][1]) | |
314 | || s->sh_entsize != ~0UL) | |
315 | continue; | |
316 | s->sh_entsize = get_offset(&mod->core_size, s); | |
317 | } | |
318 | ||
319 | if (m == 0) | |
320 | mod->core_text_size = mod->core_size; | |
321 | ||
322 | } | |
323 | } | |
324 | ||
325 | ||
326 | /* from module-elf32.c, but subverted a little */ | |
327 | ||
328 | struct mips_hi16 { | |
329 | struct mips_hi16 *next; | |
330 | Elf32_Addr *addr; | |
331 | Elf32_Addr value; | |
332 | }; | |
333 | ||
334 | static struct mips_hi16 *mips_hi16_list; | |
335 | static unsigned int gp_offs, gp_addr; | |
336 | ||
337 | static int apply_r_mips_none(struct module *me, uint32_t *location, | |
338 | Elf32_Addr v) | |
339 | { | |
340 | return 0; | |
341 | } | |
342 | ||
343 | static int apply_r_mips_gprel16(struct module *me, uint32_t *location, | |
344 | Elf32_Addr v) | |
345 | { | |
346 | int rel; | |
347 | ||
348 | if( !(*location & 0xffff) ) { | |
349 | rel = (int)v - gp_addr; | |
350 | } | |
351 | else { | |
352 | /* .sbss + gp(relative) + offset */ | |
353 | /* kludge! */ | |
354 | rel = (int)(short)((int)v + gp_offs + | |
355 | (int)(short)(*location & 0xffff) - gp_addr); | |
356 | } | |
357 | ||
358 | if( (rel > 32768) || (rel < -32768) ) { | |
2600990e RB |
359 | printk(KERN_DEBUG "VPE loader: apply_r_mips_gprel16: " |
360 | "relative address 0x%x out of range of gp register\n", | |
361 | rel); | |
e01402b1 RB |
362 | return -ENOEXEC; |
363 | } | |
364 | ||
365 | *location = (*location & 0xffff0000) | (rel & 0xffff); | |
366 | ||
367 | return 0; | |
368 | } | |
369 | ||
370 | static int apply_r_mips_pc16(struct module *me, uint32_t *location, | |
371 | Elf32_Addr v) | |
372 | { | |
373 | int rel; | |
374 | rel = (((unsigned int)v - (unsigned int)location)); | |
375 | rel >>= 2; // because the offset is in _instructions_ not bytes. | |
376 | rel -= 1; // and one instruction less due to the branch delay slot. | |
377 | ||
378 | if( (rel > 32768) || (rel < -32768) ) { | |
2600990e RB |
379 | printk(KERN_DEBUG "VPE loader: " |
380 | "apply_r_mips_pc16: relative address out of range 0x%x\n", rel); | |
e01402b1 RB |
381 | return -ENOEXEC; |
382 | } | |
383 | ||
384 | *location = (*location & 0xffff0000) | (rel & 0xffff); | |
385 | ||
386 | return 0; | |
387 | } | |
388 | ||
389 | static int apply_r_mips_32(struct module *me, uint32_t *location, | |
390 | Elf32_Addr v) | |
391 | { | |
392 | *location += v; | |
393 | ||
394 | return 0; | |
395 | } | |
396 | ||
397 | static int apply_r_mips_26(struct module *me, uint32_t *location, | |
398 | Elf32_Addr v) | |
399 | { | |
400 | if (v % 4) { | |
2600990e RB |
401 | printk(KERN_DEBUG "VPE loader: apply_r_mips_26 " |
402 | " unaligned relocation\n"); | |
e01402b1 RB |
403 | return -ENOEXEC; |
404 | } | |
405 | ||
307bd284 RB |
406 | /* |
407 | * Not desperately convinced this is a good check of an overflow condition | |
408 | * anyway. But it gets in the way of handling undefined weak symbols which | |
409 | * we want to set to zero. | |
410 | * if ((v & 0xf0000000) != (((unsigned long)location + 4) & 0xf0000000)) { | |
411 | * printk(KERN_ERR | |
412 | * "module %s: relocation overflow\n", | |
413 | * me->name); | |
414 | * return -ENOEXEC; | |
415 | * } | |
416 | */ | |
e01402b1 RB |
417 | |
418 | *location = (*location & ~0x03ffffff) | | |
419 | ((*location + (v >> 2)) & 0x03ffffff); | |
420 | return 0; | |
421 | } | |
422 | ||
423 | static int apply_r_mips_hi16(struct module *me, uint32_t *location, | |
424 | Elf32_Addr v) | |
425 | { | |
426 | struct mips_hi16 *n; | |
427 | ||
428 | /* | |
429 | * We cannot relocate this one now because we don't know the value of | |
430 | * the carry we need to add. Save the information, and let LO16 do the | |
431 | * actual relocation. | |
432 | */ | |
433 | n = kmalloc(sizeof *n, GFP_KERNEL); | |
434 | if (!n) | |
435 | return -ENOMEM; | |
436 | ||
437 | n->addr = location; | |
438 | n->value = v; | |
439 | n->next = mips_hi16_list; | |
440 | mips_hi16_list = n; | |
441 | ||
442 | return 0; | |
443 | } | |
444 | ||
445 | static int apply_r_mips_lo16(struct module *me, uint32_t *location, | |
446 | Elf32_Addr v) | |
447 | { | |
448 | unsigned long insnlo = *location; | |
449 | Elf32_Addr val, vallo; | |
450 | ||
451 | /* Sign extend the addend we extract from the lo insn. */ | |
452 | vallo = ((insnlo & 0xffff) ^ 0x8000) - 0x8000; | |
453 | ||
454 | if (mips_hi16_list != NULL) { | |
455 | struct mips_hi16 *l; | |
456 | ||
457 | l = mips_hi16_list; | |
458 | while (l != NULL) { | |
459 | struct mips_hi16 *next; | |
460 | unsigned long insn; | |
461 | ||
462 | /* | |
463 | * The value for the HI16 had best be the same. | |
464 | */ | |
2600990e RB |
465 | if (v != l->value) { |
466 | printk(KERN_DEBUG "VPE loader: " | |
467 | "apply_r_mips_lo16/hi16: " | |
468 | "inconsistent value information\n"); | |
469 | return -ENOEXEC; | |
e01402b1 RB |
470 | } |
471 | ||
e01402b1 RB |
472 | /* |
473 | * Do the HI16 relocation. Note that we actually don't | |
474 | * need to know anything about the LO16 itself, except | |
475 | * where to find the low 16 bits of the addend needed | |
476 | * by the LO16. | |
477 | */ | |
478 | insn = *l->addr; | |
479 | val = ((insn & 0xffff) << 16) + vallo; | |
480 | val += v; | |
481 | ||
482 | /* | |
483 | * Account for the sign extension that will happen in | |
484 | * the low bits. | |
485 | */ | |
486 | val = ((val >> 16) + ((val & 0x8000) != 0)) & 0xffff; | |
487 | ||
488 | insn = (insn & ~0xffff) | val; | |
489 | *l->addr = insn; | |
490 | ||
491 | next = l->next; | |
492 | kfree(l); | |
493 | l = next; | |
494 | } | |
495 | ||
496 | mips_hi16_list = NULL; | |
497 | } | |
498 | ||
499 | /* | |
500 | * Ok, we're done with the HI16 relocs. Now deal with the LO16. | |
501 | */ | |
502 | val = v + vallo; | |
503 | insnlo = (insnlo & ~0xffff) | (val & 0xffff); | |
504 | *location = insnlo; | |
505 | ||
506 | return 0; | |
e01402b1 RB |
507 | } |
508 | ||
509 | static int (*reloc_handlers[]) (struct module *me, uint32_t *location, | |
510 | Elf32_Addr v) = { | |
511 | [R_MIPS_NONE] = apply_r_mips_none, | |
512 | [R_MIPS_32] = apply_r_mips_32, | |
513 | [R_MIPS_26] = apply_r_mips_26, | |
514 | [R_MIPS_HI16] = apply_r_mips_hi16, | |
515 | [R_MIPS_LO16] = apply_r_mips_lo16, | |
516 | [R_MIPS_GPREL16] = apply_r_mips_gprel16, | |
517 | [R_MIPS_PC16] = apply_r_mips_pc16 | |
518 | }; | |
519 | ||
2600990e | 520 | static char *rstrs[] = { |
e0daad44 | 521 | [R_MIPS_NONE] = "MIPS_NONE", |
2600990e RB |
522 | [R_MIPS_32] = "MIPS_32", |
523 | [R_MIPS_26] = "MIPS_26", | |
524 | [R_MIPS_HI16] = "MIPS_HI16", | |
525 | [R_MIPS_LO16] = "MIPS_LO16", | |
526 | [R_MIPS_GPREL16] = "MIPS_GPREL16", | |
527 | [R_MIPS_PC16] = "MIPS_PC16" | |
528 | }; | |
e01402b1 RB |
529 | |
530 | int apply_relocations(Elf32_Shdr *sechdrs, | |
531 | const char *strtab, | |
532 | unsigned int symindex, | |
533 | unsigned int relsec, | |
534 | struct module *me) | |
535 | { | |
536 | Elf32_Rel *rel = (void *) sechdrs[relsec].sh_addr; | |
537 | Elf32_Sym *sym; | |
538 | uint32_t *location; | |
539 | unsigned int i; | |
540 | Elf32_Addr v; | |
541 | int res; | |
542 | ||
543 | for (i = 0; i < sechdrs[relsec].sh_size / sizeof(*rel); i++) { | |
544 | Elf32_Word r_info = rel[i].r_info; | |
545 | ||
546 | /* This is where to make the change */ | |
547 | location = (void *)sechdrs[sechdrs[relsec].sh_info].sh_addr | |
548 | + rel[i].r_offset; | |
549 | /* This is the symbol it is referring to */ | |
550 | sym = (Elf32_Sym *)sechdrs[symindex].sh_addr | |
551 | + ELF32_R_SYM(r_info); | |
552 | ||
553 | if (!sym->st_value) { | |
554 | printk(KERN_DEBUG "%s: undefined weak symbol %s\n", | |
555 | me->name, strtab + sym->st_name); | |
556 | /* just print the warning, dont barf */ | |
557 | } | |
558 | ||
559 | v = sym->st_value; | |
560 | ||
561 | res = reloc_handlers[ELF32_R_TYPE(r_info)](me, location, v); | |
562 | if( res ) { | |
2600990e RB |
563 | char *r = rstrs[ELF32_R_TYPE(r_info)]; |
564 | printk(KERN_WARNING "VPE loader: .text+0x%x " | |
565 | "relocation type %s for symbol \"%s\" failed\n", | |
566 | rel[i].r_offset, r ? r : "UNKNOWN", | |
567 | strtab + sym->st_name); | |
e01402b1 | 568 | return res; |
2600990e | 569 | } |
e01402b1 RB |
570 | } |
571 | ||
572 | return 0; | |
573 | } | |
574 | ||
575 | void save_gp_address(unsigned int secbase, unsigned int rel) | |
576 | { | |
577 | gp_addr = secbase + rel; | |
578 | gp_offs = gp_addr - (secbase & 0xffff0000); | |
579 | } | |
580 | /* end module-elf32.c */ | |
581 | ||
582 | ||
583 | ||
584 | /* Change all symbols so that sh_value encodes the pointer directly. */ | |
2600990e | 585 | static void simplify_symbols(Elf_Shdr * sechdrs, |
e01402b1 RB |
586 | unsigned int symindex, |
587 | const char *strtab, | |
588 | const char *secstrings, | |
589 | unsigned int nsecs, struct module *mod) | |
590 | { | |
591 | Elf_Sym *sym = (void *)sechdrs[symindex].sh_addr; | |
592 | unsigned long secbase, bssbase = 0; | |
593 | unsigned int i, n = sechdrs[symindex].sh_size / sizeof(Elf_Sym); | |
2600990e | 594 | int size; |
e01402b1 RB |
595 | |
596 | /* find the .bss section for COMMON symbols */ | |
597 | for (i = 0; i < nsecs; i++) { | |
2600990e | 598 | if (strncmp(secstrings + sechdrs[i].sh_name, ".bss", 4) == 0) { |
e01402b1 | 599 | bssbase = sechdrs[i].sh_addr; |
2600990e RB |
600 | break; |
601 | } | |
e01402b1 RB |
602 | } |
603 | ||
604 | for (i = 1; i < n; i++) { | |
605 | switch (sym[i].st_shndx) { | |
606 | case SHN_COMMON: | |
2600990e RB |
607 | /* Allocate space for the symbol in the .bss section. |
608 | st_value is currently size. | |
e01402b1 RB |
609 | We want it to have the address of the symbol. */ |
610 | ||
611 | size = sym[i].st_value; | |
612 | sym[i].st_value = bssbase; | |
613 | ||
614 | bssbase += size; | |
615 | break; | |
616 | ||
617 | case SHN_ABS: | |
618 | /* Don't need to do anything */ | |
619 | break; | |
620 | ||
621 | case SHN_UNDEF: | |
622 | /* ret = -ENOENT; */ | |
623 | break; | |
624 | ||
625 | case SHN_MIPS_SCOMMON: | |
2600990e RB |
626 | printk(KERN_DEBUG "simplify_symbols: ignoring SHN_MIPS_SCOMMON" |
627 | "symbol <%s> st_shndx %d\n", strtab + sym[i].st_name, | |
628 | sym[i].st_shndx); | |
e01402b1 RB |
629 | // .sbss section |
630 | break; | |
631 | ||
632 | default: | |
633 | secbase = sechdrs[sym[i].st_shndx].sh_addr; | |
634 | ||
635 | if (strncmp(strtab + sym[i].st_name, "_gp", 3) == 0) { | |
636 | save_gp_address(secbase, sym[i].st_value); | |
637 | } | |
638 | ||
639 | sym[i].st_value += secbase; | |
640 | break; | |
641 | } | |
e01402b1 | 642 | } |
e01402b1 RB |
643 | } |
644 | ||
645 | #ifdef DEBUG_ELFLOADER | |
646 | static void dump_elfsymbols(Elf_Shdr * sechdrs, unsigned int symindex, | |
647 | const char *strtab, struct module *mod) | |
648 | { | |
649 | Elf_Sym *sym = (void *)sechdrs[symindex].sh_addr; | |
650 | unsigned int i, n = sechdrs[symindex].sh_size / sizeof(Elf_Sym); | |
651 | ||
652 | printk(KERN_DEBUG "dump_elfsymbols: n %d\n", n); | |
653 | for (i = 1; i < n; i++) { | |
654 | printk(KERN_DEBUG " i %d name <%s> 0x%x\n", i, | |
655 | strtab + sym[i].st_name, sym[i].st_value); | |
656 | } | |
657 | } | |
658 | #endif | |
659 | ||
e01402b1 | 660 | /* We are prepared so configure and start the VPE... */ |
be6e1437 | 661 | static int vpe_run(struct vpe * v) |
e01402b1 | 662 | { |
07cc0c9e | 663 | unsigned long flags, val, dmt_flag; |
2600990e | 664 | struct vpe_notifications *n; |
07cc0c9e | 665 | unsigned int vpeflags; |
e01402b1 RB |
666 | struct tc *t; |
667 | ||
668 | /* check we are the Master VPE */ | |
07cc0c9e | 669 | local_irq_save(flags); |
e01402b1 RB |
670 | val = read_c0_vpeconf0(); |
671 | if (!(val & VPECONF0_MVP)) { | |
672 | printk(KERN_WARNING | |
2600990e | 673 | "VPE loader: only Master VPE's are allowed to configure MT\n"); |
07cc0c9e RB |
674 | local_irq_restore(flags); |
675 | ||
e01402b1 RB |
676 | return -1; |
677 | } | |
678 | ||
07cc0c9e RB |
679 | dmt_flag = dmt(); |
680 | vpeflags = dvpe(); | |
e01402b1 | 681 | |
2600990e | 682 | if (!list_empty(&v->tc)) { |
e0daad44 | 683 | if ((t = list_entry(v->tc.next, struct tc, tc)) == NULL) { |
07cc0c9e RB |
684 | evpe(vpeflags); |
685 | emt(dmt_flag); | |
686 | local_irq_restore(flags); | |
687 | ||
688 | printk(KERN_WARNING | |
689 | "VPE loader: TC %d is already in use.\n", | |
690 | t->index); | |
e0daad44 RB |
691 | return -ENOEXEC; |
692 | } | |
693 | } else { | |
07cc0c9e RB |
694 | evpe(vpeflags); |
695 | emt(dmt_flag); | |
696 | local_irq_restore(flags); | |
697 | ||
698 | printk(KERN_WARNING | |
699 | "VPE loader: No TC's associated with VPE %d\n", | |
e0daad44 | 700 | v->minor); |
07cc0c9e | 701 | |
e0daad44 RB |
702 | return -ENOEXEC; |
703 | } | |
2600990e | 704 | |
e01402b1 | 705 | /* Put MVPE's into 'configuration state' */ |
340ee4b9 | 706 | set_c0_mvpcontrol(MVPCONTROL_VPC); |
e01402b1 | 707 | |
e01402b1 RB |
708 | settc(t->index); |
709 | ||
e01402b1 RB |
710 | /* should check it is halted, and not activated */ |
711 | if ((read_tc_c0_tcstatus() & TCSTATUS_A) || !(read_tc_c0_tchalt() & TCHALT_H)) { | |
07cc0c9e RB |
712 | evpe(vpeflags); |
713 | emt(dmt_flag); | |
714 | local_irq_restore(flags); | |
715 | ||
716 | printk(KERN_WARNING "VPE loader: TC %d is already active!\n", | |
e01402b1 | 717 | t->index); |
07cc0c9e | 718 | |
e01402b1 RB |
719 | return -ENOEXEC; |
720 | } | |
721 | ||
722 | /* Write the address we want it to start running from in the TCPC register. */ | |
723 | write_tc_c0_tcrestart((unsigned long)v->__start); | |
e01402b1 | 724 | write_tc_c0_tccontext((unsigned long)0); |
07cc0c9e | 725 | |
2600990e RB |
726 | /* |
727 | * Mark the TC as activated, not interrupt exempt and not dynamically | |
728 | * allocatable | |
729 | */ | |
e01402b1 RB |
730 | val = read_tc_c0_tcstatus(); |
731 | val = (val & ~(TCSTATUS_DA | TCSTATUS_IXMT)) | TCSTATUS_A; | |
732 | write_tc_c0_tcstatus(val); | |
733 | ||
734 | write_tc_c0_tchalt(read_tc_c0_tchalt() & ~TCHALT_H); | |
735 | ||
e01402b1 RB |
736 | /* |
737 | * The sde-kit passes 'memsize' to __start in $a3, so set something | |
2600990e | 738 | * here... Or set $a3 to zero and define DFLT_STACK_SIZE and |
e01402b1 RB |
739 | * DFLT_HEAP_SIZE when you compile your program |
740 | */ | |
07cc0c9e | 741 | mttgpr(7, physical_memsize); |
2600990e RB |
742 | |
743 | /* set up VPE1 */ | |
744 | /* | |
745 | * bind the TC to VPE 1 as late as possible so we only have the final | |
746 | * VPE registers to set up, and so an EJTAG probe can trigger on it | |
747 | */ | |
07cc0c9e | 748 | write_tc_c0_tcbind((read_tc_c0_tcbind() & ~TCBIND_CURVPE) | 1); |
e01402b1 | 749 | |
a94d7020 EO |
750 | write_vpe_c0_vpeconf0(read_vpe_c0_vpeconf0() & ~(VPECONF0_VPA)); |
751 | ||
752 | back_to_back_c0_hazard(); | |
753 | ||
e0daad44 RB |
754 | /* Set up the XTC bit in vpeconf0 to point at our tc */ |
755 | write_vpe_c0_vpeconf0( (read_vpe_c0_vpeconf0() & ~(VPECONF0_XTC)) | |
756 | | (t->index << VPECONF0_XTC_SHIFT)); | |
e01402b1 | 757 | |
a94d7020 EO |
758 | back_to_back_c0_hazard(); |
759 | ||
e0daad44 RB |
760 | /* enable this VPE */ |
761 | write_vpe_c0_vpeconf0(read_vpe_c0_vpeconf0() | VPECONF0_VPA); | |
e01402b1 RB |
762 | |
763 | /* clear out any left overs from a previous program */ | |
2600990e | 764 | write_vpe_c0_status(0); |
e01402b1 RB |
765 | write_vpe_c0_cause(0); |
766 | ||
767 | /* take system out of configuration state */ | |
340ee4b9 | 768 | clear_c0_mvpcontrol(MVPCONTROL_VPC); |
e01402b1 | 769 | |
07cc0c9e | 770 | #ifdef CONFIG_SMP |
e01402b1 | 771 | evpe(EVPE_ENABLE); |
07cc0c9e RB |
772 | #else |
773 | evpe(vpeflags); | |
774 | #endif | |
775 | emt(dmt_flag); | |
776 | local_irq_restore(flags); | |
e01402b1 | 777 | |
07cc0c9e RB |
778 | list_for_each_entry(n, &v->notify, list) |
779 | n->start(minor); | |
2600990e | 780 | |
e01402b1 RB |
781 | return 0; |
782 | } | |
783 | ||
2600990e | 784 | static int find_vpe_symbols(struct vpe * v, Elf_Shdr * sechdrs, |
e01402b1 RB |
785 | unsigned int symindex, const char *strtab, |
786 | struct module *mod) | |
787 | { | |
788 | Elf_Sym *sym = (void *)sechdrs[symindex].sh_addr; | |
789 | unsigned int i, n = sechdrs[symindex].sh_size / sizeof(Elf_Sym); | |
790 | ||
791 | for (i = 1; i < n; i++) { | |
792 | if (strcmp(strtab + sym[i].st_name, "__start") == 0) { | |
793 | v->__start = sym[i].st_value; | |
794 | } | |
795 | ||
796 | if (strcmp(strtab + sym[i].st_name, "vpe_shared") == 0) { | |
797 | v->shared_ptr = (void *)sym[i].st_value; | |
798 | } | |
799 | } | |
800 | ||
2600990e RB |
801 | if ( (v->__start == 0) || (v->shared_ptr == NULL)) |
802 | return -1; | |
803 | ||
e01402b1 RB |
804 | return 0; |
805 | } | |
806 | ||
307bd284 | 807 | /* |
2600990e RB |
808 | * Allocates a VPE with some program code space(the load address), copies the |
809 | * contents of the program (p)buffer performing relocatations/etc, free's it | |
810 | * when finished. | |
811 | */ | |
be6e1437 | 812 | static int vpe_elfload(struct vpe * v) |
e01402b1 RB |
813 | { |
814 | Elf_Ehdr *hdr; | |
815 | Elf_Shdr *sechdrs; | |
816 | long err = 0; | |
817 | char *secstrings, *strtab = NULL; | |
2600990e | 818 | unsigned int len, i, symindex = 0, strindex = 0, relocate = 0; |
e01402b1 RB |
819 | struct module mod; // so we can re-use the relocations code |
820 | ||
821 | memset(&mod, 0, sizeof(struct module)); | |
2600990e | 822 | strcpy(mod.name, "VPE loader"); |
e01402b1 RB |
823 | |
824 | hdr = (Elf_Ehdr *) v->pbuffer; | |
825 | len = v->plen; | |
826 | ||
827 | /* Sanity checks against insmoding binaries or wrong arch, | |
828 | weird elf version */ | |
829 | if (memcmp(hdr->e_ident, ELFMAG, 4) != 0 | |
2600990e RB |
830 | || (hdr->e_type != ET_REL && hdr->e_type != ET_EXEC) |
831 | || !elf_check_arch(hdr) | |
e01402b1 RB |
832 | || hdr->e_shentsize != sizeof(*sechdrs)) { |
833 | printk(KERN_WARNING | |
2600990e | 834 | "VPE loader: program wrong arch or weird elf version\n"); |
e01402b1 RB |
835 | |
836 | return -ENOEXEC; | |
837 | } | |
838 | ||
2600990e RB |
839 | if (hdr->e_type == ET_REL) |
840 | relocate = 1; | |
841 | ||
e01402b1 | 842 | if (len < hdr->e_shoff + hdr->e_shnum * sizeof(Elf_Shdr)) { |
2600990e RB |
843 | printk(KERN_ERR "VPE loader: program length %u truncated\n", |
844 | len); | |
845 | ||
e01402b1 RB |
846 | return -ENOEXEC; |
847 | } | |
848 | ||
849 | /* Convenience variables */ | |
850 | sechdrs = (void *)hdr + hdr->e_shoff; | |
851 | secstrings = (void *)hdr + sechdrs[hdr->e_shstrndx].sh_offset; | |
852 | sechdrs[0].sh_addr = 0; | |
853 | ||
854 | /* And these should exist, but gcc whinges if we don't init them */ | |
855 | symindex = strindex = 0; | |
856 | ||
2600990e RB |
857 | if (relocate) { |
858 | for (i = 1; i < hdr->e_shnum; i++) { | |
859 | if (sechdrs[i].sh_type != SHT_NOBITS | |
860 | && len < sechdrs[i].sh_offset + sechdrs[i].sh_size) { | |
861 | printk(KERN_ERR "VPE program length %u truncated\n", | |
862 | len); | |
863 | return -ENOEXEC; | |
864 | } | |
e01402b1 | 865 | |
2600990e RB |
866 | /* Mark all sections sh_addr with their address in the |
867 | temporary image. */ | |
868 | sechdrs[i].sh_addr = (size_t) hdr + sechdrs[i].sh_offset; | |
e01402b1 | 869 | |
2600990e RB |
870 | /* Internal symbols and strings. */ |
871 | if (sechdrs[i].sh_type == SHT_SYMTAB) { | |
872 | symindex = i; | |
873 | strindex = sechdrs[i].sh_link; | |
874 | strtab = (char *)hdr + sechdrs[strindex].sh_offset; | |
875 | } | |
e01402b1 | 876 | } |
2600990e | 877 | layout_sections(&mod, hdr, sechdrs, secstrings); |
e01402b1 RB |
878 | } |
879 | ||
e01402b1 RB |
880 | v->load_addr = alloc_progmem(mod.core_size); |
881 | memset(v->load_addr, 0, mod.core_size); | |
882 | ||
2600990e | 883 | printk("VPE loader: loading to %p\n", v->load_addr); |
e01402b1 | 884 | |
2600990e RB |
885 | if (relocate) { |
886 | for (i = 0; i < hdr->e_shnum; i++) { | |
887 | void *dest; | |
e01402b1 | 888 | |
2600990e RB |
889 | if (!(sechdrs[i].sh_flags & SHF_ALLOC)) |
890 | continue; | |
e01402b1 | 891 | |
2600990e | 892 | dest = v->load_addr + sechdrs[i].sh_entsize; |
e01402b1 | 893 | |
2600990e RB |
894 | if (sechdrs[i].sh_type != SHT_NOBITS) |
895 | memcpy(dest, (void *)sechdrs[i].sh_addr, | |
896 | sechdrs[i].sh_size); | |
897 | /* Update sh_addr to point to copy in image. */ | |
898 | sechdrs[i].sh_addr = (unsigned long)dest; | |
e01402b1 | 899 | |
2600990e RB |
900 | printk(KERN_DEBUG " section sh_name %s sh_addr 0x%x\n", |
901 | secstrings + sechdrs[i].sh_name, sechdrs[i].sh_addr); | |
902 | } | |
e01402b1 | 903 | |
2600990e RB |
904 | /* Fix up syms, so that st_value is a pointer to location. */ |
905 | simplify_symbols(sechdrs, symindex, strtab, secstrings, | |
906 | hdr->e_shnum, &mod); | |
907 | ||
908 | /* Now do relocations. */ | |
909 | for (i = 1; i < hdr->e_shnum; i++) { | |
910 | const char *strtab = (char *)sechdrs[strindex].sh_addr; | |
911 | unsigned int info = sechdrs[i].sh_info; | |
912 | ||
913 | /* Not a valid relocation section? */ | |
914 | if (info >= hdr->e_shnum) | |
915 | continue; | |
916 | ||
917 | /* Don't bother with non-allocated sections */ | |
918 | if (!(sechdrs[info].sh_flags & SHF_ALLOC)) | |
919 | continue; | |
920 | ||
921 | if (sechdrs[i].sh_type == SHT_REL) | |
922 | err = apply_relocations(sechdrs, strtab, symindex, i, | |
923 | &mod); | |
924 | else if (sechdrs[i].sh_type == SHT_RELA) | |
925 | err = apply_relocate_add(sechdrs, strtab, symindex, i, | |
926 | &mod); | |
927 | if (err < 0) | |
928 | return err; | |
929 | ||
930 | } | |
931 | } else { | |
932 | for (i = 0; i < hdr->e_shnum; i++) { | |
933 | ||
934 | /* Internal symbols and strings. */ | |
935 | if (sechdrs[i].sh_type == SHT_SYMTAB) { | |
936 | symindex = i; | |
937 | strindex = sechdrs[i].sh_link; | |
938 | strtab = (char *)hdr + sechdrs[strindex].sh_offset; | |
939 | ||
940 | /* mark the symtab's address for when we try to find the | |
941 | magic symbols */ | |
942 | sechdrs[i].sh_addr = (size_t) hdr + sechdrs[i].sh_offset; | |
943 | } | |
944 | ||
945 | /* filter sections we dont want in the final image */ | |
946 | if (!(sechdrs[i].sh_flags & SHF_ALLOC) || | |
947 | (sechdrs[i].sh_type == SHT_MIPS_REGINFO)) { | |
948 | printk( KERN_DEBUG " ignoring section, " | |
949 | "name %s type %x address 0x%x \n", | |
950 | secstrings + sechdrs[i].sh_name, | |
951 | sechdrs[i].sh_type, sechdrs[i].sh_addr); | |
952 | continue; | |
953 | } | |
954 | ||
955 | if (sechdrs[i].sh_addr < (unsigned int)v->load_addr) { | |
956 | printk( KERN_WARNING "VPE loader: " | |
957 | "fully linked image has invalid section, " | |
958 | "name %s type %x address 0x%x, before load " | |
959 | "address of 0x%x\n", | |
960 | secstrings + sechdrs[i].sh_name, | |
961 | sechdrs[i].sh_type, sechdrs[i].sh_addr, | |
962 | (unsigned int)v->load_addr); | |
963 | return -ENOEXEC; | |
964 | } | |
965 | ||
966 | printk(KERN_DEBUG " copying section sh_name %s, sh_addr 0x%x " | |
967 | "size 0x%x0 from x%p\n", | |
968 | secstrings + sechdrs[i].sh_name, sechdrs[i].sh_addr, | |
969 | sechdrs[i].sh_size, hdr + sechdrs[i].sh_offset); | |
970 | ||
971 | if (sechdrs[i].sh_type != SHT_NOBITS) | |
972 | memcpy((void *)sechdrs[i].sh_addr, | |
973 | (char *)hdr + sechdrs[i].sh_offset, | |
974 | sechdrs[i].sh_size); | |
975 | else | |
976 | memset((void *)sechdrs[i].sh_addr, 0, sechdrs[i].sh_size); | |
e01402b1 RB |
977 | } |
978 | } | |
979 | ||
980 | /* make sure it's physically written out */ | |
981 | flush_icache_range((unsigned long)v->load_addr, | |
982 | (unsigned long)v->load_addr + v->len); | |
983 | ||
984 | if ((find_vpe_symbols(v, sechdrs, symindex, strtab, &mod)) < 0) { | |
2600990e RB |
985 | if (v->__start == 0) { |
986 | printk(KERN_WARNING "VPE loader: program does not contain " | |
987 | "a __start symbol\n"); | |
988 | return -ENOEXEC; | |
989 | } | |
e01402b1 | 990 | |
2600990e RB |
991 | if (v->shared_ptr == NULL) |
992 | printk(KERN_WARNING "VPE loader: " | |
993 | "program does not contain vpe_shared symbol.\n" | |
994 | " Unable to use AMVP (AP/SP) facilities.\n"); | |
e01402b1 RB |
995 | } |
996 | ||
997 | printk(" elf loaded\n"); | |
2600990e | 998 | return 0; |
e01402b1 RB |
999 | } |
1000 | ||
2600990e RB |
1001 | static void cleanup_tc(struct tc *tc) |
1002 | { | |
07cc0c9e RB |
1003 | unsigned long flags; |
1004 | unsigned int mtflags, vpflags; | |
2600990e RB |
1005 | int tmp; |
1006 | ||
07cc0c9e RB |
1007 | local_irq_save(flags); |
1008 | mtflags = dmt(); | |
1009 | vpflags = dvpe(); | |
2600990e RB |
1010 | /* Put MVPE's into 'configuration state' */ |
1011 | set_c0_mvpcontrol(MVPCONTROL_VPC); | |
1012 | ||
1013 | settc(tc->index); | |
1014 | tmp = read_tc_c0_tcstatus(); | |
1015 | ||
1016 | /* mark not allocated and not dynamically allocatable */ | |
1017 | tmp &= ~(TCSTATUS_A | TCSTATUS_DA); | |
1018 | tmp |= TCSTATUS_IXMT; /* interrupt exempt */ | |
1019 | write_tc_c0_tcstatus(tmp); | |
1020 | ||
1021 | write_tc_c0_tchalt(TCHALT_H); | |
1022 | ||
1023 | /* bind it to anything other than VPE1 */ | |
07cc0c9e | 1024 | // write_tc_c0_tcbind(read_tc_c0_tcbind() & ~TCBIND_CURVPE); // | TCBIND_CURVPE |
2600990e RB |
1025 | |
1026 | clear_c0_mvpcontrol(MVPCONTROL_VPC); | |
07cc0c9e RB |
1027 | evpe(vpflags); |
1028 | emt(mtflags); | |
1029 | local_irq_restore(flags); | |
2600990e RB |
1030 | } |
1031 | ||
1032 | static int getcwd(char *buff, int size) | |
1033 | { | |
1034 | mm_segment_t old_fs; | |
1035 | int ret; | |
1036 | ||
1037 | old_fs = get_fs(); | |
1038 | set_fs(KERNEL_DS); | |
1039 | ||
1040 | ret = sys_getcwd(buff,size); | |
1041 | ||
1042 | set_fs(old_fs); | |
1043 | ||
1044 | return ret; | |
1045 | } | |
1046 | ||
1047 | /* checks VPE is unused and gets ready to load program */ | |
e01402b1 RB |
1048 | static int vpe_open(struct inode *inode, struct file *filp) |
1049 | { | |
c4c4018b | 1050 | enum vpe_state state; |
2600990e | 1051 | struct vpe_notifications *not; |
07cc0c9e RB |
1052 | struct vpe *v; |
1053 | int ret; | |
e01402b1 | 1054 | |
07cc0c9e RB |
1055 | if (minor != iminor(inode)) { |
1056 | /* assume only 1 device at the moment. */ | |
2600990e | 1057 | printk(KERN_WARNING "VPE loader: only vpe1 is supported\n"); |
e01402b1 RB |
1058 | return -ENODEV; |
1059 | } | |
1060 | ||
07cc0c9e | 1061 | if ((v = get_vpe(tclimit)) == NULL) { |
2600990e | 1062 | printk(KERN_WARNING "VPE loader: unable to get vpe\n"); |
e01402b1 RB |
1063 | return -ENODEV; |
1064 | } | |
1065 | ||
c4c4018b RB |
1066 | state = xchg(&v->state, VPE_STATE_INUSE); |
1067 | if (state != VPE_STATE_UNUSED) { | |
2600990e | 1068 | printk(KERN_DEBUG "VPE loader: tc in use dumping regs\n"); |
e01402b1 | 1069 | |
2600990e | 1070 | list_for_each_entry(not, &v->notify, list) { |
07cc0c9e | 1071 | not->stop(tclimit); |
2600990e | 1072 | } |
e01402b1 | 1073 | |
2600990e | 1074 | release_progmem(v->load_addr); |
07cc0c9e | 1075 | cleanup_tc(get_tc(tclimit)); |
e01402b1 RB |
1076 | } |
1077 | ||
e01402b1 RB |
1078 | /* this of-course trashes what was there before... */ |
1079 | v->pbuffer = vmalloc(P_SIZE); | |
1080 | v->plen = P_SIZE; | |
1081 | v->load_addr = NULL; | |
1082 | v->len = 0; | |
1083 | ||
2600990e RB |
1084 | v->uid = filp->f_uid; |
1085 | v->gid = filp->f_gid; | |
1086 | ||
1087 | #ifdef CONFIG_MIPS_APSP_KSPD | |
1088 | /* get kspd to tell us when a syscall_exit happens */ | |
1089 | if (!kspd_events_reqd) { | |
1090 | kspd_notify(&kspd_events); | |
1091 | kspd_events_reqd++; | |
1092 | } | |
1093 | #endif | |
1094 | ||
1095 | v->cwd[0] = 0; | |
1096 | ret = getcwd(v->cwd, VPE_PATH_MAX); | |
1097 | if (ret < 0) | |
1098 | printk(KERN_WARNING "VPE loader: open, getcwd returned %d\n", ret); | |
1099 | ||
1100 | v->shared_ptr = NULL; | |
1101 | v->__start = 0; | |
07cc0c9e | 1102 | |
e01402b1 RB |
1103 | return 0; |
1104 | } | |
1105 | ||
1106 | static int vpe_release(struct inode *inode, struct file *filp) | |
1107 | { | |
307bd284 | 1108 | struct vpe *v; |
e01402b1 | 1109 | Elf_Ehdr *hdr; |
07cc0c9e | 1110 | int ret = 0; |
e01402b1 | 1111 | |
07cc0c9e RB |
1112 | v = get_vpe(tclimit); |
1113 | if (v == NULL) | |
e01402b1 RB |
1114 | return -ENODEV; |
1115 | ||
e01402b1 RB |
1116 | hdr = (Elf_Ehdr *) v->pbuffer; |
1117 | if (memcmp(hdr->e_ident, ELFMAG, 4) == 0) { | |
07cc0c9e | 1118 | if (vpe_elfload(v) >= 0) { |
e01402b1 | 1119 | vpe_run(v); |
07cc0c9e | 1120 | } else { |
2600990e | 1121 | printk(KERN_WARNING "VPE loader: ELF load failed.\n"); |
e01402b1 RB |
1122 | ret = -ENOEXEC; |
1123 | } | |
1124 | } else { | |
2600990e | 1125 | printk(KERN_WARNING "VPE loader: only elf files are supported\n"); |
e01402b1 RB |
1126 | ret = -ENOEXEC; |
1127 | } | |
1128 | ||
2600990e RB |
1129 | /* It's good to be able to run the SP and if it chokes have a look at |
1130 | the /dev/rt?. But if we reset the pointer to the shared struct we | |
1131 | loose what has happened. So perhaps if garbage is sent to the vpe | |
1132 | device, use it as a trigger for the reset. Hopefully a nice | |
1133 | executable will be along shortly. */ | |
1134 | if (ret < 0) | |
1135 | v->shared_ptr = NULL; | |
1136 | ||
e01402b1 RB |
1137 | // cleanup any temp buffers |
1138 | if (v->pbuffer) | |
1139 | vfree(v->pbuffer); | |
1140 | v->plen = 0; | |
1141 | return ret; | |
1142 | } | |
1143 | ||
1144 | static ssize_t vpe_write(struct file *file, const char __user * buffer, | |
1145 | size_t count, loff_t * ppos) | |
1146 | { | |
e01402b1 | 1147 | size_t ret = count; |
307bd284 | 1148 | struct vpe *v; |
e01402b1 | 1149 | |
07cc0c9e RB |
1150 | if (iminor(file->f_path.dentry->d_inode) != minor) |
1151 | return -ENODEV; | |
1152 | ||
1153 | v = get_vpe(tclimit); | |
1154 | if (v == NULL) | |
e01402b1 RB |
1155 | return -ENODEV; |
1156 | ||
1157 | if (v->pbuffer == NULL) { | |
2600990e | 1158 | printk(KERN_ERR "VPE loader: no buffer for program\n"); |
e01402b1 RB |
1159 | return -ENOMEM; |
1160 | } | |
1161 | ||
1162 | if ((count + v->len) > v->plen) { | |
1163 | printk(KERN_WARNING | |
2600990e | 1164 | "VPE loader: elf size too big. Perhaps strip uneeded symbols\n"); |
e01402b1 RB |
1165 | return -ENOMEM; |
1166 | } | |
1167 | ||
1168 | count -= copy_from_user(v->pbuffer + v->len, buffer, count); | |
2600990e | 1169 | if (!count) |
e01402b1 | 1170 | return -EFAULT; |
e01402b1 RB |
1171 | |
1172 | v->len += count; | |
1173 | return ret; | |
1174 | } | |
1175 | ||
5dfe4c96 | 1176 | static const struct file_operations vpe_fops = { |
e01402b1 RB |
1177 | .owner = THIS_MODULE, |
1178 | .open = vpe_open, | |
1179 | .release = vpe_release, | |
1180 | .write = vpe_write | |
1181 | }; | |
1182 | ||
1183 | /* module wrapper entry points */ | |
1184 | /* give me a vpe */ | |
1185 | vpe_handle vpe_alloc(void) | |
1186 | { | |
1187 | int i; | |
1188 | struct vpe *v; | |
1189 | ||
1190 | /* find a vpe */ | |
1191 | for (i = 1; i < MAX_VPES; i++) { | |
1192 | if ((v = get_vpe(i)) != NULL) { | |
1193 | v->state = VPE_STATE_INUSE; | |
1194 | return v; | |
1195 | } | |
1196 | } | |
1197 | return NULL; | |
1198 | } | |
1199 | ||
1200 | EXPORT_SYMBOL(vpe_alloc); | |
1201 | ||
1202 | /* start running from here */ | |
1203 | int vpe_start(vpe_handle vpe, unsigned long start) | |
1204 | { | |
1205 | struct vpe *v = vpe; | |
1206 | ||
1207 | v->__start = start; | |
1208 | return vpe_run(v); | |
1209 | } | |
1210 | ||
1211 | EXPORT_SYMBOL(vpe_start); | |
1212 | ||
1213 | /* halt it for now */ | |
1214 | int vpe_stop(vpe_handle vpe) | |
1215 | { | |
1216 | struct vpe *v = vpe; | |
1217 | struct tc *t; | |
1218 | unsigned int evpe_flags; | |
1219 | ||
1220 | evpe_flags = dvpe(); | |
1221 | ||
1222 | if ((t = list_entry(v->tc.next, struct tc, tc)) != NULL) { | |
1223 | ||
1224 | settc(t->index); | |
1225 | write_vpe_c0_vpeconf0(read_vpe_c0_vpeconf0() & ~VPECONF0_VPA); | |
1226 | } | |
1227 | ||
1228 | evpe(evpe_flags); | |
1229 | ||
1230 | return 0; | |
1231 | } | |
1232 | ||
1233 | EXPORT_SYMBOL(vpe_stop); | |
1234 | ||
1235 | /* I've done with it thank you */ | |
1236 | int vpe_free(vpe_handle vpe) | |
1237 | { | |
1238 | struct vpe *v = vpe; | |
1239 | struct tc *t; | |
1240 | unsigned int evpe_flags; | |
1241 | ||
1242 | if ((t = list_entry(v->tc.next, struct tc, tc)) == NULL) { | |
1243 | return -ENOEXEC; | |
1244 | } | |
1245 | ||
1246 | evpe_flags = dvpe(); | |
1247 | ||
1248 | /* Put MVPE's into 'configuration state' */ | |
340ee4b9 | 1249 | set_c0_mvpcontrol(MVPCONTROL_VPC); |
e01402b1 RB |
1250 | |
1251 | settc(t->index); | |
1252 | write_vpe_c0_vpeconf0(read_vpe_c0_vpeconf0() & ~VPECONF0_VPA); | |
1253 | ||
1254 | /* mark the TC unallocated and halt'ed */ | |
1255 | write_tc_c0_tcstatus(read_tc_c0_tcstatus() & ~TCSTATUS_A); | |
1256 | write_tc_c0_tchalt(TCHALT_H); | |
1257 | ||
1258 | v->state = VPE_STATE_UNUSED; | |
1259 | ||
340ee4b9 | 1260 | clear_c0_mvpcontrol(MVPCONTROL_VPC); |
e01402b1 RB |
1261 | evpe(evpe_flags); |
1262 | ||
1263 | return 0; | |
1264 | } | |
1265 | ||
1266 | EXPORT_SYMBOL(vpe_free); | |
1267 | ||
1268 | void *vpe_get_shared(int index) | |
1269 | { | |
1270 | struct vpe *v; | |
1271 | ||
2600990e | 1272 | if ((v = get_vpe(index)) == NULL) |
e01402b1 | 1273 | return NULL; |
e01402b1 RB |
1274 | |
1275 | return v->shared_ptr; | |
1276 | } | |
1277 | ||
1278 | EXPORT_SYMBOL(vpe_get_shared); | |
1279 | ||
2600990e RB |
1280 | int vpe_getuid(int index) |
1281 | { | |
1282 | struct vpe *v; | |
1283 | ||
1284 | if ((v = get_vpe(index)) == NULL) | |
1285 | return -1; | |
1286 | ||
1287 | return v->uid; | |
1288 | } | |
1289 | ||
1290 | EXPORT_SYMBOL(vpe_getuid); | |
1291 | ||
1292 | int vpe_getgid(int index) | |
1293 | { | |
1294 | struct vpe *v; | |
1295 | ||
1296 | if ((v = get_vpe(index)) == NULL) | |
1297 | return -1; | |
1298 | ||
1299 | return v->gid; | |
1300 | } | |
1301 | ||
1302 | EXPORT_SYMBOL(vpe_getgid); | |
1303 | ||
1304 | int vpe_notify(int index, struct vpe_notifications *notify) | |
1305 | { | |
1306 | struct vpe *v; | |
1307 | ||
1308 | if ((v = get_vpe(index)) == NULL) | |
1309 | return -1; | |
1310 | ||
1311 | list_add(¬ify->list, &v->notify); | |
1312 | return 0; | |
1313 | } | |
1314 | ||
1315 | EXPORT_SYMBOL(vpe_notify); | |
1316 | ||
1317 | char *vpe_getcwd(int index) | |
1318 | { | |
1319 | struct vpe *v; | |
1320 | ||
1321 | if ((v = get_vpe(index)) == NULL) | |
1322 | return NULL; | |
1323 | ||
1324 | return v->cwd; | |
1325 | } | |
1326 | ||
1327 | EXPORT_SYMBOL(vpe_getcwd); | |
1328 | ||
1329 | #ifdef CONFIG_MIPS_APSP_KSPD | |
1330 | static void kspd_sp_exit( int sp_id) | |
1331 | { | |
1332 | cleanup_tc(get_tc(sp_id)); | |
1333 | } | |
1334 | #endif | |
1335 | ||
27a3bbaf RB |
1336 | static struct device *vpe_dev; |
1337 | ||
e01402b1 RB |
1338 | static int __init vpe_module_init(void) |
1339 | { | |
07cc0c9e RB |
1340 | unsigned int mtflags, vpflags; |
1341 | int hw_tcs, hw_vpes, tc, err = 0; | |
1342 | unsigned long flags, val; | |
e01402b1 | 1343 | struct vpe *v = NULL; |
27a3bbaf | 1344 | struct device *dev; |
e01402b1 | 1345 | struct tc *t; |
e01402b1 RB |
1346 | |
1347 | if (!cpu_has_mipsmt) { | |
1348 | printk("VPE loader: not a MIPS MT capable processor\n"); | |
1349 | return -ENODEV; | |
1350 | } | |
1351 | ||
07cc0c9e RB |
1352 | if (vpelimit == 0) { |
1353 | printk(KERN_WARNING "No VPEs reserved for AP/SP, not " | |
1354 | "initializing VPE loader.\nPass maxvpes=<n> argument as " | |
1355 | "kernel argument\n"); | |
1356 | ||
1357 | return -ENODEV; | |
1358 | } | |
1359 | ||
1360 | if (tclimit == 0) { | |
1361 | printk(KERN_WARNING "No TCs reserved for AP/SP, not " | |
1362 | "initializing VPE loader.\nPass maxtcs=<n> argument as " | |
1363 | "kernel argument\n"); | |
1364 | ||
1365 | return -ENODEV; | |
1366 | } | |
1367 | ||
682e852e AD |
1368 | major = register_chrdev(0, module_name, &vpe_fops); |
1369 | if (major < 0) { | |
e01402b1 | 1370 | printk("VPE loader: unable to register character device\n"); |
307bd284 | 1371 | return major; |
e01402b1 RB |
1372 | } |
1373 | ||
27a3bbaf | 1374 | dev = device_create(mt_class, NULL, MKDEV(major, minor), |
07cc0c9e | 1375 | "vpe%d", minor); |
27a3bbaf RB |
1376 | if (IS_ERR(dev)) { |
1377 | err = PTR_ERR(dev); | |
1378 | goto out_chrdev; | |
1379 | } | |
1380 | vpe_dev = dev; | |
1381 | ||
07cc0c9e RB |
1382 | local_irq_save(flags); |
1383 | mtflags = dmt(); | |
1384 | vpflags = dvpe(); | |
e01402b1 RB |
1385 | |
1386 | /* Put MVPE's into 'configuration state' */ | |
340ee4b9 | 1387 | set_c0_mvpcontrol(MVPCONTROL_VPC); |
e01402b1 RB |
1388 | |
1389 | /* dump_mtregs(); */ | |
1390 | ||
e01402b1 | 1391 | val = read_c0_mvpconf0(); |
07cc0c9e RB |
1392 | hw_tcs = (val & MVPCONF0_PTC) + 1; |
1393 | hw_vpes = ((val & MVPCONF0_PVPE) >> MVPCONF0_PVPE_SHIFT) + 1; | |
1394 | ||
1395 | for (tc = tclimit; tc < hw_tcs; tc++) { | |
1396 | /* | |
1397 | * Must re-enable multithreading temporarily or in case we | |
1398 | * reschedule send IPIs or similar we might hang. | |
1399 | */ | |
1400 | clear_c0_mvpcontrol(MVPCONTROL_VPC); | |
1401 | evpe(vpflags); | |
1402 | emt(mtflags); | |
1403 | local_irq_restore(flags); | |
1404 | t = alloc_tc(tc); | |
1405 | if (!t) { | |
1406 | err = -ENOMEM; | |
1407 | goto out; | |
1408 | } | |
1409 | ||
1410 | local_irq_save(flags); | |
1411 | mtflags = dmt(); | |
1412 | vpflags = dvpe(); | |
1413 | set_c0_mvpcontrol(MVPCONTROL_VPC); | |
e01402b1 RB |
1414 | |
1415 | /* VPE's */ | |
07cc0c9e RB |
1416 | if (tc < hw_tcs) { |
1417 | settc(tc); | |
e01402b1 | 1418 | |
07cc0c9e | 1419 | if ((v = alloc_vpe(tc)) == NULL) { |
e01402b1 | 1420 | printk(KERN_WARNING "VPE: unable to allocate VPE\n"); |
07cc0c9e RB |
1421 | |
1422 | goto out_reenable; | |
e01402b1 RB |
1423 | } |
1424 | ||
2600990e RB |
1425 | /* add the tc to the list of this vpe's tc's. */ |
1426 | list_add(&t->tc, &v->tc); | |
e01402b1 RB |
1427 | |
1428 | /* deactivate all but vpe0 */ | |
07cc0c9e | 1429 | if (tc >= tclimit) { |
e01402b1 RB |
1430 | unsigned long tmp = read_vpe_c0_vpeconf0(); |
1431 | ||
1432 | tmp &= ~VPECONF0_VPA; | |
1433 | ||
1434 | /* master VPE */ | |
1435 | tmp |= VPECONF0_MVP; | |
1436 | write_vpe_c0_vpeconf0(tmp); | |
1437 | } | |
1438 | ||
1439 | /* disable multi-threading with TC's */ | |
1440 | write_vpe_c0_vpecontrol(read_vpe_c0_vpecontrol() & ~VPECONTROL_TE); | |
1441 | ||
07cc0c9e | 1442 | if (tc >= vpelimit) { |
2600990e RB |
1443 | /* |
1444 | * Set config to be the same as vpe0, | |
1445 | * particularly kseg0 coherency alg | |
1446 | */ | |
e01402b1 RB |
1447 | write_vpe_c0_config(read_c0_config()); |
1448 | } | |
e01402b1 RB |
1449 | } |
1450 | ||
1451 | /* TC's */ | |
1452 | t->pvpe = v; /* set the parent vpe */ | |
1453 | ||
07cc0c9e | 1454 | if (tc >= tclimit) { |
e01402b1 RB |
1455 | unsigned long tmp; |
1456 | ||
07cc0c9e | 1457 | settc(tc); |
e01402b1 | 1458 | |
2600990e RB |
1459 | /* Any TC that is bound to VPE0 gets left as is - in case |
1460 | we are running SMTC on VPE0. A TC that is bound to any | |
1461 | other VPE gets bound to VPE0, ideally I'd like to make | |
1462 | it homeless but it doesn't appear to let me bind a TC | |
1463 | to a non-existent VPE. Which is perfectly reasonable. | |
1464 | ||
1465 | The (un)bound state is visible to an EJTAG probe so may | |
1466 | notify GDB... | |
1467 | */ | |
1468 | ||
1469 | if (((tmp = read_tc_c0_tcbind()) & TCBIND_CURVPE)) { | |
1470 | /* tc is bound >vpe0 */ | |
1471 | write_tc_c0_tcbind(tmp & ~TCBIND_CURVPE); | |
1472 | ||
1473 | t->pvpe = get_vpe(0); /* set the parent vpe */ | |
1474 | } | |
e01402b1 RB |
1475 | |
1476 | tmp = read_tc_c0_tcstatus(); | |
1477 | ||
2600990e | 1478 | /* mark not activated and not dynamically allocatable */ |
e01402b1 RB |
1479 | tmp &= ~(TCSTATUS_A | TCSTATUS_DA); |
1480 | tmp |= TCSTATUS_IXMT; /* interrupt exempt */ | |
1481 | write_tc_c0_tcstatus(tmp); | |
1482 | ||
1483 | write_tc_c0_tchalt(TCHALT_H); | |
1484 | } | |
1485 | } | |
1486 | ||
07cc0c9e | 1487 | out_reenable: |
e01402b1 | 1488 | /* release config state */ |
340ee4b9 | 1489 | clear_c0_mvpcontrol(MVPCONTROL_VPC); |
e01402b1 | 1490 | |
07cc0c9e RB |
1491 | evpe(vpflags); |
1492 | emt(mtflags); | |
1493 | local_irq_restore(flags); | |
1494 | ||
2600990e RB |
1495 | #ifdef CONFIG_MIPS_APSP_KSPD |
1496 | kspd_events.kspd_sp_exit = kspd_sp_exit; | |
1497 | #endif | |
e01402b1 | 1498 | return 0; |
27a3bbaf RB |
1499 | |
1500 | out_chrdev: | |
1501 | unregister_chrdev(major, module_name); | |
1502 | ||
07cc0c9e | 1503 | out: |
27a3bbaf | 1504 | return err; |
e01402b1 RB |
1505 | } |
1506 | ||
1507 | static void __exit vpe_module_exit(void) | |
1508 | { | |
1509 | struct vpe *v, *n; | |
1510 | ||
1511 | list_for_each_entry_safe(v, n, &vpecontrol.vpe_list, list) { | |
1512 | if (v->state != VPE_STATE_UNUSED) { | |
1513 | release_vpe(v); | |
1514 | } | |
1515 | } | |
1516 | ||
27a3bbaf | 1517 | device_destroy(mt_class, MKDEV(major, minor)); |
e01402b1 RB |
1518 | unregister_chrdev(major, module_name); |
1519 | } | |
1520 | ||
1521 | module_init(vpe_module_init); | |
1522 | module_exit(vpe_module_exit); | |
1523 | MODULE_DESCRIPTION("MIPS VPE Loader"); | |
2600990e | 1524 | MODULE_AUTHOR("Elizabeth Oldham, MIPS Technologies, Inc."); |
e01402b1 | 1525 | MODULE_LICENSE("GPL"); |