diff options
author | Alan Modra <amodra@gmail.com> | 2006-10-25 06:49:21 +0000 |
---|---|---|
committer | Alan Modra <amodra@gmail.com> | 2006-10-25 06:49:21 +0000 |
commit | e9f531299306c33f3e110bd66e7f9daa29845e23 (patch) | |
tree | 7c95ff771856236efdfef25f95099f15c970e518 /ld/emultempl | |
parent | 78de3ccc2a96d619e8a7f9bc1dc41d4b92286120 (diff) | |
download | binutils-gdb-e9f531299306c33f3e110bd66e7f9daa29845e23.tar.gz |
New Cell SPU port.
Diffstat (limited to 'ld/emultempl')
-rw-r--r-- | ld/emultempl/spu_inc.s | 7 | ||||
-rw-r--r-- | ld/emultempl/spu_ovl.S | 275 | ||||
-rw-r--r-- | ld/emultempl/spu_ovl.o | bin | 0 -> 1440 bytes | |||
-rw-r--r-- | ld/emultempl/spuelf.em | 297 |
4 files changed, 579 insertions, 0 deletions
diff --git a/ld/emultempl/spu_inc.s b/ld/emultempl/spu_inc.s new file mode 100644 index 00000000000..243bd1061e9 --- /dev/null +++ b/ld/emultempl/spu_inc.s @@ -0,0 +1,7 @@ + .text + .globl _binary_builtin_ovl_mgr_start + .globl _binary_builtin_ovl_mgr_end + +_binary_builtin_ovl_mgr_start: + .incbin "spu_ovl.o" +_binary_builtin_ovl_mgr_end: diff --git a/ld/emultempl/spu_ovl.S b/ld/emultempl/spu_ovl.S new file mode 100644 index 00000000000..75d0470db50 --- /dev/null +++ b/ld/emultempl/spu_ovl.S @@ -0,0 +1,275 @@ +/* Overlay manager for SPU. + + Copyright 2006 Free Software Foundation, Inc. + + This file is part of GLD, the Gnu Linker. + + GLD is free software; you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation; either version 2, or (at your option) + any later version. + + GLD is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with GLD; see the file COPYING. If not, write to the Free + Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA + 02110-1301, USA. */ + +/** + * MFC DMA defn's. + */ +#define MFC_GET_CMD 0x40 +#define MFC_MAX_DMA_SIZE 0x4000 +#define MFC_TAG_UPDATE_ALL 2 +#define MFC_TAG_ID 0 + + +/** + * Temporary register allocations. + * These are saved/restored here. + */ +#define tab $75 +#define cgbits $75 +#define add64 $75 +#define ealo $75 +#define newmask $75 +#define tagstat $75 +#define bchn $75 +#define rv1 $75 + +#define off $76 +#define off64 $76 +#define maxsize $76 +#define oldmask $76 +#define sz $76 +#define lnkr $76 +#define rv2 $76 + +#define cur $77 +#define cmp $77 +#define buf $77 +#define genwi $77 +#define tagid $77 +#define cmd $77 +#define rv3 $77 + +#define cgshuf $78 + +#define vma $6 + +#define map $7 +#define size $7 +#define cmp2 $7 + +#define ea64 $8 +#define retval $8 + +#ifdef OVLY_IRQ_SAVE +#define irqtmp $8 +#define irq_stat $9 +#endif + + .extern _ovly_table + .extern _ovly_buf_table + + .text + .align 4 +__rv_pattern: + .word 0x00010203, 0x1c1d1e1f, 0x00010203, 0x10111213 +__cg_pattern: + .word 0x04050607, 0x80808080, 0x80808080, 0x80808080 + +/** + * __ovly_return - stub for returning from overlay functions. + * + * inputs: + * $lr link register + * + * outputs: + * $78 old partition number, to be reloaded + * $79 return address in old partion number + */ + .global __ovly_return + .type __ovly_return, @function + + .word 0 +__ovly_return: + shlqbyi $78, $lr, 4 + shlqbyi $79, $lr, 8 + biz $78, $79 + +/** + * __ovly_load - copy an overlay partion to local store. + * + * inputs: + * $78 partition number to be loaded. + * $79 branch target in new partition. + * $lr link register, containing return addr. + * + * outputs: + * $lr new link register, returning through __ovly_return. + * + * Copy a new overlay partition into local store, or return + * immediately if the partition is already resident. + */ + .global __ovly_load + .type __ovly_load, @function + +__ovly_load: +/* Save temporary registers to stack. */ + stqd $6, -16($sp) + stqd $7, -32($sp) + stqd $8, -48($sp) + +#ifdef OVLY_IRQ_SAVE +/* Save irq state, then disable interrupts. */ + stqd $9, -64($sp) + ila irqtmp, __ovly_irq_save + rdch irq_stat, $SPU_RdMachStat + bid irqtmp +__ovly_irq_save: +#endif + +/* Set branch hint to overlay target. */ + hbr __ovly_load_ret, $79 + +/* Get caller's overlay index by back chaining through stack frames. + * Loop until end of stack (back chain all-zeros) or + * encountered a link register we set here. */ + lqd bchn, 0($sp) + ila retval, __ovly_return + +__ovly_backchain_loop: + lqd lnkr, 16(bchn) + lqd bchn, 0(bchn) + ceq cmp, lnkr, retval + ceqi cmp2, bchn, 0 + or cmp, cmp, cmp2 + brz cmp, __ovly_backchain_loop + +/* If we reached the zero back-chain, then lnkr is bogus. Clear the + * part of lnkr that we use later (slot 3). */ + rotqbyi cmp2, cmp2, 4 + andc lnkr, lnkr, cmp2 + +/* Set lr = {__ovly_return, prev ovl ndx, caller return adr, callee ovl ndx}. */ + lqd rv1, (__rv_pattern-__ovly_return+4)(retval) + shufb rv2, retval, lnkr, rv1 + shufb rv3, $lr, $78, rv1 + fsmbi rv1, 0xff + selb $lr, rv2, rv3, rv1 + +/* Branch to $79 if non-overlay */ + brz $78, __ovly_load_restore + +/* Load values from _ovly_table[$78]. + * extern struct { + * u32 vma; + * u32 size; + * u32 file_offset; + * u32 buf; + * } _ovly_table[]; + */ + shli off, $78, 4 + ila tab, _ovly_table - 16 + lqx vma, tab, off + rotqbyi buf, vma, 12 + +/* Load values from _ovly_buf_table[buf]. + * extern struct { + * u32 mapped; + * } _ovly_buf_table[]; + */ + ila tab, _ovly_buf_table + ai off, buf, -1 + shli off, off, 2 + lqx map, tab, off + rotqby cur, map, off + +/* Branch to $79 now if overlay is already mapped. */ + ceq cmp, $78, cur + brnz cmp, __ovly_load_restore + +/* Set _ovly_buf_table[buf].mapped = $78. */ + cwx genwi, tab, off + shufb map, $78, map, genwi + stqx map, tab, off + +/* A new partition needs to be loaded. Prepare for DMA loop. + * _EAR_ is the 64b base EA, filled in at run time by the + * loader, and indicating the value for SPU executable image start. + */ + lqd cgshuf, (__cg_pattern-__ovly_return+4)(retval) + rotqbyi size, vma, 4 + rotqbyi sz, vma, 8 + lqa ea64, _EAR_ + +__ovly_xfer_loop: +/* 64b add to compute next ea64. */ + rotqmbyi off64, sz, -4 + cg cgbits, ea64, off64 + shufb add64, cgbits, cgbits, cgshuf + addx add64, ea64, off64 + ori ea64, add64, 0 + +/* Setup DMA parameters, then issue DMA request. */ + rotqbyi ealo, add64, 4 + ila maxsize, MFC_MAX_DMA_SIZE + cgt cmp, size, maxsize + selb sz, size, maxsize, cmp + ila tagid, MFC_TAG_ID + wrch $MFC_LSA, vma + wrch $MFC_EAH, ea64 + wrch $MFC_EAL, ealo + wrch $MFC_Size, sz + wrch $MFC_TagId, tagid + ila cmd, MFC_GET_CMD + wrch $MFC_Cmd, cmd + +/* Increment vma, decrement size, branch back as needed. */ + a vma, vma, sz + sf size, sz, size + brnz size, __ovly_xfer_loop + +/* Save app's tagmask, wait for DMA complete, restore mask. */ + rdch oldmask, $MFC_RdTagMask +#if MFC_TAG_ID < 16 + ilh newmask, 1 << MFC_TAG_ID +#else + ilhu newmask, 1 << (MFC_TAG_ID - 16) +#endif + wrch $MFC_WrTagMask, newmask + ila tagstat, MFC_TAG_UPDATE_ALL + wrch $MFC_WrTagUpdate, tagstat + rdch tagstat, $MFC_RdTagStat + sync + wrch $MFC_WrTagMask, oldmask + + .global _ovly_debug_event + .type _ovly_debug_event, @function +_ovly_debug_event: +/* GDB inserts debugger trap here. */ + nop + +__ovly_load_restore: +#ifdef OVLY_IRQ_SAVE +/* Conditionally re-enable interrupts. */ + andi irq_stat, irq_stat, 1 + ila irqtmp, __ovly_irq_restore + binze irq_stat, irqtmp +__ovly_irq_restore: + lqd $9, -64($sp) +#endif + +/* Restore saved registers. */ + lqd $8, -48($sp) + lqd $7, -32($sp) + lqd $6, -16($sp) + +__ovly_load_ret: +/* Branch to target address. */ + bi $79 diff --git a/ld/emultempl/spu_ovl.o b/ld/emultempl/spu_ovl.o Binary files differnew file mode 100644 index 00000000000..1d48c00fafa --- /dev/null +++ b/ld/emultempl/spu_ovl.o diff --git a/ld/emultempl/spuelf.em b/ld/emultempl/spuelf.em new file mode 100644 index 00000000000..de6a914a883 --- /dev/null +++ b/ld/emultempl/spuelf.em @@ -0,0 +1,297 @@ +# This shell script emits a C file. -*- C -*- +# Copyright 2006 Free Software Foundation, Inc. +# +# This file is part of GLD, the Gnu Linker. +# +# This program is free software; you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation; either version 2 of the License, or +# (at your option) any later version. +# +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License along +# with this program; if not, write to the Free Software Foundation, Inc., +# 51 Franklin Street - Fifth Floor, Boston, MA 02110-1301, USA. +# + +# This file is sourced from elf32.em, and defines extra spu specific +# features. +# +cat >>e${EMULATION_NAME}.c <<EOF +#include "ldctor.h" +#include "elf32-spu.h" + +/* Non-zero if no overlay processing should be done. */ +static int no_overlays = 0; + +/* Non-zero if we want stubs on all calls out of overlay regions. */ +static int non_overlay_stubs = 0; + +/* Whether to emit symbols for stubs. */ +static int emit_stub_syms = 0; + +/* Range of valid addresses for loadable sections. */ +static bfd_vma local_store_lo = 0; +static bfd_vma local_store_hi = 0x3ffff; + +extern void *_binary_builtin_ovl_mgr_start; +extern void *_binary_builtin_ovl_mgr_end; + +static const struct _ovl_stream ovl_mgr_stream = { + &_binary_builtin_ovl_mgr_start, + &_binary_builtin_ovl_mgr_end +}; + +static asection *toe = NULL; + + +static int +is_spu_target (void) +{ + extern const bfd_target bfd_elf32_spu_vec; + + return link_info.hash->creator == &bfd_elf32_spu_vec; +} + +/* Create our note section. */ + +static void +spu_after_open (void) +{ + if (is_spu_target () + && !link_info.relocatable + && link_info.input_bfds != NULL + && !spu_elf_create_sections (output_bfd, &link_info)) + einfo ("%X%P: can not create note section: %E\n"); + + gld${EMULATION_NAME}_after_open (); +} + +/* Add section S at the end of output section OUTPUT_NAME. + + Really, we should be duplicating ldlang.c map_input_to_output_sections + logic here, ie. using the linker script to find where the section + goes. That's rather a lot of code, and we don't want to run + map_input_to_output_sections again because most sections are already + mapped. So cheat, and put the section in a fixed place, ignoring any + attempt via a linker script to put .stub, .ovtab, and built-in + overlay manager code somewhere else. */ + +static void +spu_place_special_section (asection *s, const char *output_name) +{ + lang_output_section_statement_type *os; + + os = lang_output_section_find (output_name); + if (os == NULL) + { + const char *save = s->name; + s->name = output_name; + gld${EMULATION_NAME}_place_orphan (s); + s->name = save; + } + else + lang_add_section (&os->children, s, os); + + s->output_section->size += s->size; +} + +/* Load built-in overlay manager, and tweak overlay section alignment. */ + +static void +spu_elf_load_ovl_mgr (void) +{ + lang_output_section_statement_type *os; + struct elf_link_hash_entry *h; + + h = elf_link_hash_lookup (elf_hash_table (&link_info), + "__ovly_load", FALSE, FALSE, FALSE); + + if (h != NULL + && (h->root.type == bfd_link_hash_defined + || h->root.type == bfd_link_hash_defweak) + && h->def_regular) + { + /* User supplied __ovly_load. */ + } + else + { + lang_input_statement_type *ovl_is; + + ovl_is = lang_add_input_file ("builtin ovl_mgr", + lang_input_file_is_file_enum, + NULL); + + if (!spu_elf_open_builtin_lib (&ovl_is->the_bfd, &ovl_mgr_stream)) + einfo ("%X%P: can not open built-in overlay manager: %E\n"); + else + { + asection *in; + + if (!load_symbols (ovl_is, NULL)) + einfo ("%X%P: can not load built-in overlay manager: %E\n"); + + /* Map overlay manager sections to output sections. */ + for (in = ovl_is->the_bfd->sections; in != NULL; in = in->next) + if ((in->flags & (SEC_ALLOC | SEC_LOAD)) + == (SEC_ALLOC | SEC_LOAD)) + spu_place_special_section (in, ".text"); + } + } + + /* Ensure alignment of overlay sections is sufficient. */ + for (os = &lang_output_section_statement.head->output_section_statement; + os != NULL; + os = os->next) + if (os->bfd_section != NULL + && spu_elf_section_data (os->bfd_section) != NULL + && spu_elf_section_data (os->bfd_section)->ovl_index != 0) + { + if (os->bfd_section->alignment_power < 4) + os->bfd_section->alignment_power = 4; + + /* Also ensure size rounds up. */ + os->block_value = 16; + } +} + +/* Go find if we need to do anything special for overlays. */ + +static void +spu_before_allocation (void) +{ + if (is_spu_target () + && !link_info.relocatable + && !no_overlays) + { + /* Size the sections. This is premature, but we need to know the + rough layout so that overlays can be found. */ + expld.phase = lang_mark_phase_enum; + expld.dataseg.phase = exp_dataseg_none; + one_lang_size_sections_pass (NULL, TRUE); + + /* Find overlays by inspecting section vmas. */ + if (spu_elf_find_overlays (output_bfd, &link_info)) + { + asection *stub, *ovtab; + + if (!spu_elf_size_stubs (output_bfd, &link_info, non_overlay_stubs, + &stub, &ovtab, &toe)) + einfo ("%X%P: can not size overlay stubs: %E\n"); + + if (stub != NULL) + { + spu_place_special_section (stub, ".text"); + spu_place_special_section (ovtab, ".data"); + spu_place_special_section (toe, ".toe"); + + spu_elf_load_ovl_mgr (); + } + } + + /* We must not cache anything from the preliminary sizing. */ + lang_reset_memory_regions (); + } + + gld${EMULATION_NAME}_before_allocation (); +} + +/* Final emulation specific call. */ + +static void +gld${EMULATION_NAME}_finish (void) +{ + int need_laying_out; + + need_laying_out = bfd_elf_discard_info (output_bfd, &link_info); + + gld${EMULATION_NAME}_map_segments (need_laying_out); + + if (is_spu_target () && local_store_lo < local_store_hi) + { + asection *s; + + s = spu_elf_check_vma (output_bfd, local_store_lo, local_store_hi); + if (s != NULL) + einfo ("%X%P: %A exceeds local store range\n", s); + } + + if (toe != NULL + && !spu_elf_build_stubs (&link_info, + emit_stub_syms || link_info.emitrelocations, + toe)) + einfo ("%X%P: can not build overlay stubs: %E\n"); + + finish_default (); +} + +EOF + +# Define some shell vars to insert bits of code into the standard elf +# parse_args and list_options functions. +# +PARSE_AND_LIST_PROLOGUE=' +#define OPTION_SPU_PLUGIN 301 +#define OPTION_SPU_NO_OVERLAYS (OPTION_SPU_PLUGIN + 1) +#define OPTION_SPU_STUB_SYMS (OPTION_SPU_NO_OVERLAYS + 1) +#define OPTION_SPU_NON_OVERLAY_STUBS (OPTION_SPU_STUB_SYMS + 1) +#define OPTION_SPU_LOCAL_STORE (OPTION_SPU_NON_OVERLAY_STUBS + 1) +' + +PARSE_AND_LIST_LONGOPTS=' + { "plugin", no_argument, NULL, OPTION_SPU_PLUGIN }, + { "no-overlays", no_argument, NULL, OPTION_SPU_NO_OVERLAYS }, + { "emit-stub-syms", no_argument, NULL, OPTION_SPU_STUB_SYMS }, + { "extra-overlay-stubs", no_argument, NULL, OPTION_SPU_NON_OVERLAY_STUBS }, + { "local-store", required_argument, NULL, OPTION_SPU_LOCAL_STORE }, +' + +PARSE_AND_LIST_OPTIONS=' + fprintf (file, _("\ + --plugin Make SPU plugin.\n\ + --no-overlays No overlay handling.\n\ + --emit-stub-syms Add symbols on overlay call stubs.\n\ + --extra-overlay-stubs Add stubs on all calls out of overlay regions.\n\ + --local-store=lo:hi Valid address range.\n" + )); +' + +PARSE_AND_LIST_ARGS_CASES=' + case OPTION_SPU_PLUGIN: + spu_elf_plugin (1); + break; + + case OPTION_SPU_NO_OVERLAYS: + no_overlays = 1; + break; + + case OPTION_SPU_STUB_SYMS: + emit_stub_syms = 1; + break; + + case OPTION_SPU_NON_OVERLAY_STUBS: + non_overlay_stubs = 1; + break; + + case OPTION_SPU_LOCAL_STORE: + { + char *end; + local_store_lo = strtoul (optarg, &end, 0); + if (*end == '\'':'\'') + { + local_store_hi = strtoul (end + 1, &end, 0); + if (*end == 0) + break; + } + einfo (_("%P%F: invalid --local-store address range `%s'\''\n"), optarg); + } + break; +' + +LDEMUL_AFTER_OPEN=spu_after_open +LDEMUL_BEFORE_ALLOCATION=spu_before_allocation +LDEMUL_FINISH=gld${EMULATION_NAME}_finish |