summaryrefslogtreecommitdiff
path: root/gcc/config/pa
diff options
context:
space:
mode:
authordanglin <danglin@138bc75d-0d04-0410-961f-82ee72b054a4>2016-06-26 18:09:01 +0000
committerdanglin <danglin@138bc75d-0d04-0410-961f-82ee72b054a4>2016-06-26 18:09:01 +0000
commita1e99c57a0a1ff043c71d7354f484b2f2d6e7c2e (patch)
treef5ada84ba9de1dc2c58d40fd9c2a468a77596d73 /gcc/config/pa
parent0aa73965c1736eeb5a632a021959bab255d417b6 (diff)
downloadgcc-a1e99c57a0a1ff043c71d7354f484b2f2d6e7c2e.tar.gz
* config/pa/pa.c (pa_output_indirect_call): Rework to combine
output_asm_insn calls and shorten long lines. Output .CALL argument descriptor using pa_output_arg_descriptor. Add various inline $$dyncall and other optimizations. (pa_attr_length_indirect_call): Adjust ordering and lengths. git-svn-id: svn+ssh://gcc.gnu.org/svn/gcc/trunk@237790 138bc75d-0d04-0410-961f-82ee72b054a4
Diffstat (limited to 'gcc/config/pa')
-rw-r--r--gcc/config/pa/pa.c122
1 files changed, 99 insertions, 23 deletions
diff --git a/gcc/config/pa/pa.c b/gcc/config/pa/pa.c
index 8ce6b57341e..1047f3d61eb 100644
--- a/gcc/config/pa/pa.c
+++ b/gcc/config/pa/pa.c
@@ -8111,72 +8111,148 @@ pa_attr_length_indirect_call (rtx_insn *insn)
if (TARGET_64BIT)
return 12;
- if (TARGET_FAST_INDIRECT_CALLS
- || (!TARGET_LONG_CALLS
- && !TARGET_PORTABLE_RUNTIME
- && ((TARGET_PA_20 && !TARGET_SOM && distance < 7600000)
- || distance < MAX_PCREL17F_OFFSET)))
+ if (TARGET_FAST_INDIRECT_CALLS)
return 8;
- if (flag_pic)
- return 20;
-
if (TARGET_PORTABLE_RUNTIME)
return 16;
+ /* Inline version of $$dyncall. */
+ if ((TARGET_NO_SPACE_REGS || TARGET_PA_20) && !optimize_size)
+ return 20;
+
+ if (!TARGET_LONG_CALLS
+ && ((TARGET_PA_20 && !TARGET_SOM && distance < 7600000)
+ || distance < MAX_PCREL17F_OFFSET))
+ return 8;
+
/* Out of reach, can use ble. */
- return 12;
+ if (!flag_pic)
+ return 12;
+
+ /* Inline version of $$dyncall. */
+ if (TARGET_NO_SPACE_REGS || TARGET_PA_20)
+ return 20;
+
+ if (!optimize_size)
+ return 36;
+
+ /* Long PIC pc-relative call. */
+ return 20;
}
const char *
pa_output_indirect_call (rtx_insn *insn, rtx call_dest)
{
rtx xoperands[4];
+ int length;
if (TARGET_64BIT)
{
xoperands[0] = call_dest;
- output_asm_insn ("ldd 16(%0),%%r2", xoperands);
- output_asm_insn ("bve,l (%%r2),%%r2\n\tldd 24(%0),%%r27", xoperands);
+ output_asm_insn ("ldd 16(%0),%%r2\n\t"
+ "bve,l (%%r2),%%r2\n\t"
+ "ldd 24(%0),%%r27", xoperands);
return "";
}
/* First the special case for kernels, level 0 systems, etc. */
if (TARGET_FAST_INDIRECT_CALLS)
- return "ble 0(%%sr4,%%r22)\n\tcopy %%r31,%%r2";
+ {
+ pa_output_arg_descriptor (insn);
+ if (TARGET_PA_20)
+ return "bve,l,n (%%r22),%%r2\n\tnop";
+ return "ble 0(%%sr4,%%r22)\n\tcopy %%r31,%%r2";
+ }
+
+ if (TARGET_PORTABLE_RUNTIME)
+ {
+ output_asm_insn ("ldil L'$$dyncall,%%r31\n\t"
+ "ldo R'$$dyncall(%%r31),%%r31", xoperands);
+ pa_output_arg_descriptor (insn);
+ return "blr %%r0,%%r2\n\tbv,n %%r0(%%r31)";
+ }
+
+ /* Maybe emit a fast inline version of $$dyncall. */
+ if ((TARGET_NO_SPACE_REGS || TARGET_PA_20) && !optimize_size)
+ {
+ output_asm_insn ("bb,>=,n %%r22,30,.+12\n\t"
+ "ldw 2(%%r22),%%r19\n\t"
+ "ldw -2(%%r22),%%r22", xoperands);
+ pa_output_arg_descriptor (insn);
+ if (TARGET_NO_SPACE_REGS)
+ {
+ if (TARGET_PA_20)
+ return "bve,l,n (%%r22),%%r2\n\tnop";
+ return "ble 0(%%sr4,%%r22)\n\tcopy %%r31,%%r2";
+ }
+ return "bve,l (%%r22),%%r2\n\tstw %%r2,-24(%%sp)";
+ }
/* Now the normal case -- we can reach $$dyncall directly or
we're sure that we can get there via a long-branch stub.
No need to check target flags as the length uniquely identifies
the remaining cases. */
- if (pa_attr_length_indirect_call (insn) == 8)
+ length = pa_attr_length_indirect_call (insn);
+ if (length == 8)
{
+ pa_output_arg_descriptor (insn);
+
/* The HP linker sometimes substitutes a BLE for BL/B,L calls to
$$dyncall. Since BLE uses %r31 as the link register, the 22-bit
variant of the B,L instruction can't be used on the SOM target. */
if (TARGET_PA_20 && !TARGET_SOM)
- return ".CALL\tARGW0=GR\n\tb,l $$dyncall,%%r2\n\tcopy %%r2,%%r31";
+ return "b,l,n $$dyncall,%%r2\n\tnop";
else
- return ".CALL\tARGW0=GR\n\tbl $$dyncall,%%r31\n\tcopy %%r31,%%r2";
+ return "bl $$dyncall,%%r31\n\tcopy %%r31,%%r2";
}
/* Long millicode call, but we are not generating PIC or portable runtime
code. */
- if (pa_attr_length_indirect_call (insn) == 12)
- return ".CALL\tARGW0=GR\n\tldil L'$$dyncall,%%r2\n\tble R'$$dyncall(%%sr4,%%r2)\n\tcopy %%r31,%%r2";
-
- /* Long millicode call for portable runtime. */
- if (pa_attr_length_indirect_call (insn) == 16)
- return "ldil L'$$dyncall,%%r31\n\tldo R'$$dyncall(%%r31),%%r31\n\tblr %%r0,%%r2\n\tbv,n %%r0(%%r31)";
+ if (length == 12)
+ {
+ output_asm_insn ("ldil L'$$dyncall,%%r2", xoperands);
+ pa_output_arg_descriptor (insn);
+ return "ble R'$$dyncall(%%sr4,%%r2)\n\tcopy %%r31,%%r2";
+ }
+ /* Maybe emit a fast inline version of $$dyncall. The long PIC
+ pc-relative call sequence is five instructions. The inline PA 2.0
+ version of $$dyncall is also five instructions. The PA 1.X versions
+ are longer but still an overall win. */
+ if (TARGET_NO_SPACE_REGS || TARGET_PA_20 || !optimize_size)
+ {
+ output_asm_insn ("bb,>=,n %%r22,30,.+12\n\t"
+ "ldw 2(%%r22),%%r19\n\t"
+ "ldw -2(%%r22),%%r22", xoperands);
+ if (TARGET_NO_SPACE_REGS)
+ {
+ pa_output_arg_descriptor (insn);
+ if (TARGET_PA_20)
+ return "bve,l,n (%%r22),%%r2\n\tnop";
+ return "ble 0(%%sr4,%%r22)\n\tcopy %%r31,%%r2";
+ }
+ if (TARGET_PA_20)
+ {
+ pa_output_arg_descriptor (insn);
+ return "bve,l (%%r22),%%r2\n\tstw %%r2,-24(%%sp)";
+ }
+ output_asm_insn ("bl .+8,%%r2\n\t"
+ "ldo 16(%%r2),%%r2\n\t"
+ "ldsid (%%r22),%%r1\n\t"
+ "mtsp %%r1,%%sr0", xoperands);
+ pa_output_arg_descriptor (insn);
+ return "be 0(%%sr0,%%r22)\n\tstw %%r2,-24(%%sp)";
+ }
+
/* We need a long PIC call to $$dyncall. */
xoperands[0] = gen_rtx_SYMBOL_REF (Pmode, "$$dyncall");
xoperands[1] = gen_rtx_REG (Pmode, 2);
xoperands[2] = gen_rtx_REG (Pmode, 1);
pa_output_pic_pcrel_sequence (xoperands);
- output_asm_insn ("bv %%r0(%%r1)", xoperands);
- return "ldo {12|20}(%%r2),%%r2";
+ pa_output_arg_descriptor (insn);
+ return "bv %%r0(%%r1)\n\tldo {12|20}(%%r2),%%r2";
}
/* In HPUX 8.0's shared library scheme, special relocations are needed