From a6f12d7c1db7321252ff53f79229d0598ae0df4b Mon Sep 17 00:00:00 2001
From: Richard Kenner <kenner@gcc.gnu.org>
Date: Mon, 26 Oct 1992 16:01:33 -0500
Subject: [PATCH] Initial revision

From-SVN: r2615
---
 gcc/config/alpha/alpha.c | 1521 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 1521 insertions(+)
 create mode 100644 gcc/config/alpha/alpha.c

diff --git a/gcc/config/alpha/alpha.c b/gcc/config/alpha/alpha.c
new file mode 100644
index 00000000000..4ec88cc581b
--- /dev/null
+++ b/gcc/config/alpha/alpha.c
@@ -0,0 +1,1521 @@
+/* Subroutines used for code generation on the DEC Alpha.
+   Copyright (C) 1992 Free Software Foundation, Inc.
+   Contributed by Richard Kenner (kenner@nyu.edu)
+
+This file is part of GNU CC.
+
+GNU CC is free software; you can redistribute it and/or modify
+it under the terms of the GNU General Public License as published by
+the Free Software Foundation; either version 2, or (at your option)
+any later version.
+
+GNU CC is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with GNU CC; see the file COPYING.  If not, write to
+the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.  */
+
+
+#include <stdio.h>
+#include "config.h"
+#include "rtl.h"
+#include "regs.h"
+#include "hard-reg-set.h"
+#include "real.h"
+#include "insn-config.h"
+#include "conditions.h"
+#include "insn-flags.h"
+#include "output.h"
+#include "insn-attr.h"
+#include "flags.h"
+#include "recog.h"
+#include "reload.h"
+#include "expr.h"
+#include "obstack.h"
+#include "tree.h"
+
+/* Save information from a "cmpxx" operation until the branch or scc is
+   emitted.  */
+
+rtx alpha_compare_op0, alpha_compare_op1;
+int alpha_compare_fp_p;
+
+/* Save the name of the current function as used by the assembler.  This
+   is used by the epilogue.  */
+
+char *alpha_function_name;
+
+/* Nonzero if the current function needs gp.  */
+
+int alpha_function_needs_gp;
+
+/* Returns 1 if VALUE is a mask that contains full bytes of zero or ones.  */
+
+int
+zap_mask (value)
+     HOST_WIDE_INT value;
+{
+  int i;
+
+  for (i = 0; i < HOST_BITS_PER_WIDE_INT / HOST_BITS_PER_CHAR;
+       i++, value >>= 8)
+    if ((value & 0xff) != 0 && (value & 0xff) != 0xff)
+      return 0;
+
+  return 1;
+}
+
+/* Returns 1 if OP is either the constant zero or a register.  If a
+   register, it must be in the proper mode unless MODE is VOIDmode.  */
+
+int
+reg_or_0_operand (op, mode)
+      register rtx op;
+      enum machine_mode mode;
+{
+  return op == const0_rtx || register_operand (op, mode);
+}
+
+/* Return 1 if OP is an 8-bit constant or any register.  */
+
+int
+reg_or_8bit_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  return ((GET_CODE (op) == CONST_INT
+	   && (unsigned HOST_WIDE_INT) INTVAL (op) < 0x100)
+	  || register_operand (op, mode));
+}
+
+/* Return 1 if the operand is a valid second operand to an add insn.  */
+
+int
+add_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  if (GET_CODE (op) == CONST_INT)
+    return ((unsigned HOST_WIDE_INT) (INTVAL (op) + 0x8000) < 0x10000
+	    || ((INTVAL (op) & 0xffff) == 0
+		&& (INTVAL (op) >> 31 == -1
+		    || INTVAL (op) >> 31 == 0)));
+
+  return register_operand (op, mode);
+}
+
+/* Return 1 if the operand is a valid second operand to a sign-extending
+   add insn.  */
+
+int
+sext_add_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  if (GET_CODE (op) == CONST_INT)
+    return ((unsigned HOST_WIDE_INT) INTVAL (op) < 255
+	    || (unsigned HOST_WIDE_INT) (- INTVAL (op)) < 255);
+
+  return register_operand (op, mode);
+}
+
+/* Return 1 if OP is the constant 4 or 8.  */
+
+int
+const48_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  return (GET_CODE (op) == CONST_INT
+	  && (INTVAL (op) == 4 || INTVAL (op) == 8));
+}
+
+/* Return 1 if OP is a valid first operand to an AND insn.  */
+
+int
+and_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  if (GET_CODE (op) == CONST_DOUBLE && GET_MODE (op) == VOIDmode)
+    return (zap_mask (CONST_DOUBLE_LOW (op))
+	    && zap_mask (CONST_DOUBLE_HIGH (op)));
+
+  if (GET_CODE (op) == CONST_INT)
+    return ((unsigned HOST_WIDE_INT) INTVAL (op) < 0x100
+	    || (unsigned HOST_WIDE_INT) ~ INTVAL (op) < 0x100
+	    || zap_mask (INTVAL (op)));
+
+  return register_operand (op, mode);
+}
+
+/* Return 1 if OP is a constant that is the width, in bits, of an integral
+   mode smaller than DImode.  */
+
+int
+mode_width_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  return (GET_CODE (op) == CONST_INT
+	  && (INTVAL (op) == 8 || INTVAL (op) == 16 || INTVAL (op) == 32));
+}
+
+/* Return 1 if OP is a constant that is the width of an integral machine mode
+   smaller than an integer.  */
+
+int
+mode_mask_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+#if HOST_BITS_PER_WIDE_INT == 32
+  if (GET_CODE (op) == CONST_DOUBLE)
+    return CONST_DOUBLE_HIGH (op) == 0 && CONST_DOUBLE_LOW (op) == -1;
+#endif
+
+  if (GET_CODE (op) == CONST_INT)
+    return (INTVAL (op) == 0xff
+	    || INTVAL (op) == 0xffff
+#if HOST_BITS_PER_WIDE_INT == 64
+	    || INTVAL (op) == 0xffffffff
+#endif
+	    );
+}
+
+/* Return 1 if OP is a multiple of 8 less than 64.  */
+
+int
+mul8_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  return (GET_CODE (op) == CONST_INT
+	  && (unsigned HOST_WIDE_INT) INTVAL (op) < 64
+	  && (INTVAL (op) & 7) == 0);
+}
+
+/* Return 1 if OP is the constant zero in floating-point.  */
+
+int
+fp0_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  return (GET_MODE (op) == mode
+	  && GET_MODE_CLASS (mode) == MODE_FLOAT && op == CONST0_RTX (mode));
+}
+
+/* Return 1 if OP is the floating-point constant zero or a register.  */
+
+int
+reg_or_fp0_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  return fp0_operand (op, mode) || register_operand (op, mode);
+}
+
+/* Return 1 if OP is a register or a constant integer.  */
+
+
+int
+reg_or_cint_operand (op, mode)
+    register rtx op;
+    enum machine_mode mode;
+{
+     return GET_CODE (op) == CONST_INT || register_operand (op, mode);
+}
+
+/* Return 1 if OP is a valid operand for the source of a move insn.  */
+
+int
+input_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  if (mode != VOIDmode && GET_MODE (op) != VOIDmode && mode != GET_MODE (op))
+    return 0;
+
+  if (GET_MODE_CLASS (mode) == MODE_FLOAT && GET_MODE (op) != mode)
+    return 0;
+
+  switch (GET_CODE (op))
+    {
+    case LABEL_REF:
+    case SYMBOL_REF:
+    case CONST:
+      return mode == DImode;
+
+    case REG:
+      return 1;
+
+    case SUBREG:
+      if (register_operand (op, mode))
+	return 1;
+      /* ... fall through ... */
+    case MEM:
+      return mode != HImode && mode != QImode && general_operand (op, mode);
+
+    case CONST_DOUBLE:
+      return GET_MODE_CLASS (mode) == MODE_FLOAT && op == CONST0_RTX (mode);
+
+    case CONST_INT:
+      return mode == QImode || mode == HImode || add_operand (op, mode);
+    }
+
+  return 0;
+}
+
+/* Return 1 if OP is a SYMBOL_REF for the current function.  */
+
+int
+current_function_operand (op, mode)
+     rtx op;
+     enum machine_mode mode;
+{
+  return (GET_CODE (op) == SYMBOL_REF
+	  && ! strcmp (XSTR (op, 0), current_function_name));
+}
+
+/* Return 1 if OP is a valid Alpha comparison operator.  Here we know which
+   comparisons are valid in which insn.  */
+
+int
+alpha_comparison_operator (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  enum rtx_code code = GET_CODE (op);
+
+  if (mode != GET_MODE (op) || GET_RTX_CLASS (code) != '<')
+    return 0;
+
+  return (code == EQ || code == LE || code == LT
+	  || (mode == DImode && (code == LEU || code == LTU)));
+}
+
+/* Return 1 if OP is a signed comparison operation.  */
+
+int
+signed_comparison_operator (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  switch (GET_CODE (op))
+    {
+    case EQ:  case NE:  case LE:  case LT:  case GE:   case GT:
+      return 1;
+    }
+
+  return 0;
+}
+
+/* Return 1 if this is a divide or modulus operator.  */
+
+int
+divmod_operator (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  switch (GET_CODE (op))
+    {
+    case DIV:  case MOD:  case UDIV:  case UMOD:
+      return 1;
+    }
+
+  return 0;
+}
+
+/* Return 1 if this memory address is a known aligned register plus
+   a constant.  It must be a valid address.  This means that we can do
+   this as an aligned reference plus some offset.
+
+   Take into account what reload will do.
+
+   We could say that out-of-range stack slots are alignable, but that would
+   complicate get_aligned_mem and it isn't worth the trouble since few
+   functions have large stack space.  */
+
+int
+aligned_memory_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  if (GET_CODE (op) == SUBREG)
+    {
+      if (GET_MODE (op) != mode)
+	return 0;
+      op = SUBREG_REG (op);
+      mode = GET_MODE (op);
+    }
+
+  if (reload_in_progress && GET_CODE (op) == REG
+      && REGNO (op) >= FIRST_PSEUDO_REGISTER)
+    op = reg_equiv_mem[REGNO (op)];
+
+  if (GET_CODE (op) != MEM || GET_MODE (op) != mode
+      || ! memory_address_p (mode, XEXP (op, 0)))
+    return 0;
+
+  op = XEXP (op, 0);
+
+  if (GET_CODE (op) == PLUS)
+    op = XEXP (op, 0);
+
+  return (GET_CODE (op) == REG
+	  && (REGNO (op) == STACK_POINTER_REGNUM || op == frame_pointer_rtx
+	      || (REGNO (op) >= FIRST_VIRTUAL_REGISTER
+		  && REGNO (op) <= LAST_VIRTUAL_REGISTER)));
+}
+
+/* Similar, but return 1 if OP is a MEM which is not alignable.  */
+
+int
+unaligned_memory_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  if (GET_CODE (op) == SUBREG)
+    {
+      if (GET_MODE (op) != mode)
+	return 0;
+      op = SUBREG_REG (op);
+      mode = GET_MODE (op);
+    }
+
+  if (reload_in_progress && GET_CODE (op) == REG
+      && REGNO (op) >= FIRST_PSEUDO_REGISTER)
+    op = reg_equiv_mem[REGNO (op)];
+
+  if (GET_CODE (op) != MEM || GET_MODE (op) != mode)
+    return 0;
+
+  op = XEXP (op, 0);
+
+  if (! memory_address_p (mode, op))
+    return 1;
+
+  if (GET_CODE (op) == PLUS)
+    op = XEXP (op, 0);
+
+  return (GET_CODE (op) != REG
+	  || (REGNO (op) != STACK_POINTER_REGNUM && op != frame_pointer_rtx
+	      && (REGNO (op) < FIRST_VIRTUAL_REGISTER
+		  || REGNO (op) > LAST_VIRTUAL_REGISTER)));
+}
+
+/* Return 1 if OP is any memory location.  During reload a pseudo matches.  */
+
+int
+any_memory_operand (op, mode)
+     register rtx op;
+     enum machine_mode mode;
+{
+  return (GET_CODE (op) == MEM
+	  || (GET_CODE (op) == SUBREG && GET_CODE (SUBREG_REG (op)) == REG)
+	  || (reload_in_progress && GET_CODE (op) == REG
+	      && REGNO (op) >= FIRST_PSEUDO_REGISTER)
+	  || (reload_in_progress && GET_CODE (op) == SUBREG
+	      && GET_CODE (SUBREG_REG (op)) == REG
+	      && REGNO (SUBREG_REG (op)) >= FIRST_PSEUDO_REGISTER));
+}
+
+/* REF is an alignable memory location.  Place an aligned SImode
+   reference into *PALIGNED_MEM and the number of bits to shift into
+   *PBITNUM.  */
+
+void
+get_aligned_mem (ref, paligned_mem, pbitnum)
+     rtx ref;
+     rtx *paligned_mem, *pbitnum;
+{
+  rtx base;
+  HOST_WIDE_INT offset = 0;
+
+  if (GET_CODE (ref) == SUBREG)
+    {
+      offset = SUBREG_WORD (ref) * UNITS_PER_WORD;
+      if (BYTES_BIG_ENDIAN)
+	offset -= (MIN (UNITS_PER_WORD, GET_MODE_SIZE (GET_MODE (ref)))
+		   - MIN (UNITS_PER_WORD,
+			  GET_MODE_SIZE (GET_MODE (SUBREG_REG (ref)))));
+      ref = SUBREG_REG (ref);
+    }
+
+  if (GET_CODE (ref) == REG)
+    ref = reg_equiv_mem[REGNO (ref)];
+
+  if (reload_in_progress)
+    base = find_replacement (&XEXP (ref, 0));
+  else
+    base = XEXP (ref, 0);
+
+  if (GET_CODE (base) == PLUS)
+    offset += INTVAL (XEXP (base, 1)), base = XEXP (base, 0);
+
+  *paligned_mem = gen_rtx (MEM, SImode,
+			   plus_constant (base, offset & ~3));
+  MEM_IN_STRUCT_P (*paligned_mem) = MEM_IN_STRUCT_P (ref);
+  MEM_VOLATILE_P (*paligned_mem) = MEM_VOLATILE_P (ref);
+  RTX_UNCHANGING_P (*paligned_mem) = RTX_UNCHANGING_P (ref);
+
+  *pbitnum = GEN_INT ((offset & 3) * 8);
+}
+
+/* Similar, but just get the address.  Handle the two reload cases.  */
+
+rtx
+get_unaligned_address (ref)
+     rtx ref;
+{
+  rtx base;
+  HOST_WIDE_INT offset = 0;
+
+  if (GET_CODE (ref) == SUBREG)
+    {
+      offset = SUBREG_WORD (ref) * UNITS_PER_WORD;
+      if (BYTES_BIG_ENDIAN)
+	offset -= (MIN (UNITS_PER_WORD, GET_MODE_SIZE (GET_MODE (ref)))
+		   - MIN (UNITS_PER_WORD,
+			  GET_MODE_SIZE (GET_MODE (SUBREG_REG (ref)))));
+      ref = SUBREG_REG (ref);
+    }
+
+  if (GET_CODE (ref) == REG)
+    ref = reg_equiv_mem[REGNO (ref)];
+
+  if (reload_in_progress)
+    base = find_replacement (&XEXP (ref, 0));
+  else
+    base = XEXP (ref, 0);
+
+  if (GET_CODE (base) == PLUS)
+    offset += INTVAL (XEXP (base, 1)), base = XEXP (base, 0);
+
+  return plus_constant (base, offset);
+}
+
+/* Subfunction of the following function.  Update the flags of any MEM
+   found in part of X.  */
+
+static void
+alpha_set_memflags_1 (x, in_struct_p, volatile_p, unchanging_p)
+     rtx x;
+     int in_struct_p, volatile_p, unchanging_p;
+{
+  int i;
+
+  switch (GET_CODE (x))
+    {
+    case SEQUENCE:
+    case PARALLEL:
+      for (i = XVECLEN (x, 0) - 1; i >= 0; i--)
+	alpha_set_memflags_1 (XVECEXP (x, 0, i), in_struct_p, volatile_p,
+			      unchanging_p);
+      break;
+
+    case INSN:
+      alpha_set_memflags_1 (PATTERN (x), in_struct_p, volatile_p,
+			    unchanging_p);
+      break;
+
+    case SET:
+      alpha_set_memflags_1 (SET_DEST (x), in_struct_p, volatile_p,
+			    unchanging_p);
+      alpha_set_memflags_1 (SET_SRC (x), in_struct_p, volatile_p,
+			    unchanging_p);
+      break;
+
+    case MEM:
+      MEM_IN_STRUCT_P (x) = in_struct_p;
+      MEM_VOLATILE_P (x) = volatile_p;
+      RTX_UNCHANGING_P (x) = unchanging_p;
+      break;
+    }
+}
+
+/* Given INSN, which is either an INSN or a SEQUENCE generated to
+   perform a memory operation, look for any MEMs in either a SET_DEST or
+   a SET_SRC and copy the in-struct, unchanging, and volatile flags from
+   REF into each of the MEMs found.  If REF is not a MEM, don't do
+   anything.  */
+
+void
+alpha_set_memflags (insn, ref)
+     rtx insn;
+     rtx ref;
+{
+  /* Note that it is always safe to get these flags, though they won't
+     be what we think if REF is not a MEM.  */
+  int in_struct_p = MEM_IN_STRUCT_P (ref);
+  int volatile_p = MEM_VOLATILE_P (ref);
+  int unchanging_p = RTX_UNCHANGING_P (ref);
+
+  if (GET_CODE (ref) != MEM
+      || (! in_struct_p && ! volatile_p && ! unchanging_p))
+    return;
+
+  alpha_set_memflags_1 (insn, in_struct_p, volatile_p, unchanging_p);
+}
+
+/* Try to output insns to set TARGET equal to the constant C if it can be
+   done in less than N insns.  Returns 1 if it can be done and the
+   insns have been emitted.  If it would take more than N insns, zero is
+   returned and no insns and emitted.  */
+
+int
+alpha_emit_set_const (target, c, n)
+     rtx target;
+     HOST_WIDE_INT c;
+     int n;
+{
+  HOST_WIDE_INT new = c;
+  int i, bits;
+
+#if HOST_BITS_PER_WIDE_INT == 64
+  /* We are only called for SImode and DImode.  If this is SImode, ensure that
+     we are sign extended to a full word.  This does not make any sense when
+     cross-compiling on a narrow machine.  */
+
+  if (GET_MODE (target) == SImode)
+    c = (c & 0xffffffff) - 2 * (c & 0x80000000);
+#endif
+
+  /* If this is a sign-extended 32-bit constant, we can do this in at most
+     three insns, so do it if we have enough insns left.  We always have
+     a sign-extended 32-bit constant when compiling on a narrow machine.  */
+
+  if (HOST_BITS_PER_WIDE_INT != 64
+      || c >> 31 == -1 || c >> 31 == 0)
+    {
+      HOST_WIDE_INT low = (c & 0xffff) - 2 * (c & 0x8000);
+      HOST_WIDE_INT tmp1 = c - low;
+      HOST_WIDE_INT high
+	= ((tmp1 >> 16) & 0xffff) - 2 * ((tmp1 >> 16) & 0x8000);
+      HOST_WIDE_INT tmp2 = c - (high << 16) - low;
+      HOST_WIDE_INT extra = 0;
+
+      if (tmp2)
+	{
+	  extra = 0x4000;
+	  tmp1 -= 0x40000000;
+	  high = ((tmp1 >> 16) & 0xffff) - 2 * ((tmp1 >> 16) & 0x8000);
+	}
+
+      if (c == low || (low == 0 && extra == 0))
+	{
+	  emit_move_insn (target, GEN_INT (c));
+	  return 1;
+	}
+      else if (n >= 2 + (extra != 0))
+	{
+	  emit_move_insn (target, GEN_INT (low));
+	  if (extra != 0)
+	    emit_insn (gen_add2_insn (target, GEN_INT (extra << 16)));
+
+	  emit_insn (gen_add2_insn (target, GEN_INT (high << 16)));
+	  return 1;
+	}
+    }
+
+  /* If we couldn't do it that way, try some other methods (that depend on
+     being able to compute in the target's word size).  But if we have no
+     instructions left, don't bother.  Also, don't even try if this is 
+     SImode (in which case we should have already done something, but
+     do a sanity check here).  */
+
+  if (n == 1 || HOST_BITS_PER_WIDE_INT < 64 || GET_MODE (target) != DImode)
+    return 0;
+
+  /* First, see if can load a value into the target that is the same as the
+     constant except that all bytes that are 0 are changed to be 0xff.  If we
+     can, then we can do a ZAPNOT to obtain the desired constant.  */
+
+  for (i = 0; i < 64; i += 8)
+    if ((new & ((HOST_WIDE_INT) 0xff << i)) == 0)
+      new |= (HOST_WIDE_INT) 0xff << i;
+
+  if (alpha_emit_set_const (target, new, n - 1))
+    {
+      emit_insn (gen_anddi3 (target, target, GEN_INT (c | ~ new)));
+      return 1;
+    }
+
+  /* Find, see if we can load a related constant and then shift and possibly
+     negate it to get the constant we want.  Try this once each increasing
+     numbers of insns.  */
+
+  for (i = 1; i < n; i++)
+    {
+      /* First try complementing.  */
+      if (alpha_emit_set_const (target, ~ c, i))
+	{
+	  emit_insn (gen_one_cmpldi2 (target, target));
+	  return 1;
+	}
+
+      /* First try to form a constant and do a left shift.  We can do this
+	 if some low-order bits are zero; the exact_log2 call below tells
+	 us that information.  The bits we are shifting out could be any
+	 value, but here we'll just try the 0- and sign-extended forms of
+	 the constant.  To try to increase the chance of having the same
+	 constant in more than one insn, start at the highest number of
+	 bits to shift, but try all possibilities in case a ZAPNOT will
+	 be useful.  */
+
+      if ((bits = exact_log2 (c & - c)) > 0)
+	for (; bits > 0; bits--)
+	  if (alpha_emit_set_const (target, c >> bits, i)
+	      || alpha_emit_set_const (target,
+				       ((unsigned HOST_WIDE_INT) c) >> bits,
+				       i))
+	    {
+	      emit_insn (gen_ashldi3 (target, target, GEN_INT (bits)));
+	      return 1;
+	    }
+
+      /* Now try high-order zero bits.  Here we try the shifted-in bits as
+	 all zero and all ones.  */
+
+      if ((bits = HOST_BITS_PER_WIDE_INT - floor_log2 (c) - 1) > 0)
+	for (; bits > 0; bits--)
+	  if (alpha_emit_set_const (target, c << bits, i)
+	      || alpha_emit_set_const (target,
+				       ((c << bits)
+					| (((HOST_WIDE_INT) 1 << bits) - 1)),
+				       i))
+	    {
+	      emit_insn (gen_lshrdi3 (target, target, GEN_INT (bits)));
+	      return 1;
+	    }
+
+      /* Now try high-order 1 bits.  We get that with a sign-extension.
+	 But one bit isn't enough here.  */
+      
+      if ((bits = HOST_BITS_PER_WIDE_INT - floor_log2 (~ c) - 2) > 0)
+	for (; bits > 0; bits--)
+	  if (alpha_emit_set_const (target, c << bits, i)
+	      || alpha_emit_set_const (target,
+				       ((c << bits)
+					| (((HOST_WIDE_INT) 1 << bits) - 1)),
+				       i))
+	    {
+	      emit_insn (gen_ashrdi3 (target, target, GEN_INT (bits)));
+	      return 1;
+	    }
+    }
+
+  return 0;
+}
+
+/* Adjust the cost of a scheduling dependency.  Return the new cost of
+   a dependency LINK or INSN on DEP_INSN.  COST is the current cost.  */
+
+int
+alpha_adjust_cost (insn, link, dep_insn, cost)
+     rtx insn;
+     rtx link;
+     rtx dep_insn;
+     int cost;
+{
+  rtx set;
+
+  /* If the dependence is an anti-dependence, there is no cost.  For an
+     output dependence, there is sometimes a cost, but it doesn't seem
+     worth handling those few cases.  */
+
+  if (REG_NOTE_KIND (link) != 0)
+    return 0;
+
+  /* If INSN is a store insn and DEP_INSN is setting the data being stored,
+     we can sometimes lower the cost.  */
+
+  if (recog_memoized (insn) >= 0 && get_attr_type (insn) == TYPE_ST
+      && (set = single_set (dep_insn)) != 0
+      && GET_CODE (PATTERN (insn)) == SET
+      && rtx_equal_p (SET_DEST (set), SET_SRC (PATTERN (insn))))
+    switch (get_attr_type (dep_insn))
+      {
+      case TYPE_LD:
+	/* No savings here.  */
+	return cost;
+
+      case TYPE_IMULL:
+      case TYPE_IMULQ:
+	/* In these cases, we save one cycle.  */
+	return cost - 2;
+
+      default:
+	/* In all other cases, we save two cycles.  */
+	return MAX (0, cost - 4);
+      }
+
+  /* Another case that needs adjustment is an arithmetic or logical
+     operation.  It's cost is usually one cycle, but we default it to
+     two in the MD file.  The only case that it is actually two is
+     for the address in loads and stores.  */
+
+  if (recog_memoized (dep_insn) >= 0
+      && get_attr_type (dep_insn) == TYPE_IADDLOG)
+    switch (get_attr_type (insn))
+      {
+      case TYPE_LD:
+      case TYPE_ST:
+	return cost;
+
+      default:
+	return 2;
+      }
+
+  /* The final case is when a compare feeds into an integer branch.  The cost
+     is only one cycle in that case.  */
+
+  if (recog_memoized (dep_insn) >= 0
+      && get_attr_type (dep_insn) == TYPE_ICMP
+      && recog_memoized (insn) >= 0
+      && get_attr_type (insn) == TYPE_IBR)
+    return 2;
+
+  /* Otherwise, return the default cost. */
+
+  return cost;
+}
+
+/* Print an operand.  Recognize special options, documented below.  */
+
+void
+print_operand (file, x, code)
+    FILE *file;
+    rtx x;
+    char code;
+{
+  int i;
+
+  switch (code)
+    {
+    case 'r':
+      /* If this operand is the constant zero, write it as "$31".  */
+      if (GET_CODE (x) == REG)
+	fprintf (file, "%s", reg_names[REGNO (x)]);
+      else if (x == CONST0_RTX (GET_MODE (x)))
+	fprintf (file, "$31");
+      else
+	output_operand_lossage ("invalid %%r value");
+
+      break;
+
+    case 'R':
+      /* Similar, but for floating-point.  */
+      if (GET_CODE (x) == REG)
+	fprintf (file, "%s", reg_names[REGNO (x)]);
+      else if (x == CONST0_RTX (GET_MODE (x)))
+	fprintf (file, "$f31");
+      else
+	output_operand_lossage ("invalid %%R value");
+
+      break;
+
+    case 'N':
+      /* Write the 1's complement of a constant.  */
+      if (GET_CODE (x) != CONST_INT)
+	output_operand_lossage ("invalid %%N value");
+
+      fprintf (file, "%ld", ~ INTVAL (x));
+      break;
+
+    case 'P':
+      /* Write 1 << C, for a constant C.  */
+      if (GET_CODE (x) != CONST_INT)
+	output_operand_lossage ("invalid %%P value");
+
+      fprintf (file, "%ld", (HOST_WIDE_INT) 1 << INTVAL (x));
+      break;
+
+    case 'h':
+      /* Write the high-order 16 bits of a constant, sign-extended.  */
+      if (GET_CODE (x) != CONST_INT)
+	output_operand_lossage ("invalid %%h value");
+
+      fprintf (file, "%ld", INTVAL (x) >> 16);
+      break;
+
+    case 'L':
+      /* Write the low-order 16 bits of a constant, sign-extended.  */
+      if (GET_CODE (x) != CONST_INT)
+	output_operand_lossage ("invalid %%L value");
+
+      fprintf (file, "%ld", (INTVAL (x) & 0xffff) - 2 * (INTVAL (x) & 0x8000));
+      break;
+
+    case 'm':
+      /* Write mask for ZAP insn.  */
+      if (GET_CODE (x) == CONST_DOUBLE)
+	{
+	  HOST_WIDE_INT mask = 0;
+	  HOST_WIDE_INT value;
+
+	  value = CONST_DOUBLE_LOW (x);
+	  for (i = 0; i < HOST_BITS_PER_WIDE_INT / HOST_BITS_PER_CHAR;
+	       i++, value >>= 8)
+	    if (value & 0xff)
+	      mask |= (1 << i);
+
+	  value = CONST_DOUBLE_HIGH (x);
+	  for (i = 0; i < HOST_BITS_PER_WIDE_INT / HOST_BITS_PER_CHAR;
+	       i++, value >>= 8)
+	    if (value & 0xff)
+	      mask |= (1 << (i + sizeof (int)));
+
+	  fprintf (file, "%ld", mask & 0xff);
+	}
+
+      else if (GET_CODE (x) == CONST_INT)
+	{
+	  HOST_WIDE_INT mask = 0, value = INTVAL (x);
+
+	  for (i = 0; i < 8; i++, value >>= 8)
+	    if (value & 0xff)
+	      mask |= (1 << i);
+
+	  fprintf (file, "%ld", mask);
+	}
+      else
+	output_operand_lossage ("invalid %%m value");
+      break;
+
+    case 'M':
+      /* 'b', 'w', or 'l' as the value of the constant.  */
+      if (GET_CODE (x) != CONST_INT
+	  || (INTVAL (x) != 8 && INTVAL (x) != 16 && INTVAL (x) != 32))
+	output_operand_lossage ("invalid %%M value");
+
+      fprintf (file, "%s",
+	       INTVAL (x) == 8 ? "b" : INTVAL (x) == 16 ? "w" : "l");
+      break;
+
+    case 'U':
+      /* Similar, except do it from the mask.  */
+      if (GET_CODE (x) == CONST_INT && INTVAL (x) == 0xff)
+	fprintf (file, "b");
+      else if (GET_CODE (x) == CONST_INT && INTVAL (x) == 0xffff)
+	fprintf (file, "w");
+#if HOST_BITS_PER_WIDE_INT == 32
+      else if (GET_CODE (x) == CONST_DOUBLE
+	       && CONST_DOUBLE_HIGH (x) == 0
+	       && CONST_DOUBLE_LOW (x) == -1)
+	fprintf (file, "l");
+#else
+      else if (GET_CODE (x) == CONST_INT && INTVAL (x) == 0xffffffff)
+	fprintf (file, "l");
+#endif
+      else
+	output_operand_lossage ("invalid %%U value");
+      break;
+
+    case 's':
+      /* Write the constant value divided by 8.  */
+      if (GET_CODE (x) != CONST_INT
+	  && (unsigned HOST_WIDE_INT) INTVAL (x) >= 64
+	  && (INTVAL (x) & 7) != 8)
+	output_operand_lossage ("invalid %%s value");
+
+      fprintf (file, "%ld", INTVAL (x) / 8);
+      break;
+
+    case 'S':
+      /* Same, except compute (64 - c) / 8 */
+
+      if (GET_CODE (x) != CONST_INT
+	  && (unsigned HOST_WIDE_INT) INTVAL (x) >= 64
+	  && (INTVAL (x) & 7) != 8)
+	output_operand_lossage ("invalid %%s value");
+
+      fprintf (file, "%ld", (64 - INTVAL (x)) / 8);
+      break;
+
+    case 'C':
+      /* Write out comparison name.  */
+      if (GET_RTX_CLASS (GET_CODE (x)) != '<')
+	output_operand_lossage ("invalid %%C value");
+
+      if (GET_CODE (x) == LEU)
+	fprintf (file, "ule");
+      else if (GET_CODE (x) == LTU)
+	fprintf (file, "ult");
+      else
+	fprintf (file, "%s", GET_RTX_NAME (GET_CODE (x)));
+      break;
+
+    case 'D':
+      /* Similar, but write reversed code.  We can't get an unsigned code
+	 here.  */
+      if (GET_RTX_CLASS (GET_CODE (x)) != '<')
+	output_operand_lossage ("invalid %%D value");
+
+      fprintf (file, "%s", GET_RTX_NAME (reverse_condition (GET_CODE (x))));
+      break;
+
+    case 'E':
+      /* Write the divide or modulus operator.  */
+      switch (GET_CODE (x))
+	{
+	case DIV:
+	  fprintf (file, "div%s", GET_MODE (x) == SImode ? "l" : "q");
+	  break;
+	case UDIV:
+	  fprintf (file, "div%su", GET_MODE (x) == SImode ? "l" : "q");
+	  break;
+	case MOD:
+	  fprintf (file, "rem%s", GET_MODE (x) == SImode ? "l" : "q");
+	  break;
+	case UMOD:
+	  fprintf (file, "rem%su", GET_MODE (x) == SImode ? "l" : "q");
+	  break;
+	default:
+	  output_operand_lossage ("invalid %%E value");
+	  break;
+	}
+      break;
+
+    case 'F':
+      /* Write the symbol; if the current function uses GP, write a
+	 modified version.  */
+      if (GET_CODE (x) != SYMBOL_REF)
+	output_operand_lossage ("invalid %%F value");
+
+      output_addr_const (file, x);
+      if (alpha_function_needs_gp)
+	fprintf (file, "..ng");
+      break;
+
+    case 'A':
+      /* Write "_u" for unaligned access.  */
+      if (GET_CODE (x) == MEM && GET_CODE (XEXP (x, 0)) == AND)
+	fprintf (file, "_u");
+      break;
+
+    case 0:
+      if (GET_CODE (x) == REG)
+	fprintf (file, "%s", reg_names[REGNO (x)]);
+      else if (GET_CODE (x) == MEM)
+	output_address (XEXP (x, 0));
+      else
+	output_addr_const (file, x);
+      break;
+
+    default:
+      output_operand_lossage ("invalid %%xn code");
+    }
+}
+
+/* Do what is necessary for `va_start'.  The argument is ignored;
+   We look at the current function to determine if stdargs or varargs
+   is used and fill in an initial va_list.  A pointer to this constructor
+   is returned.  */
+
+struct rtx_def *
+alpha_builtin_saveregs (arglist)
+     tree arglist;
+{
+  rtx block, addr, argsize;
+  tree fntype = TREE_TYPE (current_function_decl);
+  int stdargs = (TYPE_ARG_TYPES (fntype) != 0
+		 && (TREE_VALUE (tree_last (TYPE_ARG_TYPES (fntype)))
+		     != void_type_node));
+  int nregs = current_function_args_info;
+
+  /* If we have a variable-sized argument already, we will have used all
+     the registers, so set up to indicate that.  */
+
+  if (GET_CODE (current_function_arg_offset_rtx) != CONST_INT)
+    {
+      argsize = plus_constant (current_function_arg_offset_rtx,
+			       ((6 - stdargs) * UNITS_PER_WORD
+				+ UNITS_PER_WORD - 1));
+      argsize = expand_shift (RSHIFT_EXPR, Pmode, argsize,
+			      build_int_2 (3, 0), argsize, 0);
+    }
+  else
+    {
+      /* If we are using memory, deduct the stdarg adjustment from it,
+	 otherwise from the number of registers.  Then compute the current
+	 argument number.  */
+
+      int memargs = ((INTVAL (current_function_arg_offset_rtx)
+		      + UNITS_PER_WORD - 1)
+		     / UNITS_PER_WORD);
+
+      if (memargs)
+	memargs -= stdargs;
+      else
+	nregs -= stdargs;
+
+      argsize = GEN_INT (MIN (nregs, 6) + memargs);
+    }
+
+  /* Allocate the va_list constructor */
+  block = assign_stack_local (BLKmode, 4 * UNITS_PER_WORD, BITS_PER_WORD);
+  RTX_UNCHANGING_P (block) = 1;
+  RTX_UNCHANGING_P (XEXP (block, 0)) = 1;
+
+  /* Store the argsize as the __va_arg member.  */
+  emit_move_insn (change_address (block, DImode, XEXP (block, 0)),
+		  argsize);
+
+  /* Store the arg pointer in the __va_stack member.  */
+  emit_move_insn (change_address (block, Pmode,
+				  plus_constant (XEXP (block, 0),
+						 UNITS_PER_WORD)),
+		  virtual_incoming_args_rtx);
+
+  /* Allocate the integer register space, and store it as the
+     __va_ireg member.  */
+  addr = assign_stack_local (BLKmode, 6 * UNITS_PER_WORD, -1);
+  MEM_IN_STRUCT_P (addr) = 1;
+  RTX_UNCHANGING_P (addr) = 1;
+  RTX_UNCHANGING_P (XEXP (addr, 0)) = 1;
+
+  emit_move_insn (change_address (block, Pmode,
+				  plus_constant (XEXP (block, 0),
+						 2 * UNITS_PER_WORD)),
+		  copy_to_reg (XEXP (addr, 0)));
+
+  /* Now store the incoming integer registers.  */
+  if (nregs < 6)
+      move_block_from_reg
+	(16 + nregs,
+	 change_address (addr, Pmode,
+			 plus_constant (XEXP (addr, 0),
+					nregs * UNITS_PER_WORD)),
+	 6 - nregs);
+
+  /* Allocate the FP register space, and store it as the
+     __va_freg member.  */
+  addr = assign_stack_local (BLKmode, 6 * UNITS_PER_WORD, -1);
+  MEM_IN_STRUCT_P (addr) = 1;
+  RTX_UNCHANGING_P (addr) = 1;
+  RTX_UNCHANGING_P (XEXP (addr, 0)) = 1;
+
+  emit_move_insn (change_address (block, Pmode,
+				  plus_constant (XEXP (block, 0),
+						 3 * UNITS_PER_WORD)),
+		  copy_to_reg (XEXP (addr, 0)));
+
+  /* Now store the incoming floating-point registers.   If we are not
+     to use the floating-point registers, store the integer registers
+     in those locations too.  */
+  if (nregs < 6)
+      move_block_from_reg
+	(16 + 32 * (TARGET_FPREGS != 0) + nregs,
+	 change_address (addr, Pmode,
+			 plus_constant (XEXP (addr, 0),
+					nregs * UNITS_PER_WORD)),
+	 6 - nregs);
+
+  /* Return the address of the va_list constructor, but don't put it in a
+     register.  This fails when not optimizing and produces worse code when
+     optimizing.  */
+  return XEXP (block, 0);
+}
+
+/* This page contains routines that are used to determine what the function
+   prologue and epilogue code will do and write them out.  */
+
+/* Compute the size of the save area in the stack.  */
+
+int
+alpha_sa_size ()
+{
+  int size = 0;
+  int i;
+
+  for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
+    if (! fixed_regs[i] && ! call_used_regs[i] && regs_ever_live[i])
+      size++;
+
+  return size * 8;
+}
+
+/* Return non-zero if this function needs gp.  It does if it has
+   an LDSYM insn.  */
+
+int
+alpha_need_gp ()
+{
+  rtx insn;
+
+  for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
+    if (GET_RTX_CLASS (GET_CODE (insn)) == 'i'
+	&& GET_CODE (PATTERN (insn)) != USE
+	&& GET_CODE (PATTERN (insn)) != CLOBBER
+	&& get_attr_type (insn) == TYPE_LDSYM)
+      return 1;
+
+  return 0;
+}
+
+/* Return 1 if GP is dead at after INSN.  */
+
+int
+alpha_gp_dead_after (insn)
+     rtx insn;
+{
+  int jump_count = 0;
+  int found = 0;
+  rtx p;
+
+  /* If we aren't optimizing, don't do this optimization.  More importantly,
+     JUMP_LABEL isn't properly set when not optimizing.  */
+
+  if (optimize == 0)
+    return 0;
+
+  /* If we are followed by a BARRIER, we don't return.  */
+  if (NEXT_INSN (insn) && GET_CODE (NEXT_INSN (insn)) == BARRIER)
+    return 1;
+
+  /* Otherwise search for a use of GP before a return.  */
+
+  for (p = next_active_insn (insn); p; p = next_active_insn (p))
+    {
+      if (get_attr_type (p) == TYPE_LDSYM
+	  || get_attr_type (p) == TYPE_JSR)
+	{
+	  found = 1;
+	  break;
+	}
+
+      if (GET_CODE (p) == JUMP_INSN)
+	{
+	  if (GET_CODE (PATTERN (p)) == RETURN)
+	    break;
+
+	  if (! simplejump_p (p) || jump_count++ > 10)
+	    {
+	      found = 1;
+	      break;
+	    }
+
+	  p = JUMP_LABEL (p);
+	}
+    }
+
+  /* Restore any operands destroyed by the attribute calls above.  */
+  insn_extract (insn);
+
+  return ! found;
+}
+
+/* Return 1 if this function can directly return via $26.  */
+
+int
+direct_return ()
+{
+  return (reload_completed && alpha_sa_size () == 0
+	  && get_frame_size () == 0
+	  && current_function_pretend_args_size == 0);
+}
+
+/* Write function prologue.  */
+
+void
+output_prolog (file, size)
+     FILE *file;
+     int size;
+{
+  HOST_WIDE_INT frame_size = ((size + current_function_outgoing_args_size
+			       + current_function_pretend_args_size
+			       + alpha_sa_size () + 15) & ~15);
+  int reg_offset = current_function_outgoing_args_size;
+  int start_reg_offset = reg_offset;
+  unsigned reg_mask = 0;
+  int i;
+
+  /* If we need a GP, load it first.  */
+  alpha_function_needs_gp = alpha_need_gp ();
+
+  if (alpha_function_needs_gp)
+    {
+      rtx insn;
+
+      fprintf (file, "\tldgp $29,0($27)\n");
+
+      /* If we have a recursive call, put a special label here.  */
+      for (insn = get_insns (); insn; insn = NEXT_INSN (insn))
+	if (GET_CODE (insn) == CALL_INSN
+	    && get_attr_type (insn) != TYPE_JSR)
+	  {
+	    fprintf (file, "%s..ng:\n", current_function_name);
+	    break;
+	  }
+    }
+
+  /* Adjust the stack by the frame size.  If the frame size is > 32768
+     bytes, we have to load it into a register first and then subtract
+     from sp.  Note that we are only allowed to adjust sp once in the
+     prologue.  */
+
+  if (frame_size > 32768)
+    {
+      HOST_WIDE_INT low = (frame_size & 0xffff) - 2 * (frame_size & 0x8000);
+      HOST_WIDE_INT tmp1 = frame_size - low;
+      HOST_WIDE_INT high
+	= ((tmp1 >> 16) & 0xfff) - 2 * ((tmp1 >> 16) & 0x8000);
+      HOST_WIDE_INT tmp2 = frame_size - (high << 16) - low;
+      HOST_WIDE_INT extra = 0;
+      int in_reg = 31;
+
+      /* We haven't written code to handle frames > 4GB.  */
+#if HOST_BITS_PER_LONG_INT == 64
+      if ((unsigned HOST_WIDE_INT) frame_size >> 32 != 0)
+	abort ();
+#endif
+
+      if (tmp2)
+	{
+	  extra = 0x4000;
+	  tmp1 -= 0x40000000;
+	  high = ((tmp1 >> 16) & 0xffff) - 2 * ((tmp1 >> 16) & 0x8000);
+	}
+
+      if (low != 0)
+	{
+	  fprintf (file, "\tlda $28,%d($%d)\n", low, in_reg);
+	  in_reg = 28;
+	}
+
+      if (extra)
+	{
+	  fprintf (file, "\tldah $28,%d($%d)\n", extra, in_reg);
+	  in_reg = 28;
+	}
+
+      fprintf (file, "\tldah $28,%d($%d)\n", high, in_reg);
+
+      fprintf (file, "\tsubq $30,$28,$30\n");
+    }
+  else if (frame_size)
+    fprintf (file, "\tlda $30,-%d($30)\n", frame_size);
+
+  /* Write out the .frame line.  If we need a frame pointer, we use
+     an offset of zero.  */
+
+  if (frame_pointer_needed)
+    fprintf (file, "\t.frame $15,0,$26\n");
+  else
+    fprintf (file, "\t.frame $30,%d,$26\n", frame_size);
+
+    
+  /* Save register 26 if it is used.  */
+  if (regs_ever_live[26])
+    {
+      reg_mask |= 1 << 26;
+      fprintf (file, "\tstq $26,%d($30)\n", reg_offset);
+      reg_offset += 8;
+    }
+
+  /* Now save any other used register that are required to be saved.  */
+  for (i = 0; i < 32; i++)
+    if (! fixed_regs[i] && ! call_used_regs[i] && regs_ever_live[i] && i != 26)
+      {
+	reg_mask |= 1 << i;
+	fprintf (file, "\tstq $%d,%d($30)\n", i, reg_offset);
+	reg_offset += 8;
+      }
+
+  /* Print the register mask and do floating-point saves.  */
+  if (reg_mask)
+    fprintf (file, "\t.mask 0x%x,%d\n", reg_mask,
+	     start_reg_offset - frame_size);
+
+  start_reg_offset = reg_offset;
+  reg_mask = 0;
+
+  for (i = 0; i < 32; i++)
+    if (! fixed_regs[i + 32] && ! call_used_regs[i + 32]
+	&& regs_ever_live[i + 32])
+      {
+	reg_mask |= 1 << i;
+	fprintf (file, "\tstt $f%d,%d($30)\n", i, reg_offset);
+	reg_offset += 8;
+      }
+
+  /* Print the floating-point mask, if we've saved any fp register.  */
+  if (reg_mask)
+    fprintf (file, "\t.fmask 0x%x,%d\n", reg_mask, start_reg_offset);
+
+  /* If we need a frame pointer, set it to the value of incoming stack
+     which we compute by adding back the frame size pointer.  Because we
+     can subtract one more than we can add, we have to special-case
+     frame sizes of 32K.  Note that there is no restriction that the frame
+     pointer be updated in one instruction.  */
+
+  if (frame_pointer_needed)
+    {
+      if (frame_size == 32768)
+	fprintf (file, "\tlda $15,16384($30)\n\tlda $15,16384($15)\n");
+      else if (frame_size > 32768)
+	fprintf (file, "\tadd $30,$28,$15\n");
+      else
+	fprintf (file, "\tlda $15,%d($30)\n", frame_size);
+    }
+}
+
+/* Write function epilogue.  */
+
+void
+output_epilog (file, size)
+     FILE *file;
+     int size;
+{
+  rtx insn = get_last_insn ();
+  HOST_WIDE_INT frame_size = ((size + current_function_outgoing_args_size
+			       + current_function_pretend_args_size
+			       + alpha_sa_size () + 15) & ~15);
+  int reg_offset = current_function_outgoing_args_size;
+  int reg_offset_from = STACK_POINTER_REGNUM;
+  int i;
+
+  /* If the last insn was a BARRIER, we don't have to write anything except
+     the .end pseudo-op.  */
+  if (GET_CODE (insn) == NOTE)
+    insn = prev_nonnote_insn (insn);
+  if (insn == 0 || GET_CODE (insn) != BARRIER)
+    {
+      /* If we have a frame pointer, we restore the registers from an
+	 offset from it, assuming that we can reach the offset.  If not,
+	 we have to compute the address using a scratch register.  This is
+	 messy, but should not be common.  We have to copy the frame
+	 pointer elsewhere here since we will be restoring it before we can
+	 use it to restore the stack pointer.  We use $25.  */
+
+      if (frame_pointer_needed)
+	{
+	  fprintf (file, "\tbis $15,$15,$25\n");
+
+	  if (frame_size < 32768)
+	    reg_offset -= frame_size, reg_offset_from = 25;
+	  else
+	    {
+	      HOST_WIDE_INT low
+		= (frame_size & 0xffff) - 2 * (frame_size & 0x8000);
+	      HOST_WIDE_INT tmp1 = frame_size - low;
+	      HOST_WIDE_INT high
+		= ((tmp1 >> 16) & 0xffff) - 2 * ((tmp1 >> 16) & 0x8000);
+	      HOST_WIDE_INT tmp2 = frame_size - (high << 16) - low;
+	      int extra = 0xe;
+	      int in_reg = 31;
+
+	      if (tmp2)
+		{
+		  extra = 0x4000;
+		  tmp1 -= 0x40000000;	
+		  high = ((tmp1 >> 16) & 0xffff) - 2 * ((tmp1 >> 16) & 0x8000);
+		}
+
+	      if (low != 0)
+		{
+		  fprintf (file, "\tlda $28,%d($%d)\n", low, in_reg);
+		  in_reg = 28;
+		}
+
+	      if (extra)
+		{
+		  fprintf (file, "\tldah $28,%d($%d)\n", extra, in_reg);
+		  in_reg = 28;
+		}
+
+	      fprintf (file, "\tldah $28,%d($%d)\n", high, in_reg);
+
+	      fprintf (file, "\taddq $25,$28,$28\n");
+
+	      reg_offset_from = 28;
+	    }
+	}
+
+      /* Restore all the registers, starting with the return address
+	 register.  */
+      if (regs_ever_live[26])
+	{
+	  fprintf (file, "\tldq $26,%d($%d)\n", reg_offset, reg_offset_from);
+	  reg_offset += 8;
+	}
+
+      /* Now restore any other used register that that we saved.  */
+      for (i = 0; i < 32; i++)
+	if (! fixed_regs[i] && ! call_used_regs[i] && regs_ever_live[i]
+	    && i != 26)
+	  {
+	    fprintf (file, "\tldq $%d,%d($%d)\n",
+		     i, reg_offset, reg_offset_from);
+	    reg_offset += 8;
+	  }
+
+      for (i = 0; i < 32; i++)
+	if (! fixed_regs[i + 32] && ! call_used_regs[i + 32]
+	    && regs_ever_live[i + 32])
+	  {
+	    fprintf (file, "\tldt $f%d,%d($%d)\n",
+		     i, reg_offset, reg_offset_from);
+	    reg_offset += 8;
+	  }
+
+      /* Restore the stack.  If we have a frame pointer, use it.  Otherwise,
+	 add the size back into the stack, handling the large frame size.  */
+
+      if (frame_pointer_needed)
+	fprintf (file, "\tbis $25,$25,$30\n");
+      else if (frame_size > 32767)
+	{
+	  HOST_WIDE_INT low
+	    = (frame_size & 0xffff) - 2 * (frame_size & 0x8000);
+	  HOST_WIDE_INT tmp1 = frame_size - low;
+	  HOST_WIDE_INT high
+	    = ((tmp1 >> 16) & 0xffff) - 2 * ((tmp1 >> 16) & 0x8000);
+	  HOST_WIDE_INT tmp2 = frame_size - (high << 16) - low;
+	  HOST_WIDE_INT extra = 0;
+	  int in_reg = 31;
+
+	  /* We haven't written code to handle frames > 4GB.  */
+#if HOST_BITS_PER_LONG_INT == 64
+	  if ((unsigned HOST_WIDE_INT) frame_size >> 32 != 0)
+	    abort ();
+#endif
+
+	  if (tmp2)
+	    {
+	      extra = 0x4000;
+	      tmp1 -= 0x40000000;
+	      high = ((tmp1 >> 16) & 0xffff) - 2 * ((tmp1 >> 16) & 0x8000);
+	    }
+
+	  if (low != 0)
+	    {
+	      fprintf (file, "\tlda $28,%d($%d)\n", low, in_reg);
+	      in_reg = 28;
+	    }
+
+	  if (extra)
+	    {
+	      fprintf (file, "\tldah $28,%d($%d)\n", extra, in_reg);
+	      in_reg = 28;
+	    }
+
+	  fprintf (file, "\tldah $28,%d($%d)\n", high, in_reg);
+
+	  fprintf (file, "\taddq $30,$28,$30\n");
+	}
+      else if (frame_size)
+	fprintf (file, "\tlda $30,%d($30)\n", frame_size);
+
+      /* Now return to the caller.  */
+      fprintf (file, "\tret $31,($26),1\n");
+    }
+
+  /* End the function.  */
+  fprintf (file, "\t.end %s\n", alpha_function_name);
+}