OpenCores
URL https://opencores.org/ocsvn/openrisc/openrisc/trunk

Subversion Repositories openrisc

[/] [openrisc/] [trunk/] [gnu-dev/] [or1k-gcc/] [gcc/] [config/] [rl78/] [rl78.c] - Rev 761

Go to most recent revision | Compare with Previous | Blame | View Log

/* Subroutines used for code generation on Renesas RL78 processors.
   Copyright (C) 2011 Free Software Foundation, Inc.
   Contributed by Red Hat.
 
   This file is part of GCC.
 
   GCC is free software; you can redistribute it and/or modify
   it under the terms of the GNU General Public License as published by
   the Free Software Foundation; either version 3, or (at your option)
   any later version.
 
   GCC is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   GNU General Public License for more details.
 
   You should have received a copy of the GNU General Public License
   along with GCC; see the file COPYING3.  If not see
   <http://www.gnu.org/licenses/>.  */
 
#include "config.h"
#include "system.h"
#include "coretypes.h"
#include "tm.h"
#include "tree.h"
#include "rtl.h"
#include "regs.h"
#include "hard-reg-set.h"
#include "insn-config.h"
#include "conditions.h"
#include "output.h"
#include "insn-attr.h"
#include "flags.h"
#include "function.h"
#include "expr.h"
#include "optabs.h"
#include "libfuncs.h"
#include "recog.h"
#include "diagnostic-core.h"
#include "toplev.h"
#include "reload.h"
#include "df.h"
#include "ggc.h"
#include "tm_p.h"
#include "debug.h"
#include "target.h"
#include "target-def.h"
#include "langhooks.h"
#include "rl78-protos.h"
#include "tree-pass.h"

static inline bool is_interrupt_func (const_tree decl);
static inline bool is_brk_interrupt_func (const_tree decl);
static void rl78_reorg (void);

 
/* Debugging statements are tagged with DEBUG0 only so that they can
   be easily enabled individually, by replacing the '0' with '1' as
   needed.  */
#define DEBUG0 0
#define DEBUG1 1
 
/* REGISTER_NAMES has the names for individual 8-bit registers, but
   these have the names we need to use when referring to 16-bit
   register pairs.  */
static const char * const word_regnames[] =
{
  "ax", "AX", "bc", "BC", "de", "DE", "hl", "HL",
  "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15",
  "r16", "r17", "r18", "r19", "r20", "r21", "r22", "r23",
  "r24", "r25", "r26", "r27", "r28", "r29", "r30", "r31",
  "sp", "ap", "psw", "es", "cs"
};
 
struct GTY(()) machine_function
{
  /* If set, the rest of the fields have been computed.  */
  int computed;
  /* Which register pairs need to be pushed in the prologue.  */
  int need_to_push [FIRST_PSEUDO_REGISTER / 2];
 
  /* These fields describe the frame layout...  */
  /* arg pointer */
  /* 4 bytes for saved PC */
  int framesize_regs;
  /* frame pointer */
  int framesize_locals;
  int framesize_outgoing;
  /* stack pointer */
  int framesize;
 
  /* If set, recog is allowed to match against the "real" patterns.  */
  int real_insns_ok;
  /* If set, recog is allowed to match against the "virtual" patterns.  */
  int virt_insns_ok;
  /* Set if the current function needs to clean up any trampolines.  */
  int trampolines_used;
};
 
/* This is our init_machine_status, as set in
   rl78_option_override.  */
static struct machine_function *
rl78_init_machine_status (void)
{
  struct machine_function *m;
 
  m = ggc_alloc_cleared_machine_function ();
  m->virt_insns_ok = 1;
 
  return m;
}
 
/* Returns whether to run the devirtualization pass.  */
static bool
devirt_gate (void)
{
  return true;
}
 
/* Runs the devirtualization pass.  */
static unsigned int
devirt_pass (void)
{
  rl78_reorg ();
  return 0;
}
 
/* This pass converts virtual instructions using virtual registers, to
   real instructions using real registers.  Rather than run it as
   reorg, we reschedule it before vartrack to help with debugging.  */
static struct opt_pass rl78_devirt_pass =
{
  RTL_PASS,
  "devirt",
  devirt_gate,
  devirt_pass,
  NULL,
  NULL,
  212,
  TV_MACH_DEP,
  0, 0, 0,
  0,
  TODO_dump_func
};
 
static struct register_pass_info rl78_devirt_info =
{
  & rl78_devirt_pass,
  "vartrack",
  1,
  PASS_POS_INSERT_BEFORE
};
 
#undef  TARGET_ASM_FILE_START
#define TARGET_ASM_FILE_START rl78_asm_file_start
 
static void
rl78_asm_file_start (void)
{
  int i;
 
  for (i = 0; i < 8; i++)
    {
      fprintf (asm_out_file, "r%d\t=\t0x%x\n", 8 + i, 0xffef0 + i);
      fprintf (asm_out_file, "r%d\t=\t0x%x\n", 16 + i, 0xffee8 + i);
    }
 
  register_pass (& rl78_devirt_info);
}
 

#undef  TARGET_OPTION_OVERRIDE
#define TARGET_OPTION_OVERRIDE		rl78_option_override
 
static void
rl78_option_override (void)
{
  flag_omit_frame_pointer = 1;
  flag_no_function_cse = 1;
  flag_split_wide_types = 0;
 
  init_machine_status = rl78_init_machine_status;
}
 
/* Most registers are 8 bits.  Some are 16 bits because, for example,
   gcc doesn't like dealing with $FP as a register pair.  This table
   maps register numbers to size in bytes.  */
static const int register_sizes[] =
{
  1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 2, 1,
  1, 1, 1, 1, 1, 1, 1, 1,
  2, 2, 1, 1, 1
};
 
/* Predicates used in the MD patterns.  This one is true when virtual
   insns may be matched, which typically means before (or during) the
   devirt pass.  */
bool
rl78_virt_insns_ok (void)
{
  if (cfun)
    return cfun->machine->virt_insns_ok;
  return true;
}
 
/* Predicates used in the MD patterns.  This one is true when real
   insns may be matched, which typically means after (or during) the
   devirt pass.  */
bool
rl78_real_insns_ok (void)
{
  if (cfun)
    return cfun->machine->real_insns_ok;
  return false;
}
 
/* Implements HARD_REGNO_NREGS.  */
int
rl78_hard_regno_nregs (int regno, enum machine_mode mode)
{
  int rs = register_sizes[regno];
  if (rs < 1)
    rs = 1;
  return ((GET_MODE_SIZE (mode) + rs - 1) / rs);
}
 
/* Implements HARD_REGNO_MODE_OK.  */
int
rl78_hard_regno_mode_ok (int regno, enum machine_mode mode)
{
  int s = GET_MODE_SIZE (mode);
 
  if (s < 1)
    return 0;
  /* These are not to be used by gcc.  */
  if (regno == 23 || regno == ES_REG || regno == CS_REG)
    return 0;
  /* $fp can alway sbe accessed as a 16-bit value.  */
  if (regno == FP_REG && s == 2)
    return 1;
  if (regno < SP_REG)
    {
      /* Since a reg-reg move is really a reg-mem move, we must
	 enforce alignment.  */
      if (s > 1 && (regno % 2))
	return 0;
      return 1;
    }
  if (s == CC_REGNUM)
    return (mode == BImode);
  /* All other registers must be accessed in their natural sizes.  */
  if (s == register_sizes [regno])
    return 1;
  return 0;
}
 
/* Simplify_gen_subreg() doesn't handle memory references the way we
   need it to below, so we use this function for when we must get a
   valid subreg in a "natural" state.  */
static rtx
rl78_subreg (enum machine_mode mode, rtx r, enum machine_mode omode, int byte)
{
  if (GET_CODE (r) == MEM)
    return adjust_address (r, mode, byte);
  else
    return simplify_gen_subreg (mode, r, omode, byte);
}
 
/* Used by movsi.  Split SImode moves into two HImode moves, using
   appropriate patterns for the upper and lower halves of symbols.  */
void
rl78_expand_movsi (rtx *operands)
{
  rtx op00, op02, op10, op12;
 
  op00 = rl78_subreg (HImode, operands[0], SImode, 0);
  op02 = rl78_subreg (HImode, operands[0], SImode, 2);
  if (GET_CODE (operands[1]) == CONST
      || GET_CODE (operands[1]) == SYMBOL_REF)
    {
      op10 = gen_rtx_ZERO_EXTRACT (HImode, operands[1], GEN_INT (16), GEN_INT (0));
      op10 = gen_rtx_CONST (HImode, op10);
      op12 = gen_rtx_ZERO_EXTRACT (HImode, operands[1], GEN_INT (16), GEN_INT (16));
      op12 = gen_rtx_CONST (HImode, op12);
    }
  else
    {
      op10 = rl78_subreg (HImode, operands[1], SImode, 0);
      op12 = rl78_subreg (HImode, operands[1], SImode, 2);
    }
 
  if (rtx_equal_p (operands[0], operands[1]))
    ;
  else if (rtx_equal_p (op00, op12))
    {
      emit_move_insn (op02, op12);
      emit_move_insn (op00, op10);
    }
  else
    {
      emit_move_insn (op00, op10);
      emit_move_insn (op02, op12);
    }
}
 
/* Used by various two-operand expanders which cannot accept all
   operands in the "far" namespace.  Force some such operands into
   registers so that each pattern has at most one far operand.  */
int
rl78_force_nonfar_2 (rtx *operands, rtx (*gen)(rtx,rtx))
{
  int did = 0;
  rtx temp_reg = NULL;
 
  /* FIXME: in the future, be smarter about only doing this if the
     other operand is also far, assuming the devirtualizer can also
     handle that.  */
  if (rl78_far_p (operands[0]))
    {
      temp_reg = operands[0];
      operands[0] = gen_reg_rtx (GET_MODE (operands[0]));
      did = 1;
    }
  if (!did)
    return 0;
 
  emit_insn (gen (operands[0], operands[1]));
  if (temp_reg)
    emit_move_insn (temp_reg, operands[0]);
  return 1;
}
 
/* Likewise, but for three-operand expanders.  */
int
rl78_force_nonfar_3 (rtx *operands, rtx (*gen)(rtx,rtx,rtx))
{
  int did = 0;
  rtx temp_reg = NULL;
 
  /* FIXME: Likewise.  */
  if (rl78_far_p (operands[1]))
    {
      rtx temp_reg = gen_reg_rtx (GET_MODE (operands[1]));
      emit_move_insn (temp_reg, operands[1]);
      operands[1] = temp_reg;
      did = 1;
    }
  if (rl78_far_p (operands[0]))
    {
      temp_reg = operands[0];
      operands[0] = gen_reg_rtx (GET_MODE (operands[0]));
      did = 1;
    }
  if (!did)
    return 0;
 
  emit_insn (gen (operands[0], operands[1], operands[2]));
  if (temp_reg)
    emit_move_insn (temp_reg, operands[0]);
  return 1;
}
 
#undef  TARGET_CAN_ELIMINATE
#define TARGET_CAN_ELIMINATE		rl78_can_eliminate
 
static bool
rl78_can_eliminate (const int from ATTRIBUTE_UNUSED, const int to ATTRIBUTE_UNUSED)
{
  return true;
}
 
/* Returns nonzero if the given register needs to be saved by the
   current function.  */
static int
need_to_save (int regno)
{
  if (is_interrupt_func (cfun->decl))
    {
      if (regno < 8)
	return 1; /* don't know what devirt will need */
      if (regno > 23)
	return 0; /* don't need to save interrupt registers */
      if (current_function_is_leaf)
	{
	  return df_regs_ever_live_p (regno);
	}
      else
	return 1;
    }
  if (regno == FRAME_POINTER_REGNUM && frame_pointer_needed)
    return 1;
  if (fixed_regs[regno])
    return 0;
  if (crtl->calls_eh_return)
    return 1;
  if (df_regs_ever_live_p (regno)
      && !call_used_regs[regno])
    return 1;
  return 0;
}
 
/* We use this to wrap all emitted insns in the prologue.  */
static rtx
F (rtx x)
{
  RTX_FRAME_RELATED_P (x) = 1;
  return x;
}
 
/* Compute all the frame-related fields in our machine_function
   structure.  */
static void
rl78_compute_frame_info (void)
{
  int i;
 
  cfun->machine->computed = 1;
  cfun->machine->framesize_regs = 0;
  cfun->machine->framesize_locals = get_frame_size ();
  cfun->machine->framesize_outgoing = crtl->outgoing_args_size;
 
  for (i = 0; i < 16; i ++)
    if (need_to_save (i * 2) || need_to_save (i * 2 + 1))
      {
	cfun->machine->need_to_push [i] = 1;
	cfun->machine->framesize_regs += 2;
      }
    else
      cfun->machine->need_to_push [i] = 0;
 
  if ((cfun->machine->framesize_locals + cfun->machine->framesize_outgoing) & 1)
    cfun->machine->framesize_locals ++;
 
  cfun->machine->framesize = (cfun->machine->framesize_regs
			      + cfun->machine->framesize_locals
			      + cfun->machine->framesize_outgoing);
}

/* Returns true if the provided function has the specified attribute.  */
static inline bool
has_func_attr (const_tree decl, const char * func_attr)
{
  if (decl == NULL_TREE)
    decl = current_function_decl;
 
  return lookup_attribute (func_attr, DECL_ATTRIBUTES (decl)) != NULL_TREE;
}
 
/* Returns true if the provided function has the "interrupt" attribute.  */
static inline bool
is_interrupt_func (const_tree decl)
{
  return has_func_attr (decl, "interrupt") || has_func_attr (decl, "brk_interrupt");
}
 
/* Returns true if the provided function has the "brk_interrupt" attribute.  */
static inline bool
is_brk_interrupt_func (const_tree decl)
{
  return has_func_attr (decl, "brk_interrupt");
}
 
/* Check "interrupt" attributes.  */
static tree
rl78_handle_func_attribute (tree * node,
			  tree   name,
			  tree   args,
			  int    flags ATTRIBUTE_UNUSED,
			  bool * no_add_attrs)
{
  gcc_assert (DECL_P (* node));
  gcc_assert (args == NULL_TREE);
 
  if (TREE_CODE (* node) != FUNCTION_DECL)
    {
      warning (OPT_Wattributes, "%qE attribute only applies to functions",
	       name);
      * no_add_attrs = true;
    }
 
  /* FIXME: We ought to check that the interrupt and exception
     handler attributes have been applied to void functions.  */
  return NULL_TREE;
}
 
#undef  TARGET_ATTRIBUTE_TABLE
#define TARGET_ATTRIBUTE_TABLE		rl78_attribute_table
 
/* Table of RL78-specific attributes.  */
const struct attribute_spec rl78_attribute_table[] =
{
  /* Name, min_len, max_len, decl_req, type_req, fn_type_req, handler,
     affects_type_identity.  */
  { "interrupt",      0, 0, true, false, false, rl78_handle_func_attribute,
    false },
  { "brk_interrupt",  0, 0, true, false, false, rl78_handle_func_attribute,
    false },
  { NULL,             0, 0, false, false, false, NULL, false }
};
 
 

/* Break down an address RTX into its component base/index/addend
   portions and return TRUE if the address is of a valid form, else
   FALSE.  */
static bool
characterize_address (rtx x, rtx *base, rtx *index, rtx *addend)
{
  *base = NULL_RTX;
  *index = NULL_RTX;
  *addend = NULL_RTX;
 
  if (GET_CODE (x) == REG)
    {
      *base = x;
      return true;
    }
 
  /* We sometimes get these without the CONST wrapper */
  if (GET_CODE (x) == PLUS
      && GET_CODE (XEXP (x, 0)) == SYMBOL_REF
      && GET_CODE (XEXP (x, 1)) == CONST_INT)
    {
      *addend = x;
      return true;
    }
 
  if (GET_CODE (x) == PLUS)
    {
      *base = XEXP (x, 0);
      x = XEXP (x, 1);
 
      if (GET_CODE (*base) != REG
	  && GET_CODE (x) == REG)
	{
	  rtx tmp = *base;
	  *base = x;
	  x = tmp;
	}
 
      if (GET_CODE (*base) != REG)
	return false;
 
      if (GET_CODE (x) == ZERO_EXTEND
	  && GET_CODE (XEXP (x, 0)) == REG)
	{
	  *index = XEXP (x, 0);
	  return false;
	}
    }
 
  switch (GET_CODE (x))
    {
    case PLUS:
      if (GET_CODE (XEXP (x, 0)) == SYMBOL_REF
	  && GET_CODE (XEXP (x, 0)) == CONST_INT)
	{
	  *addend = x;
	  return true;
	}
      /* fall through */
    case MEM:
    case REG:
      return false;
 
    case CONST:
    case SYMBOL_REF:
    case CONST_INT:
      *addend = x;
      return true;
 
    default:
      return false;
    }
 
  return false;
}
 
/* Used by the Whb constraint.  Match addresses that use HL+B or HL+C
   addressing.  */
bool
rl78_hl_b_c_addr_p (rtx op)
{
  rtx hl, bc;
 
  if (GET_CODE (op) != PLUS)
    return false;
  hl = XEXP (op, 0);
  bc = XEXP (op, 1);
  if (GET_CODE (hl) == ZERO_EXTEND)
    {
      rtx tmp = hl;
      hl = bc;
      bc = tmp;
    }
  if (GET_CODE (hl) != REG)
    return false;
  if (GET_CODE (bc) != ZERO_EXTEND)
    return false;
  bc = XEXP (bc, 0);
  if (GET_CODE (bc) != REG)
    return false;
  if (REGNO (hl) != HL_REG)
    return false;
  if (REGNO (bc) != B_REG && REGNO (bc) != C_REG)
    return false;
 
  return true;
}
 
#define REG_IS(r, regno) (((r) == (regno)) || ((r) >= FIRST_PSEUDO_REGISTER && !(strict)))
 
/* Used in various constraints and predicates to match operands in the
   "far" address space.  */
int
rl78_far_p (rtx x)
{
  if (GET_CODE (x) != MEM)
    return 0;
#if DEBUG0
  fprintf(stderr, "\033[35mrl78_far_p: "); debug_rtx(x);
  fprintf(stderr, " = %d\033[0m\n", MEM_ADDR_SPACE (x) == ADDR_SPACE_FAR);
#endif
  return MEM_ADDR_SPACE (x) == ADDR_SPACE_FAR;
}
 
/* Return the appropriate mode for a named address pointer.  */
#undef TARGET_ADDR_SPACE_POINTER_MODE
#define TARGET_ADDR_SPACE_POINTER_MODE rl78_addr_space_pointer_mode
static enum machine_mode
rl78_addr_space_pointer_mode (addr_space_t addrspace)
{
  switch (addrspace)
    {
    case ADDR_SPACE_GENERIC:
      return HImode;
    case ADDR_SPACE_FAR:
      return SImode;
    default:
      gcc_unreachable ();
    }
}
 
/* Return the appropriate mode for a named address address.  */
#undef TARGET_ADDR_SPACE_ADDRESS_MODE
#define TARGET_ADDR_SPACE_ADDRESS_MODE rl78_addr_space_address_mode
static enum machine_mode
rl78_addr_space_address_mode (addr_space_t addrspace)
{
  switch (addrspace)
    {
    case ADDR_SPACE_GENERIC:
      return HImode;
    case ADDR_SPACE_FAR:
      return SImode;
    default:
      gcc_unreachable ();
    }
}
 
#undef  TARGET_LEGITIMATE_CONSTANT_P
#define TARGET_LEGITIMATE_CONSTANT_P		rl78_is_legitimate_constant
 
static bool
rl78_is_legitimate_constant (enum machine_mode mode ATTRIBUTE_UNUSED, rtx x ATTRIBUTE_UNUSED)
{
  return true;
}
 
#undef  TARGET_ADDR_SPACE_LEGITIMATE_ADDRESS_P
#define TARGET_ADDR_SPACE_LEGITIMATE_ADDRESS_P	rl78_as_legitimate_address
 
bool
rl78_as_legitimate_address (enum machine_mode mode ATTRIBUTE_UNUSED, rtx x,
			    bool strict ATTRIBUTE_UNUSED, addr_space_t as ATTRIBUTE_UNUSED)
{
  rtx base, index, addend;
 
  if (as == ADDR_SPACE_GENERIC
      && GET_MODE (x) == SImode)
    return false;
 
  if (! characterize_address (x, &base, &index, &addend))
    return false;
 
  if (base && index)
    {
      int ir = REGNO (index);
      int br = REGNO (base);
 
#define OK(test, debug) if (test) { /*fprintf(stderr, "%d: OK %s\n", __LINE__, debug);*/ return true; }
      OK (REG_IS (br, HL_REG) && REG_IS (ir, B_REG), "[hl+b]");
      OK (REG_IS (br, HL_REG) && REG_IS (ir, C_REG), "[hl+c]");
      return false;
    }
 
  if (strict && base && GET_CODE (base) == REG && REGNO (base) >= FIRST_PSEUDO_REGISTER)
    return false;
 
  return true;
}
 
/* Determine if one named address space is a subset of another.  */
#undef  TARGET_ADDR_SPACE_SUBSET_P
#define TARGET_ADDR_SPACE_SUBSET_P rl78_addr_space_subset_p
static bool
rl78_addr_space_subset_p (addr_space_t subset, addr_space_t superset)
{
  gcc_assert (subset == ADDR_SPACE_GENERIC || subset == ADDR_SPACE_FAR);
  gcc_assert (superset == ADDR_SPACE_GENERIC || superset == ADDR_SPACE_FAR);
 
  if (subset == superset)
    return true;
 
  else
    return (subset == ADDR_SPACE_GENERIC && superset == ADDR_SPACE_FAR);
}
 
#undef  TARGET_ADDR_SPACE_CONVERT
#define TARGET_ADDR_SPACE_CONVERT rl78_addr_space_convert
/* Convert from one address space to another.  */
static rtx
rl78_addr_space_convert (rtx op, tree from_type, tree to_type)
{
  addr_space_t from_as = TYPE_ADDR_SPACE (TREE_TYPE (from_type));
  addr_space_t to_as = TYPE_ADDR_SPACE (TREE_TYPE (to_type));
  rtx result;
 
  gcc_assert (from_as == ADDR_SPACE_GENERIC || from_as == ADDR_SPACE_FAR);
  gcc_assert (to_as == ADDR_SPACE_GENERIC || to_as == ADDR_SPACE_FAR);
 
  if (to_as == ADDR_SPACE_GENERIC && from_as == ADDR_SPACE_FAR)
    {
      /* This is unpredictable, as we're truncating off usable address
	 bits.  */
 
      result = gen_reg_rtx (HImode);
      emit_move_insn (result, simplify_subreg (HImode, op, SImode, 0));
      return result;
    }
  else if (to_as == ADDR_SPACE_FAR && from_as == ADDR_SPACE_GENERIC)
    {
      /* This always works.  */
      result = gen_reg_rtx (SImode);
      debug_rtx(result);
      debug_rtx(op);
      emit_move_insn (rl78_subreg (HImode, result, SImode, 0), op);
      emit_move_insn (rl78_subreg (HImode, result, SImode, 2), const0_rtx);
      return result;
    }
  else
    gcc_unreachable ();
}
 
/* Implements REGNO_MODE_CODE_OK_FOR_BASE_P.  */
bool
rl78_regno_mode_code_ok_for_base_p (int regno, enum machine_mode mode ATTRIBUTE_UNUSED,
				    addr_space_t address_space ATTRIBUTE_UNUSED,
				    int outer_code ATTRIBUTE_UNUSED, int index_code)
{
  if (regno < 24 && regno >= 16)
    return true;
  if (index_code == REG)
    return (regno == HL_REG);
  if (regno == C_REG || regno == B_REG || regno == E_REG || regno == L_REG)
    return true;
  return false;
}
 
/* Implements MODE_CODE_BASE_REG_CLASS.  */
enum reg_class
rl78_mode_code_base_reg_class (enum machine_mode mode ATTRIBUTE_UNUSED,
			       addr_space_t address_space ATTRIBUTE_UNUSED,
			       int outer_code ATTRIBUTE_UNUSED,
			       int index_code ATTRIBUTE_UNUSED)
{
  return V_REGS;
}
 
/* Implements INITIAL_ELIMINATION_OFFSET.  The frame layout is
   described in the machine_Function struct definition, above.  */
int
rl78_initial_elimination_offset (int from, int to)
{
  int rv = 0; /* as if arg to arg */
 
  rl78_compute_frame_info ();
 
  switch (to)
    {
    case STACK_POINTER_REGNUM:
      rv += cfun->machine->framesize_outgoing;
      rv += cfun->machine->framesize_locals;
      /* Fall through.  */
    case FRAME_POINTER_REGNUM:
      rv += cfun->machine->framesize_regs;
      rv += 4;
      break;
    default:
      gcc_unreachable ();
    }
 
  switch (from)
    {
    case FRAME_POINTER_REGNUM:
      rv -= 4;
      rv -= cfun->machine->framesize_regs;
    case ARG_POINTER_REGNUM:
      break;
    default:
      gcc_unreachable ();
    }
 
  return rv;
}
 
/* Expand the function prologue (from the prologue pattern).  */
void
rl78_expand_prologue (void)
{
  int i, fs;
  rtx sp = gen_rtx_REG (HImode, STACK_POINTER_REGNUM);
  int rb = 0;
 
  if (!cfun->machine->computed)
    rl78_compute_frame_info ();
 
  for (i = 0; i < 16; i++)
    if (cfun->machine->need_to_push [i])
      {
	int need_bank = i/4;
	if (need_bank != rb)
	  {
	    emit_insn (gen_sel_rb (GEN_INT (need_bank)));
	    rb = need_bank;
	  }
	F (emit_insn (gen_push (gen_rtx_REG (HImode, i*2))));
      }
  if (rb != 0)
    emit_insn (gen_sel_rb (GEN_INT (0)));
 
  if (frame_pointer_needed)
    F (emit_move_insn (gen_rtx_REG (HImode, FRAME_POINTER_REGNUM),
		       gen_rtx_REG (HImode, STACK_POINTER_REGNUM)));
 
  fs = cfun->machine->framesize_locals + cfun->machine->framesize_outgoing;
  while (fs > 0)
    {
      int fs_byte = (fs > 254) ? 254 : fs;
      F (emit_insn (gen_subhi3 (sp, sp, GEN_INT (fs_byte))));
      fs -= fs_byte;
    }
}
 
/* Expand the function epilogue (from the epilogue pattern).  */
void
rl78_expand_epilogue (void)
{
  int i, fs;
  rtx sp = gen_rtx_REG (HImode, STACK_POINTER_REGNUM);
  int rb = 0;
 
  if (frame_pointer_needed)
    {
      emit_move_insn (gen_rtx_REG (HImode, STACK_POINTER_REGNUM),
		      gen_rtx_REG (HImode, FRAME_POINTER_REGNUM));
    }
  else
    {
      fs = cfun->machine->framesize_locals + cfun->machine->framesize_outgoing;
      while (fs > 0)
	{
	  int fs_byte = (fs > 254) ? 254 : fs;
 
	  emit_insn (gen_addhi3 (sp, sp, GEN_INT (fs_byte)));
	  fs -= fs_byte;
	}
    }
 
  for (i = 15; i >= 0; i--)
    if (cfun->machine->need_to_push [i])
      {
	int need_bank = i / 4;
 
	if (need_bank != rb)
	  {
	    emit_insn (gen_sel_rb (GEN_INT (need_bank)));
	    rb = need_bank;
	  }
	emit_insn (gen_pop (gen_rtx_REG (HImode, i * 2)));
      }
 
  if (rb != 0)
    emit_insn (gen_sel_rb (GEN_INT (0)));
 
  if (cfun->machine->trampolines_used)
    emit_insn (gen_trampoline_uninit ());
 
  if (is_brk_interrupt_func (cfun->decl))
    emit_jump_insn (gen_brk_interrupt_return ());
  else if (is_interrupt_func (cfun->decl))
    emit_jump_insn (gen_interrupt_return ());
  else
    emit_jump_insn (gen_rl78_return ());
}
 
/* Likewise, for exception handlers.  */
void
rl78_expand_eh_epilogue (rtx x ATTRIBUTE_UNUSED)
{
  /* FIXME - replace this with an indirect jump with stack adjust.  */
  emit_jump_insn (gen_rl78_return ());
}
 
#undef  TARGET_ASM_FUNCTION_PROLOGUE
#define TARGET_ASM_FUNCTION_PROLOGUE	rl78_start_function
 
/* We don't use this to actually emit the function prologue.  We use
   this to insert a comment in the asm file describing the
   function.  */
static void
rl78_start_function (FILE *file, HOST_WIDE_INT hwi_local ATTRIBUTE_UNUSED)
{
  int i;
 
  if (cfun->machine->framesize == 0)
    return;
  fprintf (file, "\t; start of function\n");
 
  if (cfun->machine->framesize_regs)
    {
      fprintf (file, "\t; push %d:", cfun->machine->framesize_regs);
      for (i = 0; i < 16; i ++)
	if (cfun->machine->need_to_push[i])
	  fprintf (file, " %s", word_regnames[i*2]);
      fprintf(file, "\n");
    }
 
  if (frame_pointer_needed)
    fprintf (file, "\t; $fp points here (r22)\n");
 
  if (cfun->machine->framesize_locals)
    fprintf (file, "\t; locals: %d byte%s\n", cfun->machine->framesize_locals,
	     cfun->machine->framesize_locals == 1 ? "" : "s");
 
  if (cfun->machine->framesize_outgoing)
    fprintf (file, "\t; outgoing: %d byte%s\n", cfun->machine->framesize_outgoing,
	     cfun->machine->framesize_outgoing == 1 ? "" : "s");
}
 
/* Return an RTL describing where a function return value of type RET_TYPE
   is held.  */
 
#undef  TARGET_FUNCTION_VALUE
#define TARGET_FUNCTION_VALUE		rl78_function_value
 
static rtx
rl78_function_value (const_tree ret_type,
		     const_tree fn_decl_or_type ATTRIBUTE_UNUSED,
		     bool       outgoing ATTRIBUTE_UNUSED)
{
  enum machine_mode mode = TYPE_MODE (ret_type);
 
  return gen_rtx_REG (mode, 8);
}
 
#undef  TARGET_PROMOTE_FUNCTION_MODE
#define TARGET_PROMOTE_FUNCTION_MODE rl78_promote_function_mode
 
static enum machine_mode
rl78_promote_function_mode (const_tree type ATTRIBUTE_UNUSED,
			    enum machine_mode mode,
			    int *punsignedp ATTRIBUTE_UNUSED,
			    const_tree funtype ATTRIBUTE_UNUSED, int for_return ATTRIBUTE_UNUSED)
{
  return mode;
}
 
/* Return an RTL expression describing the register holding a function
   parameter of mode MODE and type TYPE or NULL_RTX if the parameter should
   be passed on the stack.  CUM describes the previous parameters to the
   function and NAMED is false if the parameter is part of a variable
   parameter list, or the last named parameter before the start of a
   variable parameter list.  */
 
#undef  TARGET_FUNCTION_ARG
#define TARGET_FUNCTION_ARG     	rl78_function_arg
 
static rtx
rl78_function_arg (cumulative_args_t cum_v ATTRIBUTE_UNUSED,
		   enum machine_mode mode ATTRIBUTE_UNUSED,
		   const_tree type ATTRIBUTE_UNUSED,
		   bool named ATTRIBUTE_UNUSED)
{
  return NULL_RTX;
}
 
#undef  TARGET_FUNCTION_ARG_ADVANCE
#define TARGET_FUNCTION_ARG_ADVANCE     rl78_function_arg_advance
 
static void
rl78_function_arg_advance (cumulative_args_t cum_v, enum machine_mode mode, const_tree type,
			   bool named ATTRIBUTE_UNUSED)
{
  int rounded_size;
  CUMULATIVE_ARGS * cum = get_cumulative_args (cum_v);
 
  rounded_size = ((mode == BLKmode)
		  ? int_size_in_bytes (type) : GET_MODE_SIZE (mode));
  if (rounded_size & 1)
    rounded_size ++;
  (*cum) += rounded_size;
}
 
#undef  TARGET_FUNCTION_ARG_BOUNDARY
#define	TARGET_FUNCTION_ARG_BOUNDARY rl78_function_arg_boundary
 
static unsigned int
rl78_function_arg_boundary (enum machine_mode mode ATTRIBUTE_UNUSED,
			    const_tree type ATTRIBUTE_UNUSED)
{
  return 16;
}
 
/* Supported modifier letters:
 
   A - address of a MEM
   S - SADDR form of a real register
   v - real register corresponding to a virtual register
   m - minus - negative of CONST_INT value.
   c - inverse of a conditional (NE vs EQ for example)
 
   h - bottom HI of an SI
   H - top HI of an SI
   q - bottom QI of an HI
   Q - top QI of an HI
   e - third QI of an SI (i.e. where the ES register gets values from)
 
*/
 
/* Implements the bulk of rl78_print_operand, below.  We do it this
   way because we need to test for a constant at the top level and
   insert the '#', but not test for it anywhere else as we recurse
   down into the operand.  */
static void
rl78_print_operand_1 (FILE * file, rtx op, int letter)
{
  int need_paren;
 
  switch (GET_CODE (op))
    {
    case MEM:
      if (letter == 'A')
	rl78_print_operand_1 (file, XEXP (op, 0), letter);
      else
	{
	  if (rl78_far_p (op))
	    fprintf(file, "es:");
	  if (letter == 'H')
	    {
	      op = adjust_address (op, HImode, 2);
	      letter = 0;
	    }
	  if (letter == 'h')
	    {
	      op = adjust_address (op, HImode, 0);
	      letter = 0;
	    }
	  if (letter == 'Q')
	    {
	      op = adjust_address (op, QImode, 1);
	      letter = 0;
	    }
	  if (letter == 'q')
	    {
	      op = adjust_address (op, QImode, 0);
	      letter = 0;
	    }
	  if (letter == 'e')
	    {
	      op = adjust_address (op, QImode, 2);
	      letter = 0;
	    }
	  if (CONSTANT_P (XEXP (op, 0)))
	    {
	      fprintf(file, "!");
	      rl78_print_operand_1 (file, XEXP (op, 0), letter);
	    }
	  else if (GET_CODE (XEXP (op, 0)) == PLUS
		   && GET_CODE (XEXP (XEXP (op, 0), 0)) == SYMBOL_REF)
	    {
	      fprintf(file, "!");
	      rl78_print_operand_1 (file, XEXP (op, 0), letter);
	    }
	  else if (GET_CODE (XEXP (op, 0)) == PLUS
		   && GET_CODE (XEXP (XEXP (op, 0), 0)) == REG
		   && REGNO (XEXP (XEXP (op, 0), 0)) == 2)
	    {
	      rl78_print_operand_1 (file, XEXP (XEXP (op, 0), 1), 'u');
	      fprintf(file, "[");
	      rl78_print_operand_1 (file, XEXP (XEXP (op, 0), 0), 0);
	      fprintf(file, "]");
	    }
	  else
	    {
	      fprintf(file, "[");
	      rl78_print_operand_1 (file, XEXP (op, 0), letter);
	      fprintf(file, "]");
	    }
	}
      break;
 
    case REG:
      if (letter == 'Q')
	fprintf (file, "%s", reg_names [REGNO (op) | 1]);
      else if (letter == 'H')
	fprintf (file, "%s", reg_names [REGNO (op) + 2]);
      else if (letter == 'q')
	fprintf (file, "%s", reg_names [REGNO (op) & ~1]);
      else if (letter == 'e')
	fprintf (file, "%s", reg_names [REGNO (op) + 2]);
      else if (letter == 'S')
	fprintf (file, "0x%x", 0xffef8 + REGNO (op));
      else if (GET_MODE (op) == HImode
	       && ! (REGNO (op) & ~0xfe))
	{
	  if (letter == 'v')
	    fprintf (file, "%s", word_regnames [REGNO (op) % 8]);
	  else
	    fprintf (file, "%s", word_regnames [REGNO (op)]);
	}
      else
	fprintf (file, "%s", reg_names [REGNO (op)]);
      break;
 
    case CONST_INT:
      if (letter == 'Q')
	fprintf (file, "%ld", INTVAL (op) >> 8);
      else if (letter == 'H')
	fprintf (file, "%ld", INTVAL (op) >> 16);
      else if (letter == 'q')
	fprintf (file, "%ld", INTVAL (op) & 0xff);
      else if (letter == 'h')
	fprintf (file, "%ld", INTVAL (op) & 0xffff);
      else if (letter == 'e')
	fprintf (file, "%ld", (INTVAL (op) >> 16) & 0xff);
      else if (letter == 'm')
	fprintf (file, "%ld", - INTVAL (op));
      else
	fprintf(file, "%ld", INTVAL (op));
      break;
 
    case CONST:
      rl78_print_operand_1 (file, XEXP (op, 0), letter);
      break;
 
    case ZERO_EXTRACT:
      {
	int bits = INTVAL (XEXP (op, 1));
	int ofs = INTVAL (XEXP (op, 2));
	if (bits == 16 && ofs == 0)
	  fprintf (file, "%%lo16(");
	else if (bits == 16 && ofs == 16)
	  fprintf (file, "%%hi16(");
	else if (bits == 8 && ofs == 16)
	  fprintf (file, "%%hi8(");
	else
	  gcc_unreachable ();
	rl78_print_operand_1 (file, XEXP (op, 0), 0);
	fprintf (file, ")");
      }
      break;
 
    case ZERO_EXTEND:
      if (GET_CODE (XEXP (op, 0)) == REG)
	fprintf (file, "%s", reg_names [REGNO (XEXP (op, 0))]);
      else
	print_rtl (file, op);
      break;
 
    case PLUS:
      need_paren = 0;
      if (letter == 'H')
	{
	  fprintf (file, "%%hi16(");
	  need_paren = 1;
	  letter = 0;
	}
      if (letter == 'h')
	{
	  fprintf (file, "%%lo16(");
	  need_paren = 1;
	  letter = 0;
	}
      if (letter == 'e')
	{
	  fprintf (file, "%%hi8(");
	  need_paren = 1;
	  letter = 0;
	}
      if (letter == 'q' || letter == 'Q')
	output_operand_lossage ("q/Q modifiers invalid for symbol references");
 
      if (GET_CODE (XEXP (op, 0)) == ZERO_EXTEND)
	{
	  rl78_print_operand_1 (file, XEXP (op, 1), letter);
	  fprintf (file, "+");
	  rl78_print_operand_1 (file, XEXP (op, 0), letter);
	}
      else
	{
	  rl78_print_operand_1 (file, XEXP (op, 0), letter);
	  fprintf (file, "+");
	  rl78_print_operand_1 (file, XEXP (op, 1), letter);
	}
      if (need_paren)
	fprintf (file, ")");
      break;
 
    case SYMBOL_REF:
      need_paren = 0;
      if (letter == 'H')
	{
	  fprintf (file, "%%hi16(");
	  need_paren = 1;
	  letter = 0;
	}
      if (letter == 'h')
	{
	  fprintf (file, "%%lo16(");
	  need_paren = 1;
	  letter = 0;
	}
      if (letter == 'e')
	{
	  fprintf (file, "%%hi8(");
	  need_paren = 1;
	  letter = 0;
	}
      if (letter == 'q' || letter == 'Q')
	output_operand_lossage ("q/Q modifiers invalid for symbol references");
 
      output_addr_const (file, op);
      if (need_paren)
	fprintf (file, ")");
      break;
 
    case CODE_LABEL:
    case LABEL_REF:
      output_asm_label (op);
      break;
 
    case LTU:
      fprintf (file, letter == 'c' ? "nc" : "c");
      break;
    case LEU:
      fprintf (file, letter == 'c' ? "h" : "nh");
      break;
    case GEU:
      fprintf (file, letter == 'c' ? "c" : "nc");
      break;
    case GTU:
      fprintf (file, letter == 'c' ? "nh" : "h");
      break;
    case EQ:
      fprintf (file, letter == 'c' ? "nz" : "z");
      break;
    case NE:
      fprintf (file, letter == 'c' ? "z" : "nz");
      break;
 
    default:
      fprintf (file, "(%s)", GET_RTX_NAME (GET_CODE (op)));
      break;
    }
}
 
#undef  TARGET_PRINT_OPERAND
#define TARGET_PRINT_OPERAND		rl78_print_operand
 
static void
rl78_print_operand (FILE * file, rtx op, int letter)
{
  if (CONSTANT_P (op) && letter != 'u')
    fprintf (file, "#");
  rl78_print_operand_1 (file, op, letter);
}
 
#undef  TARGET_TRAMPOLINE_INIT
#define TARGET_TRAMPOLINE_INIT rl78_trampoline_init
 
/* Note that the RL78's addressing makes it very difficult to do
   trampolines on the stack.  So, libgcc has a small pool of
   trampolines from which one is allocated to this task.  */
static void
rl78_trampoline_init (rtx m_tramp, tree fndecl, rtx static_chain)
{
  rtx mov_addr, thunk_addr;
  rtx function = XEXP (DECL_RTL (fndecl), 0);
 
  mov_addr = adjust_address (m_tramp, HImode, 0);
  thunk_addr = gen_reg_rtx (HImode);
 
  function = force_reg (HImode, function);
  static_chain = force_reg (HImode, static_chain);
 
  emit_insn (gen_trampoline_init (thunk_addr, function, static_chain));
  emit_move_insn (mov_addr, thunk_addr);
 
  cfun->machine->trampolines_used = 1;
}
 
#undef  TARGET_TRAMPOLINE_ADJUST_ADDRESS
#define TARGET_TRAMPOLINE_ADJUST_ADDRESS rl78_trampoline_adjust_address
 
static rtx
rl78_trampoline_adjust_address (rtx m_tramp)
{
  rtx x = gen_rtx_MEM (HImode, m_tramp);
  return x;
}

/* Expander for cbranchqi4 and cbranchhi4.  RL78 is missing some of
   the "normal" compares, specifically, it only has unsigned compares,
   so we must synthesize the missing ones.  */
void
rl78_expand_compare (rtx *operands)
{
  /* RL78 does not have signed comparisons.  We must modify the
     operands to be in the unsigned range, and emit an unsigned
     comparison.  */
 
  enum machine_mode mode;
  rtx high_bit;
  int i;
  RTX_CODE new_cond;
 
  switch (GET_CODE (operands[0]))
    {
    case GE:
      new_cond = GEU;
      break;
    case LE:
      new_cond = LEU;
      break;
    case GT:
      new_cond = GTU;
      break;
    case LT:
      new_cond = LTU;
      break;
    default:
      return;
    }
 
#if DEBUG0
  fprintf (stderr, "\033[38;5;129mrl78_expand_compare\n");
  debug_rtx (operands[0]);
  fprintf (stderr, "\033[0m");
#endif
 
  mode = GET_MODE (operands[1]);
  if (mode == VOIDmode)
    mode = GET_MODE (operands[2]);
  high_bit = GEN_INT (~0 << (GET_MODE_BITSIZE (mode) - 1));
 
  /* 0: conditional 1,2: operands */
  for (i = 1; i <= 2; i ++)
    {
      rtx r = operands[i];
 
      if (GET_CODE (r) == CONST_INT)
	r = GEN_INT (INTVAL (r) ^ INTVAL (high_bit));
      else
	{
	  r = gen_rtx_PLUS (mode, operands[i], high_bit);
	  r = copy_to_mode_reg (mode, r);
	}
      operands[i] = r;
    }
 
  operands[0] = gen_rtx_fmt_ee (new_cond, GET_MODE (operands[0]), operands[1], operands[2]);
 
#if DEBUG0
  fprintf (stderr, "\033[38;5;142mrl78_expand_compare\n");
  debug_rtx (operands[0]);
  fprintf (stderr, "\033[0m");
#endif
}
 

 
/* Define this to 1 if you are debugging the peephole optimizers.  */
#define DEBUG_PEEP 0
 
/* Predicate used to enable the peephole2 patterns in rl78-virt.md.
   The default "word" size is a byte so we can effectively use all the
   registers, but we want to do 16-bit moves whenever possible.  This
   function determines when such a move is an option.  */
bool
rl78_peep_movhi_p (rtx *operands)
{
  int i;
  rtx m, a;
 
  /* (set (op0) (op1))
     (set (op2) (op3)) */
 
#if DEBUG_PEEP
  fprintf (stderr, "\033[33m");
  debug_rtx(operands[0]);
  debug_rtx(operands[1]);
  debug_rtx(operands[2]);
  debug_rtx(operands[3]);
  fprintf (stderr, "\033[0m");
#endif
 
  if (rtx_equal_p (operands[0], operands[3]))
    {
#if DEBUG_PEEP
      fprintf (stderr, "no peep: overlapping\n");
#endif
      return false;
    }
 
  for (i = 0; i < 2; i ++)
    {
      if (GET_CODE (operands[i]) != GET_CODE (operands[i+2]))
	{
#if DEBUG_PEEP
	  fprintf (stderr, "no peep: different codes\n");
#endif
	  return false;
	}
      if (GET_MODE (operands[i]) != GET_MODE (operands[i+2]))
	{
#if DEBUG_PEEP
	  fprintf (stderr, "no peep: different modes\n");
#endif
	  return false;
	}
 
      switch (GET_CODE (operands[i]))
	{
	case REG:
	  /*   LSB                      MSB  */
	  if (REGNO (operands[i]) + 1 != REGNO (operands[i+2])
	      || GET_MODE (operands[i]) != QImode)
	    {
#if DEBUG_PEEP
	      fprintf (stderr, "no peep: wrong regnos %d %d %d\n",
		       REGNO (operands[i]), REGNO (operands[i+2]),
		       i);
#endif
	      return false;
	    }
	  if (! rl78_hard_regno_mode_ok (REGNO (operands[i]), HImode))
	    {
#if DEBUG_PEEP
	      fprintf (stderr, "no peep: reg %d not HI\n", REGNO (operands[i]));
#endif
	      return false;
	    }
	  break;
 
	case CONST_INT:
	  break;
 
	case MEM:
	  if (GET_MODE (operands[i]) != QImode)
	    return false;
	  if (MEM_ALIGN (operands[i]) < 16)
	    return false;
	  a = XEXP (operands[i], 0);
	  if (GET_CODE (a) == CONST)
	    a = XEXP (a, 0);
	  if (GET_CODE (a) == PLUS)
	    a = XEXP (a, 1);
	  if (GET_CODE (a) == CONST_INT
	      && INTVAL (a) & 1)
	    {
#if DEBUG_PEEP
	      fprintf (stderr, "no peep: misaligned mem %d\n", i);
	      debug_rtx (operands[i]);
#endif
	      return false;
	    }
	  m = adjust_address (operands[i], QImode, 1);
	  if (! rtx_equal_p (m, operands[i+2]))
	    {
#if DEBUG_PEEP
	      fprintf (stderr, "no peep: wrong mem %d\n", i);
	      debug_rtx(m);
	      debug_rtx (operands[i+2]);
#endif
	      return false;
	    }
	  break;
 
	default:
#if DEBUG_PEEP
	  fprintf (stderr, "no peep: wrong rtx %d\n", i);
#endif
	  return false;
	}
    }
#if DEBUG_PEEP
  fprintf (stderr, "\033[32mpeep!\033[0m\n");
#endif
  return true;
}
 
/* Likewise, when a peephole is activated, this function helps compute
   the new operands.  */
void
rl78_setup_peep_movhi (rtx *operands)
{
  int i;
 
  for (i = 0; i < 2; i ++)
    {
      switch (GET_CODE (operands[i]))
	{
	case REG:
	  operands[i+4] = gen_rtx_REG (HImode, REGNO (operands[i]));
	  break;
 
	case CONST_INT:
	  operands[i+4] = GEN_INT ((INTVAL (operands[i]) & 0xff) + ((char)INTVAL (operands[i+2])) * 256);
	  break;
 
	case MEM:
	  operands[i+4] = adjust_address (operands[i], HImode, 0);
	  break;
 
	default:
	  break;
	}
    }
}

/*
	How Devirtualization works in the RL78 GCC port
 
Background
 
The RL78 is an 8-bit port with some 16-bit operations.  It has 32
bytes of register space, in four banks, memory-mapped.  One bank is
the "selected" bank and holds the registers used for primary
operations.  Since the registers are memory mapped, often you can
still refer to the unselected banks via memory accesses.
 
Virtual Registers
 
The GCC port uses bank 0 as the "selected" registers (A, X, BC, etc)
and refers to the other banks via their memory addresses, although
they're treated as regular registers internally.  These "virtual"
registers are R8 through R23 (bank3 is reserved for asm-based
interrupt handlers).
 
There are four machine description files:
 
rl78.md        - common register-independent patterns and definitions
rl78-expand.md - expanders
rl78-virt.md   - patterns that match BEFORE devirtualization
rl78-real.md   - patterns that match AFTER devirtualization
 
At least through register allocation and reload, gcc is told that it
can do pretty much anything - but may only use the virtual registers.
GCC cannot properly create the varying addressing modes that the RL78
supports in an efficient way.
 
Sometime after reload, the RL78 backend "devirtualizes" the RTL.  It
uses the "valloc" attribute in rl78-virt.md for determining the rules
by which it will replace virtual registers with real registers (or
not) and how to make up addressing modes.  For example, insns tagged
with "ro1" have a single read-only parameter, which may need to be
moved from memory/constant/vreg to a suitable real register.  As part
of devirtualization, a flag is toggled, disabling the rl78-virt.md
patterns and enabling the rl78-real.md patterns.  The new patterns'
constraints are used to determine the real registers used.  NOTE:
patterns in rl78-virt.md essentially ignore the constrains and rely on
predicates, where the rl78-real.md ones essentially ignore the
predicates and rely on the constraints.
 
The devirtualization pass is scheduled via the pass manager (despite
being called "rl78_reorg") so it can be scheduled prior to var-track
(the idea is to let gdb know about the new registers).  Ideally, it
would be scheduled right after pro/epilogue generation, so the
post-reload optimizers could operate on the real registers, but when I
tried that there were some issues building the target libraries.
 
During devirtualization, a simple register move optimizer is run.  It
would be better to run a full CSE/propogation pass on it through, or
re-run regmove, but that has not yet been attempted.
 
 */
#define DEBUG_ALLOC 0
 
/* Rescans an insn to see if it's recognized again.  This is done
   carefully to ensure that all the constraint information is accurate
   for the newly matched insn.  */
static bool
insn_ok_now (rtx insn)
{
  INSN_CODE (insn) = -1;
  if (recog (PATTERN (insn), insn, 0) > -1)
    {
      extract_insn (insn);
      if (constrain_operands (1))
	{
#if DEBUG_ALLOC
	  fprintf (stderr, "\033[32m");
	  debug_rtx (insn);
	  fprintf (stderr, "\033[0m");
#endif
	  return true;
	}
    }
  else
    {
      fprintf (stderr, "\033[41;30m Unrecognized insn \033[0m\n");
      debug_rtx (insn);
      gcc_unreachable ();
    }
#if DEBUG_ALLOC
  fprintf (stderr, "\033[31m");
  debug_rtx (insn);
  fprintf (stderr, "\033[0m");
#endif
  return false;
}
 
#if DEBUG_ALLOC
#define WORKED fprintf (stderr, "\033[48;5;22m Worked at line %d \033[0m\n", __LINE__)
#define FAILEDSOFAR fprintf (stderr, "\033[48;5;52m FAILED at line %d \033[0m\n", __LINE__)
#define FAILED fprintf (stderr, "\033[48;5;52m FAILED at line %d \033[0m\n", __LINE__), gcc_unreachable()
#define MAYBE_OK(insn) if (insn_ok_now (insn)) { WORKED; return; } else { FAILEDSOFAR; }
#else
#define WORKED
#define FAILEDSOFAR
#define FAILED gcc_unreachable ()
#define MAYBE_OK(insn) if (insn_ok_now (insn)) return;
#endif
 
/* Registers into which we move the contents of virtual registers.  */
#define X gen_rtx_REG (QImode, 0)
#define A gen_rtx_REG (QImode, 1)
#define C gen_rtx_REG (QImode, 2)
#define B gen_rtx_REG (QImode, 3)
#define E gen_rtx_REG (QImode, 4)
#define D gen_rtx_REG (QImode, 5)
#define L gen_rtx_REG (QImode, 6)
#define H gen_rtx_REG (QImode, 7)
 
#define AX gen_rtx_REG (HImode, 0)
#define BC gen_rtx_REG (HImode, 2)
#define DE gen_rtx_REG (HImode, 4)
#define HL gen_rtx_REG (HImode, 6)
 
#define OP(x) (*recog_data.operand_loc[x])
 
/* Returns TRUE if R is a virtual register.  */
static bool
is_virtual_register (rtx r)
{
  return (GET_CODE (r) == REG
	  && REGNO (r) >= 8
	  && REGNO (r) < 24);
}
 
/* In all these alloc routines, we expect the following: the insn
   pattern is unshared, the insn was previously recognized and failed
   due to predicates or constraints, and the operand data is in
   recog_data.  */
 
static int virt_insn_was_frame;
 
/* Hook for all insns we emit.  Re-mark them as FRAME_RELATED if
   needed.  */
static rtx
EM2 (int line ATTRIBUTE_UNUSED, rtx r)
{
#if DEBUG_ALLOC
  fprintf (stderr, "\033[36m%d: ", line);
  debug_rtx(r);
  fprintf (stderr, "\033[0m");
#endif
  /*SCHED_GROUP_P (r) = 1;*/
  if (virt_insn_was_frame)
    RTX_FRAME_RELATED_P (r) = 1;
  return r;
}
 
#define EM(x) EM2 (__LINE__, x)
 
/* Return a suitable RTX for the low half of a __far address.  */
static rtx
rl78_lo16 (rtx addr)
{
  if (GET_CODE (addr) == SYMBOL_REF
      || GET_CODE (addr) == CONST)
    {
      rtx r = gen_rtx_ZERO_EXTRACT (HImode, addr, GEN_INT (16), GEN_INT (0));
      r = gen_rtx_CONST (HImode, r);
      return r;
    }
  return rl78_subreg (HImode, addr, SImode, 0);
}
 
/* Return a suitable RTX for the high half's lower byte of a __far address.  */
static rtx
rl78_hi8 (rtx addr)
{
  if (GET_CODE (addr) == SYMBOL_REF
      || GET_CODE (addr) == CONST)
    {
      rtx r = gen_rtx_ZERO_EXTRACT (QImode, addr, GEN_INT (8), GEN_INT (16));
      r = gen_rtx_CONST (QImode, r);
      return r;
    }
  return rl78_subreg (QImode, addr, SImode, 2);
}
 
/* Copy any register values into real registers and return an RTX for
   the same memory, now addressed by real registers.  Any needed insns
   are emitted before BEFORE.  */
static rtx
transcode_memory_rtx (rtx m, rtx newbase, rtx before)
{
  rtx base, index, addendr;
  int addend = 0;
 
  if (GET_CODE (m) != MEM)
    return m;
 
  if (GET_MODE (XEXP (m, 0)) == SImode)
    {
      rtx seg = rl78_hi8 (XEXP (m, 0));
#if DEBUG_ALLOC
      fprintf (stderr, "setting ES:\n");
      debug_rtx(seg);
#endif
      emit_insn_before (EM(gen_movqi (A, seg)), before);
      emit_insn_before (EM(gen_movqi_es (A)), before);
      m = change_address (m, GET_MODE (m), rl78_lo16 (XEXP (m, 0)));
    }
 
  characterize_address (XEXP (m, 0), &base, &index, &addendr);
  gcc_assert (index == NULL_RTX);
 
#if DEBUG_ALLOC
  fprintf (stderr, "\033[33m"); debug_rtx(m); fprintf (stderr, "\033[0m");
  debug_rtx (base);
#endif
  if (base == NULL_RTX)
    return m;
 
  if (addendr && GET_CODE (addendr) == CONST_INT)
    addend = INTVAL (addendr);
 
  if (REGNO (base) == SP_REG)
    {
      if (addend >= 0 && addend  <= 255)
	return m;
    }
 
  /* BASE should be a virtual register.  We copy it to NEWBASE.  If
     the addend is out of range for DE/HL, we use AX to compute the full
     address.  */
 
  if (addend < 0
      || (addend > 255 && REGNO (newbase) != 2)
      || (addendr && GET_CODE (addendr) != CONST_INT))
    {
      /* mov ax, vreg
	 add ax, #imm
	 mov hl, ax	*/
      EM (emit_insn_before (gen_movhi (AX, base), before));
      EM (emit_insn_before (gen_addhi3 (AX, AX, addendr), before));
      EM (emit_insn_before (gen_movhi (newbase, AX), before));
      base = newbase;
      addend = 0;
    }
  else
    {
      EM (emit_insn_before (gen_movhi (newbase, base), before));
      base = newbase;
    }
 
  if (addend)
    base = gen_rtx_PLUS (HImode, base, GEN_INT (addend));
 
#if DEBUG_ALLOC
  fprintf (stderr, "\033[33m");
  debug_rtx (m);
#endif
  m = change_address (m, GET_MODE (m), base);
#if DEBUG_ALLOC
  debug_rtx (m);
  fprintf (stderr, "\033[0m");
#endif
  return m;
}
 
/* Copy SRC to accumulator (A or AX), placing any generated insns
   before BEFORE.  Returns accumulator RTX.  */
 
static rtx
move_to_acc (int opno, rtx before)
{
  rtx src = OP(opno);
  enum machine_mode mode = GET_MODE (src);
 
  if (GET_CODE (src) == REG
      && REGNO (src) < 2)
    return src;
 
  if (mode == VOIDmode)
    mode = recog_data.operand_mode[opno];
 
  if (mode == QImode)
    {
      EM (emit_insn_before (gen_movqi (A, src), before));
      return A;
    }
  else
    {
      EM (emit_insn_before (gen_movhi (AX, src), before));
      return AX;
    }
}
 
/* Copy accumulator (A or AX) to DEST, placing any generated insns
   after AFTER.  Returns accumulator RTX.  */
 
static rtx
move_from_acc (rtx dest, rtx after)
{
  enum machine_mode mode = GET_MODE (dest);
 
  if (REG_P (dest) && REGNO (dest) < 2)
    return dest;
 
  if (mode == QImode)
    {
      EM (emit_insn_after (gen_movqi (dest, A), after));
      return A;
    }
  else
    {
      EM (emit_insn_after (gen_movhi (dest, AX), after));
      return AX;
    }
}
 
/* Copy accumulator (A or AX) to REGNO, placing any generated insns
   before BEFORE.  Returns reg RTX.  */
 
static rtx
move_acc_to_reg (rtx acc, int regno, rtx before)
{
  enum machine_mode mode = GET_MODE (acc);
  rtx reg;
 
  reg = gen_rtx_REG (mode, regno);
 
  if (mode == QImode)
    {
      EM (emit_insn_before (gen_movqi (reg, A), before));
      return reg;
    }
  else
    {
      EM (emit_insn_before (gen_movhi (reg, AX), before));
      return reg;
    }
}
 
/* Copy SRC to X, placing any generated insns before BEFORE.
   Returns X RTX.  */
 
static rtx
move_to_x (int opno, rtx before)
{
  rtx src = OP(opno);
  enum machine_mode mode = GET_MODE (src);
  rtx reg;
 
  if (mode == VOIDmode)
    mode = recog_data.operand_mode[opno];
  reg = (mode == QImode) ? X : AX;
 
  if (mode == QImode || ! is_virtual_register (OP (opno)))
    {
      OP(opno) = move_to_acc (opno, before);
      OP(opno) = move_acc_to_reg (OP(opno), X_REG, before);
      return reg;
    }
 
  if (mode == QImode)
    EM (emit_insn_before (gen_movqi (reg, src), before));
  else
    EM (emit_insn_before (gen_movhi (reg, src), before));
 
  return reg;
}
 
/* Copy OP(opno) to H or HL, placing any generated insns before BEFORE.
   Returns H/HL RTX.  */
 
static rtx
move_to_hl (int opno, rtx before)
{
  rtx src = OP (opno);
  enum machine_mode mode = GET_MODE (src);
  rtx reg;
 
  if (mode == VOIDmode)
    mode = recog_data.operand_mode[opno];
  reg = (mode == QImode) ? L : HL;
 
  if (mode == QImode || ! is_virtual_register (OP (opno)))
    {
      OP (opno) = move_to_acc (opno, before);
      OP (opno) = move_acc_to_reg (OP (opno), L_REG, before);
      return reg;
    }
 
  if (mode == QImode)
    EM (emit_insn_before (gen_movqi (reg, src), before));
  else
    EM (emit_insn_before (gen_movhi (reg, src), before));
 
  return reg;
}
 
/* Copy OP(opno) to E or DE, placing any generated insns before BEFORE.
   Returns E/DE RTX.  */
 
static rtx
move_to_de (int opno, rtx before)
{
  rtx src = OP (opno);
  enum machine_mode mode = GET_MODE (src);
  rtx reg;
 
  if (mode == VOIDmode)
    mode = recog_data.operand_mode[opno];
 
  reg = (mode == QImode) ? E : DE;
 
  if (mode == QImode || ! is_virtual_register (OP (opno)))
    {
      OP (opno) = move_to_acc (opno, before);
      OP (opno) = move_acc_to_reg (OP (opno), E_REG, before);
    }
  else
    {
      rtx move = mode == QImode ? gen_movqi (reg, src) : gen_movhi (reg, src);
 
      EM (emit_insn_before (move, before));
    }
 
  return reg;
}
 
/* Devirtualize an insn of the form (SET (op) (unop (op))).  */
static void
rl78_alloc_physical_registers_op1 (rtx insn)
{
  /* op[0] = func op[1] */
 
  /* We first try using A as the destination, then copying it
     back.  */
  if (rtx_equal_p (OP(0), OP(1)))
    {
      OP(0) =
      OP(1) = transcode_memory_rtx (OP(1), DE, insn);
    }
  else
    {
      OP(0) = transcode_memory_rtx (OP(0), BC, insn);
      OP(1) = transcode_memory_rtx (OP(1), HL, insn);
    }
 
  MAYBE_OK (insn);
 
  OP(0) = move_from_acc (OP(0), insn);
 
  MAYBE_OK (insn);
 
  /* Try copying the src to acc first, then.  This is for, for
     example, ZERO_EXTEND or NOT.  */
  OP(1) = move_to_acc (1, insn);
 
  MAYBE_OK (insn);
 
  FAILED;
}
 
/* Devirtualize an insn of the form (SET (op) (unop (op) (op))).  */
static void
rl78_alloc_physical_registers_op2 (rtx insn)
{
  /* op[0] = op[1] func op[2] */
  rtx prev = prev_nonnote_nondebug_insn (insn);
  rtx first;
  bool hl_used;
 
  if (rtx_equal_p (OP(0), OP(1)))
    {
      OP(0) =
      OP(1) = transcode_memory_rtx (OP(1), DE, insn);
      prev = next_nonnote_nondebug_insn (prev);
      OP(2) = transcode_memory_rtx (OP(2), HL, insn);
      prev = prev_nonnote_nondebug_insn (prev);
    }
  else if (rtx_equal_p (OP(0), OP(2)))
    {
      OP(1) = transcode_memory_rtx (OP(1), DE, insn);
      prev = next_nonnote_nondebug_insn (prev);
      OP(0) =
      OP(2) = transcode_memory_rtx (OP(2), HL, insn);
      prev = prev_nonnote_nondebug_insn (prev);
    }
  else
    {
      OP(0) = transcode_memory_rtx (OP(0), BC, insn);
      OP(1) = transcode_memory_rtx (OP(1), DE, insn);
      prev = next_nonnote_nondebug_insn (prev);
      OP(2) = transcode_memory_rtx (OP(2), HL, insn);
    }
 
  MAYBE_OK (insn);
 
  prev = prev_nonnote_nondebug_insn (insn);
  if (recog_data.constraints[1][0] == '%'
      && is_virtual_register (OP (1))
      && ! is_virtual_register (OP (2))
      && ! CONSTANT_P (OP (2)))
    {
      rtx tmp = OP (1);
      OP (1) = OP (2);
      OP (2) = tmp;
    }
 
  /* Make a note of wether (H)L is being used.  It matters
     because if OP(2) alsoneeds reloading, then we must take
     care not to corrupt HL.  */
  hl_used = reg_mentioned_p (L, OP (0)) || reg_mentioned_p (L, OP (1));
 
  OP(0) = move_from_acc (OP (0), insn);
  OP(1) = move_to_acc (1, insn);
 
  MAYBE_OK (insn);
 
  /* We have to copy op2 to HL, but that involves AX, which
     already has a live value.  Emit it before those insns.  */
 
  if (prev)
    first = next_nonnote_nondebug_insn (prev);
  else
    for (first = insn; prev_nonnote_nondebug_insn (first); first = prev_nonnote_nondebug_insn (first))
      ;
 
  OP (2) = hl_used ? move_to_de (2, first) : move_to_hl (2, first);
 
  MAYBE_OK (insn);
 
  FAILED;
}
 
/* Devirtualize an insn of the form (SET () (unop (op))).  */
 
static void
rl78_alloc_physical_registers_ro1 (rtx insn)
{
  /* (void) op[0] */
  OP(0) = transcode_memory_rtx (OP(0), BC, insn);
 
  MAYBE_OK (insn);
 
  OP(0) = move_to_acc (0, insn);
 
  MAYBE_OK (insn);
 
  FAILED;
}
 
/* Devirtualize a compare insn.  */
static void
rl78_alloc_physical_registers_cmp (rtx insn)
{
  /* op[1] cmp_op[0] op[2] */
  rtx prev = prev_nonnote_nondebug_insn (insn);
  rtx first;
 
  OP(1) = transcode_memory_rtx (OP(1), DE, insn);
  OP(2) = transcode_memory_rtx (OP(2), HL, insn);
 
  MAYBE_OK (insn);
 
  OP(1) = move_to_acc (1, insn);
 
  MAYBE_OK (insn);
 
  /* We have to copy op2 to HL, but that involves the acc, which
     already has a live value.  Emit it before those insns.  */
 
  if (prev)
    first = next_nonnote_nondebug_insn (prev);
  else
    for (first = insn; prev_nonnote_nondebug_insn (first); first = prev_nonnote_nondebug_insn (first))
      ;
  OP(2) = move_to_hl (2, first);
 
  MAYBE_OK (insn);
 
  FAILED;
}
 
/* Like op2, but AX = A op X.  */
static void
rl78_alloc_physical_registers_umul (rtx insn)
{
  /* op[0] = op[1] func op[2] */
  rtx prev = prev_nonnote_nondebug_insn (insn);
  rtx first;
 
  OP(0) = transcode_memory_rtx (OP(0), BC, insn);
  OP(1) = transcode_memory_rtx (OP(1), DE, insn);
  OP(2) = transcode_memory_rtx (OP(2), HL, insn);
 
  MAYBE_OK (insn);
 
  if (recog_data.constraints[1][0] == '%'
      && is_virtual_register (OP(1))
      && !is_virtual_register (OP(2))
      && !CONSTANT_P (OP(2)))
    {
      rtx tmp = OP(1);
      OP(1) = OP(2);
      OP(2) = tmp;
    }
 
  OP(0) = move_from_acc (OP(0), insn);
  OP(1) = move_to_acc (1, insn);
 
  MAYBE_OK (insn);
 
  /* We have to copy op2 to X, but that involves the acc, which
     already has a live value.  Emit it before those insns.  */
 
  if (prev)
    first = next_nonnote_nondebug_insn (prev);
  else
    for (first = insn; prev_nonnote_nondebug_insn (first); first = prev_nonnote_nondebug_insn (first))
      ;
  OP(2) = move_to_x (2, first);
 
  MAYBE_OK (insn);
 
  FAILED;
}
 
/* Scan all insns and devirtualize them.  */
static void
rl78_alloc_physical_registers (void)
{
  /* During most of the compile, gcc is dealing with virtual
     registers.  At this point, we need to assign physical registers
     to the vitual ones, and copy in/out as needed.  */
 
  rtx insn, curr;
  enum attr_valloc valloc_method;
 
  for (insn = get_insns (); insn; insn = curr)
    {
      int i;
 
      curr = next_nonnote_nondebug_insn (insn);
 
      if (INSN_P (insn)
	  && (GET_CODE (PATTERN (insn)) == SET
	      || GET_CODE (PATTERN (insn)) == CALL)
	  && INSN_CODE (insn) == -1)
	{
	  if (GET_CODE (SET_SRC (PATTERN (insn))) == ASM_OPERANDS)
	    continue;
	  i = recog (PATTERN (insn), insn, 0);
	  if (i == -1)
	    {
	      debug_rtx (insn);
	      gcc_unreachable ();
	    }
	  INSN_CODE (insn) = i;
	}
    }
 
  cfun->machine->virt_insns_ok = 0;
  cfun->machine->real_insns_ok = 1;
 
  for (insn = get_insns (); insn; insn = curr)
    {
      curr = insn ? next_nonnote_nondebug_insn (insn) : NULL;
 
      if (!INSN_P (insn))
	continue;
      if (GET_CODE (PATTERN (insn)) != SET
	  && GET_CODE (PATTERN (insn)) != CALL)
	  continue;
 
      if (GET_CODE (SET_SRC (PATTERN (insn))) == ASM_OPERANDS)
	continue;
 
      valloc_method = get_attr_valloc (insn);
 
      PATTERN (insn)= copy_rtx_if_shared (PATTERN (insn));
 
      if (insn_ok_now (insn))
	continue;
 
      INSN_CODE (insn) = -1;
 
      if (RTX_FRAME_RELATED_P (insn))
	virt_insn_was_frame = 1;
      else
	virt_insn_was_frame = 0;
 
      switch (valloc_method)
	{
	case VALLOC_OP1:
	  rl78_alloc_physical_registers_op1 (insn);
	  break;
	case VALLOC_OP2:
	  rl78_alloc_physical_registers_op2 (insn);
	  break;
	case VALLOC_RO1:
	  rl78_alloc_physical_registers_ro1 (insn);
	  break;
	case VALLOC_CMP:
	  rl78_alloc_physical_registers_cmp (insn);
	  break;
	case VALLOC_UMUL:
	  rl78_alloc_physical_registers_umul (insn);
	  break;
	case VALLOC_MACAX:
	  /* Macro that clobbers AX */
	  break;
	}
    }
#if DEBUG_ALLOC
  fprintf (stderr, "\033[0m");
#endif
}
 
/* Add REG_DEAD notes using DEAD[reg] for rtx S which is part of INSN.
   This function scans for uses of registers; the last use (i.e. first
   encounter when scanning backwards) triggers a REG_DEAD note if the
   reg was previously in DEAD[].  */
static void
rl78_note_reg_uses (char *dead, rtx s, rtx insn)
{
  const char *fmt;
  int i, r;
  enum rtx_code code;
 
  if (!s)
    return;
 
  code = GET_CODE (s);
 
  switch (code)
    {
      /* Compare registers by number.  */
    case REG:
      r = REGNO (s);
      if (dump_file)
	{
	  fprintf (dump_file, "note use reg %d size %d on insn %d\n",
		   r, GET_MODE_SIZE (GET_MODE (s)), INSN_UID (insn));
	  print_rtl_single (dump_file, s);
	}
      if (dead [r])
	add_reg_note (insn, REG_DEAD, gen_rtx_REG (GET_MODE (s), r));
      for (i = 0; i < GET_MODE_SIZE (GET_MODE (s)); i ++)
	dead [r + i] = 0;
      return;
 
      /* These codes have no constituent expressions
	 and are unique.  */
    case SCRATCH:
    case CC0:
    case PC:
      return;
 
    case CONST_INT:
    case CONST_VECTOR:
    case CONST_DOUBLE:
    case CONST_FIXED:
      /* These are kept unique for a given value.  */
      return;
 
    default:
      break;
    }
 
  fmt = GET_RTX_FORMAT (code);
 
  for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
    {
      if (fmt[i] == 'E')
	{
	  int j;
	  for (j = XVECLEN (s, i) - 1; j >= 0; j--)
	    rl78_note_reg_uses (dead, XVECEXP (s, i, j), insn);
	}
      else if (fmt[i] == 'e')
	rl78_note_reg_uses (dead, XEXP (s, i), insn);
    }
}
 
/* Like the previous function, but scan for SETs instead.  */
static void
rl78_note_reg_set (char *dead, rtx d, rtx insn)
{
  int r, i;
 
  if (GET_CODE (d) != REG)
    return;
 
  r = REGNO (d);
  if (dead [r])
    add_reg_note (insn, REG_UNUSED, gen_rtx_REG (GET_MODE (d), r));
  if (dump_file)
    fprintf (dump_file, "note set reg %d size %d\n", r, GET_MODE_SIZE (GET_MODE (d)));
  for (i = 0; i < GET_MODE_SIZE (GET_MODE (d)); i ++)
    dead [r + i] = 1;
}
 
/* This is a rather crude register death pass.  Death status is reset
   at every jump or call insn.  */
static void
rl78_calculate_death_notes (void)
{
  char dead[FIRST_PSEUDO_REGISTER];
  rtx insn, p, s, d;
  int i;
 
  memset (dead, 0, sizeof (dead));
 
  for (insn = get_last_insn ();
       insn;
       insn = prev_nonnote_nondebug_insn (insn))
    {
      if (dump_file)
	{
	  fprintf (dump_file, "\n--------------------------------------------------");
	  fprintf (dump_file, "\nDead:");
	  for (i = 0; i < FIRST_PSEUDO_REGISTER; i ++)
	    if (dead[i])
	      fprintf(dump_file, " %s", reg_names[i]);
	  fprintf (dump_file, "\n");
	  print_rtl_single (dump_file, insn);
	}
 
      switch (GET_CODE (insn))
	{
	case INSN:
	  p = PATTERN (insn);
	  switch (GET_CODE (p))
	    {
	    case SET:
	      s = SET_SRC (p);
	      d = SET_DEST (p);
	      rl78_note_reg_set (dead, d, insn);
	      rl78_note_reg_uses (dead, s, insn);
	      break;
 
	    case USE:
	      rl78_note_reg_uses (dead, p, insn);
	      break;
 
	    default:
	      break;
	    }
	  break;
 
	case JUMP_INSN:
	  if (INSN_CODE (insn) == CODE_FOR_rl78_return)
	    {
	      memset (dead, 1, sizeof (dead));
	      /* We expect a USE just prior to this, which will mark
		 the actual return registers.  The USE will have a
		 death note, but we aren't going to be modifying it
		 after this pass.  */
	      break;
	    }
	case CALL_INSN:
	  memset (dead, 0, sizeof (dead));
	  break;
 
	default:
	  break;
	}
      if (dump_file)
	print_rtl_single (dump_file, insn);
    }
}
 
/* Helper function to reset the origins in RP and the age in AGE for
   all registers.  */
static void
reset_origins (int *rp, int *age)
{
  int i;
  for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
    {
      rp[i] = i;
      age[i] = 0;
    }
}
 
/* The idea behind this optimization is to look for cases where we
   move data from A to B to C, and instead move from A to B, and A to
   C.  If B is a virtual register or memory, this is a big win on its
   own.  If B turns out to be unneeded after this, it's a bigger win.
   For each register, we try to determine where it's value originally
   came from, if it's propogated purely through moves (and not
   computes).  The ORIGINS[] array has the regno for the "origin" of
   the value in the [regno] it's indexed by.  */
static void
rl78_propogate_register_origins (void)
{
  int origins[FIRST_PSEUDO_REGISTER];
  int age[FIRST_PSEUDO_REGISTER];
  int i;
  rtx insn, ninsn = NULL_RTX;
  rtx pat;
 
  reset_origins (origins, age);
 
  for (insn = get_insns (); insn; insn = ninsn)
    {
      ninsn = next_nonnote_nondebug_insn (insn);
 
      if (dump_file)
	{
	  fprintf (dump_file, "\n");
	  fprintf (dump_file, "Origins:");
	  for (i = 0; i < FIRST_PSEUDO_REGISTER; i ++)
	    if (origins[i] != i)
	      fprintf (dump_file, " r%d=r%d", i, origins[i]);
	  fprintf (dump_file, "\n");
	  print_rtl_single (dump_file, insn);
	}
 
      switch (GET_CODE (insn))
	{
	case CODE_LABEL:
	case BARRIER:
	case CALL_INSN:
	case JUMP_INSN:
	  reset_origins (origins, age);
	  break;
 
	default:
	  break;
 
	case INSN:
	  pat = PATTERN (insn);
 
	  if (GET_CODE (pat) == PARALLEL)
	    {
	      rtx clobber = XVECEXP (pat, 0, 1);
	      pat = XVECEXP (pat, 0, 0);
	      if (GET_CODE (clobber) == CLOBBER)
		{
		  int cr = REGNO (XEXP (clobber, 0));
		  int mb = GET_MODE_SIZE (GET_MODE (XEXP (clobber, 0)));
		  if (dump_file)
		    fprintf (dump_file, "reset origins of %d regs at %d\n", mb, cr);
		  for (i = 0; i < mb; i++)
		    {
		      origins[cr + i] = cr + i;
		      age[cr + i] = 0;
		    }
		}
	      else
		break;
	    }
 
	  if (GET_CODE (pat) == SET)
	    {
	      rtx src = SET_SRC (pat);
	      rtx dest = SET_DEST (pat);
	      int mb = GET_MODE_SIZE (GET_MODE (dest));
 
	      if (GET_CODE (dest) == REG)
		{
		  int dr = REGNO (dest);
 
		  if (GET_CODE (src) == REG)
		    {
		      int sr = REGNO (src);
		      int same = 1;
		      int best_age, best_reg;
 
		      /* See if the copy is not needed.  */
		      for (i = 0; i < mb; i ++)
			if (origins[dr + i] != origins[sr + i])
			  same = 0;
		      if (same)
			{
			  if (dump_file)
			    fprintf (dump_file, "deleting because dest already has correct value\n");
			  delete_insn (insn);
			  break;
			}
 
		      if (dr < 8 || sr >= 8)
			{
			  int ar;
 
			  best_age = -1;
			  best_reg = -1;
			  /* See if the copy can be made from another
			     bank 0 register instead, instead of the
			     virtual src register.  */
			  for (ar = 0; ar < 8; ar += mb)
			    {
			      same = 1;
			      for (i = 0; i < mb; i ++)
				if (origins[ar + i] != origins[sr + i])
				  same = 0;
 
			      /* The chip has some reg-reg move limitations.  */
			      if (mb == 1 && dr > 3)
				same = 0;
 
			      if (same)
				{
				  if (best_age == -1 || best_age > age[sr + i])
				    {
				      best_age = age[sr + i];
				      best_reg = sr;
				    }
				}
			    }
 
			  if (best_reg != -1)
			    {
			      /* FIXME: copy debug info too.  */
			      SET_SRC (pat) = gen_rtx_REG (GET_MODE (src), best_reg);
			      sr = best_reg;
			    }
			}
 
		      for (i = 0; i < mb; i++)
			{
			  origins[dr + i] = origins[sr + i];
			  age[dr + i] = age[sr + i] + 1;
			}
		    }
		  else
		    {
		      /* The destination is computed, its origin is itself.  */
		      if (dump_file)
			fprintf (dump_file, "resetting origin of r%d for %d byte%s\n",
				 dr, mb, mb == 1 ? "" : "s");
		      for (i = 0; i < mb; i ++)
			{
			  origins[dr + i] = dr + i;
			  age[dr + i] = 0;
			}
		    }
 
		  /* Any registers marked with that reg as an origin are reset.  */
		  for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
		    if (origins[i] >= dr && origins[i] < dr + mb)
		      {
			origins[i] = i;
			age[i] = 0;
		      }
		}
 
	      /* Special case - our ADDSI3 macro uses AX */
	      if (get_attr_valloc (insn) == VALLOC_MACAX)
		{
		  if (dump_file)
		    fprintf (dump_file, "Resetting origin of AX for macro.\n");
		  for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
		    if (i <= 1 || origins[i] <= 1)
		      {
			origins[i] = i;
			age[i] = 0;
		      }
		}
 
	      if (GET_CODE (src) == ASHIFT
		  || GET_CODE (src) == ASHIFTRT
		  || GET_CODE (src) == LSHIFTRT)
		{
		  rtx count = XEXP (src, 1);
		  if (GET_CODE (count) == REG)
		    {
		      /* Special case - our pattern clobbers the count register.  */
		      int r = REGNO (count);
		      if (dump_file)
			fprintf (dump_file, "Resetting origin of r%d for shift.\n", r);
		      for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
			if (i == r || origins[i] == r)
			  {
			    origins[i] = i;
			    age[i] = 0;
			  }
		    }
		}
	    }
	}
    }
}
 
/* Remove any SETs where the destination is unneeded.  */
static void
rl78_remove_unused_sets (void)
{
  rtx insn, ninsn = NULL_RTX;
  rtx dest;
 
  for (insn = get_insns (); insn; insn = ninsn)
    {
      ninsn = next_nonnote_nondebug_insn (insn);
 
      if ((insn = single_set (insn)) == NULL_RTX)
	continue;
 
      dest = SET_DEST (insn);
 
      if (REGNO (dest) > 23)
	continue;
 
      if (find_regno_note (insn, REG_UNUSED, REGNO (dest)))
	delete_insn (insn);
    }
}
 
#undef  xTARGET_MACHINE_DEPENDENT_REORG
#define xTARGET_MACHINE_DEPENDENT_REORG  rl78_reorg
 
/* This is the top of the devritualization pass.  */
static void
rl78_reorg (void)
{
  rl78_alloc_physical_registers ();
 
  if (dump_file)
    {
      fprintf (dump_file, "\n================DEVIRT:=AFTER=ALLOC=PHYSICAL=REGISTERS================\n");
      print_rtl_with_bb (dump_file, get_insns ());
    }
 
  rl78_propogate_register_origins ();
  rl78_calculate_death_notes ();
 
  if (dump_file)
    {
      fprintf (dump_file, "\n================DEVIRT:=AFTER=PROPOGATION=============================\n");
      print_rtl_with_bb (dump_file, get_insns ());
      fprintf (dump_file, "\n======================================================================\n");
    }
 
  rl78_remove_unused_sets ();
 
  /* The code after devirtualizing has changed so much that at this point
     we might as well just rescan everything.  Note that
     df_rescan_all_insns is not going to help here because it does not
     touch the artificial uses and defs.  */
  df_finish_pass (true);
  if (optimize > 1)
    df_live_add_problem ();
  df_scan_alloc (NULL);
  df_scan_blocks ();
 
  if (optimize)
    df_analyze ();
}
 
#undef TARGET_RETURN_IN_MEMORY
#define TARGET_RETURN_IN_MEMORY rl78_return_in_memory
 
static bool
rl78_return_in_memory (const_tree type, const_tree fntype ATTRIBUTE_UNUSED)
{
  const HOST_WIDE_INT size = int_size_in_bytes (type);
  return (size == -1 || size > 8);
}
 

struct gcc_target targetm = TARGET_INITIALIZER;
 
#include "gt-rl78.h"
 

Go to most recent revision | Compare with Previous | Blame | View Log

powered by: WebSVN 2.1.0

© copyright 1999-2024 OpenCores.org, equivalent to Oliscience, all rights reserved. OpenCores®, registered trademark.