1 |
709 |
jeremybenn |
/* Subroutines used for code generation on picoChip processors.
|
2 |
|
|
Copyright (C) 2001, 2008, 2009, 2010, 2011 Free Software Foundation, Inc.
|
3 |
|
|
Contributed by Picochip Ltd. (http://www.picochip.com)
|
4 |
|
|
Maintained by Daniel Towner (daniel.towner@picochip.com) and
|
5 |
|
|
Hariharan Sandanagobalane (hariharan@picochip.com)
|
6 |
|
|
|
7 |
|
|
This file is part of GCC.
|
8 |
|
|
|
9 |
|
|
GCC is free software; you can redistribute it and/or modify
|
10 |
|
|
it under the terms of the GNU General Public License as published by
|
11 |
|
|
the Free Software Foundation; either version 3, or (at your option)
|
12 |
|
|
any later version.
|
13 |
|
|
|
14 |
|
|
GCC is distributed in the hope that it will be useful,
|
15 |
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
16 |
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
17 |
|
|
GNU General Public License for more details.
|
18 |
|
|
|
19 |
|
|
You should have received a copy of the GNU General Public License
|
20 |
|
|
along with GCC; see the file COPYING3. If not, see
|
21 |
|
|
<http://www.gnu.org/licenses/>. */
|
22 |
|
|
|
23 |
|
|
#include "config.h"
|
24 |
|
|
#include "system.h"
|
25 |
|
|
#include "coretypes.h"
|
26 |
|
|
#include "tm.h"
|
27 |
|
|
#include "rtl.h"
|
28 |
|
|
#include "regs.h"
|
29 |
|
|
#include "hard-reg-set.h"
|
30 |
|
|
#include "insn-config.h"
|
31 |
|
|
#include "conditions.h"
|
32 |
|
|
#include "insn-attr.h"
|
33 |
|
|
#include "flags.h"
|
34 |
|
|
#include "recog.h"
|
35 |
|
|
#include "obstack.h"
|
36 |
|
|
#include "tree.h"
|
37 |
|
|
#include "expr.h"
|
38 |
|
|
#include "optabs.h"
|
39 |
|
|
#include "except.h"
|
40 |
|
|
#include "function.h"
|
41 |
|
|
#include "output.h"
|
42 |
|
|
#include "basic-block.h"
|
43 |
|
|
#include "integrate.h"
|
44 |
|
|
#include "diagnostic-core.h"
|
45 |
|
|
#include "ggc.h"
|
46 |
|
|
#include "hashtab.h"
|
47 |
|
|
#include "tm_p.h"
|
48 |
|
|
#include "target.h"
|
49 |
|
|
#include "target-def.h"
|
50 |
|
|
#include "langhooks.h"
|
51 |
|
|
#include "reload.h"
|
52 |
|
|
#include "params.h"
|
53 |
|
|
|
54 |
|
|
#include "picochip-protos.h"
|
55 |
|
|
|
56 |
|
|
#include "insn-attr.h" /* For DFA state_t. */
|
57 |
|
|
#include "insn-config.h" /* Required by recog.h */
|
58 |
|
|
#include "insn-codes.h" /* For CODE_FOR_? */
|
59 |
|
|
#include "optabs.h" /* For GEN_FCN */
|
60 |
|
|
#include "basic-block.h" /* UPDATE_LIFE_GLOBAL* for picochip_reorg. */
|
61 |
|
|
#include "timevar.h" /* For TV_SCHED2, in picochip_reorg. */
|
62 |
|
|
#include "libfuncs.h" /* For memcpy_libfuncs, etc. */
|
63 |
|
|
#include "df.h" /* For df_regs_ever_live_df_regs_ever_live_pp, etc. */
|
64 |
|
|
|
65 |
|
|
|
66 |
|
|
/* Target AE ISA information. */
|
67 |
|
|
enum picochip_dfa_type picochip_schedule_type;
|
68 |
|
|
|
69 |
|
|
bool picochip_has_mul_unit = false;
|
70 |
|
|
bool picochip_has_mac_unit = false;
|
71 |
|
|
|
72 |
|
|
/* targetm hook function prototypes. */
|
73 |
|
|
|
74 |
|
|
void picochip_asm_file_start (void);
|
75 |
|
|
void picochip_asm_file_end (void);
|
76 |
|
|
|
77 |
|
|
void picochip_init_libfuncs (void);
|
78 |
|
|
void picochip_reorg (void);
|
79 |
|
|
|
80 |
|
|
int picochip_arg_partial_bytes (cumulative_args_t p_cum,
|
81 |
|
|
enum machine_mode mode,
|
82 |
|
|
tree type, bool named);
|
83 |
|
|
rtx picochip_function_arg (cumulative_args_t p_cum,
|
84 |
|
|
enum machine_mode mode,
|
85 |
|
|
const_tree type, bool named);
|
86 |
|
|
rtx picochip_incoming_function_arg (cumulative_args_t p_cum,
|
87 |
|
|
enum machine_mode mode,
|
88 |
|
|
const_tree type, bool named);
|
89 |
|
|
void picochip_arg_advance (cumulative_args_t p_cum, enum machine_mode mode,
|
90 |
|
|
const_tree type, bool named);
|
91 |
|
|
unsigned int picochip_function_arg_boundary (enum machine_mode mode,
|
92 |
|
|
const_tree type);
|
93 |
|
|
|
94 |
|
|
int picochip_sched_lookahead (void);
|
95 |
|
|
int picochip_sched_issue_rate (void);
|
96 |
|
|
int picochip_sched_adjust_cost (rtx insn, rtx link,
|
97 |
|
|
rtx dep_insn, int cost);
|
98 |
|
|
int picochip_sched_reorder (FILE * file, int verbose, rtx * ready,
|
99 |
|
|
int *n_readyp, int clock);
|
100 |
|
|
|
101 |
|
|
void picochip_init_builtins (void);
|
102 |
|
|
rtx picochip_expand_builtin (tree, rtx, rtx, enum machine_mode, int);
|
103 |
|
|
|
104 |
|
|
bool picochip_rtx_costs (rtx x, int code, int outer_code, int opno,
|
105 |
|
|
int* total, bool speed);
|
106 |
|
|
bool picochip_return_in_memory(const_tree type,
|
107 |
|
|
const_tree fntype ATTRIBUTE_UNUSED);
|
108 |
|
|
bool picochip_legitimate_address_p (enum machine_mode, rtx, bool);
|
109 |
|
|
rtx picochip_legitimize_address (rtx x, rtx oldx ATTRIBUTE_UNUSED,
|
110 |
|
|
enum machine_mode mode);
|
111 |
|
|
int picochip_legitimize_reload_address (rtx *x, enum machine_mode mode,
|
112 |
|
|
int opnum, int type, int ind_levels);
|
113 |
|
|
|
114 |
|
|
rtx picochip_struct_value_rtx(tree fntype ATTRIBUTE_UNUSED, int incoming ATTRIBUTE_UNUSED);
|
115 |
|
|
rtx picochip_function_value (const_tree valtype, const_tree func ATTRIBUTE_UNUSED,
|
116 |
|
|
bool outgoing ATTRIBUTE_UNUSED);
|
117 |
|
|
static reg_class_t
|
118 |
|
|
picochip_secondary_reload (bool in_p,
|
119 |
|
|
rtx x ATTRIBUTE_UNUSED,
|
120 |
|
|
reg_class_t cla ATTRIBUTE_UNUSED,
|
121 |
|
|
enum machine_mode mode,
|
122 |
|
|
secondary_reload_info *sri);
|
123 |
|
|
void
|
124 |
|
|
picochip_asm_named_section (const char *name,
|
125 |
|
|
unsigned int flags ATTRIBUTE_UNUSED,
|
126 |
|
|
tree decl ATTRIBUTE_UNUSED);
|
127 |
|
|
|
128 |
|
|
static rtx picochip_static_chain (const_tree, bool);
|
129 |
|
|
|
130 |
|
|
static void picochip_option_override (void);
|
131 |
|
|
|
132 |
|
|
/* Lookup table mapping a register number to the earliest containing
|
133 |
|
|
class. Used by REGNO_REG_CLASS. */
|
134 |
|
|
const enum reg_class picochip_regno_reg_class[FIRST_PSEUDO_REGISTER] =
|
135 |
|
|
{
|
136 |
|
|
TWIN_REGS, TWIN_REGS, TWIN_REGS, TWIN_REGS,
|
137 |
|
|
TWIN_REGS, TWIN_REGS, TWIN_REGS, TWIN_REGS,
|
138 |
|
|
TWIN_REGS, TWIN_REGS, TWIN_REGS, TWIN_REGS,
|
139 |
|
|
GR_REGS, FRAME_REGS, PTR_REGS, CONST_REGS,
|
140 |
|
|
ACC_REGS, CC_REGS, GR_REGS, GR_REGS
|
141 |
|
|
};
|
142 |
|
|
|
143 |
|
|
/* picoChip register names. */
|
144 |
|
|
const char *picochip_regnames[] = REGISTER_NAMES;
|
145 |
|
|
|
146 |
|
|
/* Define the maximum number of registers which may be used to pass
|
147 |
|
|
* parameters to functions. */
|
148 |
|
|
#define MAX_CALL_PARAMETER_REGS 6
|
149 |
|
|
|
150 |
|
|
|
151 |
|
|
/* Target scheduling information. */
|
152 |
|
|
|
153 |
|
|
/* This flag indicates whether the next instruction to be output is a
|
154 |
|
|
VLIW continuation instruction. It is used to communicate between
|
155 |
|
|
final_prescan_insn and asm_output_opcode. */
|
156 |
|
|
static int picochip_vliw_continuation = 0;
|
157 |
|
|
|
158 |
|
|
/* This variable is used to communicate the current instruction
|
159 |
|
|
between final_prescan_insn and functions such as asm_output_opcode,
|
160 |
|
|
and picochip_get_vliw_alu_id (which are otherwise unable to determine the
|
161 |
|
|
current instruction. */
|
162 |
|
|
static rtx picochip_current_prescan_insn;
|
163 |
|
|
|
164 |
|
|
static bool picochip_is_delay_slot_pending = 0;
|
165 |
|
|
|
166 |
|
|
/* When final_prescan_insn is called, it computes information about
|
167 |
|
|
the current VLIW packet, and stores it in this structure. When
|
168 |
|
|
instructions are output, this state is used to make sure that the
|
169 |
|
|
instructions are output in the correct way (e.g., which ALU to use,
|
170 |
|
|
whether a macro branch was ever previously a real branch, etc.). */
|
171 |
|
|
struct vliw_state
|
172 |
|
|
{
|
173 |
|
|
int contains_pico_alu_insn;
|
174 |
|
|
int contains_non_cc_alu_insn;
|
175 |
|
|
int num_alu_insns_so_far;
|
176 |
|
|
|
177 |
|
|
/* Record how many instructions are contained in the packet. */
|
178 |
|
|
int num_insns_in_packet;
|
179 |
|
|
|
180 |
|
|
/* There was a case for this to be more than 1 */
|
181 |
|
|
int num_cfi_labels_deferred;
|
182 |
|
|
char cfi_label_name[2][256]; /* Used to record the name of a CFI label
|
183 |
|
|
emitted inside a VLIW packet. */
|
184 |
|
|
char lm_label_name[256]; /* Used to record the name of an LM label. */
|
185 |
|
|
};
|
186 |
|
|
|
187 |
|
|
struct vliw_state picochip_current_vliw_state;
|
188 |
|
|
|
189 |
|
|
/* Save/restore recog_data. */
|
190 |
|
|
static int picochip_saved_which_alternative;
|
191 |
|
|
static struct recog_data picochip_saved_recog_data;
|
192 |
|
|
|
193 |
|
|
/* Determine which ALU to use for the instruction in
|
194 |
|
|
picochip_current_prescan_insn. */
|
195 |
|
|
static char picochip_get_vliw_alu_id (void);
|
196 |
|
|
|
197 |
|
|
/* Initialize the GCC target structure. */
|
198 |
|
|
|
199 |
|
|
#undef TARGET_ASM_FUNCTION_PROLOGUE
|
200 |
|
|
#define TARGET_ASM_FUNCTION_PROLOGUE picochip_function_prologue
|
201 |
|
|
|
202 |
|
|
#undef TARGET_ASM_FUNCTION_EPILOGUE
|
203 |
|
|
#define TARGET_ASM_FUNCTION_EPILOGUE picochip_function_epilogue
|
204 |
|
|
|
205 |
|
|
#undef TARGET_ASM_INTERNAL_LABEL
|
206 |
|
|
#define TARGET_ASM_INTERNAL_LABEL picochip_output_internal_label
|
207 |
|
|
|
208 |
|
|
#undef TARGET_ASM_GLOBALIZE_LABEL
|
209 |
|
|
#define TARGET_ASM_GLOBALIZE_LABEL picochip_output_global
|
210 |
|
|
|
211 |
|
|
#undef TARGET_ASM_BYTE_OP
|
212 |
|
|
#define TARGET_ASM_BYTE_OP ".initByte "
|
213 |
|
|
#undef TARGET_ASM_ALIGNED_HI_OP
|
214 |
|
|
#define TARGET_ASM_ALIGNED_HI_OP ".initWord "
|
215 |
|
|
#undef TARGET_ASM_UNALIGNED_HI_OP
|
216 |
|
|
#define TARGET_ASM_UNALIGNED_HI_OP ".unalignedInitWord "
|
217 |
|
|
#undef TARGET_ASM_ALIGNED_SI_OP
|
218 |
|
|
#define TARGET_ASM_ALIGNED_SI_OP ".initLong "
|
219 |
|
|
#undef TARGET_ASM_UNALIGNED_SI_OP
|
220 |
|
|
#define TARGET_ASM_UNALIGNED_SI_OP ".unalignedInitLong "
|
221 |
|
|
|
222 |
|
|
#undef TARGET_INIT_BUILTINS
|
223 |
|
|
#define TARGET_INIT_BUILTINS picochip_init_builtins
|
224 |
|
|
|
225 |
|
|
#undef TARGET_EXPAND_BUILTIN
|
226 |
|
|
#define TARGET_EXPAND_BUILTIN picochip_expand_builtin
|
227 |
|
|
|
228 |
|
|
#undef TARGET_RTX_COSTS
|
229 |
|
|
#define TARGET_RTX_COSTS picochip_rtx_costs
|
230 |
|
|
|
231 |
|
|
#undef TARGET_SCHED_ISSUE_RATE
|
232 |
|
|
#define TARGET_SCHED_ISSUE_RATE picochip_sched_issue_rate
|
233 |
|
|
|
234 |
|
|
#undef TARGET_SCHED_REORDER
|
235 |
|
|
#define TARGET_SCHED_REORDER picochip_sched_reorder
|
236 |
|
|
|
237 |
|
|
#undef TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD
|
238 |
|
|
#define TARGET_SCHED_FIRST_CYCLE_MULTIPASS_DFA_LOOKAHEAD \
|
239 |
|
|
picochip_sched_lookahead
|
240 |
|
|
|
241 |
|
|
#undef TARGET_SCHED_ADJUST_COST
|
242 |
|
|
#define TARGET_SCHED_ADJUST_COST picochip_sched_adjust_cost
|
243 |
|
|
|
244 |
|
|
#undef TARGET_ASM_NAMED_SECTION
|
245 |
|
|
#define TARGET_ASM_NAMED_SECTION picochip_asm_named_section
|
246 |
|
|
|
247 |
|
|
#undef TARGET_HAVE_SWITCHABLE_BSS_SECTIONS
|
248 |
|
|
#define TARGET_HAVE_SWITCHABLE_BSS_SECTIONS 1
|
249 |
|
|
|
250 |
|
|
#undef TARGET_INIT_LIBFUNCS
|
251 |
|
|
#define TARGET_INIT_LIBFUNCS picochip_init_libfuncs
|
252 |
|
|
|
253 |
|
|
#undef TARGET_ASM_FILE_START
|
254 |
|
|
#define TARGET_ASM_FILE_START picochip_asm_file_start
|
255 |
|
|
|
256 |
|
|
#undef TARGET_ASM_FILE_END
|
257 |
|
|
#define TARGET_ASM_FILE_END picochip_asm_file_end
|
258 |
|
|
|
259 |
|
|
#undef TARGET_MACHINE_DEPENDENT_REORG
|
260 |
|
|
#define TARGET_MACHINE_DEPENDENT_REORG picochip_reorg
|
261 |
|
|
|
262 |
|
|
#undef TARGET_ARG_PARTIAL_BYTES
|
263 |
|
|
#define TARGET_ARG_PARTIAL_BYTES picochip_arg_partial_bytes
|
264 |
|
|
|
265 |
|
|
#undef TARGET_FUNCTION_ARG
|
266 |
|
|
#define TARGET_FUNCTION_ARG picochip_function_arg
|
267 |
|
|
|
268 |
|
|
#undef TARGET_FUNCTION_INCOMING_ARG
|
269 |
|
|
#define TARGET_FUNCTION_INCOMING_ARG picochip_incoming_function_arg
|
270 |
|
|
|
271 |
|
|
#undef TARGET_FUNCTION_ARG_ADVANCE
|
272 |
|
|
#define TARGET_FUNCTION_ARG_ADVANCE picochip_arg_advance
|
273 |
|
|
|
274 |
|
|
#undef TARGET_FUNCTION_ARG_BOUNDARY
|
275 |
|
|
#define TARGET_FUNCTION_ARG_BOUNDARY picochip_function_arg_boundary
|
276 |
|
|
|
277 |
|
|
#undef TARGET_PROMOTE_FUNCTION_MODE
|
278 |
|
|
#define TARGET_PROMOTE_FUNCTION_MODE default_promote_function_mode_always_promote
|
279 |
|
|
#undef TARGET_PROMOTE_PROTOTYPES
|
280 |
|
|
#define TARGET_PROMOTE_PROTOTYPES hook_bool_const_tree_true
|
281 |
|
|
|
282 |
|
|
/* Target support for Anchored Addresses optimization */
|
283 |
|
|
#undef TARGET_MIN_ANCHOR_OFFSET
|
284 |
|
|
#define TARGET_MIN_ANCHOR_OFFSET 0
|
285 |
|
|
#undef TARGET_MAX_ANCHOR_OFFSET
|
286 |
|
|
#define TARGET_MAX_ANCHOR_OFFSET 7
|
287 |
|
|
#undef TARGET_ASM_OUTPUT_ANCHOR
|
288 |
|
|
#define TARGET_ASM_OUTPUT_ANCHOR picochip_asm_output_anchor
|
289 |
|
|
|
290 |
|
|
#undef TARGET_FUNCTION_VALUE
|
291 |
|
|
#define TARGET_FUNCTION_VALUE picochip_function_value
|
292 |
|
|
/*
|
293 |
|
|
#undef TARGET_LIBGCC_CMP_RETURN_MODE
|
294 |
|
|
#define TARGET_LIBGCC_CMP_RETURN_MODE picochip_libgcc_cmp_return_mode
|
295 |
|
|
*/
|
296 |
|
|
|
297 |
|
|
#undef TARGET_LEGITIMATE_ADDRESS_P
|
298 |
|
|
#define TARGET_LEGITIMATE_ADDRESS_P picochip_legitimate_address_p
|
299 |
|
|
|
300 |
|
|
#undef TARGET_LEGITIMIZE_ADDRESS
|
301 |
|
|
#define TARGET_LEGITIMIZE_ADDRESS picochip_legitimize_address
|
302 |
|
|
|
303 |
|
|
/* Loading and storing QImode values to and from memory
|
304 |
|
|
usually requires a scratch register. */
|
305 |
|
|
#undef TARGET_SECONDARY_RELOAD
|
306 |
|
|
#define TARGET_SECONDARY_RELOAD picochip_secondary_reload
|
307 |
|
|
#undef DONT_USE_BUILTIN_SETJMP
|
308 |
|
|
#define DONT_USE_BUILTIN_SETJMP 1
|
309 |
|
|
|
310 |
|
|
/* How Large Values are Returned */
|
311 |
|
|
|
312 |
|
|
#undef TARGET_RETURN_IN_MEMORY
|
313 |
|
|
#define TARGET_RETURN_IN_MEMORY picochip_return_in_memory
|
314 |
|
|
|
315 |
|
|
#undef TARGET_STATIC_CHAIN
|
316 |
|
|
#define TARGET_STATIC_CHAIN picochip_static_chain
|
317 |
|
|
|
318 |
|
|
#undef TARGET_OPTION_OVERRIDE
|
319 |
|
|
#define TARGET_OPTION_OVERRIDE picochip_option_override
|
320 |
|
|
|
321 |
|
|
#undef TARGET_OVERRIDE_OPTIONS_AFTER_CHANGE
|
322 |
|
|
#define TARGET_OVERRIDE_OPTIONS_AFTER_CHANGE picochip_option_override
|
323 |
|
|
|
324 |
|
|
/* The 2nd scheduling pass option is switched off, and a machine
|
325 |
|
|
dependent reorganisation ensures that it is run later on, after the
|
326 |
|
|
second jump optimisation. */
|
327 |
|
|
#undef TARGET_DELAY_SCHED2
|
328 |
|
|
#define TARGET_DELAY_SCHED2 true
|
329 |
|
|
|
330 |
|
|
/* Variable tracking should be run after all optimizations which
|
331 |
|
|
change order of insns. It also needs a valid CFG. */
|
332 |
|
|
#undef TARGET_DELAY_VARTRACK
|
333 |
|
|
#define TARGET_DELAY_VARTRACK true
|
334 |
|
|
|
335 |
|
|
struct gcc_target targetm = TARGET_INITIALIZER;
|
336 |
|
|
|
337 |
|
|
|
338 |
|
|
/* Only return a value in memory if it is greater than 4 bytes.
|
339 |
|
|
int_size_in_bytes returns -1 for variable size objects, which go in
|
340 |
|
|
memory always. The cast to unsigned makes -1 > 8. */
|
341 |
|
|
|
342 |
|
|
bool
|
343 |
|
|
picochip_return_in_memory(const_tree type, const_tree fntype ATTRIBUTE_UNUSED)
|
344 |
|
|
{
|
345 |
|
|
return ((unsigned HOST_WIDE_INT) int_size_in_bytes (type) > 4);
|
346 |
|
|
}
|
347 |
|
|
|
348 |
|
|
/* Allow some options to be overriden. */
|
349 |
|
|
|
350 |
|
|
static void
|
351 |
|
|
picochip_option_override (void)
|
352 |
|
|
{
|
353 |
|
|
/* If we are optimizing for stack, dont let inliner to inline functions
|
354 |
|
|
that could potentially increase stack size.*/
|
355 |
|
|
if (flag_conserve_stack)
|
356 |
|
|
{
|
357 |
|
|
maybe_set_param_value (PARAM_LARGE_STACK_FRAME, 0,
|
358 |
|
|
global_options.x_param_values,
|
359 |
|
|
global_options_set.x_param_values);
|
360 |
|
|
maybe_set_param_value (PARAM_STACK_FRAME_GROWTH, 0,
|
361 |
|
|
global_options.x_param_values,
|
362 |
|
|
global_options_set.x_param_values);
|
363 |
|
|
}
|
364 |
|
|
|
365 |
|
|
/* Turn off the elimination of unused types. The elaborator
|
366 |
|
|
generates various interesting types to represent constants,
|
367 |
|
|
generics, and so on, and it is useful to retain this information
|
368 |
|
|
in the debug output. The increased size of the debug information
|
369 |
|
|
is not really an issue for us. */
|
370 |
|
|
flag_eliminate_unused_debug_types = 0;
|
371 |
|
|
|
372 |
|
|
/* Even if the user specifies a -fno-omit-frame-pointer on the
|
373 |
|
|
command line, we still want to go ahead and omit frame pointer
|
374 |
|
|
usages, since we dont really have a frame pointer register.
|
375 |
|
|
So, all accesses to FP need to be converted to accesses off
|
376 |
|
|
stack pointer.*/
|
377 |
|
|
flag_omit_frame_pointer = 1;
|
378 |
|
|
|
379 |
|
|
/* Turning on anchored addresses by default. This is an optimization
|
380 |
|
|
that could decrease the code size by placing anchors in data and
|
381 |
|
|
accessing offsets from the anchor for file local data variables.*/
|
382 |
|
|
if (optimize >= 1)
|
383 |
|
|
flag_section_anchors = 1;
|
384 |
|
|
|
385 |
|
|
/* The second scheduling pass runs within picochip_reorg, to avoid
|
386 |
|
|
having the second jump optimisation trash the instruction modes
|
387 |
|
|
(e.g., instructions are changed to TImode to mark the beginning
|
388 |
|
|
of cycles). Two types of DFA scheduling are possible: space and
|
389 |
|
|
speed. In both cases, instructions are reordered to avoid stalls
|
390 |
|
|
(e.g., memory loads stall for one cycle). Speed scheduling will
|
391 |
|
|
also enable VLIW instruction packing. VLIW instructions use more
|
392 |
|
|
code space, so VLIW scheduling is disabled when scheduling for
|
393 |
|
|
size. */
|
394 |
|
|
if (flag_schedule_insns_after_reload)
|
395 |
|
|
{
|
396 |
|
|
if (optimize_size)
|
397 |
|
|
picochip_schedule_type = DFA_TYPE_SPACE;
|
398 |
|
|
else
|
399 |
|
|
{
|
400 |
|
|
picochip_schedule_type = DFA_TYPE_SPEED;
|
401 |
|
|
flag_delayed_branch = 0;
|
402 |
|
|
}
|
403 |
|
|
}
|
404 |
|
|
else
|
405 |
|
|
picochip_schedule_type = DFA_TYPE_NONE;
|
406 |
|
|
|
407 |
|
|
/* Ensure that the debug level is always at least -g2. The flow
|
408 |
|
|
analyser works at its best if it always has debug
|
409 |
|
|
information. DWARF is non-intrusive, so it makes no difference to
|
410 |
|
|
code quality if debug is always enabled. */
|
411 |
|
|
if (debug_info_level < DINFO_LEVEL_NORMAL)
|
412 |
|
|
{
|
413 |
|
|
debug_info_level = DINFO_LEVEL_NORMAL;
|
414 |
|
|
write_symbols = DWARF2_DEBUG;
|
415 |
|
|
}
|
416 |
|
|
|
417 |
|
|
/* Options of the form -mae=mac, and so on will be substituted by
|
418 |
|
|
the compiler driver for the appropriate byte access and multiply
|
419 |
|
|
unit ISA options. Any unrecognised AE types will end up being
|
420 |
|
|
passed to the compiler, which should reject them as invalid. */
|
421 |
|
|
if (picochip_ae_type_string != NULL)
|
422 |
|
|
error ("invalid AE type specified (%s)", picochip_ae_type_string);
|
423 |
|
|
|
424 |
|
|
/* Override any specific capabilities of the instruction set. These
|
425 |
|
|
take precedence over any capabilities inferred from the AE type,
|
426 |
|
|
regardless of where the options appear on the command line. */
|
427 |
|
|
if (picochip_mul_type_string == NULL)
|
428 |
|
|
{
|
429 |
|
|
/* Default to MEM-type multiply, for historical compatibility. */
|
430 |
|
|
picochip_has_mac_unit = false;
|
431 |
|
|
picochip_has_mul_unit = true;
|
432 |
|
|
}
|
433 |
|
|
else
|
434 |
|
|
{
|
435 |
|
|
picochip_has_mac_unit = false;
|
436 |
|
|
picochip_has_mul_unit = false;
|
437 |
|
|
|
438 |
|
|
if (strcmp (picochip_mul_type_string, "mul") == 0)
|
439 |
|
|
picochip_has_mul_unit = true;
|
440 |
|
|
else if (strcmp (picochip_mul_type_string, "mac") == 0)
|
441 |
|
|
picochip_has_mac_unit = true;
|
442 |
|
|
else if (strcmp (picochip_mul_type_string, "none") == 0)
|
443 |
|
|
{ /* Do nothing. Unit types already set to false. */ }
|
444 |
|
|
else
|
445 |
|
|
error ("invalid mul type specified (%s) - expected mac, mul or none",
|
446 |
|
|
picochip_mul_type_string);
|
447 |
|
|
}
|
448 |
|
|
}
|
449 |
|
|
|
450 |
|
|
|
451 |
|
|
/* Initialise the library functions to handle arithmetic on some of
|
452 |
|
|
the larger modes. */
|
453 |
|
|
void
|
454 |
|
|
picochip_init_libfuncs (void)
|
455 |
|
|
{
|
456 |
|
|
/* 64-bit shifts */
|
457 |
|
|
set_optab_libfunc (ashr_optab, DImode, "__ashrdi3");
|
458 |
|
|
set_optab_libfunc (ashl_optab, DImode, "__ashldi3");
|
459 |
|
|
set_optab_libfunc (lshr_optab, DImode, "__lshrdi3");
|
460 |
|
|
|
461 |
|
|
/* 64-bit signed multiplication. */
|
462 |
|
|
set_optab_libfunc (smul_optab, DImode, "__muldi3");
|
463 |
|
|
|
464 |
|
|
/* Signed division */
|
465 |
|
|
set_optab_libfunc (sdiv_optab, HImode, "__divhi3");
|
466 |
|
|
set_optab_libfunc (sdiv_optab, DImode, "__divdi3");
|
467 |
|
|
|
468 |
|
|
/* Signed modulus */
|
469 |
|
|
set_optab_libfunc (smod_optab, HImode, "__modhi3");
|
470 |
|
|
set_optab_libfunc (smod_optab, DImode, "__moddi3");
|
471 |
|
|
|
472 |
|
|
/* 32-bit count leading Zeros*/
|
473 |
|
|
set_optab_libfunc (clz_optab, SImode, "_clzsi2");
|
474 |
|
|
|
475 |
|
|
/* 64-bit comparison */
|
476 |
|
|
set_optab_libfunc (ucmp_optab, DImode, "__ucmpdi2");
|
477 |
|
|
set_optab_libfunc (cmp_optab, DImode, "__cmpdi2");
|
478 |
|
|
|
479 |
|
|
/* 64-bit addition and subtraction*/
|
480 |
|
|
set_optab_libfunc (add_optab, DImode, "_adddi3");
|
481 |
|
|
set_optab_libfunc (sub_optab, DImode, "_subdi3");
|
482 |
|
|
}
|
483 |
|
|
|
484 |
|
|
/* Memcpy function */
|
485 |
|
|
int
|
486 |
|
|
picochip_expand_movmemhi (rtx *operands)
|
487 |
|
|
{
|
488 |
|
|
rtx src_addr_reg, dst_addr_reg, count_reg, src_mem, dst_mem, tmp_reg;
|
489 |
|
|
rtx start_label;
|
490 |
|
|
int align, size;
|
491 |
|
|
src_addr_reg = gen_reg_rtx(HImode);
|
492 |
|
|
dst_addr_reg = gen_reg_rtx(HImode);
|
493 |
|
|
count_reg = gen_reg_rtx(HImode);
|
494 |
|
|
emit_insn (gen_movhi (count_reg, operands[2]));
|
495 |
|
|
emit_insn (gen_movqi (src_addr_reg, XEXP(operands[1], 0)));
|
496 |
|
|
emit_insn (gen_movqi (dst_addr_reg, XEXP(operands[0], 0)));
|
497 |
|
|
gcc_assert (GET_CODE(count_reg) == REG);
|
498 |
|
|
start_label = gen_label_rtx ();
|
499 |
|
|
emit_label (start_label);
|
500 |
|
|
|
501 |
|
|
/* We can specialise the code for different alignments */
|
502 |
|
|
align = INTVAL(operands[3]);
|
503 |
|
|
size = INTVAL(operands[2]);
|
504 |
|
|
gcc_assert(align >= 0 && size >= 0);
|
505 |
|
|
if (size != 0)
|
506 |
|
|
{
|
507 |
|
|
if (size % 4 == 0 && align % 4 == 0)
|
508 |
|
|
{
|
509 |
|
|
src_mem = gen_rtx_MEM(SImode, src_addr_reg);
|
510 |
|
|
dst_mem = gen_rtx_MEM(SImode, dst_addr_reg);
|
511 |
|
|
tmp_reg = gen_reg_rtx(SImode);
|
512 |
|
|
emit_insn (gen_movsi (tmp_reg, src_mem));
|
513 |
|
|
emit_insn (gen_movsi (dst_mem, tmp_reg));
|
514 |
|
|
emit_insn (gen_addhi3 (dst_addr_reg, dst_addr_reg, GEN_INT(4)));
|
515 |
|
|
emit_insn (gen_addhi3 (src_addr_reg, src_addr_reg, GEN_INT(4)));
|
516 |
|
|
emit_insn (gen_addhi3 (count_reg, count_reg, GEN_INT(-4)));
|
517 |
|
|
/* The sub instruction above generates cc, but we cannot just emit the branch.*/
|
518 |
|
|
emit_cmp_and_jump_insns (count_reg, const0_rtx, GT, 0, HImode, 0, start_label);
|
519 |
|
|
}
|
520 |
|
|
else if (size % 2 == 0 && align % 2 == 0)
|
521 |
|
|
{
|
522 |
|
|
src_mem = gen_rtx_MEM(HImode, src_addr_reg);
|
523 |
|
|
dst_mem = gen_rtx_MEM(HImode, dst_addr_reg);
|
524 |
|
|
tmp_reg = gen_reg_rtx(HImode);
|
525 |
|
|
emit_insn (gen_movhi (tmp_reg, src_mem));
|
526 |
|
|
emit_insn (gen_movhi (dst_mem, tmp_reg));
|
527 |
|
|
emit_insn (gen_addhi3 (dst_addr_reg, dst_addr_reg, const2_rtx));
|
528 |
|
|
emit_insn (gen_addhi3 (src_addr_reg, src_addr_reg, const2_rtx));
|
529 |
|
|
emit_insn (gen_addhi3 (count_reg, count_reg, GEN_INT(-2)));
|
530 |
|
|
/* The sub instruction above generates cc, but we cannot just emit the branch.*/
|
531 |
|
|
emit_cmp_and_jump_insns (count_reg, const0_rtx, GT, 0, HImode, 0, start_label);
|
532 |
|
|
}
|
533 |
|
|
else
|
534 |
|
|
{
|
535 |
|
|
src_mem = gen_rtx_MEM(QImode, src_addr_reg);
|
536 |
|
|
dst_mem = gen_rtx_MEM(QImode, dst_addr_reg);
|
537 |
|
|
tmp_reg = gen_reg_rtx(QImode);
|
538 |
|
|
emit_insn (gen_movqi (tmp_reg, src_mem));
|
539 |
|
|
emit_insn (gen_movqi (dst_mem, tmp_reg));
|
540 |
|
|
emit_insn (gen_addhi3 (dst_addr_reg, dst_addr_reg, const1_rtx));
|
541 |
|
|
emit_insn (gen_addhi3 (src_addr_reg, src_addr_reg, const1_rtx));
|
542 |
|
|
emit_insn (gen_addhi3 (count_reg, count_reg, GEN_INT(-1)));
|
543 |
|
|
/* The sub instruction above generates cc, but we cannot just emit the branch.*/
|
544 |
|
|
emit_cmp_and_jump_insns (count_reg, const0_rtx, GT, 0, HImode, 0, start_label);
|
545 |
|
|
}
|
546 |
|
|
}
|
547 |
|
|
return 1;
|
548 |
|
|
}
|
549 |
|
|
|
550 |
|
|
|
551 |
|
|
/* Return the register class for letter C. */
|
552 |
|
|
enum reg_class
|
553 |
|
|
picochip_reg_class_from_letter (unsigned c)
|
554 |
|
|
{
|
555 |
|
|
switch (c)
|
556 |
|
|
{
|
557 |
|
|
case 'k':
|
558 |
|
|
return FRAME_REGS;
|
559 |
|
|
case 'f':
|
560 |
|
|
return PTR_REGS;
|
561 |
|
|
case 't':
|
562 |
|
|
return TWIN_REGS;
|
563 |
|
|
case 'r':
|
564 |
|
|
return GR_REGS;
|
565 |
|
|
default:
|
566 |
|
|
return NO_REGS;
|
567 |
|
|
}
|
568 |
|
|
}
|
569 |
|
|
|
570 |
|
|
static const int
|
571 |
|
|
pico_leaf_reg_alloc_order[] = LEAF_REG_ALLOC_ORDER;
|
572 |
|
|
static const int
|
573 |
|
|
pico_nonleaf_reg_alloc_order[] = REG_ALLOC_ORDER;
|
574 |
|
|
|
575 |
|
|
void
|
576 |
|
|
picochip_order_regs_for_local_alloc (void)
|
577 |
|
|
{
|
578 |
|
|
/* We change the order for leaf functions alone. We put r12 at
|
579 |
|
|
the end since using it will prevent us to combine stw/ldws to
|
580 |
|
|
stl/ldl and it gives no benefit. In non-leaf functions, we
|
581 |
|
|
would anyway saveup/restore r12, so it makes sense to use it.*/
|
582 |
|
|
|
583 |
|
|
if (leaf_function_p())
|
584 |
|
|
{
|
585 |
|
|
memcpy ((char *)reg_alloc_order, (const char *) pico_leaf_reg_alloc_order,
|
586 |
|
|
FIRST_PSEUDO_REGISTER * sizeof (int));
|
587 |
|
|
}
|
588 |
|
|
else
|
589 |
|
|
{
|
590 |
|
|
memcpy ((char *)reg_alloc_order, (const char *) pico_nonleaf_reg_alloc_order,
|
591 |
|
|
FIRST_PSEUDO_REGISTER * sizeof (int));
|
592 |
|
|
}
|
593 |
|
|
}
|
594 |
|
|
|
595 |
|
|
/* Check that VALUE (an INT_CST) is ok as a constant of type C. */
|
596 |
|
|
int
|
597 |
|
|
picochip_const_ok_for_letter_p (unsigned HOST_WIDE_INT value, unsigned c)
|
598 |
|
|
{
|
599 |
|
|
|
600 |
|
|
switch (c)
|
601 |
|
|
{
|
602 |
|
|
case 'I': /* 4 bits signed. */
|
603 |
|
|
return value + 8 < 16;
|
604 |
|
|
case 'J': /* 4 bits unsigned. */
|
605 |
|
|
return value < 16;
|
606 |
|
|
case 'K': /* 8 bits signed. */
|
607 |
|
|
return value + 128 < 256;
|
608 |
|
|
case 'M': /* 4-bit magnitude. */
|
609 |
|
|
return abs (value) < 16;
|
610 |
|
|
case 'N': /* 10 bits signed. */
|
611 |
|
|
return value + 512 > 1024;
|
612 |
|
|
case 'O': /* 16 bits signed. */
|
613 |
|
|
return value + 32768 < 65536;
|
614 |
|
|
default: /* Unknown letter. */
|
615 |
|
|
return 0;
|
616 |
|
|
}
|
617 |
|
|
}
|
618 |
|
|
|
619 |
|
|
/* Stack utility functions. */
|
620 |
|
|
rtx
|
621 |
|
|
picochip_return_addr_rtx(int count, rtx frameaddr ATTRIBUTE_UNUSED)
|
622 |
|
|
{
|
623 |
|
|
if (count==0)
|
624 |
|
|
return gen_rtx_REG (Pmode, LINK_REGNUM);
|
625 |
|
|
else
|
626 |
|
|
return NULL_RTX;
|
627 |
|
|
}
|
628 |
|
|
|
629 |
|
|
|
630 |
|
|
/* Emit a set of parallel register expressions used to store
|
631 |
|
|
blockmode values to pass to functions. */
|
632 |
|
|
static rtx
|
633 |
|
|
picochip_emit_register_parallel (int size_in_units, int offset)
|
634 |
|
|
{
|
635 |
|
|
int num_regs = 0;
|
636 |
|
|
rtx result;
|
637 |
|
|
rtx vector[MAX_CALL_PARAMETER_REGS];
|
638 |
|
|
int base_reg = 0;
|
639 |
|
|
int i = 0;
|
640 |
|
|
|
641 |
|
|
/* Compute the base register, and number of required registers. */
|
642 |
|
|
base_reg = offset / 2;
|
643 |
|
|
num_regs = size_in_units / 2;
|
644 |
|
|
if (size_in_units % 2 == 1)
|
645 |
|
|
num_regs++;
|
646 |
|
|
|
647 |
|
|
/* Emit a register for each part of the block mode value to be
|
648 |
|
|
passed in a register. */
|
649 |
|
|
for (i = 0; i < num_regs; i++)
|
650 |
|
|
vector[i] = gen_rtx_EXPR_LIST (VOIDmode,
|
651 |
|
|
gen_rtx_REG (HImode, base_reg + i),
|
652 |
|
|
GEN_INT (i * 2));
|
653 |
|
|
result = gen_rtx_PARALLEL (BLKmode, gen_rtvec_v (num_regs, vector));
|
654 |
|
|
|
655 |
|
|
return result;
|
656 |
|
|
|
657 |
|
|
}
|
658 |
|
|
|
659 |
|
|
/* Emit an instruction to allocate a suitable amount of space on the
|
660 |
|
|
stack, by decrementing the stack pointer. */
|
661 |
|
|
static void
|
662 |
|
|
picochip_emit_stack_allocate (int adjustment)
|
663 |
|
|
{
|
664 |
|
|
rtx insn;
|
665 |
|
|
rtx stack_pointer_reg = gen_rtx_REG (Pmode, STACK_POINTER_REGNUM);
|
666 |
|
|
|
667 |
|
|
/* Use an addition of a negative value. */
|
668 |
|
|
insn = emit_insn (gen_addhi3 (stack_pointer_reg, stack_pointer_reg,
|
669 |
|
|
GEN_INT (-adjustment)));
|
670 |
|
|
|
671 |
|
|
/* Make the instruction frame related. Also add an expression note,
|
672 |
|
|
so that the correct Dwarf information is generated (see documention
|
673 |
|
|
for RTX_FRAME_RELATED_P for more details). */
|
674 |
|
|
RTX_FRAME_RELATED_P (insn) = 1;
|
675 |
|
|
add_reg_note (insn, REG_FRAME_RELATED_EXPR,
|
676 |
|
|
gen_rtx_SET (VOIDmode, stack_pointer_reg,
|
677 |
|
|
gen_rtx_PLUS (Pmode, stack_pointer_reg,
|
678 |
|
|
GEN_INT (-adjustment))));
|
679 |
|
|
|
680 |
|
|
}
|
681 |
|
|
|
682 |
|
|
/* Emit an instruction to save a register of the given mode. The
|
683 |
|
|
offset at which to save the register is given relative to the stack
|
684 |
|
|
pointer. */
|
685 |
|
|
static void
|
686 |
|
|
picochip_emit_save_register (rtx reg, int offset)
|
687 |
|
|
{
|
688 |
|
|
rtx stack_pointer, address, mem, insn;
|
689 |
|
|
|
690 |
|
|
stack_pointer = gen_rtx_REG (Pmode, STACK_POINTER_REGNUM);
|
691 |
|
|
|
692 |
|
|
address = gen_rtx_PLUS (Pmode, stack_pointer, GEN_INT (offset));
|
693 |
|
|
|
694 |
|
|
mem = gen_rtx_MEM (GET_MODE (reg), address);
|
695 |
|
|
|
696 |
|
|
insn = emit_move_insn (mem, reg);
|
697 |
|
|
RTX_FRAME_RELATED_P (insn) = 1;
|
698 |
|
|
|
699 |
|
|
/* For modes other than HImode, create a note explaining that
|
700 |
|
|
multiple registers have been saved. This allows the correct DWARF
|
701 |
|
|
call frame information to be generated. */
|
702 |
|
|
switch (GET_MODE (reg))
|
703 |
|
|
{
|
704 |
|
|
case HImode:
|
705 |
|
|
/* The RTL is sufficient to explain HImode register saves. */
|
706 |
|
|
break;
|
707 |
|
|
|
708 |
|
|
case SImode:
|
709 |
|
|
/* SImode must be broken down into parallel HImode register saves. */
|
710 |
|
|
{
|
711 |
|
|
rtvec p;
|
712 |
|
|
p = rtvec_alloc (2);
|
713 |
|
|
|
714 |
|
|
RTVEC_ELT (p, 0) =
|
715 |
|
|
gen_rtx_SET (HImode,
|
716 |
|
|
gen_rtx_MEM (HImode,
|
717 |
|
|
gen_rtx_PLUS (Pmode, stack_pointer,
|
718 |
|
|
GEN_INT (offset))),
|
719 |
|
|
gen_rtx_REG (HImode, REGNO (reg)));
|
720 |
|
|
RTX_FRAME_RELATED_P (RTVEC_ELT (p, 0)) = 1;
|
721 |
|
|
|
722 |
|
|
RTVEC_ELT (p, 1) =
|
723 |
|
|
gen_rtx_SET (HImode, gen_rtx_MEM (HImode,
|
724 |
|
|
gen_rtx_PLUS (Pmode,
|
725 |
|
|
stack_pointer,
|
726 |
|
|
GEN_INT (offset +
|
727 |
|
|
2))),
|
728 |
|
|
gen_rtx_REG (HImode, REGNO (reg) + 1));
|
729 |
|
|
RTX_FRAME_RELATED_P (RTVEC_ELT (p, 1)) = 1;
|
730 |
|
|
|
731 |
|
|
add_reg_note (insn, REG_FRAME_RELATED_EXPR,
|
732 |
|
|
gen_rtx_PARALLEL (VOIDmode, p));
|
733 |
|
|
|
734 |
|
|
}
|
735 |
|
|
break;
|
736 |
|
|
|
737 |
|
|
default:
|
738 |
|
|
internal_error
|
739 |
|
|
("unexpected mode %s encountered in picochip_emit_save_register",
|
740 |
|
|
GET_MODE_NAME (GET_MODE (reg)));
|
741 |
|
|
}
|
742 |
|
|
|
743 |
|
|
}
|
744 |
|
|
|
745 |
|
|
/* Emit an instruction to restore a register of the given mode. The
|
746 |
|
|
offset from which to restore the register is given relative to the
|
747 |
|
|
stack pointer. */
|
748 |
|
|
static void
|
749 |
|
|
picochip_emit_restore_register (rtx reg, int offset)
|
750 |
|
|
{
|
751 |
|
|
rtx stack_pointer, address, mem;
|
752 |
|
|
|
753 |
|
|
stack_pointer = gen_rtx_REG (Pmode, STACK_POINTER_REGNUM);
|
754 |
|
|
|
755 |
|
|
address = gen_rtx_PLUS (Pmode, stack_pointer, GEN_INT (offset));
|
756 |
|
|
|
757 |
|
|
mem = gen_rtx_MEM (GET_MODE (reg), address);
|
758 |
|
|
|
759 |
|
|
emit_move_insn (reg, mem);
|
760 |
|
|
|
761 |
|
|
}
|
762 |
|
|
|
763 |
|
|
/* Check that the given byte offset is aligned to the given number of
|
764 |
|
|
bits. */
|
765 |
|
|
static int
|
766 |
|
|
picochip_is_aligned (int byte_offset, int bit_alignment)
|
767 |
|
|
{
|
768 |
|
|
int byte_alignment = bit_alignment / BITS_PER_UNIT;
|
769 |
|
|
return (byte_offset % byte_alignment) == 0;
|
770 |
|
|
}
|
771 |
|
|
|
772 |
|
|
/*****************************************************************************
|
773 |
|
|
* Stack layout.
|
774 |
|
|
*
|
775 |
|
|
* The following section contains code which controls how the stack is
|
776 |
|
|
* laid out.
|
777 |
|
|
*
|
778 |
|
|
* The stack is laid out as follows (high addresses first):
|
779 |
|
|
*
|
780 |
|
|
* Incoming arguments
|
781 |
|
|
* Pretend arguments (ARG PTR)
|
782 |
|
|
* Special registers
|
783 |
|
|
* General registers
|
784 |
|
|
* Frame (FP)
|
785 |
|
|
* Outgoing arguments (SP)
|
786 |
|
|
*
|
787 |
|
|
* The (constant) offsets of the different areas must be calculated
|
788 |
|
|
* relative to the stack area immediately below, and aligned
|
789 |
|
|
* appropriately. For example, the frame offset is computed by
|
790 |
|
|
* determining the offset of the special register area, adding the
|
791 |
|
|
* size of the special register area, and then aligning the resulting
|
792 |
|
|
* offset correctly. In turn, the special register offset is computed
|
793 |
|
|
* from the general register offset, and so on. This enables the
|
794 |
|
|
* different offsets to change size and alignment, without requiring
|
795 |
|
|
* the code for other offset calculations to be rewritten.
|
796 |
|
|
*
|
797 |
|
|
* The argument pointer, and the frame pointer are eliminated wherever
|
798 |
|
|
* possible, by replacing them with a constant offset from the stack
|
799 |
|
|
* pointer. In the rare cases where constant offsets from the stack
|
800 |
|
|
* pointer cannot be computed, another register will be allocated to
|
801 |
|
|
* serve as the argument pointer, or the frame pointer.
|
802 |
|
|
*
|
803 |
|
|
* The save registers are stored at small offsets from the caller, to
|
804 |
|
|
* enable the more efficient SP-based ISA instructions to be used.
|
805 |
|
|
*
|
806 |
|
|
****************************************************************************/
|
807 |
|
|
|
808 |
|
|
/* Compute the size of an argument in units. */
|
809 |
|
|
static int
|
810 |
|
|
picochip_compute_arg_size (const_tree type, enum machine_mode mode)
|
811 |
|
|
{
|
812 |
|
|
int type_size_in_units = 0;
|
813 |
|
|
|
814 |
|
|
if (type)
|
815 |
|
|
type_size_in_units = tree_low_cst (TYPE_SIZE_UNIT (type), 1);
|
816 |
|
|
else
|
817 |
|
|
type_size_in_units = GET_MODE_SIZE (mode);
|
818 |
|
|
|
819 |
|
|
return type_size_in_units;
|
820 |
|
|
|
821 |
|
|
}
|
822 |
|
|
|
823 |
|
|
/* Determine where the next outgoing arg should be placed. */
|
824 |
|
|
rtx
|
825 |
|
|
picochip_function_arg (cumulative_args_t cum_v, enum machine_mode mode,
|
826 |
|
|
const_tree type, bool named ATTRIBUTE_UNUSED)
|
827 |
|
|
{
|
828 |
|
|
CUMULATIVE_ARGS *cum = get_cumulative_args (cum_v);
|
829 |
|
|
int reg = 0;
|
830 |
|
|
int type_align_in_units = 0;
|
831 |
|
|
int type_size_in_units;
|
832 |
|
|
int new_offset = 0;
|
833 |
|
|
int offset_overflow = 0;
|
834 |
|
|
|
835 |
|
|
/* VOIDmode is passed when computing the second argument to a `call'
|
836 |
|
|
pattern. This can be ignored. */
|
837 |
|
|
if (mode == VOIDmode)
|
838 |
|
|
return 0;
|
839 |
|
|
|
840 |
|
|
/* Compute the alignment and size of the parameter. */
|
841 |
|
|
type_align_in_units =
|
842 |
|
|
picochip_function_arg_boundary (mode, type) / BITS_PER_UNIT;
|
843 |
|
|
type_size_in_units = picochip_compute_arg_size (type, mode);
|
844 |
|
|
|
845 |
|
|
/* Compute the correct offset (i.e., ensure that the offset meets
|
846 |
|
|
the alignment requirements). */
|
847 |
|
|
offset_overflow = *cum % type_align_in_units;
|
848 |
|
|
if (offset_overflow == 0)
|
849 |
|
|
new_offset = *cum;
|
850 |
|
|
else
|
851 |
|
|
new_offset = (*cum - offset_overflow) + type_align_in_units;
|
852 |
|
|
|
853 |
|
|
if (TARGET_DEBUG)
|
854 |
|
|
{
|
855 |
|
|
printf ("Function arg:\n");
|
856 |
|
|
printf (" Type valid: %s\n", (type ? "yes" : "no"));
|
857 |
|
|
printf (" Cumulative Value: %d\n", *cum);
|
858 |
|
|
printf (" Mode: %s\n", GET_MODE_NAME (mode));
|
859 |
|
|
printf (" Type size: %i units\n", type_size_in_units);
|
860 |
|
|
printf (" Alignment: %i units\n", type_align_in_units);
|
861 |
|
|
printf (" New offset: %i\n", new_offset);
|
862 |
|
|
printf ("\n");
|
863 |
|
|
}
|
864 |
|
|
|
865 |
|
|
/* If the new offset is outside the register space, return. */
|
866 |
|
|
if (new_offset >= MAX_CALL_PARAMETER_REGS * 2)
|
867 |
|
|
return 0;
|
868 |
|
|
|
869 |
|
|
/* If the end of the argument is outside the register space, then
|
870 |
|
|
the argument must overlap the register space. Return the first
|
871 |
|
|
available register. */
|
872 |
|
|
if ((new_offset + type_size_in_units) > (MAX_CALL_PARAMETER_REGS * 2))
|
873 |
|
|
return gen_rtx_REG (HImode, new_offset / 2);
|
874 |
|
|
|
875 |
|
|
/* Create a register of the required mode to hold the parameter. */
|
876 |
|
|
reg = new_offset / 2;
|
877 |
|
|
switch (mode)
|
878 |
|
|
{
|
879 |
|
|
case QImode:
|
880 |
|
|
case HImode:
|
881 |
|
|
case SImode:
|
882 |
|
|
case SFmode:
|
883 |
|
|
case DImode:
|
884 |
|
|
case DFmode:
|
885 |
|
|
case SDmode:
|
886 |
|
|
case DDmode:
|
887 |
|
|
case CHImode:
|
888 |
|
|
case CSImode:
|
889 |
|
|
case SCmode:
|
890 |
|
|
case CQImode:
|
891 |
|
|
return gen_rtx_REG (mode, reg);
|
892 |
|
|
|
893 |
|
|
case BLKmode:
|
894 |
|
|
{
|
895 |
|
|
/* Empty blockmode values can be passed as arguments (e.g.,
|
896 |
|
|
* empty structs). These require no registers
|
897 |
|
|
* whatsoever. Non-empty blockmode values are passed in a set
|
898 |
|
|
* of parallel registers. */
|
899 |
|
|
if (type_size_in_units == 0)
|
900 |
|
|
return 0;
|
901 |
|
|
else
|
902 |
|
|
return picochip_emit_register_parallel (type_size_in_units, new_offset);
|
903 |
|
|
}
|
904 |
|
|
|
905 |
|
|
default:
|
906 |
|
|
warning
|
907 |
|
|
(0, "defaulting to stack for %s register creation",
|
908 |
|
|
GET_MODE_NAME (mode));
|
909 |
|
|
break;
|
910 |
|
|
}
|
911 |
|
|
|
912 |
|
|
return 0;
|
913 |
|
|
|
914 |
|
|
}
|
915 |
|
|
|
916 |
|
|
/* Determine where the next incoming function argument will
|
917 |
|
|
appear. Normally, this works in exactly the same way as
|
918 |
|
|
picochip_function_arg, except when the function in question is a
|
919 |
|
|
varadic function. In this case, the incoming arguments all appear
|
920 |
|
|
to be passed on the stack (actually, some of the arguments are
|
921 |
|
|
passed in registers, which are then pushed onto the stack by the
|
922 |
|
|
function prologue). */
|
923 |
|
|
rtx
|
924 |
|
|
picochip_incoming_function_arg (cumulative_args_t cum,
|
925 |
|
|
enum machine_mode mode,
|
926 |
|
|
const_tree type, bool named)
|
927 |
|
|
{
|
928 |
|
|
|
929 |
|
|
if (cfun->stdarg)
|
930 |
|
|
return 0;
|
931 |
|
|
else
|
932 |
|
|
return picochip_function_arg (cum, mode, type, named);
|
933 |
|
|
|
934 |
|
|
}
|
935 |
|
|
|
936 |
|
|
/* Gives the alignment boundary, in bits, of an argument with the
|
937 |
|
|
specified mode. */
|
938 |
|
|
unsigned int
|
939 |
|
|
picochip_function_arg_boundary (enum machine_mode mode,
|
940 |
|
|
const_tree type ATTRIBUTE_UNUSED)
|
941 |
|
|
{
|
942 |
|
|
int align;
|
943 |
|
|
|
944 |
|
|
if (mode == BLKmode)
|
945 |
|
|
align = STACK_BOUNDARY;
|
946 |
|
|
else
|
947 |
|
|
align = GET_MODE_ALIGNMENT (mode);
|
948 |
|
|
|
949 |
|
|
if (align < PARM_BOUNDARY)
|
950 |
|
|
align = PARM_BOUNDARY;
|
951 |
|
|
|
952 |
|
|
return align;
|
953 |
|
|
|
954 |
|
|
}
|
955 |
|
|
|
956 |
|
|
/* Compute partial registers. */
|
957 |
|
|
int
|
958 |
|
|
picochip_arg_partial_bytes (cumulative_args_t p_cum, enum machine_mode mode,
|
959 |
|
|
tree type, bool named ATTRIBUTE_UNUSED)
|
960 |
|
|
{
|
961 |
|
|
int type_align_in_units = 0;
|
962 |
|
|
int type_size_in_units;
|
963 |
|
|
int new_offset = 0;
|
964 |
|
|
int offset_overflow = 0;
|
965 |
|
|
|
966 |
|
|
unsigned cum = *get_cumulative_args (p_cum);
|
967 |
|
|
|
968 |
|
|
/* VOIDmode is passed when computing the second argument to a `call'
|
969 |
|
|
pattern. This can be ignored. */
|
970 |
|
|
if (mode == VOIDmode)
|
971 |
|
|
return 0;
|
972 |
|
|
|
973 |
|
|
/* Compute the alignment and size of the parameter. */
|
974 |
|
|
type_align_in_units =
|
975 |
|
|
picochip_function_arg_boundary (mode, type) / BITS_PER_UNIT;
|
976 |
|
|
type_size_in_units = picochip_compute_arg_size (type, mode);
|
977 |
|
|
|
978 |
|
|
/* Compute the correct offset (i.e., ensure that the offset meets
|
979 |
|
|
the alignment requirements). */
|
980 |
|
|
offset_overflow = cum % type_align_in_units;
|
981 |
|
|
if (offset_overflow == 0)
|
982 |
|
|
new_offset = cum;
|
983 |
|
|
else
|
984 |
|
|
new_offset = (cum - offset_overflow) + type_align_in_units;
|
985 |
|
|
|
986 |
|
|
if (TARGET_DEBUG)
|
987 |
|
|
{
|
988 |
|
|
printf ("Partial function arg nregs:\n");
|
989 |
|
|
printf (" Type valid: %s\n", (type ? "yes" : "no"));
|
990 |
|
|
printf (" Cumulative Value: %d\n", cum);
|
991 |
|
|
printf (" Mode: %s\n", GET_MODE_NAME (mode));
|
992 |
|
|
printf (" Type size: %i units\n", type_size_in_units);
|
993 |
|
|
printf (" Alignment: %i units\n", type_align_in_units);
|
994 |
|
|
printf (" New offset: %i\n", new_offset);
|
995 |
|
|
printf ("\n");
|
996 |
|
|
}
|
997 |
|
|
|
998 |
|
|
/* If the new offset is outside the register space, return. */
|
999 |
|
|
if (new_offset >= (MAX_CALL_PARAMETER_REGS * 2))
|
1000 |
|
|
return 0;
|
1001 |
|
|
|
1002 |
|
|
/* If the end of the argument is outside the register space, then
|
1003 |
|
|
the argument must overlap the register space. Return the number
|
1004 |
|
|
of bytes which are passed in registers. */
|
1005 |
|
|
if ((new_offset + type_size_in_units) > (MAX_CALL_PARAMETER_REGS * 2))
|
1006 |
|
|
return ((MAX_CALL_PARAMETER_REGS * 2) - new_offset);
|
1007 |
|
|
|
1008 |
|
|
return 0;
|
1009 |
|
|
|
1010 |
|
|
}
|
1011 |
|
|
|
1012 |
|
|
/* Advance the cumulative args counter CUM. */
|
1013 |
|
|
void
|
1014 |
|
|
picochip_arg_advance (cumulative_args_t cum_v, enum machine_mode mode,
|
1015 |
|
|
const_tree type, bool named ATTRIBUTE_UNUSED)
|
1016 |
|
|
{
|
1017 |
|
|
CUMULATIVE_ARGS *cum = get_cumulative_args (cum_v);
|
1018 |
|
|
int type_align_in_units = 0;
|
1019 |
|
|
int type_size_in_units;
|
1020 |
|
|
int new_offset = 0;
|
1021 |
|
|
int offset_overflow = 0;
|
1022 |
|
|
|
1023 |
|
|
/* VOIDmode is passed when computing the second argument to a `call'
|
1024 |
|
|
pattern. This can be ignored. */
|
1025 |
|
|
if (mode == VOIDmode)
|
1026 |
|
|
return;
|
1027 |
|
|
|
1028 |
|
|
/* Compute the alignment and size of the parameter. */
|
1029 |
|
|
type_align_in_units =
|
1030 |
|
|
picochip_function_arg_boundary (mode, type) / BITS_PER_UNIT;
|
1031 |
|
|
type_size_in_units = picochip_compute_arg_size (type, mode);
|
1032 |
|
|
|
1033 |
|
|
/* Compute the correct offset (i.e., ensure that the offset meets
|
1034 |
|
|
the alignment requirements). */
|
1035 |
|
|
offset_overflow = *cum % type_align_in_units;
|
1036 |
|
|
if (offset_overflow == 0)
|
1037 |
|
|
new_offset = *cum;
|
1038 |
|
|
else
|
1039 |
|
|
new_offset = (*cum - offset_overflow) + type_align_in_units;
|
1040 |
|
|
|
1041 |
|
|
/* Advance past the last argument. */
|
1042 |
|
|
new_offset += type_size_in_units;
|
1043 |
|
|
|
1044 |
|
|
*cum = new_offset;
|
1045 |
|
|
}
|
1046 |
|
|
|
1047 |
|
|
/* Determine whether a register needs saving/restoring. It does if it
|
1048 |
|
|
is live in a function, and isn't a call-used register. */
|
1049 |
|
|
static int
|
1050 |
|
|
picochip_reg_needs_saving (int reg_num)
|
1051 |
|
|
{
|
1052 |
|
|
return df_regs_ever_live_p(reg_num) && !call_used_regs[reg_num];
|
1053 |
|
|
}
|
1054 |
|
|
|
1055 |
|
|
/* Compute and return offset of the main frame. */
|
1056 |
|
|
static int
|
1057 |
|
|
picochip_frame_byte_offset (void)
|
1058 |
|
|
{
|
1059 |
|
|
gcc_assert(picochip_is_aligned
|
1060 |
|
|
(crtl->outgoing_args_size, BITS_PER_WORD));
|
1061 |
|
|
|
1062 |
|
|
return crtl->outgoing_args_size;
|
1063 |
|
|
}
|
1064 |
|
|
|
1065 |
|
|
/* Return the size of the main frame. */
|
1066 |
|
|
static int
|
1067 |
|
|
picochip_frame_size_in_bytes (void)
|
1068 |
|
|
{
|
1069 |
|
|
int frame_size = get_frame_size();
|
1070 |
|
|
int stack_align = STACK_BOUNDARY/BITS_PER_UNIT;
|
1071 |
|
|
if (!picochip_is_aligned (frame_size, STACK_BOUNDARY))
|
1072 |
|
|
frame_size = frame_size + (stack_align - frame_size%stack_align);
|
1073 |
|
|
gcc_assert(picochip_is_aligned (frame_size, STACK_BOUNDARY));
|
1074 |
|
|
return frame_size;
|
1075 |
|
|
}
|
1076 |
|
|
|
1077 |
|
|
/* Compute and return the size (in bytes) of the register save/restore
|
1078 |
|
|
area for the current function. This only includes the general
|
1079 |
|
|
purpose registers - the special purpose stack pointer and link
|
1080 |
|
|
registers are not included in this area. */
|
1081 |
|
|
static int
|
1082 |
|
|
picochip_save_area_size_in_bytes (void)
|
1083 |
|
|
{
|
1084 |
|
|
int num_regs_to_save = 0;
|
1085 |
|
|
int i = 0;
|
1086 |
|
|
|
1087 |
|
|
/* Read through all the registers, determining which need to be saved. */
|
1088 |
|
|
for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
|
1089 |
|
|
{
|
1090 |
|
|
if (picochip_reg_needs_saving (i))
|
1091 |
|
|
num_regs_to_save += 1;
|
1092 |
|
|
}
|
1093 |
|
|
|
1094 |
|
|
return num_regs_to_save * UNITS_PER_WORD;
|
1095 |
|
|
|
1096 |
|
|
}
|
1097 |
|
|
|
1098 |
|
|
/* Compute and return offset of the save area base. */
|
1099 |
|
|
static int
|
1100 |
|
|
picochip_save_area_byte_offset (void)
|
1101 |
|
|
{
|
1102 |
|
|
int base_offset = (picochip_frame_byte_offset () +
|
1103 |
|
|
picochip_frame_size_in_bytes ());
|
1104 |
|
|
|
1105 |
|
|
gcc_assert(picochip_is_aligned (base_offset, BITS_PER_WORD));
|
1106 |
|
|
|
1107 |
|
|
return base_offset;
|
1108 |
|
|
|
1109 |
|
|
}
|
1110 |
|
|
|
1111 |
|
|
/* Compute and return offset of the special register save area. This
|
1112 |
|
|
area can be found immediately above the normal save area. It must
|
1113 |
|
|
be aligned, to allow the registers to be saved and restored as a
|
1114 |
|
|
pair. */
|
1115 |
|
|
static int
|
1116 |
|
|
picochip_special_save_area_byte_offset (void)
|
1117 |
|
|
{
|
1118 |
|
|
int byte_alignment = STACK_BOUNDARY / BITS_PER_UNIT;
|
1119 |
|
|
int offset = (picochip_save_area_byte_offset () +
|
1120 |
|
|
picochip_save_area_size_in_bytes ());
|
1121 |
|
|
|
1122 |
|
|
if ((offset % byte_alignment) != 0)
|
1123 |
|
|
offset = ((offset / byte_alignment) + 1) * byte_alignment;
|
1124 |
|
|
|
1125 |
|
|
return offset;
|
1126 |
|
|
|
1127 |
|
|
}
|
1128 |
|
|
|
1129 |
|
|
/* Determine whether the LNK/SP register save/restores can be eliminated. */
|
1130 |
|
|
static int
|
1131 |
|
|
picochip_can_eliminate_link_sp_save (void)
|
1132 |
|
|
{
|
1133 |
|
|
/* This deserves some reasoning. The df_regs_ever_live_p call keeps
|
1134 |
|
|
changing during optimizations phases. So, this function returns different
|
1135 |
|
|
values when called from initial_elimination_offset and then again when it
|
1136 |
|
|
is called from prologue/epilogue generation. This means that argument
|
1137 |
|
|
accesses become wrong. This wouldnt happen only if we were not using the
|
1138 |
|
|
stack at all. The following conditions ensures that.*/
|
1139 |
|
|
|
1140 |
|
|
return (current_function_is_leaf &&
|
1141 |
|
|
!df_regs_ever_live_p(LINK_REGNUM) &&
|
1142 |
|
|
!df_regs_ever_live_p(STACK_POINTER_REGNUM) &&
|
1143 |
|
|
(picochip_special_save_area_byte_offset() == 0) &&
|
1144 |
|
|
(crtl->args.size == 0) &&
|
1145 |
|
|
(crtl->args.pretend_args_size == 0));
|
1146 |
|
|
}
|
1147 |
|
|
|
1148 |
|
|
/* Compute the size of the special reg save area (SP and LNK). If the
|
1149 |
|
|
SP/LNK registers don't need to be saved, this area can shrink to
|
1150 |
|
|
nothing. */
|
1151 |
|
|
static int
|
1152 |
|
|
picochip_special_save_area_size_in_bytes (void)
|
1153 |
|
|
{
|
1154 |
|
|
|
1155 |
|
|
|
1156 |
|
|
if (picochip_can_eliminate_link_sp_save ())
|
1157 |
|
|
return 0;
|
1158 |
|
|
else
|
1159 |
|
|
return 2 * UNITS_PER_WORD;
|
1160 |
|
|
}
|
1161 |
|
|
|
1162 |
|
|
/* Return the number of pretend arguments. If this function is
|
1163 |
|
|
varadic, all the incoming arguments are effectively passed on the
|
1164 |
|
|
stack. If this function has real pretend arguments (caused by a
|
1165 |
|
|
value being passed partially on the stack and partially in
|
1166 |
|
|
registers), then return the number of registers used. */
|
1167 |
|
|
static int
|
1168 |
|
|
picochip_pretend_arg_area_size (void)
|
1169 |
|
|
{
|
1170 |
|
|
|
1171 |
|
|
if (crtl->args.pretend_args_size != 0)
|
1172 |
|
|
{
|
1173 |
|
|
gcc_assert(crtl->args.pretend_args_size % 4 == 0);
|
1174 |
|
|
|
1175 |
|
|
return crtl->args.pretend_args_size;
|
1176 |
|
|
}
|
1177 |
|
|
else if (cfun->stdarg)
|
1178 |
|
|
return 12;
|
1179 |
|
|
else
|
1180 |
|
|
return 0;
|
1181 |
|
|
|
1182 |
|
|
}
|
1183 |
|
|
|
1184 |
|
|
/* Compute and return the offset of the pretend arguments. The pretend
|
1185 |
|
|
arguments are contiguous with the incoming arguments, and must be
|
1186 |
|
|
correctly aligned. */
|
1187 |
|
|
static int
|
1188 |
|
|
picochip_pretend_arg_area_byte_offset (void)
|
1189 |
|
|
{
|
1190 |
|
|
int base_offset = 0;
|
1191 |
|
|
|
1192 |
|
|
base_offset = (picochip_special_save_area_byte_offset () +
|
1193 |
|
|
picochip_special_save_area_size_in_bytes ());
|
1194 |
|
|
|
1195 |
|
|
gcc_assert(picochip_is_aligned (base_offset, STACK_BOUNDARY));
|
1196 |
|
|
gcc_assert(picochip_is_aligned
|
1197 |
|
|
(base_offset + picochip_pretend_arg_area_size (), STACK_BOUNDARY));
|
1198 |
|
|
|
1199 |
|
|
return base_offset;
|
1200 |
|
|
|
1201 |
|
|
}
|
1202 |
|
|
|
1203 |
|
|
/* Compute and return the offset of the incoming arguments. If a
|
1204 |
|
|
static chain is in use, this will be passed just before the other
|
1205 |
|
|
arguments. This means that the pretend argument mechanism, used in
|
1206 |
|
|
variadic functions, doesn't work properly. Thus, static chains work
|
1207 |
|
|
on their own, as do variadic functions, but not the combination of
|
1208 |
|
|
the two. This isn't really a problem. */
|
1209 |
|
|
static int
|
1210 |
|
|
picochip_arg_area_byte_offset (void)
|
1211 |
|
|
{
|
1212 |
|
|
int base_offset = (picochip_pretend_arg_area_byte_offset () +
|
1213 |
|
|
picochip_pretend_arg_area_size ());
|
1214 |
|
|
|
1215 |
|
|
/* Add an extra 4 bytes - only an extra 16-bits are required, but
|
1216 |
|
|
the alignment on a 32-bit boundary must be maintained. */
|
1217 |
|
|
if (cfun->static_chain_decl != NULL)
|
1218 |
|
|
{
|
1219 |
|
|
gcc_assert (!cfun->stdarg);
|
1220 |
|
|
base_offset += 4;
|
1221 |
|
|
}
|
1222 |
|
|
|
1223 |
|
|
gcc_assert(picochip_is_aligned (base_offset, STACK_BOUNDARY));
|
1224 |
|
|
|
1225 |
|
|
return base_offset;
|
1226 |
|
|
|
1227 |
|
|
}
|
1228 |
|
|
|
1229 |
|
|
int
|
1230 |
|
|
picochip_regno_nregs (int regno ATTRIBUTE_UNUSED, int mode)
|
1231 |
|
|
{
|
1232 |
|
|
|
1233 |
|
|
/* Special case - only one register needed. */
|
1234 |
|
|
if (GET_MODE_CLASS (mode) == MODE_CC)
|
1235 |
|
|
return 1;
|
1236 |
|
|
|
1237 |
|
|
/* We actually do not allocate acc0 ever. But, it seems like we need to
|
1238 |
|
|
make it look like a allocatable register for the dataflow checks to work
|
1239 |
|
|
properly. Note that hard_regno_mode_ok will always return 0 for acc0*/
|
1240 |
|
|
|
1241 |
|
|
if (regno == 16)
|
1242 |
|
|
return 1;
|
1243 |
|
|
|
1244 |
|
|
/* General case - compute how much space in terms of units. */
|
1245 |
|
|
return ((GET_MODE_SIZE (mode) + UNITS_PER_WORD - 1) / UNITS_PER_WORD);
|
1246 |
|
|
|
1247 |
|
|
}
|
1248 |
|
|
|
1249 |
|
|
int
|
1250 |
|
|
picochip_class_max_nregs (int reg_class, int mode)
|
1251 |
|
|
{
|
1252 |
|
|
int size = ((GET_MODE_SIZE (mode) + UNITS_PER_WORD - 1) / UNITS_PER_WORD);
|
1253 |
|
|
|
1254 |
|
|
if (reg_class == ACC_REGS)
|
1255 |
|
|
return 1;
|
1256 |
|
|
|
1257 |
|
|
if (GET_MODE_CLASS (mode) == MODE_CC)
|
1258 |
|
|
return 1;
|
1259 |
|
|
else
|
1260 |
|
|
return size;
|
1261 |
|
|
|
1262 |
|
|
}
|
1263 |
|
|
|
1264 |
|
|
/* Eliminate a register that addresses the stack (e.g., frame pointer,
|
1265 |
|
|
argument pointer) by replacing it with a constant offset from the
|
1266 |
|
|
main stack register. */
|
1267 |
|
|
int
|
1268 |
|
|
initial_elimination_offset (int from, int to)
|
1269 |
|
|
{
|
1270 |
|
|
int offset_from_sp = 0;
|
1271 |
|
|
|
1272 |
|
|
if (FRAME_POINTER_REGNUM == from && STACK_POINTER_REGNUM == to)
|
1273 |
|
|
offset_from_sp = picochip_frame_byte_offset ();
|
1274 |
|
|
else if (ARG_POINTER_REGNUM == from && STACK_POINTER_REGNUM == to)
|
1275 |
|
|
offset_from_sp = picochip_pretend_arg_area_byte_offset ();
|
1276 |
|
|
else
|
1277 |
|
|
gcc_unreachable();
|
1278 |
|
|
|
1279 |
|
|
return offset_from_sp;
|
1280 |
|
|
|
1281 |
|
|
}
|
1282 |
|
|
|
1283 |
|
|
/* Compute and return the size of the incoming argument area. */
|
1284 |
|
|
static int
|
1285 |
|
|
picochip_arg_area_size_in_bytes (void)
|
1286 |
|
|
{
|
1287 |
|
|
return crtl->args.size;
|
1288 |
|
|
}
|
1289 |
|
|
|
1290 |
|
|
/* Determine whether the given register is valid. When the strict mode
|
1291 |
|
|
is used, only hard registers are valid, otherwise any register is
|
1292 |
|
|
valid. */
|
1293 |
|
|
static int
|
1294 |
|
|
picochip_legitimate_address_register (rtx x, unsigned strict)
|
1295 |
|
|
{
|
1296 |
|
|
|
1297 |
|
|
/* Sanity check - non-registers shouldn't make it here, but... */
|
1298 |
|
|
if (REG != GET_CODE (x))
|
1299 |
|
|
return 0;
|
1300 |
|
|
|
1301 |
|
|
if (strict)
|
1302 |
|
|
return REGNO (x) < FIRST_NONHARD_REGISTER;
|
1303 |
|
|
else
|
1304 |
|
|
return 1;
|
1305 |
|
|
|
1306 |
|
|
}
|
1307 |
|
|
|
1308 |
|
|
/* Determine whether the given constant is in the range required for
|
1309 |
|
|
the given base register. */
|
1310 |
|
|
static int
|
1311 |
|
|
picochip_const_ok_for_base (enum machine_mode mode, int regno, int offset)
|
1312 |
|
|
{
|
1313 |
|
|
HOST_WIDE_INT corrected_offset;
|
1314 |
|
|
|
1315 |
|
|
if (GET_MODE_SIZE (mode) != 0)
|
1316 |
|
|
{
|
1317 |
|
|
if (GET_MODE_SIZE(mode) <= 4)
|
1318 |
|
|
{
|
1319 |
|
|
/* We used to allow incorrect offsets if strict is 0. But, this would
|
1320 |
|
|
then rely on reload doing the right thing. We have had problems
|
1321 |
|
|
there before, and on > 4.3 compiler, there are no benefits. */
|
1322 |
|
|
if (offset % GET_MODE_SIZE (mode) != 0)
|
1323 |
|
|
return 0;
|
1324 |
|
|
corrected_offset = offset / GET_MODE_SIZE (mode);
|
1325 |
|
|
}
|
1326 |
|
|
else
|
1327 |
|
|
{
|
1328 |
|
|
if (offset % 4 != 0)
|
1329 |
|
|
return 0;
|
1330 |
|
|
corrected_offset = offset / 4;
|
1331 |
|
|
}
|
1332 |
|
|
}
|
1333 |
|
|
else
|
1334 |
|
|
{
|
1335 |
|
|
/* Default to the byte offset as supplied. */
|
1336 |
|
|
corrected_offset = offset;
|
1337 |
|
|
}
|
1338 |
|
|
|
1339 |
|
|
/* The offset from the base register can be different depending upon
|
1340 |
|
|
the base register. The stack/frame/argument pointer offsets can
|
1341 |
|
|
all be greater than a simple register-based offset. Note that the
|
1342 |
|
|
frame/argument pointer registers are actually eliminations of the
|
1343 |
|
|
stack pointer, so a value which is valid for an offset to, for
|
1344 |
|
|
example, the frame pointer, might be invalid for the stack
|
1345 |
|
|
pointer once the elimination has occurred. However, there is no
|
1346 |
|
|
need to handle this special case here, as the stack offset is
|
1347 |
|
|
always checked after elimination anyway, and the generated code
|
1348 |
|
|
seems to have identical performance. */
|
1349 |
|
|
if (regno == STACK_POINTER_REGNUM ||
|
1350 |
|
|
regno == FRAME_POINTER_REGNUM || regno == ARG_POINTER_REGNUM)
|
1351 |
|
|
return picochip_const_ok_for_letter_p (corrected_offset, 'K');
|
1352 |
|
|
else
|
1353 |
|
|
return picochip_const_ok_for_letter_p (corrected_offset, 'J');
|
1354 |
|
|
|
1355 |
|
|
}
|
1356 |
|
|
|
1357 |
|
|
/* Determine whether a given rtx is a legitimate address for machine_mode
|
1358 |
|
|
MODE. STRICT is non-zero if we're being strict - any pseudo that
|
1359 |
|
|
is not a hard register must be a memory reference. */
|
1360 |
|
|
bool
|
1361 |
|
|
picochip_legitimate_address_p (enum machine_mode mode, rtx x, bool strict)
|
1362 |
|
|
{
|
1363 |
|
|
int valid = 0;
|
1364 |
|
|
|
1365 |
|
|
switch (GET_CODE (x))
|
1366 |
|
|
{
|
1367 |
|
|
case REG:
|
1368 |
|
|
valid = picochip_legitimate_address_register (x, strict);
|
1369 |
|
|
break;
|
1370 |
|
|
|
1371 |
|
|
case PLUS:
|
1372 |
|
|
{
|
1373 |
|
|
rtx base = XEXP (x, 0);
|
1374 |
|
|
rtx offset = XEXP (x, 1);
|
1375 |
|
|
if (strict && !REGNO_OK_FOR_BASE_P (REGNO(base)))
|
1376 |
|
|
{
|
1377 |
|
|
valid = 0;
|
1378 |
|
|
break;
|
1379 |
|
|
}
|
1380 |
|
|
|
1381 |
|
|
valid = (REG == GET_CODE (base) &&
|
1382 |
|
|
picochip_legitimate_address_register (base, strict) &&
|
1383 |
|
|
CONST_INT == GET_CODE (offset) &&
|
1384 |
|
|
picochip_const_ok_for_base (mode, REGNO (base),
|
1385 |
|
|
INTVAL (offset)));
|
1386 |
|
|
break;
|
1387 |
|
|
}
|
1388 |
|
|
|
1389 |
|
|
case SYMBOL_REF:
|
1390 |
|
|
/* The user can select whether a symbol can be used as a memory
|
1391 |
|
|
address. Typically, this will decrease execution time (no
|
1392 |
|
|
register load is required first), but will increase code size
|
1393 |
|
|
(because the symbol will be used several times, rather than
|
1394 |
|
|
loaded once into a register.*/
|
1395 |
|
|
valid = TARGET_SYMBOL_AS_ADDRESS;
|
1396 |
|
|
break;
|
1397 |
|
|
|
1398 |
|
|
case CONST:
|
1399 |
|
|
{
|
1400 |
|
|
/* A constant memory address must be a (plus (symbol_ref)
|
1401 |
|
|
(const_int)), and is only allowed when the symbols are
|
1402 |
|
|
permitted addresses. */
|
1403 |
|
|
rtx inner = XEXP (x, 0);
|
1404 |
|
|
|
1405 |
|
|
valid = (TARGET_SYMBOL_AS_ADDRESS &&
|
1406 |
|
|
PLUS == GET_CODE (inner) &&
|
1407 |
|
|
SYMBOL_REF == GET_CODE (XEXP (inner, 0)) &&
|
1408 |
|
|
CONST_INT == GET_CODE (XEXP (inner, 1)));
|
1409 |
|
|
|
1410 |
|
|
break;
|
1411 |
|
|
|
1412 |
|
|
}
|
1413 |
|
|
|
1414 |
|
|
default:
|
1415 |
|
|
valid = 0;
|
1416 |
|
|
}
|
1417 |
|
|
|
1418 |
|
|
return valid;
|
1419 |
|
|
|
1420 |
|
|
}
|
1421 |
|
|
|
1422 |
|
|
/* For all memory operations, picochip allows a uconst4 offset value. It
|
1423 |
|
|
is hence beneficial to turn an
|
1424 |
|
|
addr = <reg + long_const>
|
1425 |
|
|
ld/st addr
|
1426 |
|
|
|
1427 |
|
|
into
|
1428 |
|
|
|
1429 |
|
|
X = reg + long_const & FFF0
|
1430 |
|
|
diff = long_const - (long_const & FFF0)
|
1431 |
|
|
ld/st <X + diff>
|
1432 |
|
|
|
1433 |
|
|
X can be reused in subsequent memory operations.
|
1434 |
|
|
*/
|
1435 |
|
|
rtx
|
1436 |
|
|
picochip_legitimize_address (rtx x, rtx oldx ATTRIBUTE_UNUSED,
|
1437 |
|
|
enum machine_mode mode)
|
1438 |
|
|
{
|
1439 |
|
|
unsigned mask_val;
|
1440 |
|
|
|
1441 |
|
|
if (!optimize)
|
1442 |
|
|
return x;
|
1443 |
|
|
|
1444 |
|
|
/* Depending on mode, the offsets allowed are either 16/32/64.*/
|
1445 |
|
|
switch (mode)
|
1446 |
|
|
{
|
1447 |
|
|
case QImode:
|
1448 |
|
|
mask_val = 0xFFF0;
|
1449 |
|
|
break;
|
1450 |
|
|
case HImode:
|
1451 |
|
|
mask_val = 0xFFE0;
|
1452 |
|
|
break;
|
1453 |
|
|
case SImode:
|
1454 |
|
|
mask_val = 0xFFC0;
|
1455 |
|
|
break;
|
1456 |
|
|
default:
|
1457 |
|
|
return x;
|
1458 |
|
|
}
|
1459 |
|
|
|
1460 |
|
|
if (GET_CODE (x) == PLUS
|
1461 |
|
|
&& GET_CODE (XEXP (x, 0)) == REG
|
1462 |
|
|
&& GET_CODE (XEXP (x, 1)) == CONST_INT)
|
1463 |
|
|
{
|
1464 |
|
|
int high_val, low_val, offset;
|
1465 |
|
|
offset = INTVAL (XEXP (x, 1));
|
1466 |
|
|
/* Ignore cases with negative offsets. */
|
1467 |
|
|
if (offset < 0)
|
1468 |
|
|
return x;
|
1469 |
|
|
high_val = offset & mask_val;
|
1470 |
|
|
low_val = offset - high_val;
|
1471 |
|
|
if (high_val != 0)
|
1472 |
|
|
{
|
1473 |
|
|
rtx temp_reg = force_reg (Pmode, gen_rtx_PLUS (Pmode, XEXP (x, 0), GEN_INT(high_val)));
|
1474 |
|
|
x = gen_rtx_PLUS (Pmode, temp_reg, GEN_INT(low_val));
|
1475 |
|
|
return x;
|
1476 |
|
|
}
|
1477 |
|
|
}
|
1478 |
|
|
return x;
|
1479 |
|
|
}
|
1480 |
|
|
|
1481 |
|
|
/* For all memory operations, picochip allows a uconst4 offset value. It
|
1482 |
|
|
is hence beneficial to turn an
|
1483 |
|
|
addr = <reg + long_const>
|
1484 |
|
|
ld/st addr
|
1485 |
|
|
|
1486 |
|
|
into
|
1487 |
|
|
|
1488 |
|
|
X = reg + long_const & FFF0
|
1489 |
|
|
diff = long_const - (long_const & FFF0)
|
1490 |
|
|
ld/st <X + diff>
|
1491 |
|
|
|
1492 |
|
|
X can be reused in subsequent memory operations.
|
1493 |
|
|
*/
|
1494 |
|
|
int
|
1495 |
|
|
picochip_legitimize_reload_address (rtx *x,
|
1496 |
|
|
enum machine_mode mode,
|
1497 |
|
|
int opnum, int type,
|
1498 |
|
|
int ind_levels ATTRIBUTE_UNUSED)
|
1499 |
|
|
{
|
1500 |
|
|
unsigned mask_val;
|
1501 |
|
|
|
1502 |
|
|
if (picochip_symbol_offset(*x))
|
1503 |
|
|
{
|
1504 |
|
|
*x = gen_rtx_CONST(mode, *x);
|
1505 |
|
|
return 0;
|
1506 |
|
|
}
|
1507 |
|
|
if (!optimize)
|
1508 |
|
|
return 0;
|
1509 |
|
|
|
1510 |
|
|
/* We should recognise addresses that we created.*/
|
1511 |
|
|
if (GET_CODE (*x) == PLUS
|
1512 |
|
|
&& GET_CODE (XEXP (*x, 0)) == PLUS
|
1513 |
|
|
&& GET_CODE (XEXP (XEXP (*x, 0), 0)) == REG
|
1514 |
|
|
&& GET_CODE (XEXP (XEXP (*x, 0), 1)) == CONST_INT
|
1515 |
|
|
&& GET_CODE (XEXP (*x, 1)) == CONST_INT)
|
1516 |
|
|
{
|
1517 |
|
|
push_reload (XEXP (*x, 0), NULL_RTX, &XEXP (*x, 0), NULL,
|
1518 |
|
|
BASE_REG_CLASS, GET_MODE (*x), VOIDmode, 0, 0,
|
1519 |
|
|
opnum, (enum reload_type)type);
|
1520 |
|
|
return 1;
|
1521 |
|
|
}
|
1522 |
|
|
|
1523 |
|
|
/* Depending on mode, the offsets allowed are either 16/32/64. */
|
1524 |
|
|
switch (mode)
|
1525 |
|
|
{
|
1526 |
|
|
case QImode:
|
1527 |
|
|
mask_val = 0xFFF0;
|
1528 |
|
|
break;
|
1529 |
|
|
case HImode:
|
1530 |
|
|
mask_val = 0xFFE0;
|
1531 |
|
|
break;
|
1532 |
|
|
case SImode:
|
1533 |
|
|
mask_val = 0xFFC0;
|
1534 |
|
|
break;
|
1535 |
|
|
default:
|
1536 |
|
|
return 0;
|
1537 |
|
|
}
|
1538 |
|
|
|
1539 |
|
|
if (GET_CODE (*x) == PLUS
|
1540 |
|
|
&& GET_CODE (XEXP (*x, 0)) == REG
|
1541 |
|
|
&& GET_CODE (XEXP (*x, 1)) == CONST_INT)
|
1542 |
|
|
{
|
1543 |
|
|
int high_val, low_val, offset;
|
1544 |
|
|
offset = INTVAL (XEXP (*x, 1));
|
1545 |
|
|
/* Ignore cases with negative offsets. */
|
1546 |
|
|
if (offset < 0)
|
1547 |
|
|
return 0;
|
1548 |
|
|
high_val = offset & mask_val;
|
1549 |
|
|
low_val = offset - high_val;
|
1550 |
|
|
if (high_val != 0)
|
1551 |
|
|
{
|
1552 |
|
|
rtx temp_reg = gen_rtx_PLUS (Pmode, XEXP (*x, 0), GEN_INT(high_val));
|
1553 |
|
|
*x = gen_rtx_PLUS (Pmode, temp_reg, GEN_INT(low_val));
|
1554 |
|
|
push_reload (XEXP (*x, 0), NULL_RTX, &XEXP (*x, 0), NULL,
|
1555 |
|
|
BASE_REG_CLASS, GET_MODE (*x), VOIDmode, 0, 0,
|
1556 |
|
|
opnum, (enum reload_type)type);
|
1557 |
|
|
return 1;
|
1558 |
|
|
}
|
1559 |
|
|
}
|
1560 |
|
|
|
1561 |
|
|
return 0;
|
1562 |
|
|
}
|
1563 |
|
|
|
1564 |
|
|
/* Detect an rtx which matches (plus (symbol_ref) (const_int)). */
|
1565 |
|
|
int
|
1566 |
|
|
picochip_symbol_offset (rtx operand)
|
1567 |
|
|
{
|
1568 |
|
|
|
1569 |
|
|
return (PLUS == GET_CODE (operand) &&
|
1570 |
|
|
SYMBOL_REF == GET_CODE (XEXP (operand, 0)) &&
|
1571 |
|
|
CONST_INT == GET_CODE (XEXP (operand, 1)));
|
1572 |
|
|
|
1573 |
|
|
}
|
1574 |
|
|
|
1575 |
|
|
/* Assembly output. */
|
1576 |
|
|
|
1577 |
|
|
/* The format here should match the format used in the output of
|
1578 |
|
|
symbol_ref's elsewhere in this file. */
|
1579 |
|
|
void
|
1580 |
|
|
picochip_output_label (FILE * stream, const char name[])
|
1581 |
|
|
{
|
1582 |
|
|
int is_cfi_label = (strncmp (name, "picoMark_LCFI", 13) == 0);
|
1583 |
|
|
|
1584 |
|
|
/* If VLIW scheduling is in use, any Call Frame Information labels
|
1585 |
|
|
generated inside a packet must have their output deferred until
|
1586 |
|
|
the end of the packet. */
|
1587 |
|
|
if (picochip_schedule_type == DFA_TYPE_SPEED &&
|
1588 |
|
|
is_cfi_label && picochip_vliw_continuation)
|
1589 |
|
|
{
|
1590 |
|
|
if (picochip_current_vliw_state.num_cfi_labels_deferred == 2)
|
1591 |
|
|
{
|
1592 |
|
|
internal_error ("LCFI labels have already been deferred");
|
1593 |
|
|
}
|
1594 |
|
|
strcpy (picochip_current_vliw_state.cfi_label_name[
|
1595 |
|
|
picochip_current_vliw_state.num_cfi_labels_deferred], name);
|
1596 |
|
|
picochip_current_vliw_state.num_cfi_labels_deferred++;
|
1597 |
|
|
}
|
1598 |
|
|
else
|
1599 |
|
|
{
|
1600 |
|
|
assemble_name (stream, name);
|
1601 |
|
|
|
1602 |
|
|
if (strncmp (name, "picoMark_", 9) == 0)
|
1603 |
|
|
fprintf (stream, "=\n");
|
1604 |
|
|
else
|
1605 |
|
|
fprintf (stream, ":\n");
|
1606 |
|
|
|
1607 |
|
|
}
|
1608 |
|
|
|
1609 |
|
|
}
|
1610 |
|
|
|
1611 |
|
|
/* The format here should match the format used in the output of
|
1612 |
|
|
symbol_ref's elsewhere in this file. */
|
1613 |
|
|
void
|
1614 |
|
|
picochip_output_labelref (FILE * stream, const char name[])
|
1615 |
|
|
{
|
1616 |
|
|
fprintf (stream, "_%s", name);
|
1617 |
|
|
}
|
1618 |
|
|
|
1619 |
|
|
void
|
1620 |
|
|
picochip_weaken_label (FILE * stream, const char name[])
|
1621 |
|
|
{
|
1622 |
|
|
fprintf (stream, ".weak ");
|
1623 |
|
|
assemble_name (stream, name);
|
1624 |
|
|
fprintf (stream, "\n");
|
1625 |
|
|
}
|
1626 |
|
|
|
1627 |
|
|
/* Return true if the given label (or label prefix) denotes a marker
|
1628 |
|
|
label which should be emitted in the form LABEL= */
|
1629 |
|
|
static int
|
1630 |
|
|
picochip_is_marker_prefix (const char *prefix)
|
1631 |
|
|
{
|
1632 |
|
|
return (strcmp (prefix, "L") != 0 && strcmp (prefix, "LC") != 0
|
1633 |
|
|
&& strcmp (prefix, "LP") != 0);
|
1634 |
|
|
}
|
1635 |
|
|
|
1636 |
|
|
void
|
1637 |
|
|
picochip_output_internal_label (FILE * stream, const char *prefix,
|
1638 |
|
|
unsigned long num)
|
1639 |
|
|
{
|
1640 |
|
|
|
1641 |
|
|
/* Emit different types of label, based upon their prefix. They
|
1642 |
|
|
are handled differently to allow the assembler to ensure that
|
1643 |
|
|
branch target labels are properly aligned, while other labels
|
1644 |
|
|
will only serve as code markers, not branch targets. Aligning
|
1645 |
|
|
labels unnecessarily can result in much code wastage. */
|
1646 |
|
|
if (picochip_is_marker_prefix (prefix))
|
1647 |
|
|
{
|
1648 |
|
|
/* Special label marker. If it appears in the middle of a VLIW
|
1649 |
|
|
packet, defer it until the end of the packet. There has
|
1650 |
|
|
never been a need to handle more than one lm label at a time. */
|
1651 |
|
|
if (picochip_schedule_type == DFA_TYPE_SPEED &&
|
1652 |
|
|
(strcmp (prefix, "LM")) == 0 && picochip_vliw_continuation)
|
1653 |
|
|
{
|
1654 |
|
|
if (strlen (picochip_current_vliw_state.lm_label_name) != 0)
|
1655 |
|
|
internal_error ("LM label has already been deferred");
|
1656 |
|
|
|
1657 |
|
|
sprintf (picochip_current_vliw_state.lm_label_name,
|
1658 |
|
|
"picoMark_%s%ld", prefix, num);
|
1659 |
|
|
}
|
1660 |
|
|
else if (picochip_schedule_type == DFA_TYPE_SPEED &&
|
1661 |
|
|
(strcmp (prefix, "LCFI")) == 0 && picochip_vliw_continuation)
|
1662 |
|
|
{
|
1663 |
|
|
if (picochip_current_vliw_state.num_cfi_labels_deferred == 2)
|
1664 |
|
|
{
|
1665 |
|
|
internal_error ("LCFI labels have already been deferred.");
|
1666 |
|
|
}
|
1667 |
|
|
sprintf(picochip_current_vliw_state.cfi_label_name[
|
1668 |
|
|
picochip_current_vliw_state.num_cfi_labels_deferred],
|
1669 |
|
|
"picoMark_%s%ld", prefix, num);
|
1670 |
|
|
picochip_current_vliw_state.num_cfi_labels_deferred++;
|
1671 |
|
|
}
|
1672 |
|
|
else
|
1673 |
|
|
{
|
1674 |
|
|
/* Marker label. */
|
1675 |
|
|
fprintf (stream, "_picoMark_%s%ld=\n", prefix, num);
|
1676 |
|
|
}
|
1677 |
|
|
|
1678 |
|
|
}
|
1679 |
|
|
else
|
1680 |
|
|
{
|
1681 |
|
|
/* Normal label. */
|
1682 |
|
|
fprintf (stream, "_%s%ld:\n", prefix, num);
|
1683 |
|
|
}
|
1684 |
|
|
|
1685 |
|
|
}
|
1686 |
|
|
|
1687 |
|
|
void
|
1688 |
|
|
picochip_generate_internal_label (char *str, const char *prefix, long num)
|
1689 |
|
|
{
|
1690 |
|
|
/* Two types of internal label can be generated: branch target
|
1691 |
|
|
labels and code marker labels. Branch target labels must always
|
1692 |
|
|
be aligned (since code will execute at these
|
1693 |
|
|
points). Differentiate between the two by prepending markers with
|
1694 |
|
|
a unique prefix, which can later be used in output_label to
|
1695 |
|
|
figure out which label syntax to use. */
|
1696 |
|
|
if (picochip_is_marker_prefix (prefix))
|
1697 |
|
|
sprintf (str, "picoMark_%s%ld", prefix, num);
|
1698 |
|
|
else
|
1699 |
|
|
sprintf (str, "%s%ld", prefix, num);
|
1700 |
|
|
|
1701 |
|
|
}
|
1702 |
|
|
|
1703 |
|
|
void
|
1704 |
|
|
picochip_asm_output_anchor (rtx symbol)
|
1705 |
|
|
{
|
1706 |
|
|
fprintf (asm_out_file, ".offsetData _%s, ",XSTR (symbol, 0));
|
1707 |
|
|
fprintf (asm_out_file, "+ " HOST_WIDE_INT_PRINT_DEC"\n",SYMBOL_REF_BLOCK_OFFSET(symbol));
|
1708 |
|
|
}
|
1709 |
|
|
|
1710 |
|
|
void
|
1711 |
|
|
picochip_output_aligned_common (FILE * stream, const char *name,
|
1712 |
|
|
unsigned size, unsigned alignment)
|
1713 |
|
|
{
|
1714 |
|
|
|
1715 |
|
|
fprintf (stream, ".commonData ");
|
1716 |
|
|
assemble_name (stream, name);
|
1717 |
|
|
fprintf (stream, ", %u, %u\n", size, alignment / 8);
|
1718 |
|
|
picochip_output_global (stream, name);
|
1719 |
|
|
|
1720 |
|
|
}
|
1721 |
|
|
|
1722 |
|
|
void
|
1723 |
|
|
picochip_output_aligned_local (FILE * stream, const char *name,
|
1724 |
|
|
unsigned size, unsigned alignment)
|
1725 |
|
|
{
|
1726 |
|
|
|
1727 |
|
|
fprintf (stream, ".commonData ");
|
1728 |
|
|
assemble_name (stream, name);
|
1729 |
|
|
fprintf (stream, ", %u, %u\n", size, alignment / 8);
|
1730 |
|
|
|
1731 |
|
|
}
|
1732 |
|
|
|
1733 |
|
|
void
|
1734 |
|
|
picochip_output_global (FILE * stream, const char *name)
|
1735 |
|
|
{
|
1736 |
|
|
fprintf (stream, ".global ");
|
1737 |
|
|
assemble_name (stream, name);
|
1738 |
|
|
fprintf (stream, "\n");
|
1739 |
|
|
}
|
1740 |
|
|
|
1741 |
|
|
/* Output an assembly language string. Output as a sequence of decimal
|
1742 |
|
|
numbers, followed by the literal string to make it obvious what the
|
1743 |
|
|
numbers represent. */
|
1744 |
|
|
void
|
1745 |
|
|
picochip_output_ascii (FILE * file, const char *str, int length)
|
1746 |
|
|
{
|
1747 |
|
|
int i = 0;
|
1748 |
|
|
|
1749 |
|
|
fprintf (file, ".ascii ");
|
1750 |
|
|
|
1751 |
|
|
for (i = 0; i < length; ++i)
|
1752 |
|
|
{
|
1753 |
|
|
fprintf (file, "16#%x# ", (char) (str[i]));
|
1754 |
|
|
}
|
1755 |
|
|
|
1756 |
|
|
fprintf (file, " ; ");
|
1757 |
|
|
|
1758 |
|
|
for (i = 0; i < length; ++i)
|
1759 |
|
|
{
|
1760 |
|
|
char c = str[i];
|
1761 |
|
|
|
1762 |
|
|
switch (c)
|
1763 |
|
|
{
|
1764 |
|
|
case '\n':
|
1765 |
|
|
fprintf (file, "\\n");
|
1766 |
|
|
break;
|
1767 |
|
|
case '\t':
|
1768 |
|
|
fprintf (file, "\\t");
|
1769 |
|
|
break;
|
1770 |
|
|
case '\0':
|
1771 |
|
|
fprintf (file, "\\0");
|
1772 |
|
|
break;
|
1773 |
|
|
default:
|
1774 |
|
|
fprintf (file, "%c", c);
|
1775 |
|
|
}
|
1776 |
|
|
|
1777 |
|
|
}
|
1778 |
|
|
|
1779 |
|
|
fprintf (file, "\n");
|
1780 |
|
|
|
1781 |
|
|
}
|
1782 |
|
|
|
1783 |
|
|
/* Output the beginning of an ASM file. */
|
1784 |
|
|
void
|
1785 |
|
|
picochip_asm_file_start (void)
|
1786 |
|
|
{
|
1787 |
|
|
default_file_start ();
|
1788 |
|
|
|
1789 |
|
|
fprintf (asm_out_file, "// picoChip ASM file\n");
|
1790 |
|
|
fprintf (asm_out_file, "//.file \"%s\"\n", main_input_filename);
|
1791 |
|
|
|
1792 |
|
|
fprintf (asm_out_file, "// Has byte access: %s\n",
|
1793 |
|
|
(TARGET_HAS_BYTE_ACCESS ? "Yes" : "No"));
|
1794 |
|
|
|
1795 |
|
|
if (TARGET_HAS_MUL_UNIT)
|
1796 |
|
|
fprintf (asm_out_file, "// Has multiply: Yes (Multiply unit)\n");
|
1797 |
|
|
else if (TARGET_HAS_MAC_UNIT)
|
1798 |
|
|
fprintf (asm_out_file, "// Has multiply: Yes (Mac unit)\n");
|
1799 |
|
|
else
|
1800 |
|
|
fprintf (asm_out_file, "// Has multiply: No\n");
|
1801 |
|
|
}
|
1802 |
|
|
|
1803 |
|
|
/* Output the end of an ASM file. */
|
1804 |
|
|
void
|
1805 |
|
|
picochip_asm_file_end (void)
|
1806 |
|
|
{
|
1807 |
|
|
/* Include a segment end to make it easy for PERL scripts to grab
|
1808 |
|
|
segments. This is now done by assembler*/
|
1809 |
|
|
|
1810 |
|
|
fprintf (asm_out_file, "// End of picoChip ASM file\n");
|
1811 |
|
|
|
1812 |
|
|
}
|
1813 |
|
|
|
1814 |
|
|
/* Output frame debug information to the given stream. */
|
1815 |
|
|
static void
|
1816 |
|
|
picochip_output_frame_debug (FILE * file)
|
1817 |
|
|
{
|
1818 |
|
|
int i = 0;
|
1819 |
|
|
|
1820 |
|
|
if (current_function_is_leaf)
|
1821 |
|
|
fprintf (file, "\t\t// Leaf function\n");
|
1822 |
|
|
else
|
1823 |
|
|
fprintf (file, "\t\t// Non-leaf function\n");
|
1824 |
|
|
|
1825 |
|
|
if (picochip_can_eliminate_link_sp_save ())
|
1826 |
|
|
fprintf (file, "\t\t// Link/fp save/restore can be eliminated\n");
|
1827 |
|
|
|
1828 |
|
|
if (cfun->static_chain_decl != NULL)
|
1829 |
|
|
fprintf (file, "\t\t// Static chain in use\n");
|
1830 |
|
|
|
1831 |
|
|
fprintf (file, "\t\t// Incoming argument size: %d bytes\n",
|
1832 |
|
|
picochip_arg_area_size_in_bytes ());
|
1833 |
|
|
fprintf (file, "\t\t// Incoming arg offset: %d\n",
|
1834 |
|
|
picochip_arg_area_byte_offset ());
|
1835 |
|
|
fprintf (file, "\t\t// Pretend arg size: %d\n",
|
1836 |
|
|
picochip_pretend_arg_area_size ());
|
1837 |
|
|
fprintf (file, "\t\t// Pretend arg offset (ARGP): %d\n",
|
1838 |
|
|
picochip_pretend_arg_area_byte_offset ());
|
1839 |
|
|
fprintf (file, "\t\t// Special reg area size: %d bytes\n",
|
1840 |
|
|
picochip_special_save_area_size_in_bytes ());
|
1841 |
|
|
fprintf (file, "\t\t// Special reg area offset: %d\n",
|
1842 |
|
|
picochip_special_save_area_byte_offset ());
|
1843 |
|
|
|
1844 |
|
|
/* Output which registers are saved. */
|
1845 |
|
|
fprintf (file, "\t\t// Saved regs: ");
|
1846 |
|
|
for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
|
1847 |
|
|
{
|
1848 |
|
|
if (picochip_reg_needs_saving (i))
|
1849 |
|
|
fprintf (file, "%s ", picochip_regnames[i]);
|
1850 |
|
|
}
|
1851 |
|
|
fprintf (file, "\t\t\n");
|
1852 |
|
|
|
1853 |
|
|
fprintf (file, "\t\t// Save area size: %d bytes\n",
|
1854 |
|
|
picochip_save_area_size_in_bytes ());
|
1855 |
|
|
fprintf (file, "\t\t// Save area offset: %d\n",
|
1856 |
|
|
picochip_save_area_byte_offset ());
|
1857 |
|
|
|
1858 |
|
|
fprintf (file, "\t\t// Frame size: %ld bytes\n", get_frame_size ());
|
1859 |
|
|
fprintf (file, "\t\t// Frame offset (FP): %d\n",
|
1860 |
|
|
picochip_frame_byte_offset ());
|
1861 |
|
|
|
1862 |
|
|
fprintf (file, "\t\t// Outgoing argument area size: %d bytes\n",
|
1863 |
|
|
crtl->outgoing_args_size);
|
1864 |
|
|
|
1865 |
|
|
}
|
1866 |
|
|
|
1867 |
|
|
/* Output picoChip function prologue. This contains human-readable
|
1868 |
|
|
information about the function. */
|
1869 |
|
|
void
|
1870 |
|
|
picochip_function_prologue (FILE * file, HOST_WIDE_INT size ATTRIBUTE_UNUSED)
|
1871 |
|
|
{
|
1872 |
|
|
/* Get the function's name, as described by its RTL. This may be
|
1873 |
|
|
different from the DECL_NAME name used in the source file. The
|
1874 |
|
|
real declaration name must be used, to ensure that the prologue
|
1875 |
|
|
emits the right information for the linker. */
|
1876 |
|
|
rtx x;
|
1877 |
|
|
const char *fnname;
|
1878 |
|
|
x = DECL_RTL (current_function_decl);
|
1879 |
|
|
gcc_assert (MEM_P (x));
|
1880 |
|
|
x = XEXP (x, 0);
|
1881 |
|
|
gcc_assert (GET_CODE (x) == SYMBOL_REF);
|
1882 |
|
|
fnname = XSTR (x, 0);
|
1883 |
|
|
|
1884 |
|
|
/* Note that the name of the function is given in the &_%s
|
1885 |
|
|
form. This matches the name of the function as used in labels,
|
1886 |
|
|
and function calls, and enables processCallGraph to match
|
1887 |
|
|
function calls to the name of the function, as defined here. */
|
1888 |
|
|
fprintf (file, "// picoChip Function Prologue : &_%s = %d bytes\n",
|
1889 |
|
|
fnname, picochip_arg_area_byte_offset ());
|
1890 |
|
|
|
1891 |
|
|
picochip_output_frame_debug (file);
|
1892 |
|
|
fprintf (file, "\n");
|
1893 |
|
|
|
1894 |
|
|
}
|
1895 |
|
|
|
1896 |
|
|
/* Output picoChip function epilogue. */
|
1897 |
|
|
void
|
1898 |
|
|
picochip_function_epilogue (FILE * file, HOST_WIDE_INT size ATTRIBUTE_UNUSED)
|
1899 |
|
|
{
|
1900 |
|
|
|
1901 |
|
|
rtx x;
|
1902 |
|
|
const char *fnname;
|
1903 |
|
|
x = DECL_RTL (current_function_decl);
|
1904 |
|
|
gcc_assert (MEM_P (x));
|
1905 |
|
|
x = XEXP (x, 0);
|
1906 |
|
|
gcc_assert (GET_CODE (x) == SYMBOL_REF);
|
1907 |
|
|
fnname = XSTR (x, 0);
|
1908 |
|
|
fprintf (file, "\n// picoChip Function Epilogue : %s\n\n",
|
1909 |
|
|
fnname);
|
1910 |
|
|
}
|
1911 |
|
|
|
1912 |
|
|
/* Manipulate the asm output. Some machines only execute the code when
|
1913 |
|
|
there is actually a chance of needing it (e.g., FRV doesn't execute
|
1914 |
|
|
it if the scheduling pass wasn't used). We always execute it,
|
1915 |
|
|
simple to ensure that it is exercised more often, and bugs are more
|
1916 |
|
|
likely to be found.
|
1917 |
|
|
|
1918 |
|
|
This function's prime reason for existence is to insert the VLIW
|
1919 |
|
|
separators where appropriate. The separators must be inserted
|
1920 |
|
|
before any comments which appear at the end of the file.
|
1921 |
|
|
|
1922 |
|
|
*/
|
1923 |
|
|
const char *
|
1924 |
|
|
picochip_asm_output_opcode (FILE * f, const char *ptr)
|
1925 |
|
|
{
|
1926 |
|
|
int c;
|
1927 |
|
|
|
1928 |
|
|
/* Flag to specify when a VLIW continuation has been inserted onto
|
1929 |
|
|
the line. Continuations are either inserted before any comments,
|
1930 |
|
|
or before the end of the line is reached. The flag ensures that
|
1931 |
|
|
we don't insert continuations twice (i.e., at the comment and the
|
1932 |
|
|
end of line). */
|
1933 |
|
|
int continuation_inserted = 0;
|
1934 |
|
|
|
1935 |
|
|
/* If the instruction uses multiple lines (i.e., a new line
|
1936 |
|
|
character appears in the opcode), then ensure that no attempt is
|
1937 |
|
|
made to pack it into a VLIW. */
|
1938 |
|
|
if (strchr (ptr, '\n') != NULL && picochip_vliw_continuation)
|
1939 |
|
|
internal_error
|
1940 |
|
|
("picochip_asm_output_opcode - Found multiple lines in VLIW packet %s",
|
1941 |
|
|
ptr);
|
1942 |
|
|
|
1943 |
|
|
|
1944 |
|
|
/* If a delay slot is pending, output the directive to the assembler
|
1945 |
|
|
before the instruction. */
|
1946 |
|
|
if (picochip_is_delay_slot_pending)
|
1947 |
|
|
{
|
1948 |
|
|
picochip_is_delay_slot_pending = 0;
|
1949 |
|
|
fputs ("=->\t", f);
|
1950 |
|
|
}
|
1951 |
|
|
|
1952 |
|
|
/* Keep going for entire opcode. All substitution performed ourselves. */
|
1953 |
|
|
while (*ptr)
|
1954 |
|
|
{
|
1955 |
|
|
c = *ptr++;
|
1956 |
|
|
|
1957 |
|
|
/* Determine whether a VLIW continuation must be inserted before
|
1958 |
|
|
any comments, or the end of the opcode. A flag is set to show
|
1959 |
|
|
that we have inserted a continuation on this line, so that we
|
1960 |
|
|
don't try to insert another continuation when the end of the
|
1961 |
|
|
opcode is reached. The only other case for a continuation
|
1962 |
|
|
might have been a newline, but these aren't allowed in
|
1963 |
|
|
conjunction with VLIW continuations (see above code). */
|
1964 |
|
|
if (picochip_vliw_continuation &&
|
1965 |
|
|
!continuation_inserted &&
|
1966 |
|
|
((c == '/' && (*ptr == '/')) || *ptr == '\0'))
|
1967 |
|
|
{
|
1968 |
|
|
fprintf (f, "\\ ");
|
1969 |
|
|
continuation_inserted = 1;
|
1970 |
|
|
}
|
1971 |
|
|
|
1972 |
|
|
/* Detect an explicit VLIW separator. */
|
1973 |
|
|
if (c == '%' && (*ptr == '|'))
|
1974 |
|
|
{
|
1975 |
|
|
fprintf (f, "\\");
|
1976 |
|
|
ptr++;
|
1977 |
|
|
}
|
1978 |
|
|
/* Detect the need for an ALU id operand. */
|
1979 |
|
|
else if (c == '%' && (*ptr == '#'))
|
1980 |
|
|
{
|
1981 |
|
|
fputc (picochip_get_vliw_alu_id (), f);
|
1982 |
|
|
|
1983 |
|
|
if (TARGET_DEBUG)
|
1984 |
|
|
printf ("Generated ALU char at %s for insn %d\n", ptr,
|
1985 |
|
|
INSN_UID (picochip_current_prescan_insn));
|
1986 |
|
|
|
1987 |
|
|
/* Skip past unwanted # */
|
1988 |
|
|
ptr++;
|
1989 |
|
|
}
|
1990 |
|
|
/* Detect the need for branch delay slot. */
|
1991 |
|
|
else if (c == '%' && (*ptr == '>'))
|
1992 |
|
|
{
|
1993 |
|
|
/* Only emit delay slots (NOP's, or otherwise) when delay
|
1994 |
|
|
* slot scheduling has actually been enabled, otherwise VLIW
|
1995 |
|
|
* scheduling and delay slot scheduling output combine to
|
1996 |
|
|
* produce nasty effects. */
|
1997 |
|
|
if (flag_delayed_branch)
|
1998 |
|
|
{
|
1999 |
|
|
if (dbr_sequence_length () == 0)
|
2000 |
|
|
fputs ("\n=->\tNOP", f);
|
2001 |
|
|
else
|
2002 |
|
|
picochip_is_delay_slot_pending = 1;
|
2003 |
|
|
}
|
2004 |
|
|
|
2005 |
|
|
/* Skip past unwanted > */
|
2006 |
|
|
ptr++;
|
2007 |
|
|
}
|
2008 |
|
|
/* Detect any %digit specifiers. */
|
2009 |
|
|
else if (c == '%' && (*ptr >= '0' && *ptr <= '9'))
|
2010 |
|
|
{
|
2011 |
|
|
c = atoi (ptr);
|
2012 |
|
|
picochip_print_operand (f, recog_data.operand[c], 0);
|
2013 |
|
|
while ((c = *ptr) >= '0' && c <= '9')
|
2014 |
|
|
ptr++;
|
2015 |
|
|
}
|
2016 |
|
|
/* Detect any %letterdigit specifiers. */
|
2017 |
|
|
else if (c == '%' && ((*ptr >= 'a' && *ptr <= 'z')
|
2018 |
|
|
|| (*ptr >= 'A' && *ptr <= 'Z')))
|
2019 |
|
|
{
|
2020 |
|
|
int letter = *ptr++;
|
2021 |
|
|
|
2022 |
|
|
c = atoi (ptr);
|
2023 |
|
|
|
2024 |
|
|
switch (letter)
|
2025 |
|
|
{
|
2026 |
|
|
case 'l':
|
2027 |
|
|
output_asm_label (recog_data.operand[c]);
|
2028 |
|
|
break;
|
2029 |
|
|
|
2030 |
|
|
case 'a':
|
2031 |
|
|
output_address (recog_data.operand[c]);
|
2032 |
|
|
break;
|
2033 |
|
|
|
2034 |
|
|
default:
|
2035 |
|
|
picochip_print_operand (f, recog_data.operand[c], letter);
|
2036 |
|
|
}
|
2037 |
|
|
|
2038 |
|
|
while ((c = *ptr) >= '0' && c <= '9')
|
2039 |
|
|
ptr++;
|
2040 |
|
|
}
|
2041 |
|
|
else if (c == '%')
|
2042 |
|
|
internal_error
|
2043 |
|
|
("picochip_asm_output_opcode - can%'t output unknown operator %c",
|
2044 |
|
|
*ptr);
|
2045 |
|
|
else
|
2046 |
|
|
fputc (c, f);
|
2047 |
|
|
}
|
2048 |
|
|
|
2049 |
|
|
/* Reached the end of the packet. If any labels were deferred
|
2050 |
|
|
during output, emit them now. */
|
2051 |
|
|
if (!picochip_vliw_continuation)
|
2052 |
|
|
{
|
2053 |
|
|
if (picochip_current_vliw_state.num_cfi_labels_deferred != 0)
|
2054 |
|
|
{
|
2055 |
|
|
fprintf (f, "\n");
|
2056 |
|
|
assemble_name (f, picochip_current_vliw_state.cfi_label_name[0]);
|
2057 |
|
|
fprintf (f, "=");
|
2058 |
|
|
if (picochip_current_vliw_state.num_cfi_labels_deferred == 2)
|
2059 |
|
|
{
|
2060 |
|
|
fprintf (f, "\n");
|
2061 |
|
|
assemble_name (f, picochip_current_vliw_state.cfi_label_name[1]);
|
2062 |
|
|
fprintf (f, "=");
|
2063 |
|
|
}
|
2064 |
|
|
}
|
2065 |
|
|
|
2066 |
|
|
if (strlen (picochip_current_vliw_state.lm_label_name) != 0)
|
2067 |
|
|
{
|
2068 |
|
|
fprintf (f, "\n");
|
2069 |
|
|
assemble_name (f, picochip_current_vliw_state.lm_label_name);
|
2070 |
|
|
fprintf (f, "=");
|
2071 |
|
|
}
|
2072 |
|
|
}
|
2073 |
|
|
|
2074 |
|
|
/* Output an end-of-packet marker if requested. */
|
2075 |
|
|
if (!picochip_vliw_continuation &&
|
2076 |
|
|
TARGET_DEBUG && picochip_schedule_type == DFA_TYPE_SPEED)
|
2077 |
|
|
fprintf (f, "\n\t//-------------- End of VLIW packet -----------------");
|
2078 |
|
|
|
2079 |
|
|
return ptr;
|
2080 |
|
|
}
|
2081 |
|
|
|
2082 |
|
|
/* Function RTL expansion. */
|
2083 |
|
|
|
2084 |
|
|
/* Expand the prologue into RTL. */
|
2085 |
|
|
void
|
2086 |
|
|
picochip_expand_prologue (void)
|
2087 |
|
|
{
|
2088 |
|
|
int stack_adjustment = 0;
|
2089 |
|
|
int special_save_offset = 0;
|
2090 |
|
|
int general_save_offset = 0;
|
2091 |
|
|
int reg_save_offset = 0;
|
2092 |
|
|
int i = 0;
|
2093 |
|
|
|
2094 |
|
|
stack_adjustment = picochip_arg_area_byte_offset ();
|
2095 |
|
|
general_save_offset =
|
2096 |
|
|
-(stack_adjustment - picochip_save_area_byte_offset ());
|
2097 |
|
|
special_save_offset =
|
2098 |
|
|
-(stack_adjustment - picochip_special_save_area_byte_offset ());
|
2099 |
|
|
|
2100 |
|
|
/* Save the link registers. We could try to save just one register
|
2101 |
|
|
here. This would reduce the amount of stack space required.
|
2102 |
|
|
There hasnt been a good reason to do that so far. */
|
2103 |
|
|
if (!picochip_can_eliminate_link_sp_save ())
|
2104 |
|
|
picochip_emit_save_register (gen_rtx_REG (SImode, LINK_REGNUM),
|
2105 |
|
|
special_save_offset);
|
2106 |
|
|
|
2107 |
|
|
/* Save callee-save registers. */
|
2108 |
|
|
reg_save_offset = 0;
|
2109 |
|
|
for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
|
2110 |
|
|
{
|
2111 |
|
|
if (picochip_reg_needs_saving (i))
|
2112 |
|
|
{
|
2113 |
|
|
|
2114 |
|
|
/* If this register is an even numbered register, and the
|
2115 |
|
|
next register also needs to be saved, use a SImode save,
|
2116 |
|
|
which does both in one instruction. Note that a special
|
2117 |
|
|
check is performed to ensure that the double word aligned
|
2118 |
|
|
store is valid (e.g., it is possible that r6, r8, r9 need
|
2119 |
|
|
to be saved, in which case once r6 has been saved, the
|
2120 |
|
|
stored offset is no longer aligned, and an STL/LDL
|
2121 |
|
|
instruction becomes invalid). Alternately, we could store all
|
2122 |
|
|
aligned registers first and then save the single one(s). */
|
2123 |
|
|
if ((i % 2 == 0) &&
|
2124 |
|
|
picochip_reg_needs_saving (i + 1) &&
|
2125 |
|
|
picochip_is_aligned (reg_save_offset, LONG_TYPE_SIZE))
|
2126 |
|
|
{
|
2127 |
|
|
picochip_emit_save_register (gen_rtx_REG (SImode, i),
|
2128 |
|
|
general_save_offset +
|
2129 |
|
|
reg_save_offset);
|
2130 |
|
|
reg_save_offset += 2 * UNITS_PER_WORD;
|
2131 |
|
|
i++;
|
2132 |
|
|
}
|
2133 |
|
|
else
|
2134 |
|
|
{
|
2135 |
|
|
picochip_emit_save_register (gen_rtx_REG (HImode, i),
|
2136 |
|
|
general_save_offset +
|
2137 |
|
|
reg_save_offset);
|
2138 |
|
|
reg_save_offset += UNITS_PER_WORD;
|
2139 |
|
|
}
|
2140 |
|
|
}
|
2141 |
|
|
|
2142 |
|
|
}
|
2143 |
|
|
|
2144 |
|
|
/* Emit a stack adjustment where required. */
|
2145 |
|
|
if (stack_adjustment != 0)
|
2146 |
|
|
picochip_emit_stack_allocate (stack_adjustment);
|
2147 |
|
|
|
2148 |
|
|
/* If this function uses varadic arguments, write any unnamed
|
2149 |
|
|
registers to the stack. */
|
2150 |
|
|
if (cfun->stdarg)
|
2151 |
|
|
{
|
2152 |
|
|
int stdarg_offset = picochip_pretend_arg_area_byte_offset ();
|
2153 |
|
|
|
2154 |
|
|
/* Sanity check. The pretend argument offset should be 32-bit aligned. */
|
2155 |
|
|
gcc_assert(picochip_pretend_arg_area_byte_offset () % 4 == 0);
|
2156 |
|
|
|
2157 |
|
|
picochip_emit_save_register (gen_rtx_REG (SImode, 0), stdarg_offset);
|
2158 |
|
|
picochip_emit_save_register (gen_rtx_REG (SImode, 2),
|
2159 |
|
|
stdarg_offset + 4);
|
2160 |
|
|
picochip_emit_save_register (gen_rtx_REG (SImode, 4),
|
2161 |
|
|
stdarg_offset + 8);
|
2162 |
|
|
|
2163 |
|
|
}
|
2164 |
|
|
|
2165 |
|
|
}
|
2166 |
|
|
|
2167 |
|
|
/* Expand the epilogue into RTL. */
|
2168 |
|
|
void
|
2169 |
|
|
picochip_expand_epilogue (int is_sibling_call ATTRIBUTE_UNUSED)
|
2170 |
|
|
{
|
2171 |
|
|
int stack_adjustment = 0;
|
2172 |
|
|
int special_save_offset = 0;
|
2173 |
|
|
int general_save_offset = 0;
|
2174 |
|
|
int reg_save_offset = 0;
|
2175 |
|
|
int i = 0;
|
2176 |
|
|
int use_link_fp_restore_stack_adjust = 0; /* Default to using an explicit
|
2177 |
|
|
stack restore. */
|
2178 |
|
|
|
2179 |
|
|
stack_adjustment = picochip_arg_area_byte_offset ();
|
2180 |
|
|
general_save_offset =
|
2181 |
|
|
-(stack_adjustment - picochip_save_area_byte_offset ());
|
2182 |
|
|
special_save_offset =
|
2183 |
|
|
-(stack_adjustment - picochip_special_save_area_byte_offset ());
|
2184 |
|
|
|
2185 |
|
|
/* Emit a stack adjustment where required. */
|
2186 |
|
|
if (stack_adjustment != 0)
|
2187 |
|
|
{
|
2188 |
|
|
/* If the link/fp is already being restored, and the offset to
|
2189 |
|
|
their save location is small enough, don't bother adjusting
|
2190 |
|
|
the stack explicitly. */
|
2191 |
|
|
if (picochip_special_save_area_byte_offset () < 512 &&
|
2192 |
|
|
!picochip_can_eliminate_link_sp_save ())
|
2193 |
|
|
use_link_fp_restore_stack_adjust = 1;
|
2194 |
|
|
else
|
2195 |
|
|
/* Explicitly restore the stack. */
|
2196 |
|
|
picochip_emit_stack_allocate (-stack_adjustment);
|
2197 |
|
|
}
|
2198 |
|
|
|
2199 |
|
|
/* Restore the Link/FP registers. Only save the link register? */
|
2200 |
|
|
if (!picochip_can_eliminate_link_sp_save ())
|
2201 |
|
|
{
|
2202 |
|
|
if (use_link_fp_restore_stack_adjust)
|
2203 |
|
|
picochip_emit_restore_register (gen_rtx_REG (SImode, LINK_REGNUM),
|
2204 |
|
|
picochip_special_save_area_byte_offset
|
2205 |
|
|
());
|
2206 |
|
|
else
|
2207 |
|
|
picochip_emit_restore_register (gen_rtx_REG (SImode, LINK_REGNUM),
|
2208 |
|
|
special_save_offset);
|
2209 |
|
|
}
|
2210 |
|
|
|
2211 |
|
|
/* Restore callee-save registers. */
|
2212 |
|
|
reg_save_offset = 0;
|
2213 |
|
|
for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
|
2214 |
|
|
{
|
2215 |
|
|
if (picochip_reg_needs_saving (i))
|
2216 |
|
|
{
|
2217 |
|
|
|
2218 |
|
|
/* If this register is an even numbered register, and the
|
2219 |
|
|
next register also needs to be saved, use a SImode save,
|
2220 |
|
|
which does both in one instruction. Note that a special
|
2221 |
|
|
check is performed to ensure that the double word aligned
|
2222 |
|
|
store is valid (e.g., it is possible that r6, r8, r9 need
|
2223 |
|
|
to be saved, in which case once r6 has been saved, the
|
2224 |
|
|
stored offset is no longer aligned, and an STL/LDL
|
2225 |
|
|
instruction becomes invalid). We could store all aligned
|
2226 |
|
|
registers first, and then save the single one(s). */
|
2227 |
|
|
if ((i % 2 == 0) &&
|
2228 |
|
|
picochip_reg_needs_saving (i + 1) &&
|
2229 |
|
|
picochip_is_aligned (reg_save_offset, LONG_TYPE_SIZE))
|
2230 |
|
|
{
|
2231 |
|
|
picochip_emit_restore_register (gen_rtx_REG (SImode, i),
|
2232 |
|
|
general_save_offset +
|
2233 |
|
|
reg_save_offset);
|
2234 |
|
|
reg_save_offset += 2 * UNITS_PER_WORD;
|
2235 |
|
|
i++;
|
2236 |
|
|
}
|
2237 |
|
|
else
|
2238 |
|
|
{
|
2239 |
|
|
picochip_emit_restore_register (gen_rtx_REG (HImode, i),
|
2240 |
|
|
general_save_offset +
|
2241 |
|
|
reg_save_offset);
|
2242 |
|
|
reg_save_offset += UNITS_PER_WORD;
|
2243 |
|
|
}
|
2244 |
|
|
}
|
2245 |
|
|
|
2246 |
|
|
}
|
2247 |
|
|
|
2248 |
|
|
/* Emit a return instruction, which matches a (parallel
|
2249 |
|
|
[(return) (use r12)]) */
|
2250 |
|
|
{
|
2251 |
|
|
rtvec p;
|
2252 |
|
|
p = rtvec_alloc (2);
|
2253 |
|
|
|
2254 |
|
|
RTVEC_ELT (p, 0) = ret_rtx;
|
2255 |
|
|
RTVEC_ELT (p, 1) = gen_rtx_USE (VOIDmode,
|
2256 |
|
|
gen_rtx_REG (Pmode, LINK_REGNUM));
|
2257 |
|
|
emit_jump_insn (gen_rtx_PARALLEL (VOIDmode, p));
|
2258 |
|
|
}
|
2259 |
|
|
|
2260 |
|
|
}
|
2261 |
|
|
|
2262 |
|
|
/* Assembly instruction output. */
|
2263 |
|
|
|
2264 |
|
|
/* Test whether the given branch instruction is short, or long. Short
|
2265 |
|
|
* branches are equivalent to real branches, and may be DFA
|
2266 |
|
|
* scheduled. Long branches expand to a macro which is handled by the
|
2267 |
|
|
* elaborator, and cannot be scheduled. Occasionally, the branch
|
2268 |
|
|
* shortening pass, which is run after DFA scheduling, will change the
|
2269 |
|
|
* code layout and cause the short branch to be reverted into a long
|
2270 |
|
|
* branch. Instead of having to fix this up by emitting new assembly,
|
2271 |
|
|
* the short branch is emitted anyway. There is plenty of slack in the
|
2272 |
|
|
* calculation of long and short branches (10-bit offset, but only
|
2273 |
|
|
* 9-bits used in computation), so there is enough slack for this to
|
2274 |
|
|
* be safe. */
|
2275 |
|
|
static int
|
2276 |
|
|
picochip_is_short_branch (rtx insn)
|
2277 |
|
|
{
|
2278 |
|
|
int isRealShortBranch = (get_attr_length(insn) == SHORT_BRANCH_LENGTH);
|
2279 |
|
|
|
2280 |
|
|
return (isRealShortBranch ||
|
2281 |
|
|
picochip_current_vliw_state.num_insns_in_packet > 1);
|
2282 |
|
|
}
|
2283 |
|
|
|
2284 |
|
|
/* Output a compare-and-branch instruction (matching the cbranch
|
2285 |
|
|
pattern). */
|
2286 |
|
|
const char *
|
2287 |
|
|
picochip_output_cbranch (rtx operands[])
|
2288 |
|
|
{
|
2289 |
|
|
|
2290 |
|
|
if (HImode != GET_MODE (operands[1]) ||
|
2291 |
|
|
(HImode != GET_MODE (operands[2]) &&
|
2292 |
|
|
GET_CODE (operands[2]) != CONST_INT))
|
2293 |
|
|
{
|
2294 |
|
|
internal_error ("%s: at least one operand can%'t be handled",
|
2295 |
|
|
__FUNCTION__);
|
2296 |
|
|
}
|
2297 |
|
|
|
2298 |
|
|
/* Use the type of comparison to output the appropriate condition
|
2299 |
|
|
test. */
|
2300 |
|
|
switch (GET_CODE (operands[0]))
|
2301 |
|
|
{
|
2302 |
|
|
case NE:
|
2303 |
|
|
return ("// if (%1 != %2) goto %l3\n\tSUB.%# %1,%2,r15\n\tJMPNE %l3");
|
2304 |
|
|
|
2305 |
|
|
case EQ:
|
2306 |
|
|
return ("// if (%1 == %2) goto %l3\n\tSUB.%# %1,%2,r15\n\tJMPEQ %l3");
|
2307 |
|
|
|
2308 |
|
|
case LE:
|
2309 |
|
|
/* Reverse the operand order to be GE */
|
2310 |
|
|
return ("// if (%1 <= %2) goto %l3\n\tSUB.%# %2,%1,r15\n\tJMPGE %l3");
|
2311 |
|
|
|
2312 |
|
|
case LEU:
|
2313 |
|
|
/* Reverse operand order of GEU. */
|
2314 |
|
|
return ("// if (%1 <= %2) goto %l3\n\tSUB.%# %2,%1,r15\n\tJMPHS %l3");
|
2315 |
|
|
|
2316 |
|
|
case GE:
|
2317 |
|
|
return ("// if (%1 >= %2) goto %l3\n\tSUB.%# %1,%2,r15\n\tJMPGE %l3");
|
2318 |
|
|
|
2319 |
|
|
case GEU:
|
2320 |
|
|
return ("// if (%1 >= %2) goto %l3\n\tSUB.%# %1,%2,r15\n\tJMPHS %l3");
|
2321 |
|
|
|
2322 |
|
|
case LT:
|
2323 |
|
|
return ("// if (%1 < %2) goto %l3\n\tSUB.%# %1,%2,r15\n\tJMPLT %l3");
|
2324 |
|
|
|
2325 |
|
|
case LTU:
|
2326 |
|
|
return ("// if (%1 <{U} %2) goto %l3\n\tSUB.%# %1,%2,r15\n\tJMPLO %l3");
|
2327 |
|
|
|
2328 |
|
|
case GT:
|
2329 |
|
|
/* Reversed operand version of LT. */
|
2330 |
|
|
return ("// if (%1 > %2) goto %l3\n\tSUB.%# %2,%1,r15\n\tJMPLT %l3");
|
2331 |
|
|
|
2332 |
|
|
case GTU:
|
2333 |
|
|
/* Reverse an LTU. */
|
2334 |
|
|
return ("// if (%1 >{U} %2) goto %l3\n\tSUB.%# %2,%1,r15\n\tJMPLO %l3");
|
2335 |
|
|
|
2336 |
|
|
default:
|
2337 |
|
|
gcc_unreachable();
|
2338 |
|
|
}
|
2339 |
|
|
}
|
2340 |
|
|
|
2341 |
|
|
/* Output a compare-and-branch instruction (matching the cbranch
|
2342 |
|
|
pattern). This function is current unused since the cbranch
|
2343 |
|
|
split is disabled. The function is kept around so we can use
|
2344 |
|
|
it when we understand how to do cbranch split safely. */
|
2345 |
|
|
const char *
|
2346 |
|
|
picochip_output_compare (rtx operands[])
|
2347 |
|
|
{
|
2348 |
|
|
int code;
|
2349 |
|
|
|
2350 |
|
|
if (HImode != GET_MODE (operands[1]) ||
|
2351 |
|
|
(HImode != GET_MODE (operands[2]) &&
|
2352 |
|
|
GET_CODE (operands[2]) != CONST_INT))
|
2353 |
|
|
{
|
2354 |
|
|
internal_error ("%s: at least one operand can%'t be handled",
|
2355 |
|
|
__FUNCTION__);
|
2356 |
|
|
}
|
2357 |
|
|
|
2358 |
|
|
code = GET_CODE (operands[0]);
|
2359 |
|
|
/* Use the type of comparison to output the appropriate condition
|
2360 |
|
|
test. */
|
2361 |
|
|
switch (code)
|
2362 |
|
|
{
|
2363 |
|
|
case NE:
|
2364 |
|
|
return ("SUB.%# %1,%2,r15\t// CC := (%0)");
|
2365 |
|
|
|
2366 |
|
|
case EQ:
|
2367 |
|
|
return ("SUB.%# %1,%2,r15\t// CC := (%0)");
|
2368 |
|
|
|
2369 |
|
|
case LE:
|
2370 |
|
|
/* Reverse the operand order to be GE */
|
2371 |
|
|
return ("SUB.%# %2,%1,r15\t// CC := (%0)");
|
2372 |
|
|
|
2373 |
|
|
case LEU:
|
2374 |
|
|
/* Reverse operand order of GEU. */
|
2375 |
|
|
return ("SUB.%# %2,%1,r15\t// CC := (%0)");
|
2376 |
|
|
|
2377 |
|
|
case GE:
|
2378 |
|
|
return ("SUB.%# %1,%2,r15\t// CC := (%0)");
|
2379 |
|
|
|
2380 |
|
|
case GEU:
|
2381 |
|
|
return ("SUB.%# %1,%2,r15\t// CC := (%0)");
|
2382 |
|
|
|
2383 |
|
|
case LT:
|
2384 |
|
|
return ("SUB.%# %1,%2,r15\t// CC := (%0)");
|
2385 |
|
|
|
2386 |
|
|
case LTU:
|
2387 |
|
|
return ("SUB.%# %1,%2,r15\t// CC := (%0)");
|
2388 |
|
|
|
2389 |
|
|
case GT:
|
2390 |
|
|
/* Reversed operand version of LT. */
|
2391 |
|
|
return ("SUB.%# %2,%1,r15\t// CC := (%0)");
|
2392 |
|
|
|
2393 |
|
|
case GTU:
|
2394 |
|
|
/* Reverse an LTU. */
|
2395 |
|
|
return ("SUB.%# %2,%1,r15\t// CC := (%0)");
|
2396 |
|
|
|
2397 |
|
|
default:
|
2398 |
|
|
gcc_unreachable();
|
2399 |
|
|
}
|
2400 |
|
|
}
|
2401 |
|
|
|
2402 |
|
|
/* Output the branch insn part of a compare-and-branch split. */
|
2403 |
|
|
const char *
|
2404 |
|
|
picochip_output_branch (rtx operands[], rtx insn)
|
2405 |
|
|
{
|
2406 |
|
|
|
2407 |
|
|
int code = GET_CODE(operands[2]);
|
2408 |
|
|
if (picochip_is_short_branch (insn))
|
2409 |
|
|
{
|
2410 |
|
|
/* Short branches can be output directly using the
|
2411 |
|
|
appropriate instruction. */
|
2412 |
|
|
switch (code)
|
2413 |
|
|
{
|
2414 |
|
|
case NE:
|
2415 |
|
|
return ("BNE %l0 %>");
|
2416 |
|
|
case EQ:
|
2417 |
|
|
return ("BEQ %l0 %>");
|
2418 |
|
|
case LE:
|
2419 |
|
|
return ("BGE %l0 %>");
|
2420 |
|
|
case LEU:
|
2421 |
|
|
return ("BHS %l0 %>");
|
2422 |
|
|
case GE:
|
2423 |
|
|
return ("BGE %l0 %>");
|
2424 |
|
|
case GEU:
|
2425 |
|
|
return ("BHS %l0 %>");
|
2426 |
|
|
case LT:
|
2427 |
|
|
return ("BLT %l0 %>");
|
2428 |
|
|
case LTU:
|
2429 |
|
|
return ("BLO %l0 %>");
|
2430 |
|
|
case GT:
|
2431 |
|
|
return ("BLT %l0 %>");
|
2432 |
|
|
case GTU:
|
2433 |
|
|
return ("BLO %l0 %>");
|
2434 |
|
|
default:
|
2435 |
|
|
internal_error ("unknown short branch in %s (type %d)",
|
2436 |
|
|
__FUNCTION__, (int) INTVAL (operands[1]));
|
2437 |
|
|
return "UNKNOWN_BRANCH";
|
2438 |
|
|
}
|
2439 |
|
|
}
|
2440 |
|
|
else
|
2441 |
|
|
{
|
2442 |
|
|
/* Long branches result in the emission of a special
|
2443 |
|
|
instruction, which the assembler expands into a suitable long
|
2444 |
|
|
branch. */
|
2445 |
|
|
|
2446 |
|
|
/* Use the type of comparison to output the appropriate condition
|
2447 |
|
|
test. */
|
2448 |
|
|
switch (code)
|
2449 |
|
|
{
|
2450 |
|
|
case NE:
|
2451 |
|
|
return ("JMPNE %l0 %>");
|
2452 |
|
|
case EQ:
|
2453 |
|
|
return ("JMPEQ %l0 %>");
|
2454 |
|
|
case LE:
|
2455 |
|
|
return ("JMPGE %l0 %>");
|
2456 |
|
|
case LEU:
|
2457 |
|
|
return ("JMPHS %l0 %>");
|
2458 |
|
|
case GE:
|
2459 |
|
|
return ("JMPGE %l0 %>");
|
2460 |
|
|
case GEU:
|
2461 |
|
|
return ("JMPHS %l0 %>");
|
2462 |
|
|
case LT:
|
2463 |
|
|
return ("JMPLT %l0 %>");
|
2464 |
|
|
case LTU:
|
2465 |
|
|
return ("JMPLO %l0 %>");
|
2466 |
|
|
case GT:
|
2467 |
|
|
return ("JMPLT %l0 %>");
|
2468 |
|
|
case GTU:
|
2469 |
|
|
return ("JMPLO %l0 %>");
|
2470 |
|
|
|
2471 |
|
|
default:
|
2472 |
|
|
internal_error ("unknown long branch in %s (type %d)",
|
2473 |
|
|
__FUNCTION__, (int) INTVAL (operands[1]));
|
2474 |
|
|
return "UNKNOWN_BRANCH";
|
2475 |
|
|
}
|
2476 |
|
|
|
2477 |
|
|
}
|
2478 |
|
|
}
|
2479 |
|
|
|
2480 |
|
|
/* Output a jump instruction. */
|
2481 |
|
|
const char *
|
2482 |
|
|
picochip_output_jump (rtx insn)
|
2483 |
|
|
{
|
2484 |
|
|
if (picochip_is_short_branch (insn))
|
2485 |
|
|
return "BRA %l0%>";
|
2486 |
|
|
else
|
2487 |
|
|
return "JMPRA %l0%>";
|
2488 |
|
|
}
|
2489 |
|
|
|
2490 |
|
|
const char *
|
2491 |
|
|
picochip_output_put_array (int alternative, rtx operands[])
|
2492 |
|
|
{
|
2493 |
|
|
/* Local output buffer. */
|
2494 |
|
|
char buf[256];
|
2495 |
|
|
|
2496 |
|
|
int portArraySize = INTVAL(operands[1]);
|
2497 |
|
|
int portBaseIndex = INTVAL(operands[2]);
|
2498 |
|
|
|
2499 |
|
|
if (alternative == 0)
|
2500 |
|
|
{
|
2501 |
|
|
sprintf (buf, "// Array put\n\tadd.0 [lsl %%0,2],&__commTable_put_%d_%d,lr\n\tjl (lr)",
|
2502 |
|
|
portArraySize, portBaseIndex);
|
2503 |
|
|
output_asm_insn (buf, operands);
|
2504 |
|
|
}
|
2505 |
|
|
else if (alternative == 1)
|
2506 |
|
|
{
|
2507 |
|
|
/* Constant port id. Emit a real instruction. */
|
2508 |
|
|
int portIndex = INTVAL(operands[0]) + portBaseIndex;
|
2509 |
|
|
if (portIndex < portBaseIndex ||
|
2510 |
|
|
portIndex >= (portBaseIndex + portArraySize))
|
2511 |
|
|
{
|
2512 |
|
|
error ("PUT uses port array index %d, which is out of range [%d..%d)",
|
2513 |
|
|
portIndex, portBaseIndex, portBaseIndex + portArraySize);
|
2514 |
|
|
}
|
2515 |
|
|
sprintf(buf, "PUT R[0:1],%d", portIndex);
|
2516 |
|
|
output_asm_insn (buf, operands);
|
2517 |
|
|
}
|
2518 |
|
|
else
|
2519 |
|
|
gcc_unreachable();
|
2520 |
|
|
|
2521 |
|
|
/* Both alternatives output the insn directly. */
|
2522 |
|
|
return "";
|
2523 |
|
|
}
|
2524 |
|
|
|
2525 |
|
|
const char *picochip_output_get_array (int alternative, rtx operands[])
|
2526 |
|
|
{
|
2527 |
|
|
/* Local output buffer. */
|
2528 |
|
|
char buf[256];
|
2529 |
|
|
|
2530 |
|
|
int portArraySize = INTVAL(operands[1]);
|
2531 |
|
|
int portBaseIndex = INTVAL(operands[2]);
|
2532 |
|
|
|
2533 |
|
|
if (alternative == 0)
|
2534 |
|
|
{
|
2535 |
|
|
sprintf (buf, "// Array get\n\tadd.0 [lsl %%0,2],&__commTable_get_%d_%d,lr\n\tjl (lr)",
|
2536 |
|
|
portArraySize, portBaseIndex);
|
2537 |
|
|
output_asm_insn (buf, operands);
|
2538 |
|
|
}
|
2539 |
|
|
else if (alternative == 1)
|
2540 |
|
|
{
|
2541 |
|
|
/* Constant port id. Emit a real instruction. */
|
2542 |
|
|
int portIndex = INTVAL(operands[0]) + portBaseIndex;
|
2543 |
|
|
if (portIndex < portBaseIndex ||
|
2544 |
|
|
portIndex >= (portBaseIndex + portArraySize))
|
2545 |
|
|
{
|
2546 |
|
|
error ("GET uses port array index %d, which is out of range [%d..%d)",
|
2547 |
|
|
portIndex, portBaseIndex, portBaseIndex + portArraySize);
|
2548 |
|
|
}
|
2549 |
|
|
sprintf(buf, "GET %d,R[0:1]", portIndex);
|
2550 |
|
|
output_asm_insn (buf, operands);
|
2551 |
|
|
}
|
2552 |
|
|
else
|
2553 |
|
|
gcc_unreachable();
|
2554 |
|
|
|
2555 |
|
|
/* Both alternatives output the insn directly. */
|
2556 |
|
|
return "";
|
2557 |
|
|
}
|
2558 |
|
|
|
2559 |
|
|
const char *picochip_output_testport_array (int alternative, rtx operands[])
|
2560 |
|
|
{
|
2561 |
|
|
/* Local output buffer. */
|
2562 |
|
|
char buf[256];
|
2563 |
|
|
|
2564 |
|
|
int portArraySize = INTVAL(operands[2]);
|
2565 |
|
|
int portBaseIndex = INTVAL(operands[3]);
|
2566 |
|
|
|
2567 |
|
|
if (alternative == 0)
|
2568 |
|
|
{
|
2569 |
|
|
sprintf (buf, "// Array tstport\n\tadd.0 [lsl %%1,2],&__commTable_tstport_%d_%d,lr\n\tjl (lr)\n=->\tcopy.0 0,%%0\n\tcopyeq 1,%%0",
|
2570 |
|
|
portArraySize, portBaseIndex);
|
2571 |
|
|
output_asm_insn (buf, operands);
|
2572 |
|
|
}
|
2573 |
|
|
else if (alternative == 1)
|
2574 |
|
|
{
|
2575 |
|
|
/* Constant port id. Emit a real instruction. */
|
2576 |
|
|
int portIndex = INTVAL(operands[1]) + portBaseIndex;
|
2577 |
|
|
if (portIndex < portBaseIndex ||
|
2578 |
|
|
portIndex >= (portBaseIndex + portArraySize))
|
2579 |
|
|
{
|
2580 |
|
|
error ("PUT uses port array index %d, which is out of range [%d..%d)",
|
2581 |
|
|
portIndex, portBaseIndex, portBaseIndex + portArraySize);
|
2582 |
|
|
}
|
2583 |
|
|
sprintf(buf, "copy.1 0,%%0 %%| TSTPORT %d\n\tcopyeq 1,%%0", portIndex);
|
2584 |
|
|
output_asm_insn (buf, operands);
|
2585 |
|
|
}
|
2586 |
|
|
else
|
2587 |
|
|
gcc_unreachable();
|
2588 |
|
|
|
2589 |
|
|
/* Both alternatives output the insn directly. */
|
2590 |
|
|
return "";
|
2591 |
|
|
}
|
2592 |
|
|
|
2593 |
|
|
/* Output a comparison operand as a symbol (e.g., >). */
|
2594 |
|
|
static void
|
2595 |
|
|
picochip_print_comparison (FILE * file, rtx operand, int letter)
|
2596 |
|
|
{
|
2597 |
|
|
|
2598 |
|
|
if (letter == 'i')
|
2599 |
|
|
{
|
2600 |
|
|
/* Output just the comparison symbol. */
|
2601 |
|
|
switch (GET_CODE (operand))
|
2602 |
|
|
{
|
2603 |
|
|
case NE:
|
2604 |
|
|
fprintf (file, "!=");
|
2605 |
|
|
break;
|
2606 |
|
|
case EQ:
|
2607 |
|
|
fprintf (file, "==");
|
2608 |
|
|
break;
|
2609 |
|
|
case GE:
|
2610 |
|
|
fprintf (file, ">=");
|
2611 |
|
|
break;
|
2612 |
|
|
case GEU:
|
2613 |
|
|
fprintf (file, ">={U}");
|
2614 |
|
|
break;
|
2615 |
|
|
case LT:
|
2616 |
|
|
fprintf (file, "<");
|
2617 |
|
|
break;
|
2618 |
|
|
case LTU:
|
2619 |
|
|
fprintf (file, "<{U}");
|
2620 |
|
|
break;
|
2621 |
|
|
case LE:
|
2622 |
|
|
fprintf (file, "<=");
|
2623 |
|
|
break;
|
2624 |
|
|
case LEU:
|
2625 |
|
|
fprintf (file, "<={U}");
|
2626 |
|
|
break;
|
2627 |
|
|
case GT:
|
2628 |
|
|
fprintf (file, ">");
|
2629 |
|
|
break;
|
2630 |
|
|
case GTU:
|
2631 |
|
|
fprintf (file, ">{U}");
|
2632 |
|
|
break;
|
2633 |
|
|
default:
|
2634 |
|
|
gcc_unreachable();
|
2635 |
|
|
}
|
2636 |
|
|
}
|
2637 |
|
|
else
|
2638 |
|
|
{
|
2639 |
|
|
/* Output the comparison formatted as operand,symbol,operand */
|
2640 |
|
|
rtx op0 = XEXP (operand, 0);
|
2641 |
|
|
rtx op1 = XEXP (operand, 1);
|
2642 |
|
|
|
2643 |
|
|
picochip_print_operand (file, op0, 0);
|
2644 |
|
|
picochip_print_comparison (file, operand, 'i');
|
2645 |
|
|
picochip_print_operand (file, op1, 0);
|
2646 |
|
|
}
|
2647 |
|
|
}
|
2648 |
|
|
|
2649 |
|
|
/* This function generates a memory address operand in the given
|
2650 |
|
|
mode. That is, if the address contains a constant offset, then the
|
2651 |
|
|
offset is divided by the required mode size to compute the
|
2652 |
|
|
mode specific offset. By default, picochip_print_operand_address calls
|
2653 |
|
|
this function using the natural mode of the operand, but special
|
2654 |
|
|
operand codes can be used to invoke the computation using an
|
2655 |
|
|
unnatural mode (e.g., compute the HI aligned address of an SI mode
|
2656 |
|
|
address). */
|
2657 |
|
|
static void
|
2658 |
|
|
picochip_print_memory_address (FILE * file, rtx operand,
|
2659 |
|
|
enum machine_mode mode)
|
2660 |
|
|
{
|
2661 |
|
|
rtx address = XEXP (operand, 0);
|
2662 |
|
|
|
2663 |
|
|
/* Sanity check. */
|
2664 |
|
|
if (MEM != GET_CODE (operand))
|
2665 |
|
|
fatal_insn ("picochip_print_memory_address - Operand isn't memory based",
|
2666 |
|
|
operand);
|
2667 |
|
|
|
2668 |
|
|
if (TARGET_DEBUG)
|
2669 |
|
|
{
|
2670 |
|
|
printf ("picochip_print_memory_address: ");
|
2671 |
|
|
print_rtl (stdout, operand);
|
2672 |
|
|
printf ("\n");
|
2673 |
|
|
}
|
2674 |
|
|
|
2675 |
|
|
switch (GET_CODE (address))
|
2676 |
|
|
{
|
2677 |
|
|
case PLUS:
|
2678 |
|
|
{
|
2679 |
|
|
/* Grab the address components. */
|
2680 |
|
|
rtx base = XEXP (address, 0);
|
2681 |
|
|
rtx offset = XEXP (address, 1);
|
2682 |
|
|
|
2683 |
|
|
/* Only handle reg+const addresses */
|
2684 |
|
|
if (REG == GET_CODE (base) && CONST_INT == GET_CODE (offset))
|
2685 |
|
|
{
|
2686 |
|
|
/* Sanity check. If an FP+offset address is given, ensure
|
2687 |
|
|
that the offset lies within the given frame, or a lower
|
2688 |
|
|
frame. */
|
2689 |
|
|
if (REGNO (base) == STACK_POINTER_REGNUM )
|
2690 |
|
|
gcc_assert (INTVAL (offset) <= (picochip_arg_area_byte_offset () +
|
2691 |
|
|
crtl->args.size));
|
2692 |
|
|
|
2693 |
|
|
/* Print the base register - identical for all modes. */
|
2694 |
|
|
fprintf (file, "(");
|
2695 |
|
|
picochip_print_operand (file, base, 'r');
|
2696 |
|
|
fprintf (file, ")");
|
2697 |
|
|
|
2698 |
|
|
/* Print the constant offset with compensation for the mode. */
|
2699 |
|
|
switch (mode)
|
2700 |
|
|
{
|
2701 |
|
|
case QImode:
|
2702 |
|
|
picochip_print_operand (file, offset, 'Q');
|
2703 |
|
|
break;
|
2704 |
|
|
|
2705 |
|
|
case HImode:
|
2706 |
|
|
picochip_print_operand (file, offset, 'H');
|
2707 |
|
|
break;
|
2708 |
|
|
|
2709 |
|
|
case SImode:
|
2710 |
|
|
case SFmode:
|
2711 |
|
|
picochip_print_operand (file, offset, 'S');
|
2712 |
|
|
break;
|
2713 |
|
|
|
2714 |
|
|
case DImode:
|
2715 |
|
|
picochip_print_operand (file, offset, 'D');
|
2716 |
|
|
break;
|
2717 |
|
|
|
2718 |
|
|
default:
|
2719 |
|
|
gcc_unreachable();
|
2720 |
|
|
}
|
2721 |
|
|
|
2722 |
|
|
}
|
2723 |
|
|
|
2724 |
|
|
}
|
2725 |
|
|
|
2726 |
|
|
break;
|
2727 |
|
|
|
2728 |
|
|
case SYMBOL_REF:
|
2729 |
|
|
picochip_print_operand (file, address, 's');
|
2730 |
|
|
break;
|
2731 |
|
|
|
2732 |
|
|
case CONST:
|
2733 |
|
|
{
|
2734 |
|
|
rtx inner;
|
2735 |
|
|
rtx base;
|
2736 |
|
|
rtx offset;
|
2737 |
|
|
|
2738 |
|
|
inner = XEXP (address, 0);
|
2739 |
|
|
|
2740 |
|
|
/* Sanity check - the CONST memory address must be a base+offset. */
|
2741 |
|
|
gcc_assert (PLUS == GET_CODE (inner));
|
2742 |
|
|
|
2743 |
|
|
base = XEXP (inner, 0);
|
2744 |
|
|
offset = XEXP (inner, 1);
|
2745 |
|
|
|
2746 |
|
|
fprintf (file, "&_%s%+d", XSTR (base, 0), XINT (offset, 0));
|
2747 |
|
|
|
2748 |
|
|
break;
|
2749 |
|
|
}
|
2750 |
|
|
|
2751 |
|
|
case REG:
|
2752 |
|
|
/* Register operand. Provide a zero offset. */
|
2753 |
|
|
fprintf (file, "(");
|
2754 |
|
|
picochip_print_operand (file, address, 'r');
|
2755 |
|
|
fprintf (file, ")0");
|
2756 |
|
|
break;
|
2757 |
|
|
|
2758 |
|
|
default:
|
2759 |
|
|
gcc_unreachable();
|
2760 |
|
|
}
|
2761 |
|
|
|
2762 |
|
|
}
|
2763 |
|
|
|
2764 |
|
|
/* Output an operand. Formatting letters allow particular parts of
|
2765 |
|
|
the operand to be output. */
|
2766 |
|
|
void
|
2767 |
|
|
picochip_print_operand (FILE * file, rtx operand, int letter)
|
2768 |
|
|
{
|
2769 |
|
|
|
2770 |
|
|
/* Handle special cases. */
|
2771 |
|
|
switch (letter)
|
2772 |
|
|
{
|
2773 |
|
|
/* VLIW continuation, for explicit VLIW sequences. */
|
2774 |
|
|
case '|':
|
2775 |
|
|
fprintf (file, "\\");
|
2776 |
|
|
return;
|
2777 |
|
|
|
2778 |
|
|
/* ALU selector. */
|
2779 |
|
|
case '#':
|
2780 |
|
|
fputc (picochip_get_vliw_alu_id (), file);
|
2781 |
|
|
return;
|
2782 |
|
|
|
2783 |
|
|
/* Delay slot specifier. */
|
2784 |
|
|
case '>':
|
2785 |
|
|
/* This should be handled in asm_output_opcode. */
|
2786 |
|
|
gcc_unreachable();
|
2787 |
|
|
|
2788 |
|
|
/* Instruction mnemonics (e.g., lshift becomes LSL). */
|
2789 |
|
|
case 'I':
|
2790 |
|
|
switch (GET_CODE (operand))
|
2791 |
|
|
{
|
2792 |
|
|
case AND:
|
2793 |
|
|
fprintf (file, "AND");
|
2794 |
|
|
break;
|
2795 |
|
|
case IOR:
|
2796 |
|
|
fprintf (file, "OR");
|
2797 |
|
|
break;
|
2798 |
|
|
case XOR:
|
2799 |
|
|
fprintf (file, "XOR");
|
2800 |
|
|
break;
|
2801 |
|
|
case PLUS:
|
2802 |
|
|
fprintf (file, "ADD");
|
2803 |
|
|
break;
|
2804 |
|
|
case MINUS:
|
2805 |
|
|
fprintf (file, "SUB");
|
2806 |
|
|
break;
|
2807 |
|
|
default:
|
2808 |
|
|
gcc_unreachable();
|
2809 |
|
|
}
|
2810 |
|
|
return;
|
2811 |
|
|
|
2812 |
|
|
/* Symbolic instructions (e.g., lshift becomes <<). */
|
2813 |
|
|
case 'i':
|
2814 |
|
|
switch (GET_CODE (operand))
|
2815 |
|
|
{
|
2816 |
|
|
case AND:
|
2817 |
|
|
fprintf (file, "&");
|
2818 |
|
|
break;
|
2819 |
|
|
case IOR:
|
2820 |
|
|
fprintf (file, "|");
|
2821 |
|
|
break;
|
2822 |
|
|
case XOR:
|
2823 |
|
|
fprintf (file, "^");
|
2824 |
|
|
break;
|
2825 |
|
|
case PLUS:
|
2826 |
|
|
fprintf (file, "+");
|
2827 |
|
|
break;
|
2828 |
|
|
case MINUS:
|
2829 |
|
|
fprintf (file, "-");
|
2830 |
|
|
break;
|
2831 |
|
|
default:
|
2832 |
|
|
fprintf (file, "UNKNOWN_INSN");
|
2833 |
|
|
break;
|
2834 |
|
|
}
|
2835 |
|
|
return;
|
2836 |
|
|
|
2837 |
|
|
default: /* Not a punctuation character - process as normal. */
|
2838 |
|
|
break;
|
2839 |
|
|
}
|
2840 |
|
|
|
2841 |
|
|
switch (GET_CODE (operand))
|
2842 |
|
|
{
|
2843 |
|
|
case REG:
|
2844 |
|
|
switch (letter)
|
2845 |
|
|
{
|
2846 |
|
|
case 'R':
|
2847 |
|
|
/* Write a range of registers. */
|
2848 |
|
|
fprintf (file, "R[%d:%d]", REGNO (operand) + 1, REGNO (operand));
|
2849 |
|
|
break;
|
2850 |
|
|
|
2851 |
|
|
case 'U':
|
2852 |
|
|
/* The upper register of a pair is requested. */
|
2853 |
|
|
fprintf (file, "%s", picochip_regnames[REGNO (operand) + 1]);
|
2854 |
|
|
break;
|
2855 |
|
|
|
2856 |
|
|
case 'L':
|
2857 |
|
|
/* The lower register of a pair is requested. Equivalent to the
|
2858 |
|
|
default, but included for completeness. */
|
2859 |
|
|
fprintf (file, "%s", picochip_regnames[REGNO (operand)]);
|
2860 |
|
|
break;
|
2861 |
|
|
|
2862 |
|
|
case 'X':
|
2863 |
|
|
/* The 3rd register of a DI mode register. */
|
2864 |
|
|
fprintf (file, "%s", picochip_regnames[REGNO (operand) + 2]);
|
2865 |
|
|
break;
|
2866 |
|
|
|
2867 |
|
|
case 'Y':
|
2868 |
|
|
/* The 4th register of a DI mode register. */
|
2869 |
|
|
fprintf (file, "%s", picochip_regnames[REGNO (operand) + 3]);
|
2870 |
|
|
break;
|
2871 |
|
|
|
2872 |
|
|
default:
|
2873 |
|
|
fprintf (file, "%s", picochip_regnames[REGNO (operand)]);
|
2874 |
|
|
}
|
2875 |
|
|
break;
|
2876 |
|
|
|
2877 |
|
|
case CONST_INT:
|
2878 |
|
|
/* A range of letters can be used to format integers. The
|
2879 |
|
|
letters Q/H/S are used to divide the constant by the width of
|
2880 |
|
|
QI/HI/SI mode integers in bytes. The U/L modifiers are used
|
2881 |
|
|
to obtain the upper and lower 16-bits of a 32-bit
|
2882 |
|
|
constant. Where possible, signed numbers are used, since
|
2883 |
|
|
signed representations of numbers may be more compact (e.g.,
|
2884 |
|
|
65535 can be represented as -1, which fits into a small
|
2885 |
|
|
constant, whereas 65535 requires a large constant). */
|
2886 |
|
|
switch (letter)
|
2887 |
|
|
{
|
2888 |
|
|
case 'Q':
|
2889 |
|
|
fprintf (file, "%ld", INTVAL (operand));
|
2890 |
|
|
break;
|
2891 |
|
|
|
2892 |
|
|
case 'H':
|
2893 |
|
|
fprintf (file, "%ld", INTVAL (operand) / 2);
|
2894 |
|
|
break;
|
2895 |
|
|
|
2896 |
|
|
case 'S':
|
2897 |
|
|
fprintf (file, "%ld", INTVAL (operand) / 4);
|
2898 |
|
|
break;
|
2899 |
|
|
|
2900 |
|
|
case 'P':
|
2901 |
|
|
fprintf (file, "%d", exact_log2 (INTVAL(operand)));
|
2902 |
|
|
break;
|
2903 |
|
|
|
2904 |
|
|
case 'U':
|
2905 |
|
|
fprintf (file, "%hi", (short) ((INTVAL (operand) >> 16) & 0xFFFF));
|
2906 |
|
|
break;
|
2907 |
|
|
|
2908 |
|
|
case 'L':
|
2909 |
|
|
fprintf (file, "%hi", (short) (INTVAL (operand) & 0xFFFF));
|
2910 |
|
|
break;
|
2911 |
|
|
|
2912 |
|
|
default:
|
2913 |
|
|
fprintf (file, "%ld", INTVAL (operand));
|
2914 |
|
|
break;
|
2915 |
|
|
}
|
2916 |
|
|
break;
|
2917 |
|
|
|
2918 |
|
|
case CONST_DOUBLE:
|
2919 |
|
|
{
|
2920 |
|
|
long val;
|
2921 |
|
|
REAL_VALUE_TYPE rv;
|
2922 |
|
|
|
2923 |
|
|
if (GET_MODE (operand) != SFmode)
|
2924 |
|
|
fatal_insn ("Unknown mode in print_operand (CONST_DOUBLE) :",
|
2925 |
|
|
operand);
|
2926 |
|
|
REAL_VALUE_FROM_CONST_DOUBLE (rv, operand);
|
2927 |
|
|
REAL_VALUE_TO_TARGET_SINGLE (rv, val);
|
2928 |
|
|
|
2929 |
|
|
switch (letter)
|
2930 |
|
|
{
|
2931 |
|
|
case 'U':
|
2932 |
|
|
fprintf (file, "%hi", (short) ((val >> 16) & 0xFFFF));
|
2933 |
|
|
break;
|
2934 |
|
|
|
2935 |
|
|
case 'L':
|
2936 |
|
|
fprintf (file, "%hi", (short) (val & 0xFFFF));
|
2937 |
|
|
break;
|
2938 |
|
|
}
|
2939 |
|
|
|
2940 |
|
|
break;
|
2941 |
|
|
|
2942 |
|
|
}
|
2943 |
|
|
|
2944 |
|
|
/* Output a symbol. The output format must match that of
|
2945 |
|
|
picochip_output_label. */
|
2946 |
|
|
case SYMBOL_REF:
|
2947 |
|
|
/* Ensure that the symbol is marked as referenced. Gcc can
|
2948 |
|
|
occasionally omit the function bodies when it believes them
|
2949 |
|
|
to be unreferenced. */
|
2950 |
|
|
if (SYMBOL_REF_DECL (operand))
|
2951 |
|
|
mark_decl_referenced (SYMBOL_REF_DECL (operand));
|
2952 |
|
|
fprintf (file, "&");
|
2953 |
|
|
assemble_name (file, XSTR (operand, 0));
|
2954 |
|
|
break;
|
2955 |
|
|
|
2956 |
|
|
case LABEL_REF:
|
2957 |
|
|
/* This format must match that of picochip_output_label. */
|
2958 |
|
|
fprintf (file, "&");
|
2959 |
|
|
output_asm_label (operand);
|
2960 |
|
|
break;
|
2961 |
|
|
|
2962 |
|
|
case MEM:
|
2963 |
|
|
{
|
2964 |
|
|
rtx addr = XEXP (operand, 0);
|
2965 |
|
|
|
2966 |
|
|
switch (letter)
|
2967 |
|
|
{
|
2968 |
|
|
case 'o':
|
2969 |
|
|
if (PLUS != GET_CODE (addr))
|
2970 |
|
|
fatal_insn ("Bad address, not (reg+disp):", addr);
|
2971 |
|
|
else
|
2972 |
|
|
picochip_print_operand (file, XEXP (addr, 1), 0);
|
2973 |
|
|
break;
|
2974 |
|
|
|
2975 |
|
|
case 'M':
|
2976 |
|
|
/* Output a memory address in byte mode notation (i.e., the
|
2977 |
|
|
constant address (if any) is the actual byte address. */
|
2978 |
|
|
picochip_print_memory_address (file, operand, QImode);
|
2979 |
|
|
break;
|
2980 |
|
|
|
2981 |
|
|
/* Output a constant offset of the given mode (i.e., divide
|
2982 |
|
|
the constant by the number of units in the mode to get the
|
2983 |
|
|
constant). */
|
2984 |
|
|
case 'Q':
|
2985 |
|
|
picochip_print_memory_address (file, operand, QImode);
|
2986 |
|
|
break;
|
2987 |
|
|
|
2988 |
|
|
case 'H':
|
2989 |
|
|
picochip_print_memory_address (file, operand, HImode);
|
2990 |
|
|
break;
|
2991 |
|
|
|
2992 |
|
|
case 'S':
|
2993 |
|
|
picochip_print_memory_address (file, operand, SImode);
|
2994 |
|
|
break;
|
2995 |
|
|
|
2996 |
|
|
case 'F':
|
2997 |
|
|
picochip_print_memory_address (file, operand, SFmode);
|
2998 |
|
|
break;
|
2999 |
|
|
|
3000 |
|
|
case 'b':
|
3001 |
|
|
if (PLUS != GET_CODE (addr))
|
3002 |
|
|
fatal_insn ("Bad address, not (reg+disp):", addr);
|
3003 |
|
|
else
|
3004 |
|
|
picochip_print_operand (file, XEXP (addr, 0), 0);
|
3005 |
|
|
break;
|
3006 |
|
|
|
3007 |
|
|
/* When the mem operand is (reg + big offset) which cannot
|
3008 |
|
|
be represented in an instruction as operand, the compiler
|
3009 |
|
|
automatically generates the instruction to put in (reg +
|
3010 |
|
|
big offset) into another register. In such cases, it
|
3011 |
|
|
returns '0' as the character. This needs to be handled
|
3012 |
|
|
as well. */
|
3013 |
|
|
case 0:
|
3014 |
|
|
case 'r':
|
3015 |
|
|
if (REG != GET_CODE (addr))
|
3016 |
|
|
fatal_insn ("Bad address, not register:", addr);
|
3017 |
|
|
else
|
3018 |
|
|
picochip_print_operand (file, addr, 0);
|
3019 |
|
|
break;
|
3020 |
|
|
|
3021 |
|
|
default:
|
3022 |
|
|
fprintf (file, "Unknown mem operand - letter %c ",
|
3023 |
|
|
(char) (letter));
|
3024 |
|
|
print_rtl (file, operand);
|
3025 |
|
|
}
|
3026 |
|
|
|
3027 |
|
|
break;
|
3028 |
|
|
}
|
3029 |
|
|
|
3030 |
|
|
case CONST:
|
3031 |
|
|
{
|
3032 |
|
|
rtx const_exp = XEXP (operand, 0);
|
3033 |
|
|
|
3034 |
|
|
/* Handle constant offsets to symbol references. */
|
3035 |
|
|
if (PLUS == GET_CODE (const_exp) &&
|
3036 |
|
|
SYMBOL_REF == GET_CODE (XEXP (const_exp, 0)) &&
|
3037 |
|
|
CONST_INT == GET_CODE (XEXP (const_exp, 1)))
|
3038 |
|
|
{
|
3039 |
|
|
|
3040 |
|
|
picochip_print_operand (file, XEXP (const_exp, 0), 0);
|
3041 |
|
|
if (INTVAL (XEXP (const_exp, 1)) >= 0)
|
3042 |
|
|
fprintf (file, "+");
|
3043 |
|
|
/* else use the - from the operand (i.e., AP-2)) */
|
3044 |
|
|
|
3045 |
|
|
picochip_print_operand (file, XEXP (const_exp, 1), letter);
|
3046 |
|
|
|
3047 |
|
|
}
|
3048 |
|
|
}
|
3049 |
|
|
break;
|
3050 |
|
|
|
3051 |
|
|
|
3052 |
|
|
case PLUS:
|
3053 |
|
|
{
|
3054 |
|
|
/* PLUS expressions are of the form (base + offset). Different
|
3055 |
|
|
options (analagous to those of memory PLUS expressions) are used
|
3056 |
|
|
to extract the base and offset components. */
|
3057 |
|
|
|
3058 |
|
|
switch (letter)
|
3059 |
|
|
{
|
3060 |
|
|
case 'b':
|
3061 |
|
|
picochip_print_operand (file, XEXP (operand, 0), 0);
|
3062 |
|
|
break;
|
3063 |
|
|
|
3064 |
|
|
case 'o':
|
3065 |
|
|
picochip_print_operand (file, XEXP (operand, 1), 0);
|
3066 |
|
|
break;
|
3067 |
|
|
|
3068 |
|
|
default:
|
3069 |
|
|
|
3070 |
|
|
/* If the expression is composed entirely of constants,
|
3071 |
|
|
evaluate the result. This should only occur with the
|
3072 |
|
|
picoChip specific comms instructions, which are emitted as
|
3073 |
|
|
base+offset expressions. */
|
3074 |
|
|
if (CONST_INT == GET_CODE (XEXP (operand, 0)) &&
|
3075 |
|
|
CONST_INT == GET_CODE (XEXP (operand, 1)))
|
3076 |
|
|
{
|
3077 |
|
|
HOST_WIDE_INT result = (XINT (XEXP (operand, 0), 0) +
|
3078 |
|
|
XINT (XEXP (operand, 1), 0));
|
3079 |
|
|
fprintf (file, "%ld", result);
|
3080 |
|
|
}
|
3081 |
|
|
else
|
3082 |
|
|
{
|
3083 |
|
|
fprintf (file, "(");
|
3084 |
|
|
picochip_print_operand (file, XEXP (operand, 0), 0);
|
3085 |
|
|
fprintf (file, "+");
|
3086 |
|
|
picochip_print_operand (file, XEXP (operand, 1), 0);
|
3087 |
|
|
fprintf (file, ")");
|
3088 |
|
|
}
|
3089 |
|
|
}
|
3090 |
|
|
|
3091 |
|
|
break;
|
3092 |
|
|
}
|
3093 |
|
|
|
3094 |
|
|
/* Comparison operations. */
|
3095 |
|
|
case NE:
|
3096 |
|
|
case EQ:
|
3097 |
|
|
case GE:
|
3098 |
|
|
case GEU:
|
3099 |
|
|
case LT:
|
3100 |
|
|
case LTU:
|
3101 |
|
|
case LE:
|
3102 |
|
|
case LEU:
|
3103 |
|
|
case GT:
|
3104 |
|
|
case GTU:
|
3105 |
|
|
picochip_print_comparison (file, operand, letter);
|
3106 |
|
|
return;
|
3107 |
|
|
|
3108 |
|
|
default:
|
3109 |
|
|
fprintf (stderr, "Unknown operand encountered in %s\n", __FUNCTION__);
|
3110 |
|
|
print_rtl (file, operand);
|
3111 |
|
|
break;
|
3112 |
|
|
|
3113 |
|
|
}
|
3114 |
|
|
|
3115 |
|
|
}
|
3116 |
|
|
|
3117 |
|
|
/* Output an operand address */
|
3118 |
|
|
void
|
3119 |
|
|
picochip_print_operand_address (FILE * file, rtx operand)
|
3120 |
|
|
{
|
3121 |
|
|
|
3122 |
|
|
switch (GET_CODE (operand))
|
3123 |
|
|
{
|
3124 |
|
|
|
3125 |
|
|
case SYMBOL_REF:
|
3126 |
|
|
/* This format must match that of picochip_output_label. */
|
3127 |
|
|
assemble_name (file, XSTR (operand, 0));
|
3128 |
|
|
break;
|
3129 |
|
|
|
3130 |
|
|
case CODE_LABEL:
|
3131 |
|
|
/* Note this format must match that of picochip_output_label. */
|
3132 |
|
|
fprintf (file, "_L%d", XINT (operand, 5));
|
3133 |
|
|
break;
|
3134 |
|
|
|
3135 |
|
|
case MEM:
|
3136 |
|
|
/* Pass on to a specialised memory address generator. */
|
3137 |
|
|
picochip_print_memory_address (file, operand, GET_MODE (operand));
|
3138 |
|
|
break;
|
3139 |
|
|
|
3140 |
|
|
default:
|
3141 |
|
|
gcc_unreachable();
|
3142 |
|
|
|
3143 |
|
|
}
|
3144 |
|
|
|
3145 |
|
|
}
|
3146 |
|
|
|
3147 |
|
|
|
3148 |
|
|
/* Scheduling functions. */
|
3149 |
|
|
|
3150 |
|
|
/* Save some of the contents of recog_data. */
|
3151 |
|
|
static void
|
3152 |
|
|
picochip_save_recog_data (void)
|
3153 |
|
|
{
|
3154 |
|
|
picochip_saved_which_alternative = which_alternative;
|
3155 |
|
|
memcpy (&picochip_saved_recog_data, &recog_data,
|
3156 |
|
|
sizeof (struct recog_data));
|
3157 |
|
|
}
|
3158 |
|
|
|
3159 |
|
|
/* Restore some of the contents of global variable recog_data. */
|
3160 |
|
|
static void
|
3161 |
|
|
picochip_restore_recog_data (void)
|
3162 |
|
|
{
|
3163 |
|
|
which_alternative = picochip_saved_which_alternative;
|
3164 |
|
|
memcpy (&recog_data, &picochip_saved_recog_data,
|
3165 |
|
|
sizeof (struct recog_data));
|
3166 |
|
|
}
|
3167 |
|
|
|
3168 |
|
|
/* Ensure that no var tracking notes are emitted in the middle of a
|
3169 |
|
|
three-instruction bundle. */
|
3170 |
|
|
static void
|
3171 |
|
|
reorder_var_tracking_notes (void)
|
3172 |
|
|
{
|
3173 |
|
|
basic_block bb;
|
3174 |
|
|
|
3175 |
|
|
FOR_EACH_BB (bb)
|
3176 |
|
|
{
|
3177 |
|
|
rtx insn, next, last_insn = NULL_RTX;
|
3178 |
|
|
rtx queue = NULL_RTX;
|
3179 |
|
|
|
3180 |
|
|
/* Iterate through the bb and find the last non-debug insn */
|
3181 |
|
|
for (insn = BB_HEAD (bb); insn != NEXT_INSN(BB_END (bb)); insn = NEXT_INSN(insn))
|
3182 |
|
|
{
|
3183 |
|
|
if (NONDEBUG_INSN_P(insn))
|
3184 |
|
|
last_insn = insn;
|
3185 |
|
|
}
|
3186 |
|
|
|
3187 |
|
|
/* In all normal cases, queue up notes and emit them just before a TImode
|
3188 |
|
|
instruction. For the last instruction, emit the queued notes just after
|
3189 |
|
|
the last instruction. */
|
3190 |
|
|
for (insn = BB_HEAD (bb); insn != NEXT_INSN(BB_END (bb)); insn = next)
|
3191 |
|
|
{
|
3192 |
|
|
next = NEXT_INSN (insn);
|
3193 |
|
|
|
3194 |
|
|
if (insn == last_insn)
|
3195 |
|
|
{
|
3196 |
|
|
while (queue)
|
3197 |
|
|
{
|
3198 |
|
|
rtx next_queue = PREV_INSN (queue);
|
3199 |
|
|
PREV_INSN (NEXT_INSN(insn)) = queue;
|
3200 |
|
|
NEXT_INSN(queue) = NEXT_INSN(insn);
|
3201 |
|
|
PREV_INSN(queue) = insn;
|
3202 |
|
|
NEXT_INSN(insn) = queue;
|
3203 |
|
|
queue = next_queue;
|
3204 |
|
|
}
|
3205 |
|
|
/* There is no more to do for this bb. break*/
|
3206 |
|
|
break;
|
3207 |
|
|
}
|
3208 |
|
|
else if (NONDEBUG_INSN_P (insn))
|
3209 |
|
|
{
|
3210 |
|
|
/* Emit queued up notes before the first instruction of a bundle. */
|
3211 |
|
|
if (GET_MODE (insn) == TImode)
|
3212 |
|
|
{
|
3213 |
|
|
while (queue)
|
3214 |
|
|
{
|
3215 |
|
|
rtx next_queue = PREV_INSN (queue);
|
3216 |
|
|
NEXT_INSN (PREV_INSN(insn)) = queue;
|
3217 |
|
|
PREV_INSN (queue) = PREV_INSN(insn);
|
3218 |
|
|
PREV_INSN (insn) = queue;
|
3219 |
|
|
NEXT_INSN (queue) = insn;
|
3220 |
|
|
queue = next_queue;
|
3221 |
|
|
}
|
3222 |
|
|
}
|
3223 |
|
|
}
|
3224 |
|
|
else if (NOTE_P (insn))
|
3225 |
|
|
{
|
3226 |
|
|
rtx prev = PREV_INSN (insn);
|
3227 |
|
|
PREV_INSN (next) = prev;
|
3228 |
|
|
NEXT_INSN (prev) = next;
|
3229 |
|
|
/* Ignore call_arg notes. They are expected to be just after the
|
3230 |
|
|
call insn. If the call is start of a long VLIW, labels are
|
3231 |
|
|
emitted in the middle of a VLIW, which our assembler can not
|
3232 |
|
|
handle. */
|
3233 |
|
|
if (NOTE_KIND (insn) != NOTE_INSN_CALL_ARG_LOCATION)
|
3234 |
|
|
{
|
3235 |
|
|
PREV_INSN (insn) = queue;
|
3236 |
|
|
queue = insn;
|
3237 |
|
|
}
|
3238 |
|
|
}
|
3239 |
|
|
}
|
3240 |
|
|
/* Make sure we are not dropping debug instructions.*/
|
3241 |
|
|
gcc_assert (queue == NULL_RTX);
|
3242 |
|
|
}
|
3243 |
|
|
}
|
3244 |
|
|
|
3245 |
|
|
/* Perform machine dependent operations on the rtl chain INSNS. */
|
3246 |
|
|
void
|
3247 |
|
|
picochip_reorg (void)
|
3248 |
|
|
{
|
3249 |
|
|
rtx insn, insn1, vliw_start = NULL_RTX;
|
3250 |
|
|
int vliw_insn_location = 0;
|
3251 |
|
|
|
3252 |
|
|
/* We are freeing block_for_insn in the toplev to keep compatibility
|
3253 |
|
|
with old MDEP_REORGS that are not CFG based. Recompute it now. */
|
3254 |
|
|
compute_bb_for_insn ();
|
3255 |
|
|
|
3256 |
|
|
if (optimize == 0)
|
3257 |
|
|
split_all_insns ();
|
3258 |
|
|
|
3259 |
|
|
if (picochip_schedule_type != DFA_TYPE_NONE)
|
3260 |
|
|
{
|
3261 |
|
|
timevar_push (TV_SCHED2);
|
3262 |
|
|
|
3263 |
|
|
/* Process the instruction list, computing the sizes of each
|
3264 |
|
|
instruction, and consequently branch distances. This can
|
3265 |
|
|
result in some branches becoming short enough to be treated
|
3266 |
|
|
as a real branch instruction, rather than an assembly branch
|
3267 |
|
|
macro which may expand into multiple instructions. The
|
3268 |
|
|
benefit of shortening branches is that real branch
|
3269 |
|
|
instructions can be properly DFA scheduled, whereas macro
|
3270 |
|
|
branches cannot. */
|
3271 |
|
|
shorten_branches (get_insns ());
|
3272 |
|
|
|
3273 |
|
|
/* Do control and data sched analysis again,
|
3274 |
|
|
and write some more of the results to dump file. */
|
3275 |
|
|
|
3276 |
|
|
split_all_insns ();
|
3277 |
|
|
|
3278 |
|
|
schedule_ebbs ();
|
3279 |
|
|
|
3280 |
|
|
timevar_pop (TV_SCHED2);
|
3281 |
|
|
|
3282 |
|
|
ggc_collect ();
|
3283 |
|
|
|
3284 |
|
|
if (picochip_schedule_type == DFA_TYPE_SPEED)
|
3285 |
|
|
{
|
3286 |
|
|
/* Whenever a VLIW packet is generated, all instructions in
|
3287 |
|
|
that packet must appear to come from the same source
|
3288 |
|
|
location. The following code finds all the VLIW packets,
|
3289 |
|
|
and tags their instructions with the location of the first
|
3290 |
|
|
instruction from the packet. Clearly this will result in
|
3291 |
|
|
strange behaviour when debugging the code, but since
|
3292 |
|
|
debugging and optimisation are being used in conjunction,
|
3293 |
|
|
strange behaviour is certain to occur anyway. */
|
3294 |
|
|
/* Slight bit of change. If the vliw set contains a branch
|
3295 |
|
|
or call instruction, we pick its location.*/
|
3296 |
|
|
for (insn = get_insns (); insn; insn = next_real_insn (insn))
|
3297 |
|
|
{
|
3298 |
|
|
|
3299 |
|
|
/* If this is the first instruction in the VLIW packet,
|
3300 |
|
|
extract its location. */
|
3301 |
|
|
if (GET_MODE (insn) == TImode)
|
3302 |
|
|
{
|
3303 |
|
|
vliw_start = insn;
|
3304 |
|
|
vliw_insn_location = INSN_LOCATOR (insn);
|
3305 |
|
|
}
|
3306 |
|
|
if (JUMP_P (insn) || CALL_P(insn))
|
3307 |
|
|
{
|
3308 |
|
|
vliw_insn_location = INSN_LOCATOR (insn);
|
3309 |
|
|
for (insn1 = vliw_start; insn1 != insn ; insn1 = next_real_insn (insn1))
|
3310 |
|
|
INSN_LOCATOR (insn1) = vliw_insn_location;
|
3311 |
|
|
}
|
3312 |
|
|
/* Tag subsequent instructions with the same location. */
|
3313 |
|
|
INSN_LOCATOR (insn) = vliw_insn_location;
|
3314 |
|
|
}
|
3315 |
|
|
}
|
3316 |
|
|
|
3317 |
|
|
}
|
3318 |
|
|
|
3319 |
|
|
/* Locate the note marking the end of the function's prologue. If
|
3320 |
|
|
the note appears in the middle of a VLIW packet, move the note to
|
3321 |
|
|
the end. This avoids unpleasant consequences such as trying to
|
3322 |
|
|
emit prologue markers (e.g., .loc/.file directives) in the middle
|
3323 |
|
|
of VLIW packets. */
|
3324 |
|
|
if (picochip_schedule_type == DFA_TYPE_SPEED)
|
3325 |
|
|
{
|
3326 |
|
|
rtx prologue_end_note = NULL;
|
3327 |
|
|
rtx last_insn_in_packet = NULL;
|
3328 |
|
|
|
3329 |
|
|
for (insn = get_insns (); insn; insn = next_insn (insn))
|
3330 |
|
|
{
|
3331 |
|
|
/* The prologue end must be moved to the end of the VLIW packet. */
|
3332 |
|
|
if (NOTE_P (insn) && NOTE_KIND (insn) == NOTE_INSN_PROLOGUE_END)
|
3333 |
|
|
{
|
3334 |
|
|
prologue_end_note = insn;
|
3335 |
|
|
break;
|
3336 |
|
|
}
|
3337 |
|
|
}
|
3338 |
|
|
|
3339 |
|
|
/* Find the last instruction in this packet. */
|
3340 |
|
|
for (insn = prologue_end_note; insn; insn = next_real_insn (insn))
|
3341 |
|
|
{
|
3342 |
|
|
if (GET_MODE (insn) == TImode)
|
3343 |
|
|
break;
|
3344 |
|
|
else
|
3345 |
|
|
last_insn_in_packet = insn;
|
3346 |
|
|
}
|
3347 |
|
|
|
3348 |
|
|
if (last_insn_in_packet != NULL)
|
3349 |
|
|
{
|
3350 |
|
|
rtx tmp_note
|
3351 |
|
|
= emit_note_after ((enum insn_note) NOTE_KIND (prologue_end_note),
|
3352 |
|
|
last_insn_in_packet);
|
3353 |
|
|
memcpy(&NOTE_DATA (tmp_note), &NOTE_DATA(prologue_end_note), sizeof(NOTE_DATA(prologue_end_note)));
|
3354 |
|
|
delete_insn (prologue_end_note);
|
3355 |
|
|
}
|
3356 |
|
|
}
|
3357 |
|
|
|
3358 |
|
|
if (flag_var_tracking)
|
3359 |
|
|
{
|
3360 |
|
|
timevar_push (TV_VAR_TRACKING);
|
3361 |
|
|
variable_tracking_main ();
|
3362 |
|
|
/* We also have to deal with variable tracking notes in the
|
3363 |
|
|
middle of VLIW packets. */
|
3364 |
|
|
reorder_var_tracking_notes();
|
3365 |
|
|
timevar_pop (TV_VAR_TRACKING);
|
3366 |
|
|
}
|
3367 |
|
|
}
|
3368 |
|
|
|
3369 |
|
|
/* Return the ALU character identifier for the current
|
3370 |
|
|
instruction. This will be 0 or 1. */
|
3371 |
|
|
static char
|
3372 |
|
|
picochip_get_vliw_alu_id (void)
|
3373 |
|
|
{
|
3374 |
|
|
int attr_type = 0;
|
3375 |
|
|
|
3376 |
|
|
/* Always use ALU 0 if VLIW scheduling is disabled. */
|
3377 |
|
|
if (picochip_schedule_type != DFA_TYPE_SPEED)
|
3378 |
|
|
return '0';
|
3379 |
|
|
|
3380 |
|
|
/* Get the attribute type of the instruction. Note that this can
|
3381 |
|
|
ruin the contents of recog_data, so save/restore around the
|
3382 |
|
|
call. */
|
3383 |
|
|
picochip_save_recog_data ();
|
3384 |
|
|
attr_type = get_attr_type (picochip_current_prescan_insn);
|
3385 |
|
|
picochip_restore_recog_data ();
|
3386 |
|
|
|
3387 |
|
|
if (picochip_current_vliw_state.contains_pico_alu_insn)
|
3388 |
|
|
{
|
3389 |
|
|
|
3390 |
|
|
/* If this a picoAlu insn? If it is, then stuff it into ALU 0,
|
3391 |
|
|
else it must be the other ALU (either basic or nonCc)
|
3392 |
|
|
instruction which goes into 1. */
|
3393 |
|
|
if (attr_type == TYPE_PICOALU)
|
3394 |
|
|
return '0';
|
3395 |
|
|
else
|
3396 |
|
|
return '1';
|
3397 |
|
|
|
3398 |
|
|
}
|
3399 |
|
|
else if (picochip_current_vliw_state.contains_non_cc_alu_insn)
|
3400 |
|
|
{
|
3401 |
|
|
/* Is this the non CC instruction? If it is, then stuff it into
|
3402 |
|
|
ALU 1, else it must be a picoAlu or basicAlu, in which case
|
3403 |
|
|
it goes into ALU 0. */
|
3404 |
|
|
if (attr_type == TYPE_NONCCALU)
|
3405 |
|
|
return '1';
|
3406 |
|
|
else
|
3407 |
|
|
return '0';
|
3408 |
|
|
}
|
3409 |
|
|
else
|
3410 |
|
|
{
|
3411 |
|
|
/* No picoAlu/nonCc instructions in use, so purely dependent upon
|
3412 |
|
|
whether an ALU instruction has already been scheduled in this
|
3413 |
|
|
cycle. */
|
3414 |
|
|
switch (picochip_current_vliw_state.num_alu_insns_so_far)
|
3415 |
|
|
{
|
3416 |
|
|
case 0:
|
3417 |
|
|
picochip_current_vliw_state.num_alu_insns_so_far++;
|
3418 |
|
|
return '0';
|
3419 |
|
|
|
3420 |
|
|
case 1:
|
3421 |
|
|
picochip_current_vliw_state.num_alu_insns_so_far++;
|
3422 |
|
|
return '1';
|
3423 |
|
|
|
3424 |
|
|
default:
|
3425 |
|
|
internal_error ("too many ALU instructions emitted (%d)",
|
3426 |
|
|
picochip_current_vliw_state.num_alu_insns_so_far);
|
3427 |
|
|
return 'X';
|
3428 |
|
|
}
|
3429 |
|
|
}
|
3430 |
|
|
|
3431 |
|
|
}
|
3432 |
|
|
|
3433 |
|
|
/* Reset any information about the current VLIW packing status. */
|
3434 |
|
|
static void
|
3435 |
|
|
picochip_reset_vliw (rtx insn)
|
3436 |
|
|
{
|
3437 |
|
|
rtx local_insn = insn;
|
3438 |
|
|
|
3439 |
|
|
/* Nothing to do if VLIW scheduling isn't being used. */
|
3440 |
|
|
if (picochip_schedule_type != DFA_TYPE_SPEED)
|
3441 |
|
|
return;
|
3442 |
|
|
|
3443 |
|
|
if (TARGET_DEBUG)
|
3444 |
|
|
printf ("%s on insn %d\n", __FUNCTION__, INSN_UID (insn));
|
3445 |
|
|
|
3446 |
|
|
/* Reset. */
|
3447 |
|
|
picochip_current_vliw_state.contains_pico_alu_insn = 0;
|
3448 |
|
|
picochip_current_vliw_state.contains_non_cc_alu_insn = 0;
|
3449 |
|
|
picochip_current_vliw_state.num_alu_insns_so_far = 0;
|
3450 |
|
|
picochip_current_vliw_state.num_cfi_labels_deferred = 0;
|
3451 |
|
|
picochip_current_vliw_state.lm_label_name[0] = 0;
|
3452 |
|
|
picochip_current_vliw_state.num_insns_in_packet = 0;
|
3453 |
|
|
|
3454 |
|
|
/* Read through the VLIW packet, classifying the instructions where
|
3455 |
|
|
appropriate. */
|
3456 |
|
|
local_insn = insn;
|
3457 |
|
|
do
|
3458 |
|
|
{
|
3459 |
|
|
if (NOTE_P (local_insn) || DEBUG_INSN_P(local_insn))
|
3460 |
|
|
{
|
3461 |
|
|
local_insn = NEXT_INSN (local_insn);
|
3462 |
|
|
continue;
|
3463 |
|
|
}
|
3464 |
|
|
else if (!INSN_P (local_insn))
|
3465 |
|
|
break;
|
3466 |
|
|
else
|
3467 |
|
|
{
|
3468 |
|
|
/* It is an instruction, but is it ours? */
|
3469 |
|
|
if (INSN_CODE (local_insn) != -1)
|
3470 |
|
|
{
|
3471 |
|
|
int attr_type = 0;
|
3472 |
|
|
|
3473 |
|
|
picochip_current_vliw_state.num_insns_in_packet += 1;
|
3474 |
|
|
|
3475 |
|
|
/* Is it a picoAlu or nonCcAlu instruction? Note that the
|
3476 |
|
|
get_attr_type function can overwrite the values in
|
3477 |
|
|
the recog_data global, hence this is saved and
|
3478 |
|
|
restored around the call. Not doing so results in
|
3479 |
|
|
asm_output_opcode being called with a different
|
3480 |
|
|
instruction to final_prescan_insn, which is fatal. */
|
3481 |
|
|
picochip_save_recog_data ();
|
3482 |
|
|
attr_type = get_attr_type (local_insn);
|
3483 |
|
|
picochip_restore_recog_data ();
|
3484 |
|
|
|
3485 |
|
|
if (attr_type == TYPE_PICOALU)
|
3486 |
|
|
picochip_current_vliw_state.contains_pico_alu_insn = 1;
|
3487 |
|
|
if (attr_type == TYPE_NONCCALU)
|
3488 |
|
|
picochip_current_vliw_state.contains_non_cc_alu_insn = 1;
|
3489 |
|
|
|
3490 |
|
|
}
|
3491 |
|
|
}
|
3492 |
|
|
|
3493 |
|
|
/* Get the next instruction. */
|
3494 |
|
|
local_insn = NEXT_INSN (local_insn);
|
3495 |
|
|
|
3496 |
|
|
/* Keep going while the next instruction is part of the same
|
3497 |
|
|
VLIW packet (i.e., its a valid instruction and doesn't mark
|
3498 |
|
|
the start of a new VLIW packet. */
|
3499 |
|
|
}
|
3500 |
|
|
while (local_insn &&
|
3501 |
|
|
(GET_MODE (local_insn) != TImode) && (INSN_CODE (local_insn) != -1));
|
3502 |
|
|
|
3503 |
|
|
}
|
3504 |
|
|
|
3505 |
|
|
int
|
3506 |
|
|
picochip_sched_reorder (FILE * file, int verbose,
|
3507 |
|
|
rtx * ready ATTRIBUTE_UNUSED,
|
3508 |
|
|
int *n_readyp ATTRIBUTE_UNUSED, int clock)
|
3509 |
|
|
{
|
3510 |
|
|
|
3511 |
|
|
if (verbose > 0)
|
3512 |
|
|
fprintf (file, ";;\tClock %d\n", clock);
|
3513 |
|
|
|
3514 |
|
|
return picochip_sched_issue_rate ();
|
3515 |
|
|
|
3516 |
|
|
}
|
3517 |
|
|
|
3518 |
|
|
int
|
3519 |
|
|
picochip_sched_lookahead (void)
|
3520 |
|
|
{
|
3521 |
|
|
/* It should always be enough to lookahead by 2 insns. Only slot0/1 could
|
3522 |
|
|
have a conflict. */
|
3523 |
|
|
return 2;
|
3524 |
|
|
}
|
3525 |
|
|
|
3526 |
|
|
int
|
3527 |
|
|
picochip_sched_issue_rate (void)
|
3528 |
|
|
{
|
3529 |
|
|
return 3;
|
3530 |
|
|
}
|
3531 |
|
|
|
3532 |
|
|
/* Adjust the scheduling cost between the two given instructions,
|
3533 |
|
|
which have the given dependency. */
|
3534 |
|
|
int
|
3535 |
|
|
picochip_sched_adjust_cost (rtx insn, rtx link, rtx dep_insn, int cost)
|
3536 |
|
|
{
|
3537 |
|
|
|
3538 |
|
|
if (TARGET_DEBUG)
|
3539 |
|
|
{
|
3540 |
|
|
printf ("Sched Adjust Cost: %d->%d is %d\n",
|
3541 |
|
|
INSN_UID (insn), INSN_UID (dep_insn), cost);
|
3542 |
|
|
|
3543 |
|
|
printf (" Dependency type:");
|
3544 |
|
|
switch (REG_NOTE_KIND (link))
|
3545 |
|
|
{
|
3546 |
|
|
case 0:
|
3547 |
|
|
printf ("Data\n");
|
3548 |
|
|
break;
|
3549 |
|
|
case REG_DEP_ANTI:
|
3550 |
|
|
printf ("ANTI\n");
|
3551 |
|
|
break;
|
3552 |
|
|
case REG_DEP_OUTPUT:
|
3553 |
|
|
printf ("OUTPUT\n");
|
3554 |
|
|
break;
|
3555 |
|
|
default:
|
3556 |
|
|
printf ("Unknown (%d)\n", REG_NOTE_KIND (link));
|
3557 |
|
|
}
|
3558 |
|
|
}
|
3559 |
|
|
|
3560 |
|
|
/* Anti-dependencies are used to enforce the ordering between a
|
3561 |
|
|
* branch, and any subsequent instructions. For example:
|
3562 |
|
|
*
|
3563 |
|
|
* BNE someLabel
|
3564 |
|
|
* ADD.0 r0,r1,r2
|
3565 |
|
|
*
|
3566 |
|
|
* The ADD instruction must execute after the branch, and this is
|
3567 |
|
|
* enforced using an anti-dependency. Unfortunately, VLIW machines
|
3568 |
|
|
* are happy to execute anti-dependent instructions in the same
|
3569 |
|
|
* cycle, which then results in a schedule like the following being
|
3570 |
|
|
* created:
|
3571 |
|
|
*
|
3572 |
|
|
* BNE someLabel \ ADD.0 r0,r1,r2
|
3573 |
|
|
*
|
3574 |
|
|
* The instruction which would normally be conditionally executed
|
3575 |
|
|
* depending upon the outcome of the branch, is now unconditionally
|
3576 |
|
|
* executed every time. To prevent this happening, any
|
3577 |
|
|
* anti-dependencies between a branch and another instruction are
|
3578 |
|
|
* promoted to become real dependencies.
|
3579 |
|
|
*/
|
3580 |
|
|
if ((JUMP_P (dep_insn) || CALL_P(dep_insn)) && REG_NOTE_KIND (link) == REG_DEP_ANTI)
|
3581 |
|
|
{
|
3582 |
|
|
|
3583 |
|
|
if (TARGET_DEBUG)
|
3584 |
|
|
printf ("Promoting anti-dependency %d->%d to a true-dependency\n",
|
3585 |
|
|
INSN_UID (insn), INSN_UID (dep_insn));
|
3586 |
|
|
|
3587 |
|
|
return 1;
|
3588 |
|
|
}
|
3589 |
|
|
|
3590 |
|
|
return cost;
|
3591 |
|
|
|
3592 |
|
|
}
|
3593 |
|
|
|
3594 |
|
|
/* Return the minimum of the two values */
|
3595 |
|
|
static int
|
3596 |
|
|
minimum (int a, int b)
|
3597 |
|
|
{
|
3598 |
|
|
if (a < b)
|
3599 |
|
|
return a;
|
3600 |
|
|
if (b < a)
|
3601 |
|
|
return b;
|
3602 |
|
|
/* I dont expect to get to this function with a==b.*/
|
3603 |
|
|
gcc_unreachable();
|
3604 |
|
|
}
|
3605 |
|
|
|
3606 |
|
|
|
3607 |
|
|
/* This function checks if the memory of the two stores are just off by 2 bytes.
|
3608 |
|
|
It returns the lower memory operand's index.*/
|
3609 |
|
|
|
3610 |
|
|
static int
|
3611 |
|
|
memory_just_off (rtx opnd1, rtx opnd2)
|
3612 |
|
|
{
|
3613 |
|
|
int offset1 = 0, offset2 = 0;
|
3614 |
|
|
int reg1, reg2;
|
3615 |
|
|
|
3616 |
|
|
if (GET_CODE(XEXP(opnd1, 0)) == PLUS && GET_CODE(XEXP(XEXP(opnd1, 0),1)) == CONST_INT)
|
3617 |
|
|
{
|
3618 |
|
|
offset1 = INTVAL(XEXP(XEXP(opnd1, 0), 1));
|
3619 |
|
|
reg1 = REGNO(XEXP(XEXP(opnd1, 0), 0));
|
3620 |
|
|
}
|
3621 |
|
|
else
|
3622 |
|
|
{
|
3623 |
|
|
reg1 = REGNO(XEXP(opnd1, 0));
|
3624 |
|
|
}
|
3625 |
|
|
if (GET_CODE(XEXP(opnd2, 0)) == PLUS && GET_CODE(XEXP(XEXP(opnd2, 0), 1)) == CONST_INT)
|
3626 |
|
|
{
|
3627 |
|
|
offset2 = INTVAL(XEXP(XEXP(opnd2, 0), 1));
|
3628 |
|
|
reg2 = REGNO(XEXP(XEXP(opnd2, 0), 0));
|
3629 |
|
|
}
|
3630 |
|
|
else
|
3631 |
|
|
{
|
3632 |
|
|
reg2 = REGNO(XEXP(opnd2, 0));
|
3633 |
|
|
}
|
3634 |
|
|
|
3635 |
|
|
/* Peepholing 2 STW/LDWs has the restriction that the resulting STL/LDL's address
|
3636 |
|
|
should be 4 byte aligned. We can currently guarentee that only if the base
|
3637 |
|
|
address is FP(R13) and the offset is aligned. */
|
3638 |
|
|
|
3639 |
|
|
if (reg1 == reg2 && reg1 == 13 && abs(offset1-offset2) == 2 && minimum(offset1, offset2) % 4 == 0)
|
3640 |
|
|
return (minimum(offset1, offset2) == offset1) ? 1:2;
|
3641 |
|
|
|
3642 |
|
|
return 0;
|
3643 |
|
|
}
|
3644 |
|
|
|
3645 |
|
|
static int
|
3646 |
|
|
registers_just_off (rtx opnd1, rtx opnd2)
|
3647 |
|
|
{
|
3648 |
|
|
int reg1, reg2;
|
3649 |
|
|
reg1 = REGNO(opnd1);
|
3650 |
|
|
reg2 = REGNO(opnd2);
|
3651 |
|
|
if (abs(reg1-reg2) == 1 && minimum(reg1, reg2) % 2 == 0)
|
3652 |
|
|
return (minimum(reg1, reg2) == reg1)?1:2;
|
3653 |
|
|
return 0;
|
3654 |
|
|
}
|
3655 |
|
|
|
3656 |
|
|
/* Check to see if the two LDWs can be peepholed together into a LDL
|
3657 |
|
|
They can be if the registers getting loaded into are contiguous
|
3658 |
|
|
and the memory addresses are contiguous as well.
|
3659 |
|
|
for eg.
|
3660 |
|
|
LDW r2,[r11]x
|
3661 |
|
|
LDW r3,[r11]x+1
|
3662 |
|
|
can be merged together into
|
3663 |
|
|
LDL r[3:2],[r11]
|
3664 |
|
|
|
3665 |
|
|
NOTE:
|
3666 |
|
|
1. The LDWs themselves only guarentee that r11 will be a 2-byte
|
3667 |
|
|
aligned address. Only FP can be assumed to be 4 byte aligned.
|
3668 |
|
|
2. The progression of addresses and the register numbers should
|
3669 |
|
|
be similar. For eg., if you swap r2 and r3 in the above instructions,
|
3670 |
|
|
the resultant pair cannot be merged.
|
3671 |
|
|
|
3672 |
|
|
*/
|
3673 |
|
|
bool
|
3674 |
|
|
ok_to_peephole_ldw(rtx opnd0, rtx opnd1, rtx opnd2, rtx opnd3)
|
3675 |
|
|
{
|
3676 |
|
|
int memtest=0,regtest=0;
|
3677 |
|
|
regtest = registers_just_off(opnd1,opnd3);
|
3678 |
|
|
if (regtest == 0)
|
3679 |
|
|
return false;
|
3680 |
|
|
|
3681 |
|
|
memtest = memory_just_off(opnd0,opnd2);
|
3682 |
|
|
if (memtest == 0)
|
3683 |
|
|
return false;
|
3684 |
|
|
|
3685 |
|
|
if (regtest == memtest)
|
3686 |
|
|
{
|
3687 |
|
|
return true;
|
3688 |
|
|
}
|
3689 |
|
|
return false;
|
3690 |
|
|
}
|
3691 |
|
|
|
3692 |
|
|
/* Similar to LDW peephole */
|
3693 |
|
|
bool
|
3694 |
|
|
ok_to_peephole_stw(rtx opnd0, rtx opnd1, rtx opnd2, rtx opnd3)
|
3695 |
|
|
{
|
3696 |
|
|
int memtest=0,regtest=0;
|
3697 |
|
|
regtest = registers_just_off(opnd1,opnd3);
|
3698 |
|
|
if (regtest == 0)
|
3699 |
|
|
return false;
|
3700 |
|
|
|
3701 |
|
|
memtest = memory_just_off(opnd0,opnd2);
|
3702 |
|
|
if (memtest == 0)
|
3703 |
|
|
return false;
|
3704 |
|
|
|
3705 |
|
|
if (regtest == memtest)
|
3706 |
|
|
{
|
3707 |
|
|
return true;
|
3708 |
|
|
}
|
3709 |
|
|
return false;
|
3710 |
|
|
}
|
3711 |
|
|
|
3712 |
|
|
|
3713 |
|
|
/* Generate a SImode register with the register number that is the smaller of the two */
|
3714 |
|
|
rtx
|
3715 |
|
|
gen_min_reg(rtx opnd1,rtx opnd2)
|
3716 |
|
|
{
|
3717 |
|
|
return gen_rtx_REG (SImode, minimum(REGNO(opnd1),REGNO(opnd2)));
|
3718 |
|
|
}
|
3719 |
|
|
|
3720 |
|
|
/* Generate a SImode memory with the address that is the smaller of the two */
|
3721 |
|
|
rtx
|
3722 |
|
|
gen_SImode_mem(rtx opnd1,rtx opnd2)
|
3723 |
|
|
{
|
3724 |
|
|
int offset1=0,offset2=0;
|
3725 |
|
|
rtx reg;
|
3726 |
|
|
rtx address;
|
3727 |
|
|
if (GET_CODE(XEXP(opnd1,0)) == PLUS && GET_CODE(XEXP(XEXP(opnd1,0),1)) == CONST_INT)
|
3728 |
|
|
{
|
3729 |
|
|
offset1 = INTVAL(XEXP(XEXP(opnd1,0),1));
|
3730 |
|
|
reg = XEXP(XEXP(opnd1,0),0);
|
3731 |
|
|
}
|
3732 |
|
|
else
|
3733 |
|
|
{
|
3734 |
|
|
reg = XEXP(opnd1,0);
|
3735 |
|
|
}
|
3736 |
|
|
if (GET_CODE(XEXP(opnd2,0)) == PLUS && GET_CODE(XEXP(XEXP(opnd2,0),1)) == CONST_INT)
|
3737 |
|
|
{
|
3738 |
|
|
offset2 = INTVAL(XEXP(XEXP(opnd2,0),1));
|
3739 |
|
|
}
|
3740 |
|
|
address = gen_rtx_PLUS (HImode, reg, GEN_INT(minimum(offset1,offset2)));
|
3741 |
|
|
return gen_rtx_MEM(SImode,address);
|
3742 |
|
|
}
|
3743 |
|
|
|
3744 |
|
|
bool
|
3745 |
|
|
picochip_rtx_costs (rtx x, int code, int outer_code ATTRIBUTE_UNUSED,
|
3746 |
|
|
int opno ATTRIBUTE_UNUSED, int* total, bool speed)
|
3747 |
|
|
{
|
3748 |
|
|
|
3749 |
|
|
int localTotal = 0;
|
3750 |
|
|
|
3751 |
|
|
if (!speed)
|
3752 |
|
|
{
|
3753 |
|
|
/* Need to penalize immediates that need to be encoded as long constants.*/
|
3754 |
|
|
if (code == CONST_INT && !(INTVAL (x) >= 0 && INTVAL (x) < 16))
|
3755 |
|
|
{
|
3756 |
|
|
*total = COSTS_N_INSNS(1);
|
3757 |
|
|
return true;
|
3758 |
|
|
}
|
3759 |
|
|
}
|
3760 |
|
|
switch (code)
|
3761 |
|
|
{
|
3762 |
|
|
case SYMBOL_REF:
|
3763 |
|
|
case LABEL_REF:
|
3764 |
|
|
*total = COSTS_N_INSNS (outer_code != MEM);
|
3765 |
|
|
return true;
|
3766 |
|
|
break;
|
3767 |
|
|
|
3768 |
|
|
case IF_THEN_ELSE:
|
3769 |
|
|
/* if_then_else come out of cbranch instructions. It will get split into
|
3770 |
|
|
a condition code generating subtraction and a branch */
|
3771 |
|
|
*total = COSTS_N_INSNS (2);
|
3772 |
|
|
return true;
|
3773 |
|
|
break;
|
3774 |
|
|
|
3775 |
|
|
case AND:
|
3776 |
|
|
case IOR:
|
3777 |
|
|
case XOR:
|
3778 |
|
|
if (GET_MODE(x) == SImode)
|
3779 |
|
|
*total = COSTS_N_INSNS (2);
|
3780 |
|
|
if (GET_MODE(x) == DImode)
|
3781 |
|
|
*total = COSTS_N_INSNS (4);
|
3782 |
|
|
return false;
|
3783 |
|
|
|
3784 |
|
|
case MEM:
|
3785 |
|
|
/* Byte Memory access on a NO_BYTE_ACCESS machine would be expensive */
|
3786 |
|
|
if (GET_MODE(x) == QImode && !TARGET_HAS_BYTE_ACCESS)
|
3787 |
|
|
*total = COSTS_N_INSNS (10);
|
3788 |
|
|
|
3789 |
|
|
/* 64-bit accesses have to be done through 2 32-bit access */
|
3790 |
|
|
if (GET_MODE(x) == DImode)
|
3791 |
|
|
*total = COSTS_N_INSNS (2);
|
3792 |
|
|
return false;
|
3793 |
|
|
break;
|
3794 |
|
|
|
3795 |
|
|
case ASHIFTRT:
|
3796 |
|
|
|
3797 |
|
|
/* SImode shifts are expensive */
|
3798 |
|
|
if (GET_MODE(x) == SImode)
|
3799 |
|
|
*total = COSTS_N_INSNS (10);
|
3800 |
|
|
|
3801 |
|
|
/* Register shift by constant is cheap. */
|
3802 |
|
|
if ((GET_MODE(x) == QImode || GET_MODE(x) == HImode)
|
3803 |
|
|
&& GET_CODE(XEXP(x, 0)) == REG
|
3804 |
|
|
&& GET_CODE(XEXP(x, 1)) == CONST_INT)
|
3805 |
|
|
*total = COSTS_N_INSNS (1);
|
3806 |
|
|
else
|
3807 |
|
|
*total = COSTS_N_INSNS (4);
|
3808 |
|
|
return false;
|
3809 |
|
|
break;
|
3810 |
|
|
|
3811 |
|
|
case DIV:
|
3812 |
|
|
case MOD:
|
3813 |
|
|
|
3814 |
|
|
/* Divisions are more expensive than the default 7*/
|
3815 |
|
|
if (GET_MODE(x) == SImode)
|
3816 |
|
|
*total = COSTS_N_INSNS (20);
|
3817 |
|
|
else
|
3818 |
|
|
*total = COSTS_N_INSNS (12);
|
3819 |
|
|
return false;
|
3820 |
|
|
break;
|
3821 |
|
|
|
3822 |
|
|
case MULT:
|
3823 |
|
|
/* Look for the simple cases of multiplying register*register or
|
3824 |
|
|
register*constant. */
|
3825 |
|
|
if ((GET_MODE(x) == QImode || GET_MODE(x) == HImode)
|
3826 |
|
|
&& ((GET_CODE(XEXP(x, 0)) == REG
|
3827 |
|
|
&& (GET_CODE(XEXP(x, 1)) == REG || GET_CODE(XEXP(x,1)) == CONST_INT))
|
3828 |
|
|
|| (GET_CODE(XEXP(x, 0)) == ZERO_EXTEND
|
3829 |
|
|
&& GET_CODE(XEXP(XEXP(x, 0),0)) == REG
|
3830 |
|
|
&& GET_CODE(XEXP(x, 1)) == ZERO_EXTEND
|
3831 |
|
|
&& GET_CODE(XEXP(XEXP(x, 1),0)) == REG)))
|
3832 |
|
|
{
|
3833 |
|
|
|
3834 |
|
|
/* When optimising for size, multiplication by constant
|
3835 |
|
|
should be discouraged slightly over multiplication by a
|
3836 |
|
|
register. */
|
3837 |
|
|
if (picochip_has_mac_unit)
|
3838 |
|
|
{
|
3839 |
|
|
/* Single cycle multiplication, but the result must be
|
3840 |
|
|
loaded back into a general register afterwards. */
|
3841 |
|
|
*total = COSTS_N_INSNS(2);
|
3842 |
|
|
return true;
|
3843 |
|
|
}
|
3844 |
|
|
else if (picochip_has_mul_unit)
|
3845 |
|
|
{
|
3846 |
|
|
/* Single cycle multiplication. */
|
3847 |
|
|
*total = COSTS_N_INSNS(1);
|
3848 |
|
|
return true;
|
3849 |
|
|
}
|
3850 |
|
|
/* Else no multiply available. Use default cost. */
|
3851 |
|
|
|
3852 |
|
|
}
|
3853 |
|
|
break;
|
3854 |
|
|
|
3855 |
|
|
default:
|
3856 |
|
|
/* Do nothing. */
|
3857 |
|
|
break;
|
3858 |
|
|
}
|
3859 |
|
|
|
3860 |
|
|
if (localTotal != 0)
|
3861 |
|
|
{
|
3862 |
|
|
*total = localTotal;
|
3863 |
|
|
return true;
|
3864 |
|
|
}
|
3865 |
|
|
else
|
3866 |
|
|
{
|
3867 |
|
|
return false;
|
3868 |
|
|
}
|
3869 |
|
|
|
3870 |
|
|
}
|
3871 |
|
|
|
3872 |
|
|
void
|
3873 |
|
|
picochip_final_prescan_insn (rtx insn, rtx * opvec ATTRIBUTE_UNUSED,
|
3874 |
|
|
int num_operands ATTRIBUTE_UNUSED)
|
3875 |
|
|
{
|
3876 |
|
|
rtx local_insn;
|
3877 |
|
|
|
3878 |
|
|
picochip_current_prescan_insn = insn;
|
3879 |
|
|
|
3880 |
|
|
if (TARGET_DEBUG)
|
3881 |
|
|
printf ("Final prescan on INSN %d with mode %s\n",
|
3882 |
|
|
INSN_UID (insn), GET_MODE_NAME (GET_MODE (insn)));
|
3883 |
|
|
|
3884 |
|
|
/* If this is the start of a new instruction cycle, or no scheduling
|
3885 |
|
|
is used, then reset the VLIW status. */
|
3886 |
|
|
if (GET_MODE (insn) == TImode || !picochip_schedule_type == DFA_TYPE_SPEED)
|
3887 |
|
|
picochip_reset_vliw (insn);
|
3888 |
|
|
|
3889 |
|
|
/* No VLIW scheduling occured, so don't go any further. */
|
3890 |
|
|
if (picochip_schedule_type != DFA_TYPE_SPEED)
|
3891 |
|
|
return;
|
3892 |
|
|
|
3893 |
|
|
/* Look for the next printable instruction. This loop terminates on
|
3894 |
|
|
any recognisable instruction, and on any unrecognisable
|
3895 |
|
|
instruction with TImode. */
|
3896 |
|
|
local_insn = insn;
|
3897 |
|
|
for (local_insn = NEXT_INSN (local_insn); local_insn;
|
3898 |
|
|
local_insn = NEXT_INSN (local_insn))
|
3899 |
|
|
{
|
3900 |
|
|
if (NOTE_P (local_insn) || DEBUG_INSN_P(local_insn))
|
3901 |
|
|
continue;
|
3902 |
|
|
else if (!INSN_P (local_insn))
|
3903 |
|
|
break;
|
3904 |
|
|
else if (GET_MODE (local_insn) == TImode
|
3905 |
|
|
|| INSN_CODE (local_insn) != -1)
|
3906 |
|
|
break;
|
3907 |
|
|
}
|
3908 |
|
|
|
3909 |
|
|
/* Set the continuation flag if the next instruction can be packed
|
3910 |
|
|
with the current instruction (i.e., the next instruction is
|
3911 |
|
|
valid, and isn't the start of a new cycle). */
|
3912 |
|
|
picochip_vliw_continuation = (local_insn && NONDEBUG_INSN_P (local_insn) &&
|
3913 |
|
|
(GET_MODE (local_insn) != TImode));
|
3914 |
|
|
|
3915 |
|
|
}
|
3916 |
|
|
|
3917 |
|
|
/* Builtin functions. */
|
3918 |
|
|
/* Given a builtin function taking 2 operands (i.e., target + source),
|
3919 |
|
|
emit the RTL for the underlying instruction. */
|
3920 |
|
|
static rtx
|
3921 |
|
|
picochip_expand_builtin_2op (enum insn_code icode, tree call, rtx target)
|
3922 |
|
|
{
|
3923 |
|
|
tree arg0;
|
3924 |
|
|
rtx op0, pat;
|
3925 |
|
|
enum machine_mode tmode, mode0;
|
3926 |
|
|
|
3927 |
|
|
/* Grab the incoming argument and emit its RTL. */
|
3928 |
|
|
arg0 = CALL_EXPR_ARG (call, 0);
|
3929 |
|
|
op0 = expand_expr (arg0, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
3930 |
|
|
|
3931 |
|
|
/* Determine the modes of the instruction operands. */
|
3932 |
|
|
tmode = insn_data[icode].operand[0].mode;
|
3933 |
|
|
mode0 = insn_data[icode].operand[1].mode;
|
3934 |
|
|
|
3935 |
|
|
/* Ensure that the incoming argument RTL is in a register of the
|
3936 |
|
|
correct mode. */
|
3937 |
|
|
if (!(*insn_data[icode].operand[1].predicate) (op0, mode0))
|
3938 |
|
|
op0 = copy_to_mode_reg (mode0, op0);
|
3939 |
|
|
|
3940 |
|
|
/* If there isn't a suitable target, emit a target register. */
|
3941 |
|
|
if (target == 0
|
3942 |
|
|
|| GET_MODE (target) != tmode
|
3943 |
|
|
|| !(*insn_data[icode].operand[0].predicate) (target, tmode))
|
3944 |
|
|
target = gen_reg_rtx (tmode);
|
3945 |
|
|
|
3946 |
|
|
/* Emit and return the new instruction. */
|
3947 |
|
|
pat = GEN_FCN (icode) (target, op0);
|
3948 |
|
|
if (!pat)
|
3949 |
|
|
return 0;
|
3950 |
|
|
emit_insn (pat);
|
3951 |
|
|
|
3952 |
|
|
return target;
|
3953 |
|
|
|
3954 |
|
|
}
|
3955 |
|
|
|
3956 |
|
|
/* Given a builtin function taking 3 operands (i.e., target + two
|
3957 |
|
|
source), emit the RTL for the underlying instruction. */
|
3958 |
|
|
static rtx
|
3959 |
|
|
picochip_expand_builtin_3op (enum insn_code icode, tree call, rtx target)
|
3960 |
|
|
{
|
3961 |
|
|
tree arg0, arg1;
|
3962 |
|
|
rtx op0, op1, pat;
|
3963 |
|
|
enum machine_mode tmode, mode0, mode1;
|
3964 |
|
|
|
3965 |
|
|
/* Grab the function's arguments. */
|
3966 |
|
|
arg0 = CALL_EXPR_ARG (call, 0);
|
3967 |
|
|
arg1 = CALL_EXPR_ARG (call, 1);
|
3968 |
|
|
|
3969 |
|
|
/* Emit rtl sequences for the function arguments. */
|
3970 |
|
|
op0 = expand_expr (arg0, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
3971 |
|
|
op1 = expand_expr (arg1, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
3972 |
|
|
|
3973 |
|
|
/* Get the mode's of each of the instruction operands. */
|
3974 |
|
|
tmode = insn_data[icode].operand[0].mode;
|
3975 |
|
|
mode0 = insn_data[icode].operand[1].mode;
|
3976 |
|
|
mode1 = insn_data[icode].operand[2].mode;
|
3977 |
|
|
|
3978 |
|
|
/* Ensure that each of the function argument rtl sequences are in a
|
3979 |
|
|
register of the correct mode. */
|
3980 |
|
|
if (!(*insn_data[icode].operand[1].predicate) (op0, mode0))
|
3981 |
|
|
op0 = copy_to_mode_reg (mode0, op0);
|
3982 |
|
|
if (!(*insn_data[icode].operand[2].predicate) (op1, mode1))
|
3983 |
|
|
op1 = copy_to_mode_reg (mode1, op1);
|
3984 |
|
|
|
3985 |
|
|
/* If no target has been given, create a register to use as the target. */
|
3986 |
|
|
if (target == 0
|
3987 |
|
|
|| GET_MODE (target) != tmode
|
3988 |
|
|
|| !(*insn_data[icode].operand[0].predicate) (target, tmode))
|
3989 |
|
|
target = gen_reg_rtx (tmode);
|
3990 |
|
|
|
3991 |
|
|
/* Emit and return the new instruction. */
|
3992 |
|
|
pat = GEN_FCN (icode) (target, op0, op1);
|
3993 |
|
|
if (!pat)
|
3994 |
|
|
return 0;
|
3995 |
|
|
emit_insn (pat);
|
3996 |
|
|
|
3997 |
|
|
return target;
|
3998 |
|
|
|
3999 |
|
|
}
|
4000 |
|
|
|
4001 |
|
|
/* Expand a builtin function which takes two arguments, and returns a void. */
|
4002 |
|
|
static rtx
|
4003 |
|
|
picochip_expand_builtin_2opvoid (enum insn_code icode, tree call)
|
4004 |
|
|
{
|
4005 |
|
|
tree arg0, arg1;
|
4006 |
|
|
rtx op0, op1, pat;
|
4007 |
|
|
enum machine_mode mode0, mode1;
|
4008 |
|
|
|
4009 |
|
|
/* Grab the function's arguments. */
|
4010 |
|
|
arg0 = CALL_EXPR_ARG (call, 0);
|
4011 |
|
|
arg1 = CALL_EXPR_ARG (call, 1);
|
4012 |
|
|
|
4013 |
|
|
/* Emit rtl sequences for the function arguments. */
|
4014 |
|
|
op0 = expand_expr (arg0, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
4015 |
|
|
op1 = expand_expr (arg1, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
4016 |
|
|
|
4017 |
|
|
/* Get the mode's of each of the instruction operands. */
|
4018 |
|
|
mode0 = insn_data[icode].operand[0].mode;
|
4019 |
|
|
mode1 = insn_data[icode].operand[1].mode;
|
4020 |
|
|
|
4021 |
|
|
/* Ensure that each of the function argument rtl sequences are in a
|
4022 |
|
|
register of the correct mode. */
|
4023 |
|
|
if (!(*insn_data[icode].operand[0].predicate) (op0, mode0))
|
4024 |
|
|
op0 = copy_to_mode_reg (mode0, op0);
|
4025 |
|
|
if (!(*insn_data[icode].operand[1].predicate) (op1, mode1))
|
4026 |
|
|
op1 = copy_to_mode_reg (mode1, op1);
|
4027 |
|
|
|
4028 |
|
|
/* Emit and return the new instruction. */
|
4029 |
|
|
pat = GEN_FCN (icode) (op0, op1);
|
4030 |
|
|
if (!pat)
|
4031 |
|
|
return 0;
|
4032 |
|
|
emit_insn (pat);
|
4033 |
|
|
|
4034 |
|
|
return NULL_RTX;
|
4035 |
|
|
|
4036 |
|
|
}
|
4037 |
|
|
|
4038 |
|
|
/* Expand an array get into the corresponding RTL. */
|
4039 |
|
|
static rtx
|
4040 |
|
|
picochip_expand_array_get (tree call, rtx target)
|
4041 |
|
|
{
|
4042 |
|
|
tree arg0, arg1, arg2;
|
4043 |
|
|
rtx op0, op1, op2, pat;
|
4044 |
|
|
|
4045 |
|
|
/* Grab the function's arguments. */
|
4046 |
|
|
arg0 = CALL_EXPR_ARG (call, 0);
|
4047 |
|
|
arg1 = CALL_EXPR_ARG (call, 1);
|
4048 |
|
|
arg2 = CALL_EXPR_ARG (call, 2) ;
|
4049 |
|
|
|
4050 |
|
|
/* Emit rtl sequences for the function arguments. */
|
4051 |
|
|
op0 = expand_expr (arg0, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
4052 |
|
|
op1 = expand_expr (arg1, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
4053 |
|
|
op2 = expand_expr (arg2, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
4054 |
|
|
|
4055 |
|
|
/* The second and third operands must be constant. Nothing else will
|
4056 |
|
|
do. */
|
4057 |
|
|
if (CONST_INT != GET_CODE (op1))
|
4058 |
|
|
internal_error ("%s: Second source operand is not a constant",
|
4059 |
|
|
__FUNCTION__);
|
4060 |
|
|
if (CONST_INT != GET_CODE (op2))
|
4061 |
|
|
internal_error ("%s: Third source operand is not a constant",
|
4062 |
|
|
__FUNCTION__);
|
4063 |
|
|
|
4064 |
|
|
/* If no target has been given, create a register to use as the target. */
|
4065 |
|
|
if (target == 0 || GET_MODE (target) != SImode)
|
4066 |
|
|
target = gen_reg_rtx (SImode);
|
4067 |
|
|
|
4068 |
|
|
/* The first operand must be a HImode register or a constant. If it
|
4069 |
|
|
isn't, force it into a HImode register. */
|
4070 |
|
|
if (GET_MODE (op0) != HImode || REG != GET_CODE (op0))
|
4071 |
|
|
op0 = copy_to_mode_reg (HImode, op0);
|
4072 |
|
|
|
4073 |
|
|
|
4074 |
|
|
/* Emit and return the new instruction. */
|
4075 |
|
|
pat = gen_commsArrayGet (target, op0, op1, op2);
|
4076 |
|
|
emit_insn (pat);
|
4077 |
|
|
|
4078 |
|
|
return target;
|
4079 |
|
|
|
4080 |
|
|
}
|
4081 |
|
|
|
4082 |
|
|
/* Expand an array put into the corresponding RTL. */
|
4083 |
|
|
static rtx
|
4084 |
|
|
picochip_expand_array_put (tree call, rtx target)
|
4085 |
|
|
{
|
4086 |
|
|
tree arg0, arg1, arg2, arg3;
|
4087 |
|
|
rtx op0, op1, op2, op3, pat;
|
4088 |
|
|
|
4089 |
|
|
/* Grab the function's arguments. */
|
4090 |
|
|
arg0 = CALL_EXPR_ARG (call, 0);
|
4091 |
|
|
arg1 = CALL_EXPR_ARG (call, 1);
|
4092 |
|
|
arg2 = CALL_EXPR_ARG (call, 2);
|
4093 |
|
|
arg3 = CALL_EXPR_ARG (call, 3);
|
4094 |
|
|
|
4095 |
|
|
/* Emit rtl sequences for the function arguments. */
|
4096 |
|
|
op0 = expand_expr (arg0, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
4097 |
|
|
op1 = expand_expr (arg1, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
4098 |
|
|
op2 = expand_expr (arg2, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
4099 |
|
|
op3 = expand_expr (arg3, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
4100 |
|
|
|
4101 |
|
|
/* The first operand must be an SImode register. */
|
4102 |
|
|
if (GET_MODE (op0) != SImode || REG != GET_CODE (op0))
|
4103 |
|
|
op0 = copy_to_mode_reg (SImode, op0);
|
4104 |
|
|
|
4105 |
|
|
/* The second (index) operand must be a HImode register, or a
|
4106 |
|
|
constant. If it isn't, force it into a HImode register. */
|
4107 |
|
|
if (GET_MODE (op1) != HImode || REG != GET_CODE (op1))
|
4108 |
|
|
op1 = copy_to_mode_reg (HImode, op1);
|
4109 |
|
|
|
4110 |
|
|
/* The remaining operands must be constant. Nothing else will do. */
|
4111 |
|
|
if (CONST_INT != GET_CODE (op2))
|
4112 |
|
|
internal_error ("%s: Third source operand is not a constant",
|
4113 |
|
|
__FUNCTION__);
|
4114 |
|
|
if (CONST_INT != GET_CODE (op3))
|
4115 |
|
|
internal_error ("%s: Fourth source operand is not a constant",
|
4116 |
|
|
__FUNCTION__);
|
4117 |
|
|
|
4118 |
|
|
/* Emit and return the new instruction. */
|
4119 |
|
|
pat = gen_commsArrayPut (op0, op1, op2, op3);
|
4120 |
|
|
emit_insn (pat);
|
4121 |
|
|
|
4122 |
|
|
return target;
|
4123 |
|
|
|
4124 |
|
|
}
|
4125 |
|
|
|
4126 |
|
|
/* Expand an array testport into the corresponding RTL. */
|
4127 |
|
|
static rtx
|
4128 |
|
|
picochip_expand_array_testport (tree call, rtx target)
|
4129 |
|
|
{
|
4130 |
|
|
tree arg0, arg1, arg2;
|
4131 |
|
|
rtx op0, op1, op2, pat;
|
4132 |
|
|
|
4133 |
|
|
/* Grab the function's arguments. */
|
4134 |
|
|
arg0 = CALL_EXPR_ARG (call, 0);
|
4135 |
|
|
arg1 = CALL_EXPR_ARG (call, 1);
|
4136 |
|
|
arg2 = CALL_EXPR_ARG (call, 2);
|
4137 |
|
|
|
4138 |
|
|
/* Emit rtl sequences for the function arguments. */
|
4139 |
|
|
op0 = expand_expr (arg0, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
4140 |
|
|
op1 = expand_expr (arg1, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
4141 |
|
|
op2 = expand_expr (arg2, NULL_RTX, VOIDmode, EXPAND_NORMAL);
|
4142 |
|
|
|
4143 |
|
|
/* The first operand must be a HImode register, or a constant. If it
|
4144 |
|
|
isn't, force it into a HImode register. */
|
4145 |
|
|
if (GET_MODE (op0) != HImode || REG != GET_CODE (op0))
|
4146 |
|
|
op0 = copy_to_mode_reg (HImode, op0);
|
4147 |
|
|
|
4148 |
|
|
/* The second and third operands must be constant. Nothing else will
|
4149 |
|
|
do. */
|
4150 |
|
|
if (CONST_INT != GET_CODE (op1))
|
4151 |
|
|
internal_error ("%s: Second source operand is not a constant",
|
4152 |
|
|
__FUNCTION__);
|
4153 |
|
|
if (CONST_INT != GET_CODE (op2))
|
4154 |
|
|
internal_error ("%s: Third source operand is not a constant",
|
4155 |
|
|
__FUNCTION__);
|
4156 |
|
|
|
4157 |
|
|
/* If no target has been given, create a HImode register to use as
|
4158 |
|
|
the target. */
|
4159 |
|
|
if (target == 0 || GET_MODE (target) != HImode)
|
4160 |
|
|
target = gen_reg_rtx (HImode);
|
4161 |
|
|
|
4162 |
|
|
/* Emit and return the new instruction. */
|
4163 |
|
|
pat = gen_commsArrayTestPort (target, op0, op1, op2);
|
4164 |
|
|
emit_insn (pat);
|
4165 |
|
|
|
4166 |
|
|
return target;
|
4167 |
|
|
|
4168 |
|
|
}
|
4169 |
|
|
|
4170 |
|
|
/* Generate a unique HALT instruction by giving the instruction a
|
4171 |
|
|
unique integer. This integer makes no difference to the assembly
|
4172 |
|
|
output (other than a comment indicating the supplied id), but the
|
4173 |
|
|
presence of the unique integer prevents the compiler from combining
|
4174 |
|
|
several different halt instructions into one instruction. This
|
4175 |
|
|
means that each use of the halt instruction is unique, which in
|
4176 |
|
|
turn means that assertions work as expected. */
|
4177 |
|
|
static rtx
|
4178 |
|
|
picochip_generate_halt (void)
|
4179 |
|
|
{
|
4180 |
|
|
static int currentId = 0;
|
4181 |
|
|
rtx insns;
|
4182 |
|
|
rtx id = GEN_INT (currentId);
|
4183 |
|
|
currentId += 1;
|
4184 |
|
|
|
4185 |
|
|
start_sequence();
|
4186 |
|
|
emit_insn (gen_halt (id));
|
4187 |
|
|
|
4188 |
|
|
/* A barrier is inserted to prevent the compiler from thinking that
|
4189 |
|
|
it has to continue execution after the HALT.*/
|
4190 |
|
|
emit_barrier ();
|
4191 |
|
|
|
4192 |
|
|
insns = get_insns();
|
4193 |
|
|
end_sequence();
|
4194 |
|
|
emit_insn (insns);
|
4195 |
|
|
|
4196 |
|
|
return const0_rtx;
|
4197 |
|
|
}
|
4198 |
|
|
|
4199 |
|
|
/* Initialise the builtin functions. Start by initialising
|
4200 |
|
|
descriptions of different types of functions (e.g., void fn(int),
|
4201 |
|
|
int fn(void)), and then use these to define the builtins. */
|
4202 |
|
|
void
|
4203 |
|
|
picochip_init_builtins (void)
|
4204 |
|
|
{
|
4205 |
|
|
tree noreturn;
|
4206 |
|
|
|
4207 |
|
|
tree int_ftype_int, int_ftype_int_int;
|
4208 |
|
|
tree long_ftype_int, long_ftype_int_int_int;
|
4209 |
|
|
tree void_ftype_int_long, int_ftype_int_int_int,
|
4210 |
|
|
void_ftype_long_int_int_int;
|
4211 |
|
|
tree void_ftype_void, unsigned_ftype_unsigned;
|
4212 |
|
|
|
4213 |
|
|
/* void func (void) */
|
4214 |
|
|
void_ftype_void = build_function_type_list (void_type_node, NULL_TREE);
|
4215 |
|
|
|
4216 |
|
|
/* int func (int) */
|
4217 |
|
|
int_ftype_int = build_function_type_list (integer_type_node,
|
4218 |
|
|
integer_type_node, NULL_TREE);
|
4219 |
|
|
|
4220 |
|
|
/* unsigned int func (unsigned int) */
|
4221 |
|
|
unsigned_ftype_unsigned
|
4222 |
|
|
= build_function_type_list (unsigned_type_node,
|
4223 |
|
|
unsigned_type_node, NULL_TREE);
|
4224 |
|
|
|
4225 |
|
|
/* int func(int, int) */
|
4226 |
|
|
int_ftype_int_int
|
4227 |
|
|
= build_function_type_list (integer_type_node,
|
4228 |
|
|
integer_type_node, integer_type_node,
|
4229 |
|
|
NULL_TREE);
|
4230 |
|
|
|
4231 |
|
|
/* long func(int) */
|
4232 |
|
|
long_ftype_int = build_function_type_list (long_integer_type_node,
|
4233 |
|
|
integer_type_node, NULL_TREE);
|
4234 |
|
|
|
4235 |
|
|
/* long func(int, int, int) */
|
4236 |
|
|
long_ftype_int_int_int
|
4237 |
|
|
= build_function_type_list (long_integer_type_node,
|
4238 |
|
|
integer_type_node, integer_type_node,
|
4239 |
|
|
integer_type_node, NULL_TREE);
|
4240 |
|
|
|
4241 |
|
|
/* int func(int, int, int) */
|
4242 |
|
|
int_ftype_int_int_int
|
4243 |
|
|
= build_function_type_list (integer_type_node,
|
4244 |
|
|
integer_type_node, integer_type_node,
|
4245 |
|
|
integer_type_node, NULL_TREE);
|
4246 |
|
|
|
4247 |
|
|
/* void func(int, long) */
|
4248 |
|
|
void_ftype_int_long
|
4249 |
|
|
= build_function_type_list (void_type_node,
|
4250 |
|
|
integer_type_node, long_integer_type_node,
|
4251 |
|
|
NULL_TREE);
|
4252 |
|
|
|
4253 |
|
|
/* void func(long, int, int, int) */
|
4254 |
|
|
void_ftype_long_int_int_int
|
4255 |
|
|
= build_function_type_list (void_type_node,
|
4256 |
|
|
long_integer_type_node, integer_type_node,
|
4257 |
|
|
integer_type_node, integer_type_node,
|
4258 |
|
|
NULL_TREE);
|
4259 |
|
|
|
4260 |
|
|
/* Initialise the sign-bit-count function. */
|
4261 |
|
|
add_builtin_function ("__builtin_sbc", int_ftype_int,
|
4262 |
|
|
PICOCHIP_BUILTIN_SBC, BUILT_IN_MD, NULL,
|
4263 |
|
|
NULL_TREE);
|
4264 |
|
|
add_builtin_function ("picoSbc", int_ftype_int, PICOCHIP_BUILTIN_SBC,
|
4265 |
|
|
BUILT_IN_MD, NULL, NULL_TREE);
|
4266 |
|
|
|
4267 |
|
|
/* Initialise the bit reverse function. */
|
4268 |
|
|
add_builtin_function ("__builtin_brev", unsigned_ftype_unsigned,
|
4269 |
|
|
PICOCHIP_BUILTIN_BREV, BUILT_IN_MD, NULL,
|
4270 |
|
|
NULL_TREE);
|
4271 |
|
|
add_builtin_function ("picoBrev", unsigned_ftype_unsigned,
|
4272 |
|
|
PICOCHIP_BUILTIN_BREV, BUILT_IN_MD, NULL,
|
4273 |
|
|
NULL_TREE);
|
4274 |
|
|
|
4275 |
|
|
/* Initialise the byte swap function. */
|
4276 |
|
|
add_builtin_function ("__builtin_byteswap", unsigned_ftype_unsigned,
|
4277 |
|
|
PICOCHIP_BUILTIN_BYTESWAP, BUILT_IN_MD, NULL,
|
4278 |
|
|
NULL_TREE);
|
4279 |
|
|
add_builtin_function ("picoByteSwap", unsigned_ftype_unsigned,
|
4280 |
|
|
PICOCHIP_BUILTIN_BYTESWAP, BUILT_IN_MD, NULL,
|
4281 |
|
|
NULL_TREE);
|
4282 |
|
|
|
4283 |
|
|
/* Initialise the ASRI function (note that while this can be coded
|
4284 |
|
|
using a signed shift in C, extra scratch registers are required,
|
4285 |
|
|
which we avoid by having a direct builtin to map to the
|
4286 |
|
|
instruction). */
|
4287 |
|
|
add_builtin_function ("__builtin_asri", int_ftype_int_int,
|
4288 |
|
|
PICOCHIP_BUILTIN_ASRI, BUILT_IN_MD, NULL,
|
4289 |
|
|
NULL_TREE);
|
4290 |
|
|
|
4291 |
|
|
/* Initialise saturating addition. */
|
4292 |
|
|
add_builtin_function ("__builtin_adds", int_ftype_int_int,
|
4293 |
|
|
PICOCHIP_BUILTIN_ADDS, BUILT_IN_MD, NULL,
|
4294 |
|
|
NULL_TREE);
|
4295 |
|
|
add_builtin_function ("picoAdds", int_ftype_int_int,
|
4296 |
|
|
PICOCHIP_BUILTIN_ADDS, BUILT_IN_MD, NULL,
|
4297 |
|
|
NULL_TREE);
|
4298 |
|
|
|
4299 |
|
|
/* Initialise saturating subtraction. */
|
4300 |
|
|
add_builtin_function ("__builtin_subs", int_ftype_int_int,
|
4301 |
|
|
PICOCHIP_BUILTIN_SUBS, BUILT_IN_MD, NULL,
|
4302 |
|
|
NULL_TREE);
|
4303 |
|
|
add_builtin_function ("picoSubs", int_ftype_int_int,
|
4304 |
|
|
PICOCHIP_BUILTIN_SUBS, BUILT_IN_MD, NULL,
|
4305 |
|
|
NULL_TREE);
|
4306 |
|
|
|
4307 |
|
|
/* Scalar comms builtins. */
|
4308 |
|
|
add_builtin_function ("__builtin_get", long_ftype_int,
|
4309 |
|
|
PICOCHIP_BUILTIN_GET, BUILT_IN_MD, NULL,
|
4310 |
|
|
NULL_TREE);
|
4311 |
|
|
add_builtin_function ("__builtin_put", void_ftype_int_long,
|
4312 |
|
|
PICOCHIP_BUILTIN_PUT, BUILT_IN_MD, NULL,
|
4313 |
|
|
NULL_TREE);
|
4314 |
|
|
add_builtin_function ("__builtin_testport", int_ftype_int,
|
4315 |
|
|
PICOCHIP_BUILTIN_TESTPORT, BUILT_IN_MD, NULL,
|
4316 |
|
|
NULL_TREE);
|
4317 |
|
|
|
4318 |
|
|
/* Array comms builtins. */
|
4319 |
|
|
add_builtin_function ("__builtin_put_array",
|
4320 |
|
|
void_ftype_long_int_int_int,
|
4321 |
|
|
PICOCHIP_BUILTIN_PUT_ARRAY, BUILT_IN_MD, NULL,
|
4322 |
|
|
NULL_TREE);
|
4323 |
|
|
add_builtin_function ("__builtin_get_array", long_ftype_int_int_int,
|
4324 |
|
|
PICOCHIP_BUILTIN_GET_ARRAY, BUILT_IN_MD, NULL,
|
4325 |
|
|
NULL_TREE);
|
4326 |
|
|
add_builtin_function ("__builtin_testport_array",
|
4327 |
|
|
int_ftype_int_int_int,
|
4328 |
|
|
PICOCHIP_BUILTIN_TESTPORT_ARRAY, BUILT_IN_MD,
|
4329 |
|
|
NULL, NULL_TREE);
|
4330 |
|
|
|
4331 |
|
|
/* Halt instruction. Note that the builtin function is marked as
|
4332 |
|
|
having the attribute `noreturn' so that the compiler realises
|
4333 |
|
|
that the halt stops the program dead. */
|
4334 |
|
|
noreturn = tree_cons (get_identifier ("noreturn"), NULL, NULL);
|
4335 |
|
|
add_builtin_function ("__builtin_halt", void_ftype_void,
|
4336 |
|
|
PICOCHIP_BUILTIN_HALT, BUILT_IN_MD, NULL,
|
4337 |
|
|
noreturn);
|
4338 |
|
|
add_builtin_function ("picoHalt", void_ftype_void,
|
4339 |
|
|
PICOCHIP_BUILTIN_HALT, BUILT_IN_MD, NULL,
|
4340 |
|
|
noreturn);
|
4341 |
|
|
|
4342 |
|
|
}
|
4343 |
|
|
|
4344 |
|
|
/* Expand a call to a builtin function. */
|
4345 |
|
|
rtx
|
4346 |
|
|
picochip_expand_builtin (tree exp, rtx target, rtx subtarget ATTRIBUTE_UNUSED,
|
4347 |
|
|
enum machine_mode mode ATTRIBUTE_UNUSED,
|
4348 |
|
|
int ignore ATTRIBUTE_UNUSED)
|
4349 |
|
|
{
|
4350 |
|
|
tree fndecl = TREE_OPERAND (CALL_EXPR_FN (exp), 0);
|
4351 |
|
|
int fcode = DECL_FUNCTION_CODE (fndecl);
|
4352 |
|
|
|
4353 |
|
|
switch (fcode)
|
4354 |
|
|
{
|
4355 |
|
|
case PICOCHIP_BUILTIN_ASRI:
|
4356 |
|
|
return picochip_expand_builtin_3op (CODE_FOR_builtin_asri, exp,
|
4357 |
|
|
target);
|
4358 |
|
|
|
4359 |
|
|
case PICOCHIP_BUILTIN_ADDS:
|
4360 |
|
|
return picochip_expand_builtin_3op (CODE_FOR_sataddhi3, exp,
|
4361 |
|
|
target);
|
4362 |
|
|
|
4363 |
|
|
case PICOCHIP_BUILTIN_SUBS:
|
4364 |
|
|
return picochip_expand_builtin_3op (CODE_FOR_satsubhi3, exp,
|
4365 |
|
|
target);
|
4366 |
|
|
|
4367 |
|
|
case PICOCHIP_BUILTIN_SBC:
|
4368 |
|
|
return picochip_expand_builtin_2op (CODE_FOR_sbc, exp, target);
|
4369 |
|
|
|
4370 |
|
|
case PICOCHIP_BUILTIN_BREV:
|
4371 |
|
|
return picochip_expand_builtin_2op (CODE_FOR_brev, exp, target);
|
4372 |
|
|
|
4373 |
|
|
case PICOCHIP_BUILTIN_BYTESWAP:
|
4374 |
|
|
return picochip_expand_builtin_2op (CODE_FOR_bswaphi2, exp, target);
|
4375 |
|
|
|
4376 |
|
|
case PICOCHIP_BUILTIN_GET:
|
4377 |
|
|
return picochip_expand_builtin_2op (CODE_FOR_commsGet, exp, target);
|
4378 |
|
|
|
4379 |
|
|
case PICOCHIP_BUILTIN_PUT:
|
4380 |
|
|
return picochip_expand_builtin_2opvoid (CODE_FOR_commsPut, exp);
|
4381 |
|
|
|
4382 |
|
|
case PICOCHIP_BUILTIN_TESTPORT:
|
4383 |
|
|
return picochip_expand_builtin_2op (CODE_FOR_commsTestPort, exp,
|
4384 |
|
|
target);
|
4385 |
|
|
|
4386 |
|
|
case PICOCHIP_BUILTIN_PUT_ARRAY:
|
4387 |
|
|
return picochip_expand_array_put (exp, target);
|
4388 |
|
|
|
4389 |
|
|
case PICOCHIP_BUILTIN_GET_ARRAY:
|
4390 |
|
|
return picochip_expand_array_get (exp, target);
|
4391 |
|
|
|
4392 |
|
|
case PICOCHIP_BUILTIN_TESTPORT_ARRAY:
|
4393 |
|
|
return picochip_expand_array_testport (exp, target);
|
4394 |
|
|
|
4395 |
|
|
case PICOCHIP_BUILTIN_HALT:
|
4396 |
|
|
return picochip_generate_halt ();
|
4397 |
|
|
|
4398 |
|
|
default:
|
4399 |
|
|
gcc_unreachable();
|
4400 |
|
|
|
4401 |
|
|
}
|
4402 |
|
|
|
4403 |
|
|
/* Should really do something sensible here. */
|
4404 |
|
|
return NULL_RTX;
|
4405 |
|
|
}
|
4406 |
|
|
|
4407 |
|
|
/* Emit warnings. */
|
4408 |
|
|
static void
|
4409 |
|
|
picochip_warn_inefficient (const char *msg)
|
4410 |
|
|
{
|
4411 |
|
|
if (TARGET_INEFFICIENT_WARNINGS)
|
4412 |
|
|
warning (OPT_minefficient_warnings,
|
4413 |
|
|
"%s (disable warning using -mno-inefficient-warnings)", msg);
|
4414 |
|
|
}
|
4415 |
|
|
|
4416 |
|
|
void
|
4417 |
|
|
warn_of_byte_access (void)
|
4418 |
|
|
{
|
4419 |
|
|
static int warned = 0;
|
4420 |
|
|
|
4421 |
|
|
if (!warned)
|
4422 |
|
|
{
|
4423 |
|
|
picochip_warn_inefficient
|
4424 |
|
|
("byte access is synthesised - consider using MUL AE");
|
4425 |
|
|
warned = 1;
|
4426 |
|
|
}
|
4427 |
|
|
|
4428 |
|
|
}
|
4429 |
|
|
|
4430 |
|
|
rtx
|
4431 |
|
|
picochip_function_value (const_tree valtype, const_tree func,
|
4432 |
|
|
bool outgoing ATTRIBUTE_UNUSED)
|
4433 |
|
|
{
|
4434 |
|
|
enum machine_mode mode = TYPE_MODE (valtype);
|
4435 |
|
|
int unsignedp = TYPE_UNSIGNED (valtype);
|
4436 |
|
|
|
4437 |
|
|
/* Since we define PROMOTE_FUNCTION_RETURN, we must promote the mode
|
4438 |
|
|
just as PROMOTE_MODE does. */
|
4439 |
|
|
mode = promote_function_mode (valtype, mode, &unsignedp, func, 1);
|
4440 |
|
|
|
4441 |
|
|
return gen_rtx_REG (mode, 0);
|
4442 |
|
|
|
4443 |
|
|
}
|
4444 |
|
|
|
4445 |
|
|
/* Check that the value of the given mode will fit in the register of
|
4446 |
|
|
the given mode. */
|
4447 |
|
|
int
|
4448 |
|
|
picochip_hard_regno_mode_ok (int regno, enum machine_mode mode)
|
4449 |
|
|
{
|
4450 |
|
|
|
4451 |
|
|
if (GET_MODE_CLASS (mode) == MODE_CC)
|
4452 |
|
|
return regno == CC_REGNUM;
|
4453 |
|
|
|
4454 |
|
|
/* If the CC register is being used, then only CC mode values are
|
4455 |
|
|
allowed (which have already been tested). */
|
4456 |
|
|
if (regno == CC_REGNUM || regno == ACC_REGNUM)
|
4457 |
|
|
return 0;
|
4458 |
|
|
|
4459 |
|
|
/* Must be a valid register. */
|
4460 |
|
|
if (regno > 16)
|
4461 |
|
|
return 0;
|
4462 |
|
|
|
4463 |
|
|
/* Modes QI and HI may be placed in any register except the CC. */
|
4464 |
|
|
if (mode == QImode || mode == HImode)
|
4465 |
|
|
return 1;
|
4466 |
|
|
|
4467 |
|
|
/* DI must be in a quad register. */
|
4468 |
|
|
if (mode == DImode)
|
4469 |
|
|
return (regno % 4 == 0);
|
4470 |
|
|
|
4471 |
|
|
/* All other modes must be placed in a even numbered register. */
|
4472 |
|
|
return !(regno & 1);
|
4473 |
|
|
|
4474 |
|
|
}
|
4475 |
|
|
|
4476 |
|
|
/* Extract the lower and upper components of a constant value. */
|
4477 |
|
|
|
4478 |
|
|
rtx
|
4479 |
|
|
picochip_get_low_const (rtx value)
|
4480 |
|
|
{
|
4481 |
|
|
return gen_int_mode (INTVAL (value) & 0xFFFF, HImode);
|
4482 |
|
|
}
|
4483 |
|
|
|
4484 |
|
|
rtx
|
4485 |
|
|
picochip_get_high_const (rtx value)
|
4486 |
|
|
{
|
4487 |
|
|
/*return GEN_INT ((((INTVAL (value) >> 16) & 0xFFFF) ^ 0x8000) - 0x8000); */
|
4488 |
|
|
return gen_int_mode ((INTVAL (value) >> 16) & 0xFFFF, HImode);
|
4489 |
|
|
}
|
4490 |
|
|
|
4491 |
|
|
|
4492 |
|
|
/* Loading and storing QImode values to and from memory in a machine
|
4493 |
|
|
without byte access requires might require a scratch
|
4494 |
|
|
register. However, the scratch register might correspond to the
|
4495 |
|
|
register in which the value is being loaded. To ensure that a
|
4496 |
|
|
scratch register is supplied which is definitely different to the
|
4497 |
|
|
output register, request a register pair. This effectively gives a
|
4498 |
|
|
choice of two registers to choose from, so that we a guaranteed to
|
4499 |
|
|
get at least one register which is different to the output
|
4500 |
|
|
register. This trick is taken from the alpha implementation. */
|
4501 |
|
|
static reg_class_t
|
4502 |
|
|
picochip_secondary_reload (bool in_p,
|
4503 |
|
|
rtx x ATTRIBUTE_UNUSED,
|
4504 |
|
|
reg_class_t cla ATTRIBUTE_UNUSED,
|
4505 |
|
|
enum machine_mode mode,
|
4506 |
|
|
secondary_reload_info *sri)
|
4507 |
|
|
{
|
4508 |
|
|
if (mode == QImode && !TARGET_HAS_BYTE_ACCESS)
|
4509 |
|
|
{
|
4510 |
|
|
if (in_p == 0)
|
4511 |
|
|
sri->icode = CODE_FOR_reload_outqi;
|
4512 |
|
|
else
|
4513 |
|
|
sri->icode = CODE_FOR_reload_inqi;
|
4514 |
|
|
}
|
4515 |
|
|
|
4516 |
|
|
/* We dont need to return a register class type when we need only a
|
4517 |
|
|
scratch register. It realizes the scratch register type by looking
|
4518 |
|
|
at the instruction definition for sri->icode. We only need to
|
4519 |
|
|
return the register type when we need intermediaries for copies.*/
|
4520 |
|
|
return NO_REGS;
|
4521 |
|
|
}
|
4522 |
|
|
|
4523 |
|
|
/* Return true if the given memory operand can be aligned to a
|
4524 |
|
|
word+offset memory reference (e.g., FP+3 can be converted into the
|
4525 |
|
|
memory operand FP+2, with the offset 1). */
|
4526 |
|
|
int
|
4527 |
|
|
picochip_alignable_memory_operand (rtx mem_operand,
|
4528 |
|
|
enum machine_mode mode ATTRIBUTE_UNUSED)
|
4529 |
|
|
{
|
4530 |
|
|
rtx address;
|
4531 |
|
|
|
4532 |
|
|
/* Not a mem operand. Refuse immediately. */
|
4533 |
|
|
if (MEM != GET_CODE (mem_operand))
|
4534 |
|
|
return 0;
|
4535 |
|
|
|
4536 |
|
|
address = XEXP (mem_operand, 0);
|
4537 |
|
|
|
4538 |
|
|
/* Return true if a PLUS of the SP and a (valid) constant, or SP itself. */
|
4539 |
|
|
return ((PLUS == GET_CODE (address) &&
|
4540 |
|
|
REGNO (XEXP (address, 0)) == STACK_POINTER_REGNUM &&
|
4541 |
|
|
CONST_INT == GET_CODE (XEXP (address, 1)) &&
|
4542 |
|
|
picochip_const_ok_for_letter_p (INTVAL (XEXP (address, 1)), 'K'))
|
4543 |
|
|
|| (REG == GET_CODE (address)
|
4544 |
|
|
&& REGNO (address) == STACK_POINTER_REGNUM));
|
4545 |
|
|
|
4546 |
|
|
}
|
4547 |
|
|
|
4548 |
|
|
/* Return true if the given memory reference is to a word aligned
|
4549 |
|
|
address. Currently this means it must be either SP, or
|
4550 |
|
|
SP+offset. We could replace this function with alignable
|
4551 |
|
|
memory references in the above function?. */
|
4552 |
|
|
int
|
4553 |
|
|
picochip_word_aligned_memory_reference (rtx operand)
|
4554 |
|
|
{
|
4555 |
|
|
|
4556 |
|
|
|
4557 |
|
|
/* The address must be the SP register, or a constant, aligned
|
4558 |
|
|
offset from SP which doesn't exceed the FP+offset
|
4559 |
|
|
restrictions. */
|
4560 |
|
|
return ((PLUS == GET_CODE (operand)
|
4561 |
|
|
&& REGNO (XEXP (operand, 0)) == STACK_POINTER_REGNUM
|
4562 |
|
|
&& picochip_is_aligned (INTVAL (XEXP (operand, 1)), 16)
|
4563 |
|
|
&& picochip_const_ok_for_letter_p (INTVAL (XEXP (operand, 1)),
|
4564 |
|
|
'K'))
|
4565 |
|
|
|| (REG == GET_CODE (operand)
|
4566 |
|
|
&& REGNO (operand) == STACK_POINTER_REGNUM));
|
4567 |
|
|
|
4568 |
|
|
}
|
4569 |
|
|
|
4570 |
|
|
/* Given an alignable memory location, convert the memory location
|
4571 |
|
|
into a HI mode access, storing the new memory reference in
|
4572 |
|
|
paligned_mem, and the number of bits by which to shift in pbitnum
|
4573 |
|
|
(i.e., given a reference to FP+3, this creates an aligned reference
|
4574 |
|
|
of FP+2, with an 8-bit shift). This code is a modification of that
|
4575 |
|
|
found in the Alpha port. */
|
4576 |
|
|
void
|
4577 |
|
|
picochip_get_hi_aligned_mem (rtx ref, rtx * paligned_mem, rtx * pbitnum)
|
4578 |
|
|
{
|
4579 |
|
|
rtx base;
|
4580 |
|
|
HOST_WIDE_INT offset = 0;
|
4581 |
|
|
|
4582 |
|
|
gcc_assert (GET_CODE (ref) == MEM);
|
4583 |
|
|
|
4584 |
|
|
if (reload_in_progress && !memory_address_p (GET_MODE (ref), XEXP (ref, 0)))
|
4585 |
|
|
{
|
4586 |
|
|
base = find_replacement (&XEXP (ref, 0));
|
4587 |
|
|
|
4588 |
|
|
gcc_assert(memory_address_p (GET_MODE (ref), base));
|
4589 |
|
|
}
|
4590 |
|
|
else
|
4591 |
|
|
{
|
4592 |
|
|
base = XEXP (ref, 0);
|
4593 |
|
|
}
|
4594 |
|
|
|
4595 |
|
|
if (GET_CODE (base) == PLUS)
|
4596 |
|
|
{
|
4597 |
|
|
offset += INTVAL (XEXP (base, 1));
|
4598 |
|
|
base = XEXP (base, 0);
|
4599 |
|
|
}
|
4600 |
|
|
|
4601 |
|
|
*paligned_mem = widen_memory_access (ref, HImode, (offset & ~1) - offset);
|
4602 |
|
|
|
4603 |
|
|
if (offset > 0)
|
4604 |
|
|
{
|
4605 |
|
|
if (TARGET_DEBUG)
|
4606 |
|
|
{
|
4607 |
|
|
printf
|
4608 |
|
|
("Found non-zero offset in get_hi_aligned_mem - check that the correct value is being used (as this functionality hasn't been exploited yet).\n");
|
4609 |
|
|
}
|
4610 |
|
|
}
|
4611 |
|
|
|
4612 |
|
|
*pbitnum = GEN_INT ((offset & 1) * 8);
|
4613 |
|
|
|
4614 |
|
|
}
|
4615 |
|
|
|
4616 |
|
|
/* Return true if the given operand is an absolute address in memory
|
4617 |
|
|
(i.e., a symbolic offset). */
|
4618 |
|
|
int
|
4619 |
|
|
picochip_absolute_memory_operand (rtx op,
|
4620 |
|
|
enum machine_mode mode ATTRIBUTE_UNUSED)
|
4621 |
|
|
{
|
4622 |
|
|
|
4623 |
|
|
if (MEM == GET_CODE (op))
|
4624 |
|
|
{
|
4625 |
|
|
rtx address = XEXP (op, 0);
|
4626 |
|
|
|
4627 |
|
|
/* Symbols are valid absolute addresses. */
|
4628 |
|
|
if (SYMBOL_REF == GET_CODE (address))
|
4629 |
|
|
return 1;
|
4630 |
|
|
|
4631 |
|
|
/* Constant offsets to symbols are valid absolute addresses. */
|
4632 |
|
|
if (CONST == GET_CODE (address) &&
|
4633 |
|
|
PLUS == GET_CODE (XEXP (address, 0)) &&
|
4634 |
|
|
SYMBOL_REF == GET_CODE (XEXP (XEXP (address, 0), 0)) &&
|
4635 |
|
|
CONST_INT == GET_CODE (XEXP (XEXP (address, 0), 1)))
|
4636 |
|
|
return 1;
|
4637 |
|
|
|
4638 |
|
|
}
|
4639 |
|
|
else
|
4640 |
|
|
return 0;
|
4641 |
|
|
|
4642 |
|
|
/* Symbols are valid absolute addresses. */
|
4643 |
|
|
if (SYMBOL_REF == GET_CODE (XEXP (op, 0)))
|
4644 |
|
|
return 1;
|
4645 |
|
|
|
4646 |
|
|
|
4647 |
|
|
return 0;
|
4648 |
|
|
|
4649 |
|
|
}
|
4650 |
|
|
|
4651 |
|
|
void
|
4652 |
|
|
picochip_asm_named_section (const char *name,
|
4653 |
|
|
unsigned int flags ATTRIBUTE_UNUSED,
|
4654 |
|
|
tree decl ATTRIBUTE_UNUSED)
|
4655 |
|
|
{
|
4656 |
|
|
fprintf (asm_out_file, ".section %s\n", name);
|
4657 |
|
|
}
|
4658 |
|
|
|
4659 |
|
|
|
4660 |
|
|
/* Check if we can make a conditional copy instruction. This is emitted as an
|
4661 |
|
|
instruction to set the condition register, followed by an instruction which
|
4662 |
|
|
uses the condition registers to perform the conditional move. */
|
4663 |
|
|
int
|
4664 |
|
|
picochip_check_conditional_copy (rtx * operands)
|
4665 |
|
|
{
|
4666 |
|
|
|
4667 |
|
|
rtx branch_op_0 = XEXP (operands[1], 0);
|
4668 |
|
|
rtx branch_op_1 = XEXP (operands[1], 1);
|
4669 |
|
|
|
4670 |
|
|
/* Only HI mode conditional moves are currently allowed. Can we add
|
4671 |
|
|
SI mode moves? */
|
4672 |
|
|
if (GET_CODE (operands[1]) != EQ && GET_CODE (operands[1]) != NE)
|
4673 |
|
|
return 0;
|
4674 |
|
|
|
4675 |
|
|
/* Is the comparison valid? Only allow operands which are registers
|
4676 |
|
|
if they are HImode. SI mode comparisons against 0 could be
|
4677 |
|
|
handled using logical operations (e.g., SIreg != 0 when low ||
|
4678 |
|
|
high). Need to find test cases to provoke this though (fixunssfdi
|
4679 |
|
|
in libgcc does, but is complicated). */
|
4680 |
|
|
if (register_operand(branch_op_0, GET_MODE(branch_op_0)) &&
|
4681 |
|
|
GET_MODE(branch_op_0) != HImode)
|
4682 |
|
|
return 0;
|
4683 |
|
|
if (register_operand(branch_op_1, GET_MODE(branch_op_1)) &&
|
4684 |
|
|
GET_MODE(branch_op_1) != HImode)
|
4685 |
|
|
return 0;
|
4686 |
|
|
|
4687 |
|
|
return 1;
|
4688 |
|
|
|
4689 |
|
|
}
|
4690 |
|
|
|
4691 |
|
|
|
4692 |
|
|
static rtx
|
4693 |
|
|
picochip_static_chain (const_tree ARG_UNUSED (fndecl), bool incoming_p)
|
4694 |
|
|
{
|
4695 |
|
|
rtx addr;
|
4696 |
|
|
if (incoming_p)
|
4697 |
|
|
addr = arg_pointer_rtx;
|
4698 |
|
|
else
|
4699 |
|
|
addr = plus_constant (stack_pointer_rtx, -2 * UNITS_PER_WORD);
|
4700 |
|
|
return gen_frame_mem (Pmode, addr);
|
4701 |
|
|
}
|