URL https://opencores.org/ocsvn/openrisc/openrisc/trunk

Subversion Repositories openrisc

[/] [openrisc/] [trunk/] [gnu-dev/] [or1k-gcc/] [gcc/] [config/] [arm/] [arm926ejs.md] - Blame information for rev 801

Go to most recent revision | Details | Compare with Previous | View Log


;; ARM 926EJ-S Pipeline Description
;; Copyright (C) 2003, 2007 Free Software Foundation, Inc.
;; Written by CodeSourcery, LLC.
;;
;; This file is part of GCC.
;;
;; GCC is free software; you can redistribute it and/or modify it
;; under the terms of the GNU General Public License as published by
;; the Free Software Foundation; either version 3, or (at your option)
;; any later version.
;;
;; GCC is distributed in the hope that it will be useful, but
;; WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
;; General Public License for more details.
;;
;; You should have received a copy of the GNU General Public License
;; along with GCC; see the file COPYING3.  If not see
;; .  */
 
;; These descriptions are based on the information contained in the
;; ARM926EJ-S Technical Reference Manual, Copyright (c) 2002 ARM
;; Limited.
;;
 
;; This automaton provides a pipeline description for the ARM
;; 926EJ-S core.
;;
;; The model given here assumes that the condition for all conditional
;; instructions is "true", i.e., that all of the instructions are
;; actually executed.
 
(define_automaton "arm926ejs")
 
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
;; Pipelines
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 
;; There is a single pipeline
;;
;;   The ALU pipeline has fetch, decode, execute, memory, and
;;   write stages. We only need to model the execute, memory and write
;;   stages.
 
(define_cpu_unit "e,m,w" "arm926ejs")
 
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
;; ALU Instructions
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 
;; ALU instructions require three cycles to execute, and use the ALU
;; pipeline in each of the three stages.  The results are available
;; after the execute stage stage has finished.
;;
;; If the destination register is the PC, the pipelines are stalled
;; for several cycles.  That case is not modeled here.
 
;; ALU operations with no shifted operand
(define_insn_reservation "9_alu_op" 1
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "type" "alu,alu_shift"))
 "e,m,w")
 
;; ALU operations with a shift-by-register operand
;; These really stall in the decoder, in order to read
;; the shift value in a second cycle. Pretend we take two cycles in
;; the execute stage.
(define_insn_reservation "9_alu_shift_reg_op" 2
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "type" "alu_shift_reg"))
 "e*2,m,w")
 
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
;; Multiplication Instructions
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 
;; Multiplication instructions loop in the execute stage until the
;; instruction has been passed through the multiplier array enough
;; times. Multiply operations occur in both the execute and memory
;; stages of the pipeline
 
(define_insn_reservation "9_mult1" 3
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "insn" "smlalxy,mul,mla"))
 "e*2,m,w")
 
(define_insn_reservation "9_mult2" 4
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "insn" "muls,mlas"))
 "e*3,m,w")
 
(define_insn_reservation "9_mult3" 4
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "insn" "umull,umlal,smull,smlal"))
 "e*3,m,w")
 
(define_insn_reservation "9_mult4" 5
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "insn" "umulls,umlals,smulls,smlals"))
 "e*4,m,w")
 
(define_insn_reservation "9_mult5" 2
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "insn" "smulxy,smlaxy,smlawx"))
 "e,m,w")
 
(define_insn_reservation "9_mult6" 3
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "insn" "smlalxy"))
 "e*2,m,w")
 
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
;; Load/Store Instructions
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 
;; The models for load/store instructions do not accurately describe
;; the difference between operations with a base register writeback
;; (such as "ldm!").  These models assume that all memory references
;; hit in dcache.
 
;; Loads with a shifted offset take 3 cycles, and are (a) probably the
;; most common and (b) the pessimistic assumption will lead to fewer stalls.
(define_insn_reservation "9_load1_op" 3
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "type" "load1,load_byte"))
 "e*2,m,w")
 
(define_insn_reservation "9_store1_op" 0
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "type" "store1"))
 "e,m,w")
 
;; multiple word loads and stores
(define_insn_reservation "9_load2_op" 3
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "type" "load2"))
 "e,m*2,w")
 
(define_insn_reservation "9_load3_op" 4
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "type" "load3"))
 "e,m*3,w")
 
(define_insn_reservation "9_load4_op" 5
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "type" "load4"))
 "e,m*4,w")
 
(define_insn_reservation "9_store2_op" 0
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "type" "store2"))
 "e,m*2,w")
 
(define_insn_reservation "9_store3_op" 0
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "type" "store3"))
 "e,m*3,w")
 
(define_insn_reservation "9_store4_op" 0
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "type" "store4"))
 "e,m*4,w")
 
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
;; Branch and Call Instructions
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
 
;; Branch instructions are difficult to model accurately.  The ARM
;; core can predict most branches.  If the branch is predicted
;; correctly, and predicted early enough, the branch can be completely
;; eliminated from the instruction stream.  Some branches can
;; therefore appear to require zero cycles to execute.  We assume that
;; all branches are predicted correctly, and that the latency is
;; therefore the minimum value.
 
(define_insn_reservation "9_branch_op" 0
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "type" "branch"))
 "nothing")
 
;; The latency for a call is not predictable.  Therefore, we use 32 as
;; roughly equivalent to positive infinity.
 
(define_insn_reservation "9_call_op" 32
 (and (eq_attr "tune" "arm926ejs")
      (eq_attr "type" "call"))
 "nothing")

Line No.	Rev	Author	Line
1	709	jeremybenn	`;; ARM 926EJ-S Pipeline Description`
2			`;; Copyright (C) 2003, 2007 Free Software Foundation, Inc.`
3			`;; Written by CodeSourcery, LLC.`
4			`;;`
5			`;; This file is part of GCC.`
6			`;;`
7			`;; GCC is free software; you can redistribute it and/or modify it`
8			`;; under the terms of the GNU General Public License as published by`
9			`;; the Free Software Foundation; either version 3, or (at your option)`
10			`;; any later version.`
11			`;;`
12			`;; GCC is distributed in the hope that it will be useful, but`
13			`;; WITHOUT ANY WARRANTY; without even the implied warranty of`
14			`;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU`
15			`;; General Public License for more details.`
16			`;;`
17			`;; You should have received a copy of the GNU General Public License`
18			`;; along with GCC; see the file COPYING3. If not see`
19			`;; . */`
20
21			`;; These descriptions are based on the information contained in the`
22			`;; ARM926EJ-S Technical Reference Manual, Copyright (c) 2002 ARM`
23			`;; Limited.`
24			`;;`
25
26			`;; This automaton provides a pipeline description for the ARM`
27			`;; 926EJ-S core.`
28			`;;`
29			`;; The model given here assumes that the condition for all conditional`
30			`;; instructions is "true", i.e., that all of the instructions are`
31			`;; actually executed.`
32
33			`(define_automaton "arm926ejs")`
34
35			`;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;`
36			`;; Pipelines`
37			`;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;`
38
39			`;; There is a single pipeline`
40			`;;`
41			`;; The ALU pipeline has fetch, decode, execute, memory, and`
42			`;; write stages. We only need to model the execute, memory and write`
43			`;; stages.`
44
45			`(define_cpu_unit "e,m,w" "arm926ejs")`
46
47			`;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;`
48			`;; ALU Instructions`
49			`;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;`
50
51			`;; ALU instructions require three cycles to execute, and use the ALU`
52			`;; pipeline in each of the three stages. The results are available`
53			`;; after the execute stage stage has finished.`
54			`;;`
55			`;; If the destination register is the PC, the pipelines are stalled`
56			`;; for several cycles. That case is not modeled here.`
57
58			`;; ALU operations with no shifted operand`
59			`(define_insn_reservation "9_alu_op" 1`
60			`(and (eq_attr "tune" "arm926ejs")`
61			`(eq_attr "type" "alu,alu_shift"))`
62			`"e,m,w")`
63
64			`;; ALU operations with a shift-by-register operand`
65			`;; These really stall in the decoder, in order to read`
66			`;; the shift value in a second cycle. Pretend we take two cycles in`
67			`;; the execute stage.`
68			`(define_insn_reservation "9_alu_shift_reg_op" 2`
69			`(and (eq_attr "tune" "arm926ejs")`
70			`(eq_attr "type" "alu_shift_reg"))`
71			`"e*2,m,w")`
72
73			`;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;`
74			`;; Multiplication Instructions`
75			`;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;`
76
77			`;; Multiplication instructions loop in the execute stage until the`
78			`;; instruction has been passed through the multiplier array enough`
79			`;; times. Multiply operations occur in both the execute and memory`
80			`;; stages of the pipeline`
81
82			`(define_insn_reservation "9_mult1" 3`
83			`(and (eq_attr "tune" "arm926ejs")`
84			`(eq_attr "insn" "smlalxy,mul,mla"))`
85			`"e*2,m,w")`
86
87			`(define_insn_reservation "9_mult2" 4`
88			`(and (eq_attr "tune" "arm926ejs")`
89			`(eq_attr "insn" "muls,mlas"))`
90			`"e*3,m,w")`
91
92			`(define_insn_reservation "9_mult3" 4`
93			`(and (eq_attr "tune" "arm926ejs")`
94			`(eq_attr "insn" "umull,umlal,smull,smlal"))`
95			`"e*3,m,w")`
96
97			`(define_insn_reservation "9_mult4" 5`
98			`(and (eq_attr "tune" "arm926ejs")`
99			`(eq_attr "insn" "umulls,umlals,smulls,smlals"))`
100			`"e*4,m,w")`
101
102			`(define_insn_reservation "9_mult5" 2`
103			`(and (eq_attr "tune" "arm926ejs")`
104			`(eq_attr "insn" "smulxy,smlaxy,smlawx"))`
105			`"e,m,w")`
106
107			`(define_insn_reservation "9_mult6" 3`
108			`(and (eq_attr "tune" "arm926ejs")`
109			`(eq_attr "insn" "smlalxy"))`
110			`"e*2,m,w")`
111
112			`;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;`
113			`;; Load/Store Instructions`
114			`;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;`
115
116			`;; The models for load/store instructions do not accurately describe`
117			`;; the difference between operations with a base register writeback`
118			`;; (such as "ldm!"). These models assume that all memory references`
119			`;; hit in dcache.`
120
121			`;; Loads with a shifted offset take 3 cycles, and are (a) probably the`
122			`;; most common and (b) the pessimistic assumption will lead to fewer stalls.`
123			`(define_insn_reservation "9_load1_op" 3`
124			`(and (eq_attr "tune" "arm926ejs")`
125			`(eq_attr "type" "load1,load_byte"))`
126			`"e*2,m,w")`
127
128			`(define_insn_reservation "9_store1_op" 0`
129			`(and (eq_attr "tune" "arm926ejs")`
130			`(eq_attr "type" "store1"))`
131			`"e,m,w")`
132
133			`;; multiple word loads and stores`
134			`(define_insn_reservation "9_load2_op" 3`
135			`(and (eq_attr "tune" "arm926ejs")`
136			`(eq_attr "type" "load2"))`
137			`"e,m*2,w")`
138
139			`(define_insn_reservation "9_load3_op" 4`
140			`(and (eq_attr "tune" "arm926ejs")`
141			`(eq_attr "type" "load3"))`
142			`"e,m*3,w")`
143
144			`(define_insn_reservation "9_load4_op" 5`
145			`(and (eq_attr "tune" "arm926ejs")`
146			`(eq_attr "type" "load4"))`
147			`"e,m*4,w")`
148
149			`(define_insn_reservation "9_store2_op" 0`
150			`(and (eq_attr "tune" "arm926ejs")`
151			`(eq_attr "type" "store2"))`
152			`"e,m*2,w")`
153
154			`(define_insn_reservation "9_store3_op" 0`
155			`(and (eq_attr "tune" "arm926ejs")`
156			`(eq_attr "type" "store3"))`
157			`"e,m*3,w")`
158
159			`(define_insn_reservation "9_store4_op" 0`
160			`(and (eq_attr "tune" "arm926ejs")`
161			`(eq_attr "type" "store4"))`
162			`"e,m*4,w")`
163
164			`;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;`
165			`;; Branch and Call Instructions`
166			`;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;`
167
168			`;; Branch instructions are difficult to model accurately. The ARM`
169			`;; core can predict most branches. If the branch is predicted`
170			`;; correctly, and predicted early enough, the branch can be completely`
171			`;; eliminated from the instruction stream. Some branches can`
172			`;; therefore appear to require zero cycles to execute. We assume that`
173			`;; all branches are predicted correctly, and that the latency is`
174			`;; therefore the minimum value.`
175
176			`(define_insn_reservation "9_branch_op" 0`
177			`(and (eq_attr "tune" "arm926ejs")`
178			`(eq_attr "type" "branch"))`
179			`"nothing")`
180
181			`;; The latency for a call is not predictable. Therefore, we use 32 as`
182			`;; roughly equivalent to positive infinity.`
183
184			`(define_insn_reservation "9_call_op" 32`
185			`(and (eq_attr "tune" "arm926ejs")`
186			`(eq_attr "type" "call"))`
187			`"nothing")`

Browse

Tools

Subversion Repositories openrisc

[/] [openrisc/] [trunk/] [gnu-dev/] [or1k-gcc/] [gcc/] [config/] [arm/] [arm926ejs.md] - Blame information for rev 801