OpenCores
URL https://opencores.org/ocsvn/sparc64soc/sparc64soc/trunk

Subversion Repositories sparc64soc

[/] [sparc64soc/] [trunk/] [T1-CPU/] [exu/] [sparc_exu_eclccr.v] - Blame information for rev 4

Go to most recent revision | Details | Compare with Previous | View Log

Line No. Rev Author Line
1 2 dmitryr
// ========== Copyright Header Begin ==========================================
2
// 
3
// OpenSPARC T1 Processor File: sparc_exu_eclccr.v
4
// Copyright (c) 2006 Sun Microsystems, Inc.  All Rights Reserved.
5
// DO NOT ALTER OR REMOVE COPYRIGHT NOTICES.
6
// 
7
// The above named program is free software; you can redistribute it and/or
8
// modify it under the terms of the GNU General Public
9
// License version 2 as published by the Free Software Foundation.
10
// 
11
// The above named program is distributed in the hope that it will be 
12
// useful, but WITHOUT ANY WARRANTY; without even the implied warranty of
13
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14
// General Public License for more details.
15
// 
16
// You should have received a copy of the GNU General Public
17
// License along with this work; if not, write to the Free Software
18
// Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA.
19
// 
20
// ========== Copyright Header End ============================================
21
////////////////////////////////////////////////////////////////////////
22
/*
23
//  Module Name: sparc_exu_eclccr
24
//      Description: 4 bit condition code registers with forwarding.  Takes
25
//      the e_stage result and writes on the w stage.
26
*/
27
 
28
module sparc_exu_eclccr (/*AUTOARG*/
29
   // Outputs
30
   exu_ifu_cc_d, exu_tlu_ccr0_w, exu_tlu_ccr1_w, exu_tlu_ccr2_w,
31
   exu_tlu_ccr3_w,
32
   // Inputs
33
   clk, se, alu_xcc_e, alu_icc_e, tid_d, thrdec_d, thr_match_dm,
34
   thr_match_de, tid_w, thr_w, ifu_exu_kill_e, ifu_exu_setcc_d,
35
   byp_ecl_wrccr_data_w, wb_ccr_wrccr_w, wb_ccr_setcc_g,
36
   divcntl_ccr_cc_w2, wb_ccr_thr_g, tlu_exu_cwpccr_update_m,
37
   tlu_exu_ccr_m, ifu_exu_inst_vld_w, ifu_tlu_flush_w, early_flush_w
38
   ) ;
39
   input clk;
40
   input se;
41
   input [3:0] alu_xcc_e;    // condition codes from the alu
42
   input [3:0] alu_icc_e;
43
   input [1:0] tid_d;   // thread for each stage
44
   input [3:0] thrdec_d;   // decoded tid_d for mux select
45
   input       thr_match_dm;
46
   input       thr_match_de;
47
   input [1:0] tid_w;
48
   input [3:0] thr_w;        // decoded tid_w
49
   input       ifu_exu_kill_e;
50
   input       ifu_exu_setcc_d;
51
   input [7:0] byp_ecl_wrccr_data_w;// for the WRCCR operation (LSBs of
52
   input       wb_ccr_wrccr_w; // ALU result) + wen signal
53
   input       wb_ccr_setcc_g;
54
   input [7:0] divcntl_ccr_cc_w2;
55
   input [1:0] wb_ccr_thr_g;
56
   input       tlu_exu_cwpccr_update_m;
57
   input [7:0] tlu_exu_ccr_m;
58
   input       ifu_exu_inst_vld_w;
59
   input       ifu_tlu_flush_w;
60
   input       early_flush_w;
61
 
62
   output [7:0] exu_ifu_cc_d;   // condition codes for current thread
63
   output [7:0] exu_tlu_ccr0_w;
64
   output [7:0] exu_tlu_ccr1_w;
65
   output [7:0] exu_tlu_ccr2_w;
66
   output [7:0] exu_tlu_ccr3_w;
67
 
68
   wire [7:0]   partial_cc_d;   // partial bypassed ccr
69
   wire [7:0]   alu_cc_e;   // alu combined condition codes
70
   wire [7:0]   alu_cc_m;   // m stage alu ccs
71
   wire [7:0]   alu_cc_w;
72
   wire [7:0]   exu_ifu_cc_w;   // writeback data
73
   wire         setcc_e;        // from previous stage
74
   wire         setcc_m;
75
   wire         setcc_w;
76
   wire         valid_setcc_e;  // after comparing with kill
77
   wire         valid_setcc_m;
78
   wire         valid_setcc_w;
79
   wire         setcc_w2;
80
   wire [7:0]   ccrin_thr0;
81
   wire [7:0]   ccrin_thr1;
82
   wire [7:0]   ccrin_thr2;
83
   wire [7:0]   ccrin_thr3;
84
   wire [7:0]   ccr_d;
85
   wire [7:0]   ccr_thr0;
86
   wire [7:0]   ccr_thr1;
87
   wire [7:0]   ccr_thr2;
88
   wire [7:0]   ccr_thr3;
89
   wire         use_alu_cc;
90
   wire         use_ccr;
91
   wire         use_cc_e;
92
   wire         use_cc_m;
93
   wire         use_cc_w;
94
   wire  [1:0]   tid_dxorw;
95
   wire         thr_match_de;
96
   wire         thrmatch_w;
97
   wire [1:0]   thr_w2;
98
   wire          thr0_w2;
99
   wire          thr1_w2;
100
   wire          thr2_w2;
101
   wire          thr3_w2;
102
   wire          wen_thr0_w;    // write enable for each input/thread
103
   wire          wen_thr0_w2;
104
   wire          wen_thr1_w;
105
   wire          wen_thr1_w2;
106
   wire          wen_thr2_w;
107
   wire          wen_thr2_w2;
108
   wire          wen_thr3_w;
109
   wire          wen_thr3_w2;
110
   wire          wen_thr0_l;      // overall write enable for each thread
111
   wire          wen_thr1_l;
112
   wire          wen_thr2_l;
113
   wire          wen_thr3_l;
114
   wire          bypass_cc_w;
115
 
116
   wire [7:0]    ccr_m;
117
 
118
 
119
   // D2E flops
120
   dff_s dff_setcc_d2e(.din(ifu_exu_setcc_d), .clk(clk), .q(setcc_e),
121
                     .se(se), .si(), .so());
122
 
123
   // E stage
124
   assign       alu_cc_e = {alu_xcc_e, alu_icc_e};
125
   assign       valid_setcc_e = setcc_e & ~ifu_exu_kill_e;
126
 
127
   dff_s #(8) dff_cc_e2m(.din(alu_cc_e[7:0]), .clk(clk), .q(alu_cc_m[7:0]),
128
                  .se(se), .si(), .so());
129
   dff_s dff_setcc_e2m(.din(valid_setcc_e), .clk(clk), .q(setcc_m),
130
                     .se(se), .si(), .so());
131
 
132
   // M stage
133
   assign       valid_setcc_m = setcc_m | tlu_exu_cwpccr_update_m;
134
   mux2ds #(8) mux_ccr_m(.dout(ccr_m[7:0]),
135
                            .in0(alu_cc_m[7:0]),
136
                            .in1(tlu_exu_ccr_m[7:0]),
137
                            .sel0(~tlu_exu_cwpccr_update_m),
138
                            .sel1(tlu_exu_cwpccr_update_m));
139
 
140
   dff_s #(8) dff_cc_m2w(.din(ccr_m[7:0]), .clk(clk), .q(alu_cc_w[7:0]),
141
                  .se(se), .si(), .so());
142
   dff_s dff_setcc_m2w(.din(valid_setcc_m), .clk(clk), .q(setcc_w),
143
                     .se(se), .si(), .so());
144
 
145
   // W stage
146
   assign bypass_cc_w = ifu_exu_inst_vld_w & setcc_w;
147
   assign valid_setcc_w = ~ifu_tlu_flush_w & ~early_flush_w & ifu_exu_inst_vld_w & (setcc_w | wb_ccr_wrccr_w);
148
 
149
   // mux with wrccr
150
   assign        use_alu_cc = ~(wb_ccr_wrccr_w);
151
   mux2ds #(8) mux_ccrin_cc(.dout(exu_ifu_cc_w[7:0]), .sel0(wb_ccr_wrccr_w),
152
                          .sel1(use_alu_cc),
153
                          .in0(byp_ecl_wrccr_data_w[7:0]),
154
                          .in1(alu_cc_w[7:0]));
155
 
156
   dff_s #(3) setcc_g2w2 (.din({wb_ccr_setcc_g, wb_ccr_thr_g[1:0]}), .clk(clk),
157
                        .q({setcc_w2, thr_w2[1:0]}),
158
                        .se(se), .si(), .so());
159
 
160
 
161
   /////////////////////////
162
   // Storage of ccr
163
   /////////////////////////
164
`ifdef FPGA_SYN_1THREAD
165
 
166
   assign          thr0_w2 = ~thr_w2[1] & ~thr_w2[0];
167
   assign          wen_thr0_w = (thr_w[0] & valid_setcc_w & ~wen_thr0_w2);
168
   assign          wen_thr0_w2 = thr0_w2 & setcc_w2;
169
   assign          wen_thr0_l = ~(wen_thr0_w | wen_thr0_w2);
170
   // mux between cc_w, cc_w2, old value, tlu value
171
   mux3ds #(8) mux_ccrin0(.dout(ccrin_thr0[7:0]), .sel0(wen_thr0_w),
172
                          .sel1(wen_thr0_w2), .sel2(wen_thr0_l),
173
                          .in0(exu_ifu_cc_w[7:0]),
174
                          .in1(divcntl_ccr_cc_w2[7:0]), .in2(ccr_thr0[7:0]));
175
   // store new value
176
   dff_s #(8) dff_ccr_thr0(.din(ccrin_thr0[7:0]), .clk(clk), .q(ccr_thr0[7:0]),
177
                       .se(se), .si(), .so());
178
   assign          ccr_d[7:0] = ccr_thr0[7:0];
179
 
180
`else // !`ifdef FPGA_SYN_1THREAD
181
 
182
   // decode thr_w2 for mux select
183
   assign        thr0_w2 = ~thr_w2[1] & ~thr_w2[0];
184
   assign        thr1_w2 = ~thr_w2[1] & thr_w2[0];
185
   assign        thr2_w2 = thr_w2[1] & ~thr_w2[0];
186
   assign        thr3_w2 = thr_w2[1] & thr_w2[0];
187
   // enable input for each thread
188
   assign        wen_thr0_w = (thr_w[0] & valid_setcc_w & ~wen_thr0_w2);
189
   assign        wen_thr0_w2 = thr0_w2 & setcc_w2;
190
   assign        wen_thr0_l = ~(wen_thr0_w | wen_thr0_w2);
191
   assign        wen_thr1_w = (thr_w[1] & valid_setcc_w & ~wen_thr1_w2);
192
   assign        wen_thr1_w2 = (thr1_w2 & setcc_w2);
193
   assign        wen_thr1_l = ~(wen_thr1_w | wen_thr1_w2);
194
   assign        wen_thr2_w = (thr_w[2] & valid_setcc_w & ~wen_thr2_w2);
195
   assign        wen_thr2_w2 = (thr2_w2 & setcc_w2);
196
   assign        wen_thr2_l = ~(wen_thr2_w | wen_thr2_w2);
197
   assign        wen_thr3_w = (thr_w[3] & valid_setcc_w & ~wen_thr3_w2);
198
   assign        wen_thr3_w2 = (thr3_w2 & setcc_w2);
199
   assign        wen_thr3_l = ~(wen_thr3_w | wen_thr3_w2);
200
 
201
   // mux between cc_w, cc_w2, old value, tlu value
202
   mux3ds #(8) mux_ccrin0(.dout(ccrin_thr0[7:0]), .sel0(wen_thr0_w),
203
                          .sel1(wen_thr0_w2), .sel2(wen_thr0_l),
204
                          .in0(exu_ifu_cc_w[7:0]),
205
                          .in1(divcntl_ccr_cc_w2[7:0]), .in2(ccr_thr0[7:0]));
206
   mux3ds #(8) mux_ccrin1(.dout(ccrin_thr1[7:0]), .sel0(wen_thr1_w),
207
                          .sel1(wen_thr1_w2), .sel2(wen_thr1_l),
208
                          .in0(exu_ifu_cc_w[7:0]),
209
                          .in1(divcntl_ccr_cc_w2[7:0]), .in2(ccr_thr1[7:0]));
210
   mux3ds #(8) mux_ccrin2(.dout(ccrin_thr2[7:0]), .sel0(wen_thr2_w),
211
                          .sel1(wen_thr2_w2), .sel2(wen_thr2_l),
212
                          .in0(exu_ifu_cc_w[7:0]),
213
                          .in1(divcntl_ccr_cc_w2[7:0]), .in2(ccr_thr2[7:0]));
214
   mux3ds #(8) mux_ccrin3(.dout(ccrin_thr3[7:0]), .sel0(wen_thr3_w),
215
                          .sel1(wen_thr3_w2), .sel2(wen_thr3_l),
216
                          .in0(exu_ifu_cc_w[7:0]),
217
                          .in1(divcntl_ccr_cc_w2[7:0]), .in2(ccr_thr3[7:0]));
218
 
219
   // store new value
220
   dff_s #(8) dff_ccr_thr0(.din(ccrin_thr0[7:0]), .clk(clk), .q(ccr_thr0[7:0]),
221
                       .se(se), .si(), .so());
222
   dff_s #(8) dff_ccr_thr1(.din(ccrin_thr1[7:0]), .clk(clk), .q(ccr_thr1[7:0]),
223
                       .se(se), .si(), .so());
224
   dff_s #(8) dff_ccr_thr2(.din(ccrin_thr2[7:0]), .clk(clk), .q(ccr_thr2[7:0]),
225
                       .se(se), .si(), .so());
226
   dff_s #(8) dff_ccr_thr3(.din(ccrin_thr3[7:0]), .clk(clk), .q(ccr_thr3[7:0]),
227
                       .se(se), .si(), .so());
228
 
229
 
230
   // mux between the 4 sets of ccrs
231
   mux4ds #(8) mux_ccr_out(.dout(ccr_d[7:0]), .sel0(thrdec_d[0]),
232
                         .sel1(thrdec_d[1]), .sel2(thrdec_d[2]),
233
                         .sel3(thrdec_d[3]), .in0(ccr_thr0[7:0]),
234
                         .in1(ccr_thr1[7:0]), .in2(ccr_thr2[7:0]),
235
                         .in3(ccr_thr3[7:0]));
236
`endif // !`ifdef FPGA_SYN_1THREAD
237
 
238
   // bypass the ccs to the output.  Only alu result needs to be bypassed
239
   assign        exu_ifu_cc_d[7:0] = (use_cc_e)? alu_cc_e[7:0]: partial_cc_d[7:0];
240
   mux3ds #(8) mux_ccr_bypass1(.dout(partial_cc_d[7:0]),
241
                               .sel0(use_ccr),
242
                               .sel1(use_cc_m),
243
                               .sel2(use_cc_w),
244
                               .in0(ccr_d[7:0]),
245
                               .in1(alu_cc_m[7:0]),
246
                               .in2(alu_cc_w[7:0]));
247
 
248
   assign        use_cc_e = valid_setcc_e & thr_match_de;
249
   assign        use_cc_m = setcc_m & thr_match_dm;
250
   assign        use_cc_w = bypass_cc_w & thrmatch_w & ~use_cc_m;
251
   assign        use_ccr = ~(use_cc_m | use_cc_w);
252
 
253
   assign        tid_dxorw = tid_w ^ tid_d;
254
 
255
   assign        thrmatch_w = ~(tid_dxorw[1] | tid_dxorw[0]);
256
 
257
   // generate ccr_w for the tlu
258
   assign        exu_tlu_ccr0_w[7:0] = ccr_thr0[7:0];
259
   assign        exu_tlu_ccr1_w[7:0] = ccr_thr1[7:0];
260
   assign        exu_tlu_ccr2_w[7:0] = ccr_thr2[7:0];
261
   assign        exu_tlu_ccr3_w[7:0] = ccr_thr3[7:0];
262
 
263
 
264
endmodule // sparc_exu_eclccr

powered by: WebSVN 2.1.0

© copyright 1999-2024 OpenCores.org, equivalent to Oliscience, all rights reserved. OpenCores®, registered trademark.