OpenCores
URL https://opencores.org/ocsvn/s1_core/s1_core/trunk

Subversion Repositories s1_core

[/] [s1_core/] [trunk/] [hdl/] [rtl/] [sparc_core/] [sparc_exu_div.v] - Blame information for rev 113

Details | Compare with Previous | View Log

Line No. Rev Author Line
1 95 fafa1971
// ========== Copyright Header Begin ==========================================
2
// 
3
// OpenSPARC T1 Processor File: sparc_exu_div.v
4
// Copyright (c) 2006 Sun Microsystems, Inc.  All Rights Reserved.
5
// DO NOT ALTER OR REMOVE COPYRIGHT NOTICES.
6
// 
7
// The above named program is free software; you can redistribute it and/or
8
// modify it under the terms of the GNU General Public
9
// License version 2 as published by the Free Software Foundation.
10
// 
11
// The above named program is distributed in the hope that it will be 
12
// useful, but WITHOUT ANY WARRANTY; without even the implied warranty of
13
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14
// General Public License for more details.
15
// 
16
// You should have received a copy of the GNU General Public
17
// License along with this work; if not, write to the Free Software
18
// Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA.
19
// 
20
// ========== Copyright Header End ============================================
21 113 albert.wat
`ifdef SIMPLY_RISC_TWEAKS
22
`define SIMPLY_RISC_SCANIN .si(0)
23
`else
24
`define SIMPLY_RISC_SCANIN .si()
25
`endif
26 95 fafa1971
////////////////////////////////////////////////////////////////////////
27
/*
28
//  Module Name: sparc_exu_div
29
*/
30
module sparc_exu_div (/*AUTOARG*/
31
   // Outputs
32
   so, div_ecl_xin_msb_l, div_ecl_x_msb, div_ecl_d_msb,
33
   div_ecl_cout64, div_ecl_cout32, div_ecl_gencc_in_msb_l,
34
   div_ecl_gencc_in_31, div_ecl_upper32_equal, div_ecl_low32_nonzero,
35
   div_ecl_dividend_msb, div_byp_muldivout_g, div_byp_yreg_e,
36
   div_ecl_yreg_0_l, exu_mul_rs1_data, exu_mul_rs2_data,
37
   div_ecl_adder_out_31, div_ecl_detect_zero_low,
38
   div_ecl_detect_zero_high, div_ecl_d_62,
39
   // Inputs
40
   ecl_div_yreg_wen_w, ecl_div_yreg_wen_l, ecl_div_yreg_wen_g,
41
   ecl_div_yreg_shift_g, ecl_div_yreg_data_31_g, ecl_div_thr_e,
42
   byp_div_yreg_data_w, rclk, se, si, ecl_div_keep_d,
43
   ecl_div_ld_inputs, ecl_div_sel_adder, ecl_div_last_cycle,
44
   ecl_div_almostlast_cycle, ecl_div_div64, ecl_div_sel_u32,
45
   ecl_div_sel_pos32, ecl_div_sel_neg32, ecl_div_sel_64b,
46
   ecl_div_upper32_zero, ecl_div_upper33_one, ecl_div_upper33_zero,
47
   mul_exu_data_g, ecl_div_sel_div, ecl_div_mul_wen,
48
   ecl_div_dividend_sign, ecl_div_subtract_l, ecl_div_cin,
49
   ecl_div_newq, ecl_div_xinmask, ecl_div_keepx,
50
   ecl_div_mul_get_new_data, ecl_div_mul_keep_data,
51
   ecl_div_mul_get_32bit_data, ecl_div_mul_sext_rs2_e,
52
   ecl_div_mul_sext_rs1_e, byp_div_rs1_data_e, byp_div_rs2_data_e,
53
   ecl_div_muls_rs1_31_e_l, ecl_div_muls, ecl_div_zero_rs2_e
54
   ) ;
55
   /*AUTOINPUT*/
56
   // Beginning of automatic inputs (from unused autoinst inputs)
57
   input [31:0]         byp_div_yreg_data_w;    // To yreg of sparc_exu_div_yreg.v
58
   input [3:0]          ecl_div_thr_e;          // To yreg of sparc_exu_div_yreg.v
59
   input                ecl_div_yreg_data_31_g; // To yreg of sparc_exu_div_yreg.v
60
   input [3:0]          ecl_div_yreg_shift_g;   // To yreg of sparc_exu_div_yreg.v
61
   input [3:0]          ecl_div_yreg_wen_g;     // To yreg of sparc_exu_div_yreg.v
62
   input [3:0]          ecl_div_yreg_wen_l;     // To yreg of sparc_exu_div_yreg.v
63
   input [3:0]          ecl_div_yreg_wen_w;     // To yreg of sparc_exu_div_yreg.v
64
   // End of automatics
65
   input rclk;
66
   input se;
67
   input si;
68
   input        ecl_div_keep_d; // d should store (w/ overflow calcs)
69
   input        ecl_div_ld_inputs;// load in d and x
70
   input        ecl_div_sel_adder;// d should use adder output
71
   input        ecl_div_last_cycle;// last cycle of computations
72
   input         ecl_div_almostlast_cycle;// 2nd to last cycle of div
73
   input   ecl_div_div64;
74
   input         ecl_div_sel_u32;
75
   input         ecl_div_sel_pos32;
76
   input         ecl_div_sel_neg32;
77
   input         ecl_div_sel_64b;
78
   input         ecl_div_upper32_zero;
79
   input         ecl_div_upper33_one;
80
   input         ecl_div_upper33_zero;
81
   input [63:0]  mul_exu_data_g;
82
   input         ecl_div_sel_div;
83
   input         ecl_div_mul_wen;
84
   input         ecl_div_dividend_sign;
85
   input         ecl_div_subtract_l;     // add/subtract to adder
86
   input         ecl_div_cin;
87
   input  ecl_div_newq;         // newest q bit
88
   input         ecl_div_xinmask;
89
   input  ecl_div_keepx;
90
   input         ecl_div_mul_get_new_data;
91
   input         ecl_div_mul_keep_data;
92
   input         ecl_div_mul_get_32bit_data;
93
   input         ecl_div_mul_sext_rs2_e;
94
   input         ecl_div_mul_sext_rs1_e;
95
   input [63:0]  byp_div_rs1_data_e;
96
   input [63:0]  byp_div_rs2_data_e;
97
   input         ecl_div_muls_rs1_31_e_l;
98
   input         ecl_div_muls;
99
   input         ecl_div_zero_rs2_e;
100
 
101
   output        so;
102
   output div_ecl_xin_msb_l;
103
   output div_ecl_x_msb;
104
   output div_ecl_d_msb;
105
   output div_ecl_cout64;       // cout from adder
106
   output div_ecl_cout32;       // cout from adder
107
   output        div_ecl_gencc_in_msb_l;
108
   output        div_ecl_gencc_in_31;
109
   output        div_ecl_upper32_equal;
110
   output        div_ecl_low32_nonzero;
111
   output        div_ecl_dividend_msb;
112
   output [63:0] div_byp_muldivout_g;
113
   output [31:0] div_byp_yreg_e;
114
   output [3:0]  div_ecl_yreg_0_l;
115
   output [63:0]          exu_mul_rs1_data;
116
   output [63:0]          exu_mul_rs2_data;
117
   output                 div_ecl_adder_out_31;
118
   output        div_ecl_detect_zero_low;
119
   output        div_ecl_detect_zero_high;
120
   output        div_ecl_d_62;
121
 
122
   /*AUTOWIRE*/
123
   // Beginning of automatic wires (for undeclared instantiated-module outputs)
124
   wire [31:0]          yreg_mdq_y_e;           // From yreg of sparc_exu_div_yreg.v
125
   // End of automatics
126
   wire                 clk;
127
   wire [127:0]  din;           // sign extended dividend
128
   wire [127:0]  d;             // current dividend/quotient
129
   wire [63:0]   adder_out;     // output of adder
130
   wire [127:0]  dnext;         // input to d flop
131
   wire [127:0]  adder_dnext;   // combination of adder out and quotient
132
   wire [63:0]   x;             // divisor
133
   wire [63:0]   xin;           // sign extended (for 32bit) divisor
134
   wire [63:0]   xnext;         // input to divisor flop
135
   wire [63:0]   adderin1;      // first input to adder
136
   wire [63:0]   adderin2;      // 2nd input to adder
137
 
138
   wire [63:0]   curr_q;        // current quotient
139
   wire [63:0]   out64;         // 64 bit result
140
   wire [63:0]   pos32;         // positive 32 bit result w/ ovfl
141
   wire [63:0]   neg32;         // negative 32 bit result w/ ovfl
142
   wire [63:0]   u32;           // unsigned 32 bit result w/ ovfl
143
   wire [63:0]   gencc_in;
144
   wire [63:0]   mul_result;
145
   wire [63:0]   mul_result_next;
146
   wire [127:0]  input_data_e;
147
   wire [63:0]   dividend;
148
   wire [63:0]   divisor;
149
   wire [127:0]  next_mul_data;
150
   wire [127:0]  mul_data_out;
151
   wire [127:0]  mul32_input_data_e;
152
   wire          subtract;
153
   wire [63:0]   spr_out;
154
   wire [63:0]   z_in;
155
 
156
   assign        clk = rclk;
157
   ///////////////////////////////////////
158
   // Input masking for 32 bit operations
159
   ///////////////////////////////////////
160
   dp_buffer #(128) buf_input_data(.dout(input_data_e[127:0]),
161
                                   .in({byp_div_rs2_data_e[63:0], byp_div_rs1_data_e[63:0]}));
162
   // Mux in yreg into upper 32 bits on 32 bit divides
163
   dp_mux2es #(32) dividendmux(.dout(dividend[63:32]),
164
                             .in0(yreg_mdq_y_e[31:0]),
165
                             .in1(input_data_e[63:32]),
166
                             .sel(ecl_div_div64));
167
   assign        dividend[31:0] = input_data_e[31:0];
168
   assign        divisor[63:0] = input_data_e[127:64];
169
 
170
 
171
   /////////////////////
172
   // Output assignment
173
   /////////////////////
174
   dp_mux2es #(64) output_mux(.dout(div_byp_muldivout_g[63:0]), .in1(d[63:0]),
175
                         .in0(mul_result[63:0]),
176
                         .sel(ecl_div_sel_div));
177
   ///////////////////////////
178
   // Generate Condition Codes and divide by zero exception and overflow
179
   ///////////////////////////
180
   dp_mux2es #(64) gencc_mux(.dout(gencc_in[63:0]),
181
                          .in0(mul_result[63:0]),
182
                          .in1(curr_q[63:0]),
183
                          .sel(ecl_div_sel_div));
184
   sparc_exu_div_32eql u32eql(.in(gencc_in[63:32]), .equal(div_ecl_upper32_equal));
185
   sparc_exu_aluor32 low32or(// Outputs
186
                             .out  (div_ecl_low32_nonzero),
187
                             // Inputs
188
                             .in    (gencc_in[31:0]));
189
   assign        div_ecl_gencc_in_msb_l = ~gencc_in[63];
190
   assign        div_ecl_gencc_in_31 = gencc_in[31];
191
 
192
 
193
   // Division overflow calculations
194
   assign        curr_q = d[127:64];
195
   assign        u32 = {32'b0, (curr_q[31:0] | {32{~ecl_div_upper32_zero}})};
196
   assign        pos32 = {33'b0, (curr_q[30:0] | {31{~ecl_div_upper33_zero}})};
197
   assign        neg32 = {{33{1'b1}}, (curr_q[30:0] & {31{ecl_div_upper33_one}})};
198
 
199
   mux4ds #(64) result_mux(.dout(out64[63:0]), .in0(curr_q[63:0]), .in1(u32[63:0]),
200
                         .in2(pos32[63:0]), .in3(neg32[63:0]), .sel0(ecl_div_sel_64b),
201
                         .sel1(ecl_div_sel_u32), .sel2(ecl_div_sel_pos32),
202
                         .sel3(ecl_div_sel_neg32));
203
 
204
   //////////////////////////
205
   // Logic for D (dividend)
206
   //////////////////////////
207
 
208
   // If signed div sign extend dividend to 127 bits
209
   assign        div_ecl_dividend_msb = dividend[63];
210
   assign        din[62:0] = dividend[62:0];
211
   dp_mux2es #(32) din_mux(.dout(din[94:63]),
212
                           .in0({{31{ecl_div_dividend_sign}}, dividend[63]}),
213
                           .in1({~ecl_div_muls_rs1_31_e_l, dividend[31:1]}),
214
                           .sel(ecl_div_muls));
215
   assign        din[127:95] = {33{ecl_div_dividend_sign}};
216
//   assign        din = {{64{ecl_div_dividend_sign}}, dividend[63:0]};
217
 
218
 
219
   // Select input to FF for d
220
   mux3ds #(128) d_mux(.dout(dnext[127:0]), .in0({d[127:64], out64[63:0]}),
221
                     .in1(adder_dnext[127:0]), .in2(din[127:0]),
222
                     .sel0(ecl_div_keep_d),
223
                     .sel1(ecl_div_sel_adder),
224
                     .sel2(ecl_div_ld_inputs));
225
   assign        div_ecl_d_62 = d[62];
226
 
227
   // FF for d
228 113 albert.wat
   dff_s #(128) d_dff(.din(dnext[127:0]), .clk(clk), .q(d[127:0]), .se(se), `SIMPLY_RISC_SCANIN, .so());
229 95 fafa1971
 
230
   ////////////////////////////
231
   // Logic for X (divisor)
232
   ////////////////////////////
233
   // if signed div and 32 bits sign extend to upper 32 bits
234
   dp_mux2es #(32) xin_mux(.dout(xin[63:32]), .in1(divisor[63:32]),
235
                      .in0({32{ecl_div_xinmask}}),
236
                      .sel(ecl_div_div64));
237
   assign        xin[31:0] = divisor[31:0] & {32{~ecl_div_zero_rs2_e}};
238
   //assign xin[31:0] = divisor[31:0];
239
 
240
   // Pick between x and divisor and 1 (use divisor on first cycle, 1 last cycle)
241
   mux3ds #(64) x_mux(.dout(xnext[63:0]), .in0(x[63:0]), .in1(xin[63:0]), .in2({64'b0}),
242
                    .sel0(ecl_div_keepx),
243
                    .sel1(ecl_div_ld_inputs),
244
                    .sel2(ecl_div_almostlast_cycle));
245
 
246
   // FF for x
247 113 albert.wat
   dff_s #(64) x_dff(.din(xnext[63:0]), .clk(clk), .q(x[63:0]), .se(se), `SIMPLY_RISC_SCANIN, .so());
248 95 fafa1971
 
249
 
250
   ///////////////////////////
251
   // Logic for inputs to adder
252
   //////////////////////////
253
   assign div_ecl_xin_msb_l = ~xin[63];
254
   assign div_ecl_x_msb = x[63];
255
   assign div_ecl_d_msb = d[127];
256
   dp_mux2es #(64) in1_mux(.dout(adderin1[63:0]), .in0(d[126:63]),
257
                      .in1({d[62:0], ecl_div_newq}), .sel(ecl_div_last_cycle));
258
 
259
   assign subtract = ~ecl_div_subtract_l;
260
   assign        adderin2[63:0] = x[63:0] ^ {64{subtract}};
261
 
262
   //////////////////////////
263
   //  Adder
264
   /////////////////////////
265
   sparc_exu_aluadder64 add64(// Outputs
266
                              .adder_out(adder_out[63:0]),
267
                              .cout32   (div_ecl_cout32),
268
                              .cout64   (div_ecl_cout64),
269
                              // Inputs
270
                              .rs1_data (adderin1[63:0]),
271
                              .rs2_data (adderin2[63:0]),
272
                              .cin      (ecl_div_cin));
273
 
274
   assign        adder_dnext = {adder_out[63:0], d[62:0], ecl_div_newq};
275
   assign        div_ecl_adder_out_31 = adder_out[31];
276
 
277
   // sum predict and zero detection
278
   sparc_exu_aluspr spr(.rs1_data(adderin1[63:0]), .rs2_data(adderin2[63:0]), .cin(ecl_div_cin),
279
                        .spr_out(spr_out[63:0]));
280
   dp_mux2es #(64) zero_detect_mux(.dout(z_in[63:0]),
281
                                   .in0(spr_out[63:0]),
282
                                   .in1(xin[63:0]),
283
                                   .sel(ecl_div_ld_inputs));
284
   //sparc_exu_aluzcmp64 regzcmp(.in(z_in[63:0]), .zero64(div_ecl_detect_zero));
285
   assign        div_ecl_detect_zero_low = ~(|z_in[31:0]);
286
   assign        div_ecl_detect_zero_high = ~(|z_in[63:32]);
287
 
288
 
289
   // y register
290
   assign        div_byp_yreg_e = yreg_mdq_y_e;
291
   sparc_exu_div_yreg yreg(.mul_div_yreg_data_g(mul_exu_data_g[63:32]),
292
                           /*AUTOINST*/
293
                           // Outputs
294
                           .yreg_mdq_y_e(yreg_mdq_y_e[31:0]),
295
                           .div_ecl_yreg_0_l(div_ecl_yreg_0_l[3:0]),
296
                           // Inputs
297
                           .clk         (clk),
298
                           .se          (se),
299
                           .byp_div_yreg_data_w(byp_div_yreg_data_w[31:0]),
300
                           .ecl_div_thr_e(ecl_div_thr_e[3:0]),
301
                           .ecl_div_yreg_wen_w(ecl_div_yreg_wen_w[3:0]),
302
                           .ecl_div_yreg_wen_g(ecl_div_yreg_wen_g[3:0]),
303
                           .ecl_div_yreg_wen_l(ecl_div_yreg_wen_l[3:0]),
304
                           .ecl_div_yreg_data_31_g(ecl_div_yreg_data_31_g),
305
                           .ecl_div_yreg_shift_g(ecl_div_yreg_shift_g[3:0]));
306
 
307
 
308
   //////////////////////////////////
309
   // MULTIPLIER inputs
310
   //////////////////////////////////                  
311
   assign        mul32_input_data_e[127:64] = {{32{ecl_div_mul_sext_rs2_e}}, input_data_e[95:64]};
312
   assign        mul32_input_data_e[63:0] = {{32{ecl_div_mul_sext_rs1_e}}, input_data_e[31:0]};
313
   mux3ds #(128) mul_data_mux(.dout(next_mul_data[127:0]),
314
                              .in0(input_data_e[127:0]),
315
                              .in1(mul32_input_data_e[127:0]),
316
                              .in2(mul_data_out[127:0]),
317
                              .sel0(ecl_div_mul_get_new_data),
318
                              .sel1(ecl_div_mul_get_32bit_data),
319
                              .sel2(ecl_div_mul_keep_data));
320 113 albert.wat
   dff_s #(128) mul_data_dff(.din(next_mul_data[127:0]), .clk(clk), .q(mul_data_out[127:0]),
321
                           .se(se), `SIMPLY_RISC_SCANIN, .so());
322 95 fafa1971
   assign        exu_mul_rs1_data = mul_data_out[63:0];
323
   assign        exu_mul_rs2_data = mul_data_out[127:64];
324
 
325
   ///////////////////////////////////
326
   // Store output from mul
327
   //////////////////////////////////
328
   dp_mux2es #(64) mul_result_mux(.dout(mul_result_next[63:0]), .in0(mul_result[63:0]),
329
                           .in1(mul_exu_data_g[63:0]),
330
                           .sel(ecl_div_mul_wen));
331 113 albert.wat
   dff_s #(64) mul_result_dff(.din(mul_result_next[63:0]), .clk(clk), .q(mul_result[63:0]),
332
                        .se(se), `SIMPLY_RISC_SCANIN, .so());
333 95 fafa1971
 
334
 
335
endmodule // sparc_exu_div

powered by: WebSVN 2.1.0

© copyright 1999-2024 OpenCores.org, equivalent to Oliscience, all rights reserved. OpenCores®, registered trademark.