OpenCores

Rev 6	Rev 8
Line 1...	Line 1...
	`timescale 1ns / 1ps
`// ============================================================================`	`// ============================================================================`
`// __`	`// __`
`// \\__/ o\ (C) 2006-2016 Robert Finch, Stratford`	`// \\__/ o\ (C) 2006-2016 Robert Finch, Waterloo`
`// \ __ / All rights reserved.`	`// \ __ / All rights reserved.`
`// \/_// robfinch<remove>@finitron.ca`	`// \/_// robfinch<remove>@finitron.ca`
`// \|\|`	`// \|\|`
`//`	`//`
	`// fpMul.v`
	`// - floating point multiplier`
	`// - two cycle latency`
	`// - can issue every clock cycle`
	`// - parameterized width`
	`// - IEEE 754 representation`
	`//`
	`//`
`// This source file is free software: you can redistribute it and/or modify`	`// This source file is free software: you can redistribute it and/or modify`
`// it under the terms of the GNU Lesser General Public License as published`	`// it under the terms of the GNU Lesser General Public License as published`
`// by the Free Software Foundation, either version 3 of the License, or`	`// by the Free Software Foundation, either version 3 of the License, or`
`// (at your option) any later version.`	`// (at your option) any later version.`
`//`	`//`
Line 16...	Line 25...
`// GNU General Public License for more details.`	`// GNU General Public License for more details.`
`//`	`//`
`// You should have received a copy of the GNU General Public License`	`// You should have received a copy of the GNU General Public License`
`// along with this program. If not, see <http://www.gnu.org/licenses/>.`	`// along with this program. If not, see <http://www.gnu.org/licenses/>.`
`//`	`//`
`// fpMul.v`	`// Floating Point Multiplier / Divider`
`// - floating point multiplier`	`//`
`// - two cycle latency`	`// This multiplier/divider handles denormalized numbers.`
`// - can issue every clock cycle`	`// The output format is of an internal expanded representation`
`// - parameterized width`	`// in preparation to be fed into a normalization unit, then`
`// - IEEE 754 representation`	`// rounding. Basically, it's the same as the regular format`
	`// except the mantissa is doubled in size, the leading two`
	`// bits of which are assumed to be whole bits.`
	`//`
`//`	`//`
`// Floating Point Multiplier`	`// Floating Point Multiplier`
`//`	`//`
`// Properties:`	`// Properties:`
`// +-inf * +-inf = -+inf (this is handled by exOver)`	`// +-inf * +-inf = -+inf (this is handled by exOver)`
`// +-inf * 0 = QNaN`	`// +-inf * 0 = QNaN`
`//`	`//`
`// ============================================================================`	`// 1 sign number`
	`// 8 exponent`
	`// 48 mantissa`
`//`	`//`
	`// ============================================================================`

`module fpMul (clk, ce, a, b, o, sign_exe, inf, overflow, underflow);`	`module fpMul (clk, ce, a, b, o, sign_exe, inf, overflow, underflow);`
`parameter WID = 32;`	`parameter WID = 128;`
`localparam MSB = WID-1;`	`localparam MSB = WID-1;`
`localparam EMSB =`	`localparam EMSB = WID==128 ? 14 :`
	`WID==96 ? 14 :`
`WID==80 ? 14 :`	`WID==80 ? 14 :`
`WID==64 ? 10 :`	`WID==64 ? 10 :`
`WID==52 ? 10 :`	`WID==52 ? 10 :`
`WID==48 ? 10 :`	`WID==48 ? 10 :`
`WID==44 ? 10 :`	`WID==44 ? 10 :`
`WID==42 ? 10 :`	`WID==42 ? 10 :`
`WID==40 ? 9 :`	`WID==40 ? 9 :`
`WID==32 ? 7 :`	`WID==32 ? 7 :`
`WID==24 ? 6 : 4;`	`WID==24 ? 6 : 4;`
`localparam FMSB =`	`localparam FMSB = WID==128 ? 111 :`
	`WID==96 ? 79 :`
`WID==80 ? 63 :`	`WID==80 ? 63 :`
`WID==64 ? 51 :`	`WID==64 ? 51 :`
`WID==52 ? 39 :`	`WID==52 ? 39 :`
`WID==48 ? 35 :`	`WID==48 ? 35 :`
`WID==44 ? 31 :`	`WID==44 ? 31 :`
`WID==42 ? 29 :`	`WID==42 ? 29 :`
`WID==40 ? 28 :`	`WID==40 ? 28 :`
`WID==32 ? 22 :`	`WID==32 ? 22 :`
`WID==24 ? 15 : 9;`	`WID==24 ? 15 : 9;`

`localparam WX = 3;`	`localparam FX = (FMSB+2)*2-1; // the MSB of the expanded fraction`
`localparam FX = (FMSB+1)*2-1; // the MSB of the expanded fraction`	`localparam EX = FX + 1 + EMSB + 1 + 1 - 1;`
`localparam EX = FX + WX + EMSB + 1;`

`input clk;`	`input clk;`
`input ce;`	`input ce;`
`input [WID:1] a, b;`	`input [WID:1] a, b;`
`output [EX+1:0] o;`	`output [EX:0] o;`
`output sign_exe;`	`output sign_exe;`
`output inf;`	`output inf;`
`output overflow;`	`output overflow;`
`output underflow;`	`output underflow;`

`reg [EMSB:0] xo1; // extra bit for sign`	`reg [EMSB:0] xo1; // extra bit for sign`
`reg [FX+WX:0] mo1;`	`reg [FX:0] mo1;`

`// constants`	`// constants`
`wire [EMSB:0] infXp = {EMSB+1{1'b1}}; // infinite / NaN - all ones`	`wire [EMSB:0] infXp = {EMSB+1{1'b1}}; // infinite / NaN - all ones`
`// The following is the value for an exponent of zero, with the offset`	`// The following is the value for an exponent of zero, with the offset`
`// eg. 8'h7f for eight bit exponent, 11'h7ff for eleven bit exponent, etc.`	`// eg. 8'h7f for eight bit exponent, 11'h7ff for eleven bit exponent, etc.`
`wire [EMSB:0] bias = {1'b0,{EMSB{1'b1}}}; //2^0 exponent`	`wire [EMSB:0] bias = {1'b0,{EMSB{1'b1}}}; //2^0 exponent`
`// The following is a template for a quiet nan. (MSB=1)`	`// The following is a template for a quiet nan. (MSB=1)`
`wire [FMSB:0] qNaN = {1'b1,{FMSB{1'b0}}};`	`wire [FMSB:0] qNaN = {1'b1,{FMSB{1'b0}}};`

`// variables`	`// variables`
`reg [FX+WX:0] fract1,fract1a;`	`reg [FX:0] fract1,fract1a;`
`wire [FX+WX:0] fracto;`	`wire [FX:0] fracto;`
`wire [EMSB+2:0] ex1; // sum of exponents`	`wire [EMSB+2:0] ex1; // sum of exponents`
`wire [EMSB :0] ex2;`	`wire [EMSB :0] ex2;`

`// Decompose the operands`	`// Decompose the operands`
`wire sa, sb; // sign bit`	`wire sa, sb; // sign bit`
`wire [EMSB:0] xa, xb; // exponent bits`	`wire [EMSB:0] xa, xb; // exponent bits`
`wire [FMSB+1:0] fracta, fractb;`	`wire [FMSB+1:0] fracta, fractb;`
`wire a_dn, b_dn; // a/b is denormalized`	`wire a_dn, b_dn; // a/b is denormalized`
	`wire aNan, bNan, aNan1, bNan1;`
`wire az, bz;`	`wire az, bz;`
`wire aInf, bInf, aInf1, bInf1;`	`wire aInf, bInf, aInf1, bInf1;`


`// -----------------------------------------------------------`	`// -----------------------------------------------------------`
Line 102...	Line 120...
`// - derive basic information`	`// - derive basic information`
`// - calculate exponent`	`// - calculate exponent`
`// - calculate fraction`	`// - calculate fraction`
`// -----------------------------------------------------------`	`// -----------------------------------------------------------`

`fpDecompose #(WID) u1a (.i(a), .sgn(sa), .exp(xa), .fract(fracta), .xz(a_dn), .vz(az), .inf(aInf) );`	`fpDecomp #(WID) u1a (.i(a), .sgn(sa), .exp(xa), .fract(fracta), .xz(a_dn), .vz(az), .inf(aInf), .nan(aNan) );`
`fpDecompose #(WID) u1b (.i(b), .sgn(sb), .exp(xb), .fract(fractb), .xz(b_dn), .vz(bz), .inf(bInf) );`	`fpDecomp #(WID) u1b (.i(b), .sgn(sb), .exp(xb), .fract(fractb), .xz(b_dn), .vz(bz), .inf(bInf), .nan(bNan) );`

`// Compute the sum of the exponents.`	`// Compute the sum of the exponents.`
`// correct the exponent for denormalized operands`	`// correct the exponent for denormalized operands`
`// adjust the sum by the exponent offset (subtract 127)`	`// adjust the sum by the exponent offset (subtract 127)`
`// mul: ex1 = xa + xb, result should always be < 1ffh`	`// mul: ex1 = xa + xb, result should always be < 1ffh`
`assign ex1 = (az\|bz) ? 0 : (xa\|a_dn) + (xb\|b_dn) - bias;`	`assign ex1 = (az\|bz) ? 0 : (xa\|a_dn) + (xb\|b_dn) - bias;`
`generate`
`if (WID==64) begin`
`reg [35:0] p00,p01,p02;`	`reg [35:0] p00,p01,p02;`
`reg [35:0] p10,p11,p12;`	`reg [35:0] p10,p11,p12;`
`reg [35:0] p20,p21,p22;`	`reg [35:0] p20,p21,p22;`
	`generate`
	`if (WID==64) begin`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) begin`	`if (ce) begin`
`p00 <= fracta[17: 0] * fractb[17: 0];`	`p00 <= fracta[17: 0] * fractb[17: 0];`
`p01 <= fracta[35:18] * fractb[17: 0];`	`p01 <= fracta[35:18] * fractb[17: 0];`
`p02 <= fracta[52:36] * fractb[17: 0];`	`p02 <= fracta[52:36] * fractb[17: 0];`
Line 133...	Line 152...
`{p22,72'b0} + {p21,54'b0} + {p20,36'b0}`	`{p22,72'b0} + {p21,54'b0} + {p20,36'b0}`
`;`	`;`
`end`	`end`
`end`	`end`
`else if (WID==32) begin`	`else if (WID==32) begin`
`reg [35:0] p00,p01;`
`reg [35:0] p10,p11;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) begin`	`if (ce) begin`
`p00 <= fracta[17: 0] * fractb[17: 0];`	`p00 <= fracta[17: 0] * fractb[17: 0];`
`p01 <= fracta[23:18] * fractb[17: 0];`	`p01 <= fracta[23:18] * fractb[17: 0];`
`p10 <= fracta[17: 0] * fractb[23:18];`	`p10 <= fracta[17: 0] * fractb[23:18];`
`p11 <= fracta[23:18] * fractb[23:18];`	`p11 <= fracta[23:18] * fractb[23:18];`
`fract1 <= {p11,p00} + {p01,18'b0} + {p10,18'b0};`	`fract1 <= {p11,p00} + {p01,18'b0} + {p10,18'b0};`
`end`	`end`
`end`	`end`
	`else begin`
	`always @(posedge clk)`
	`if (ce)`
	`fract1 <= fracta * fractb;`
	`end`
`endgenerate`	`endgenerate`

`// Status`	`// Status`
`wire under1, over1;`	`wire under1, over1;`
`wire under = ex1[EMSB+2]; // exponent underflow`	`wire under = ex1[EMSB+2]; // exponent underflow`
`wire over = (&ex1[EMSB:0] \| ex1[EMSB+1]) & !ex1[EMSB+2];`	`wire over = (&ex1[EMSB:0] \| ex1[EMSB+1]) & !ex1[EMSB+2];`

`delay2 #(EMSB+1) u3 (.clk(clk), .ce(ce), .i(ex1[EMSB:0]), .o(ex2) );`	`delay2 #(EMSB+1) u3 (.clk(clk), .ce(ce), .i(ex1[EMSB:0]), .o(ex2) );`
`delay2 #(FX+WX+1) u4 (.clk(clk), .ce(ce), .i(fract1), .o(fracto) );`	`delay2 #(FX+1) u4 (.clk(clk), .ce(ce), .i(fract1), .o(fracto) );`
`delay2 u2a (.clk(clk), .ce(ce), .i(aInf), .o(aInf1) );`	`delay2 u2a (.clk(clk), .ce(ce), .i(aInf), .o(aInf1) );`
`delay2 u2b (.clk(clk), .ce(ce), .i(bInf), .o(bInf1) );`	`delay2 u2b (.clk(clk), .ce(ce), .i(bInf), .o(bInf1) );`
`delay2 u6 (.clk(clk), .ce(ce), .i(under), .o(under1) );`	`delay2 u6 (.clk(clk), .ce(ce), .i(under), .o(under1) );`
`delay2 u7 (.clk(clk), .ce(ce), .i(over), .o(over1) );`	`delay2 u7 (.clk(clk), .ce(ce), .i(over), .o(over1) );`

`// determine when a NaN is output`	`// determine when a NaN is output`
`wire qNaNOut;`	`wire qNaNOut;`
	`wire [WID-1:0] a1,b1;`
`delay2 u5 (.clk(clk), .ce(ce), .i((aInf&bz)\|(bInf&az)), .o(qNaNOut) );`	`delay2 u5 (.clk(clk), .ce(ce), .i((aInf&bz)\|(bInf&az)), .o(qNaNOut) );`
	`delay2 u14 (.clk(clk), .ce(ce), .i(aNan), .o(aNan1) );`
	`delay2 u15 (.clk(clk), .ce(ce), .i(bNan), .o(bNan1) );`
	`delay2 #(WID) u16 (.clk(clk), .ce(ce), .i(a), .o(a1) );`
	`delay2 #(WID) u17 (.clk(clk), .ce(ce), .i(b), .o(b1) );`

`// -----------------------------------------------------------`	`// -----------------------------------------------------------`
`// Second clock`	`// Second clock`
`// - correct xponent and mantissa for exceptional conditions`	`// - correct xponent and mantissa for exceptional conditions`
`// -----------------------------------------------------------`	`// -----------------------------------------------------------`
Line 173...	Line 199...
`wire so1;`	`wire so1;`
`delay3 u8 (.clk(clk), .ce(ce), .i(sa ^ sb), .o(so1) );// two clock delay!`	`delay3 u8 (.clk(clk), .ce(ce), .i(sa ^ sb), .o(so1) );// two clock delay!`

`always @(posedge clk)`	`always @(posedge clk)`
`if (ce)`	`if (ce)`
`casex({qNaNOut,aInf1,bInf1,over1,under1})`	`casex({qNaNOut\|aNan1\|bNan1,aInf1,bInf1,over1,under1})`
`5'b1xxxx: xo1 = infXp; // qNaN - infinity * zero`	`5'b1xxxx: xo1 = infXp; // qNaN - infinity * zero`
`5'b01xxx: xo1 = infXp; // 'a' infinite`	`5'b01xxx: xo1 = infXp; // 'a' infinite`
`5'b001xx: xo1 = infXp; // 'b' infinite`	`5'b001xx: xo1 = infXp; // 'b' infinite`
`5'b0001x: xo1 = infXp; // result overflow`	`5'b0001x: xo1 = infXp; // result overflow`
`5'b00001: xo1 = 0; // underflow`	`5'b00001: xo1 = 0; // underflow`
`default: xo1 = ex2[EMSB:0]; // situation normal`	`default: xo1 = ex2[EMSB:0]; // situation normal`
`endcase`	`endcase`

`always @(posedge clk)`	`always @(posedge clk)`
`if (ce)`	`if (ce)`
`casex({qNaNOut,aInf1,bInf1,over1})`	`casex({aNan1,bNan1,qNaNOut,aInf1,bInf1,over1})`
`4'b1xxx: mo1 = {1'b0,qNaN\|3'd4,{FMSB+1{1'b0}}}; // multiply inf * zero`	`6'b1xxxxx: mo1 = {1'b0,a1[FMSB:0],{FMSB+1{1'b0}}};`
`4'b01xx: mo1 = 0; // mul inf's`	`6'bx1xxxx: mo1 = {1'b0,b1[FMSB:0],{FMSB+1{1'b0}}};`
`4'b001x: mo1 = 0; // mul inf's`	`6'bxx1xxx: mo1 = {1'b0,qNaN\|3'd4,{FMSB+1{1'b0}}}; // multiply inf * zero`
`4'b0001: mo1 = 0; // mul overflow`	`6'b0001xx: mo1 = 0; // mul inf's`
	`6'b00001x: mo1 = 0; // mul inf's`
	`6'b000001: mo1 = 0; // mul overflow`
`default: mo1 = fracto;`	`default: mo1 = fracto;`
`endcase`	`endcase`

`delay3 u10 (.clk(clk), .ce(ce), .i(sa & sb), .o(sign_exe) );`	`delay3 u10 (.clk(clk), .ce(ce), .i(sa & sb), .o(sign_exe) );`
`delay1 u11 (.clk(clk), .ce(ce), .i(over1), .o(overflow) );`	`delay1 u11 (.clk(clk), .ce(ce), .i(over1), .o(overflow) );`
Line 203...	Line 231...

`endmodule`	`endmodule`

`module fpMul_tb();`	`module fpMul_tb();`
`reg clk;`	`reg clk;`
`wire ce = 1'b1;`
`wire sgnx1,sgnx2,sgnx3,sgnx4,sgnx5,sgnx6;`
`wire inf1,inf2,inf3,inf4,inf5,inf6;`
`wire of1,of2,of3,of4,of5,of6;`
`wire uf1,uf2,uf3,uf4,uf5,uf6;`
`wire [57:0] o1,o2,o3,o4,o5,o6;`
`wire [35:0] o11,o12,o13;`
`wire [31:0] o21,o22,o23;`

`initial begin`	`initial begin`
`clk = 0;`	`clk = 0;`
`end`	`end`
`always #10 clk <= ~clk;`	`always #10 clk <= ~clk;`

`fpMul u1 (.clk(clk), .ce(1'b1), .a(0), .b(0), .o(o1), .sign_exe(sgnx1), .inf(inf1), .overflow(of1), .underflow(uf1));`	`fpMul u1 (.clk(clk), .ce(1'b1), .a(0), .b(0), .o(o1), .sign_exe(sgnx1), .inf(inf1), .overflow(of1), .underflow(uf1));`
`fpMul u2 (.clk(clk), .ce(1'b1), .a(0), .b(0), .o(o2), .sign_exe(sgnx2), .inf(inf2), .overflow(of2), .underflow(uf2));`	`fpMul u2 (.clk(clk), .ce(1'b1), .a(0), .b(0), .o(o1), .sign_exe(sgnx1), .inf(inf1), .overflow(of1), .underflow(uf1));`
`// 10x10`
`fpMul u3 (.clk(clk), .ce(1'b1), .a(32'h41200000), .b(32'h41200000), .o(o3), .sign_exe(sgnx2), .inf(inf2), .overflow(of2), .underflow(uf2));`
`// 21*-17`
`fpMul u4 (.clk(clk), .ce(1'b1), .a(32'h41a80000), .b(32'hc1880000), .o(o4), .sign_exe(sgnx2), .inf(inf2), .overflow(of2), .underflow(uf2));`
`// -17*-15`
`fpMul u5 (.clk(clk), .ce(1'b1), .a(32'hc1880000), .b(32'hc1700000), .o(o5), .sign_exe(sgnx2), .inf(inf2), .overflow(of2), .underflow(uf2));`

`fpNormalize u11 (clk, ce, 1'b0, o3, o11);`
`fpNormalize u12 (clk, ce, 1'b0, o4, o12);`
`fpNormalize u13 (clk, ce, 1'b0, o5, o13);`

`fpRound u21 (3'd1, o11, o21); // zero for zero`
`fpRound u22 (3'd1, o12, o22); //`
`fpRound u23 (3'd1, o13, o23); //`

`endmodule`	`endmodule`

`No newline at end of file`	`No newline at end of file`

Line 1...

`timescale 1ns / 1ps

// ============================================================================

// ============================================================================

//        __

//        __

//   \\__/ o\    (C) 2006-2016  Robert Finch, Stratford

//   \\__/ o\    (C) 2006-2016  Robert Finch, Waterloo

//    \  __ /    All rights reserved.

//    \  __ /    All rights reserved.

//     \/_//     robfinch<remove>@finitron.ca

//     \/_//     robfinch<remove>@finitron.ca

//       ||

//       ||

//

//

//      fpMul.v

//              - floating point multiplier

//              - two cycle latency

//              - can issue every clock cycle

//              - parameterized width

//              - IEEE 754 representation

//

//

// This source file is free software: you can redistribute it and/or modify

// This source file is free software: you can redistribute it and/or modify

// it under the terms of the GNU Lesser General Public License as published

// it under the terms of the GNU Lesser General Public License as published

// by the Free Software Foundation, either version 3 of the License, or

// by the Free Software Foundation, either version 3 of the License, or

// (at your option) any later version.

// (at your option) any later version.

//

//

Line 16...

Line 25...

// GNU General Public License for more details.

// GNU General Public License for more details.

//

//

// You should have received a copy of the GNU General Public License

// You should have received a copy of the GNU General Public License

// along with this program.  If not, see <http://www.gnu.org/licenses/>.

// along with this program.  If not, see <http://www.gnu.org/licenses/>.

//

//

//      fpMul.v

//      Floating Point Multiplier / Divider

//              - floating point multiplier

//

//              - two cycle latency

//      This multiplier/divider handles denormalized numbers.

//              - can issue every clock cycle

//      The output format is of an internal expanded representation

//              - parameterized width

//      in preparation to be fed into a normalization unit, then

//              - IEEE 754 representation

//      rounding. Basically, it's the same as the regular format

//      except the mantissa is doubled in size, the leading two

//      bits of which are assumed to be whole bits.

//

//

//

//      Floating Point Multiplier

//      Floating Point Multiplier

//

//

//      Properties:

//      Properties:

//      +-inf * +-inf = -+inf   (this is handled by exOver)

//      +-inf * +-inf = -+inf   (this is handled by exOver)

//      +-inf * 0     = QNaN

//      +-inf * 0     = QNaN

//

//

// ============================================================================

//      1 sign number

//      8 exponent

//      48 mantissa

//

//

// ============================================================================

module fpMul (clk, ce, a, b, o, sign_exe, inf, overflow, underflow);

module fpMul (clk, ce, a, b, o, sign_exe, inf, overflow, underflow);

parameter WID = 32;

parameter WID = 128;

localparam MSB = WID-1;

localparam MSB = WID-1;

localparam EMSB =

localparam EMSB = WID==128 ? 14 :

                  WID==96 ? 14 :

          WID==80 ? 14 :

          WID==80 ? 14 :

          WID==64 ? 10 :

          WID==64 ? 10 :

                                  WID==52 ? 10 :

                                  WID==52 ? 10 :

                                  WID==48 ? 10 :

                                  WID==48 ? 10 :

                                  WID==44 ? 10 :

                                  WID==44 ? 10 :

                                  WID==42 ? 10 :

                                  WID==42 ? 10 :

                                  WID==40 ?  9 :

                                  WID==40 ?  9 :

                                  WID==32 ?  7 :

                                  WID==32 ?  7 :

                                  WID==24 ?  6 : 4;

                                  WID==24 ?  6 : 4;

localparam FMSB =

localparam FMSB = WID==128 ? 111 :

                  WID==96 ? 79 :

          WID==80 ? 63 :

          WID==80 ? 63 :

          WID==64 ? 51 :

          WID==64 ? 51 :

                                  WID==52 ? 39 :

                                  WID==52 ? 39 :

                                  WID==48 ? 35 :

                                  WID==48 ? 35 :

                                  WID==44 ? 31 :

                                  WID==44 ? 31 :

                                  WID==42 ? 29 :

                                  WID==42 ? 29 :

                                  WID==40 ? 28 :

                                  WID==40 ? 28 :

                                  WID==32 ? 22 :

                                  WID==32 ? 22 :

                                  WID==24 ? 15 : 9;

                                  WID==24 ? 15 : 9;

localparam WX = 3;

localparam FX = (FMSB+2)*2-1;   // the MSB of the expanded fraction

localparam FX = (FMSB+1)*2-1;   // the MSB of the expanded fraction

localparam EX = FX + 1 + EMSB + 1 + 1 - 1;

localparam EX = FX + WX + EMSB + 1;

input clk;

input clk;

input ce;

input ce;

input  [WID:1] a, b;

input  [WID:1] a, b;

output [EX+1:0] o;

output [EX:0] o;

output sign_exe;

output sign_exe;

output inf;

output inf;

output overflow;

output overflow;

output underflow;

output underflow;

reg [EMSB:0] xo1;                // extra bit for sign

reg [EMSB:0] xo1;                // extra bit for sign

reg [FX+WX:0] mo1;

reg [FX:0] mo1;

// constants

// constants

wire [EMSB:0] infXp = {EMSB+1{1'b1}};    // infinite / NaN - all ones

wire [EMSB:0] infXp = {EMSB+1{1'b1}};    // infinite / NaN - all ones

// The following is the value for an exponent of zero, with the offset

// The following is the value for an exponent of zero, with the offset

// eg. 8'h7f for eight bit exponent, 11'h7ff for eleven bit exponent, etc.

// eg. 8'h7f for eight bit exponent, 11'h7ff for eleven bit exponent, etc.

wire [EMSB:0] bias = {1'b0,{EMSB{1'b1}}};        //2^0 exponent

wire [EMSB:0] bias = {1'b0,{EMSB{1'b1}}};        //2^0 exponent

// The following is a template for a quiet nan. (MSB=1)

// The following is a template for a quiet nan. (MSB=1)

wire [FMSB:0] qNaN  = {1'b1,{FMSB{1'b0}}};

wire [FMSB:0] qNaN  = {1'b1,{FMSB{1'b0}}};

// variables

// variables

reg [FX+WX:0] fract1,fract1a;

reg [FX:0] fract1,fract1a;

wire [FX+WX:0] fracto;

wire [FX:0] fracto;

wire [EMSB+2:0] ex1;     // sum of exponents

wire [EMSB+2:0] ex1;     // sum of exponents

wire [EMSB  :0] ex2;

wire [EMSB  :0] ex2;

// Decompose the operands

// Decompose the operands

wire sa, sb;                    // sign bit

wire sa, sb;                    // sign bit

wire [EMSB:0] xa, xb;    // exponent bits

wire [EMSB:0] xa, xb;    // exponent bits

wire [FMSB+1:0] fracta, fractb;

wire [FMSB+1:0] fracta, fractb;

wire a_dn, b_dn;                        // a/b is denormalized

wire a_dn, b_dn;                        // a/b is denormalized

wire aNan, bNan, aNan1, bNan1;

wire az, bz;

wire az, bz;

wire aInf, bInf, aInf1, bInf1;

wire aInf, bInf, aInf1, bInf1;

// -----------------------------------------------------------

// -----------------------------------------------------------

Line 102...

Line 120...

// - derive basic information

// - derive basic information

// - calculate exponent

// - calculate exponent

// - calculate fraction

// - calculate fraction

// -----------------------------------------------------------

// -----------------------------------------------------------

fpDecompose #(WID) u1a (.i(a), .sgn(sa), .exp(xa), .fract(fracta), .xz(a_dn), .vz(az), .inf(aInf) );

fpDecomp #(WID) u1a (.i(a), .sgn(sa), .exp(xa), .fract(fracta), .xz(a_dn), .vz(az), .inf(aInf), .nan(aNan) );

fpDecompose #(WID) u1b (.i(b), .sgn(sb), .exp(xb), .fract(fractb), .xz(b_dn), .vz(bz), .inf(bInf) );

fpDecomp #(WID) u1b (.i(b), .sgn(sb), .exp(xb), .fract(fractb), .xz(b_dn), .vz(bz), .inf(bInf), .nan(bNan) );

// Compute the sum of the exponents.

// Compute the sum of the exponents.

// correct the exponent for denormalized operands

// correct the exponent for denormalized operands

// adjust the sum by the exponent offset (subtract 127)

// adjust the sum by the exponent offset (subtract 127)

// mul: ex1 = xa + xb,  result should always be < 1ffh

// mul: ex1 = xa + xb,  result should always be < 1ffh

assign ex1 = (az|bz) ? 0 : (xa|a_dn) + (xb|b_dn) - bias;

assign ex1 = (az|bz) ? 0 : (xa|a_dn) + (xb|b_dn) - bias;

generate

if (WID==64) begin

        reg [35:0] p00,p01,p02;

        reg [35:0] p00,p01,p02;

        reg [35:0] p10,p11,p12;

        reg [35:0] p10,p11,p12;

        reg [35:0] p20,p21,p22;

        reg [35:0] p20,p21,p22;

generate

if (WID==64) begin

        always @(posedge clk)

        always @(posedge clk)

        if (ce) begin

        if (ce) begin

                p00 <= fracta[17: 0] * fractb[17: 0];

                p00 <= fracta[17: 0] * fractb[17: 0];

                p01 <= fracta[35:18] * fractb[17: 0];

                p01 <= fracta[35:18] * fractb[17: 0];

                p02 <= fracta[52:36] * fractb[17: 0];

                p02 <= fracta[52:36] * fractb[17: 0];

Line 133...

Line 152...

                                        {p22,72'b0} + {p21,54'b0} + {p20,36'b0}

                                        {p22,72'b0} + {p21,54'b0} + {p20,36'b0}

end

end

end

end

else if (WID==32) begin

else if (WID==32) begin

        reg [35:0] p00,p01;

        reg [35:0] p10,p11;

        always @(posedge clk)

        always @(posedge clk)

        if (ce) begin

        if (ce) begin

                p00 <= fracta[17: 0] * fractb[17: 0];

                p00 <= fracta[17: 0] * fractb[17: 0];

                p01 <= fracta[23:18] * fractb[17: 0];

                p01 <= fracta[23:18] * fractb[17: 0];

                p10 <= fracta[17: 0] * fractb[23:18];

                p10 <= fracta[17: 0] * fractb[23:18];

                p11 <= fracta[23:18] * fractb[23:18];

                p11 <= fracta[23:18] * fractb[23:18];

                fract1 <= {p11,p00} + {p01,18'b0} + {p10,18'b0};

                fract1 <= {p11,p00} + {p01,18'b0} + {p10,18'b0};

end

end

end

end

else begin

        always @(posedge clk)

    if (ce)

        fract1 <= fracta * fractb;

end

endgenerate

endgenerate

// Status

// Status

wire under1, over1;

wire under1, over1;

wire under = ex1[EMSB+2];       // exponent underflow

wire under = ex1[EMSB+2];       // exponent underflow

wire over = (&ex1[EMSB:0] | ex1[EMSB+1]) & !ex1[EMSB+2];

wire over = (&ex1[EMSB:0] | ex1[EMSB+1]) & !ex1[EMSB+2];

delay2 #(EMSB+1) u3 (.clk(clk), .ce(ce), .i(ex1[EMSB:0]), .o(ex2) );

delay2 #(EMSB+1) u3 (.clk(clk), .ce(ce), .i(ex1[EMSB:0]), .o(ex2) );

delay2 #(FX+WX+1) u4 (.clk(clk), .ce(ce), .i(fract1), .o(fracto) );

delay2 #(FX+1) u4 (.clk(clk), .ce(ce), .i(fract1), .o(fracto) );

delay2 u2a (.clk(clk), .ce(ce), .i(aInf), .o(aInf1) );

delay2 u2a (.clk(clk), .ce(ce), .i(aInf), .o(aInf1) );

delay2 u2b (.clk(clk), .ce(ce), .i(bInf), .o(bInf1) );

delay2 u2b (.clk(clk), .ce(ce), .i(bInf), .o(bInf1) );

delay2 u6  (.clk(clk), .ce(ce), .i(under), .o(under1) );

delay2 u6  (.clk(clk), .ce(ce), .i(under), .o(under1) );

delay2 u7  (.clk(clk), .ce(ce), .i(over), .o(over1) );

delay2 u7  (.clk(clk), .ce(ce), .i(over), .o(over1) );

// determine when a NaN is output

// determine when a NaN is output

wire qNaNOut;

wire qNaNOut;

wire [WID-1:0] a1,b1;

delay2 u5 (.clk(clk), .ce(ce), .i((aInf&bz)|(bInf&az)), .o(qNaNOut) );

delay2 u5 (.clk(clk), .ce(ce), .i((aInf&bz)|(bInf&az)), .o(qNaNOut) );

delay2 u14 (.clk(clk), .ce(ce), .i(aNan), .o(aNan1) );

delay2 u15 (.clk(clk), .ce(ce), .i(bNan), .o(bNan1) );

delay2 #(WID) u16 (.clk(clk), .ce(ce), .i(a), .o(a1) );

delay2 #(WID) u17 (.clk(clk), .ce(ce), .i(b), .o(b1) );

// -----------------------------------------------------------

// -----------------------------------------------------------

// Second clock

// Second clock

// - correct xponent and mantissa for exceptional conditions

// - correct xponent and mantissa for exceptional conditions

// -----------------------------------------------------------

// -----------------------------------------------------------

Line 173...

Line 199...

wire so1;

wire so1;

delay3 u8 (.clk(clk), .ce(ce), .i(sa ^ sb), .o(so1) );// two clock delay!

delay3 u8 (.clk(clk), .ce(ce), .i(sa ^ sb), .o(so1) );// two clock delay!

always @(posedge clk)

always @(posedge clk)

        if (ce)

        if (ce)

                casex({qNaNOut,aInf1,bInf1,over1,under1})

                casex({qNaNOut|aNan1|bNan1,aInf1,bInf1,over1,under1})

                5'b1xxxx:       xo1 = infXp;    // qNaN - infinity * zero

                5'b1xxxx:       xo1 = infXp;    // qNaN - infinity * zero

                5'b01xxx:       xo1 = infXp;    // 'a' infinite

                5'b01xxx:       xo1 = infXp;    // 'a' infinite

                5'b001xx:       xo1 = infXp;    // 'b' infinite

                5'b001xx:       xo1 = infXp;    // 'b' infinite

                5'b0001x:       xo1 = infXp;    // result overflow

                5'b0001x:       xo1 = infXp;    // result overflow

                5'b00001:       xo1 = 0;         // underflow

                5'b00001:       xo1 = 0;         // underflow

                default:        xo1 = ex2[EMSB:0];       // situation normal

                default:        xo1 = ex2[EMSB:0];       // situation normal

                endcase

                endcase

always @(posedge clk)

always @(posedge clk)

        if (ce)

        if (ce)

                casex({qNaNOut,aInf1,bInf1,over1})

                casex({aNan1,bNan1,qNaNOut,aInf1,bInf1,over1})

                4'b1xxx:        mo1 = {1'b0,qNaN|3'd4,{FMSB+1{1'b0}}};  // multiply inf * zero

                6'b1xxxxx:  mo1 = {1'b0,a1[FMSB:0],{FMSB+1{1'b0}}};

                4'b01xx:        mo1 = 0; // mul inf's

        6'bx1xxxx:  mo1 = {1'b0,b1[FMSB:0],{FMSB+1{1'b0}}};

                4'b001x:        mo1 = 0; // mul inf's

                6'bxx1xxx:      mo1 = {1'b0,qNaN|3'd4,{FMSB+1{1'b0}}};  // multiply inf * zero

                4'b0001:        mo1 = 0; // mul overflow

                6'b0001xx:      mo1 = 0; // mul inf's

                6'b00001x:      mo1 = 0; // mul inf's

                6'b000001:      mo1 = 0; // mul overflow

                default:        mo1 = fracto;

                default:        mo1 = fracto;

                endcase

                endcase

delay3 u10 (.clk(clk), .ce(ce), .i(sa & sb), .o(sign_exe) );

delay3 u10 (.clk(clk), .ce(ce), .i(sa & sb), .o(sign_exe) );

delay1 u11 (.clk(clk), .ce(ce), .i(over1),  .o(overflow) );

delay1 u11 (.clk(clk), .ce(ce), .i(over1),  .o(overflow) );

Line 203...

Line 231...

endmodule

endmodule

module fpMul_tb();

module fpMul_tb();

reg clk;

reg clk;

wire ce = 1'b1;

wire sgnx1,sgnx2,sgnx3,sgnx4,sgnx5,sgnx6;

wire inf1,inf2,inf3,inf4,inf5,inf6;

wire of1,of2,of3,of4,of5,of6;

wire uf1,uf2,uf3,uf4,uf5,uf6;

wire [57:0] o1,o2,o3,o4,o5,o6;

wire [35:0] o11,o12,o13;

wire [31:0] o21,o22,o23;

initial begin

initial begin

        clk = 0;

        clk = 0;

end

end

always #10 clk <= ~clk;

always #10 clk <= ~clk;

fpMul u1 (.clk(clk), .ce(1'b1), .a(0), .b(0), .o(o1), .sign_exe(sgnx1), .inf(inf1), .overflow(of1), .underflow(uf1));

fpMul u1 (.clk(clk), .ce(1'b1), .a(0), .b(0), .o(o1), .sign_exe(sgnx1), .inf(inf1), .overflow(of1), .underflow(uf1));

fpMul u2 (.clk(clk), .ce(1'b1), .a(0), .b(0), .o(o2), .sign_exe(sgnx2), .inf(inf2), .overflow(of2), .underflow(uf2));

fpMul u2 (.clk(clk), .ce(1'b1), .a(0), .b(0), .o(o1), .sign_exe(sgnx1), .inf(inf1), .overflow(of1), .underflow(uf1));

// 10x10

fpMul u3 (.clk(clk), .ce(1'b1), .a(32'h41200000), .b(32'h41200000), .o(o3), .sign_exe(sgnx2), .inf(inf2), .overflow(of2), .underflow(uf2));

// 21*-17

fpMul u4 (.clk(clk), .ce(1'b1), .a(32'h41a80000), .b(32'hc1880000), .o(o4), .sign_exe(sgnx2), .inf(inf2), .overflow(of2), .underflow(uf2));

// -17*-15

fpMul u5 (.clk(clk), .ce(1'b1), .a(32'hc1880000), .b(32'hc1700000), .o(o5), .sign_exe(sgnx2), .inf(inf2), .overflow(of2), .underflow(uf2));

fpNormalize u11 (clk, ce, 1'b0, o3, o11);

fpNormalize u12 (clk, ce, 1'b0, o4, o12);

fpNormalize u13 (clk, ce, 1'b0, o5, o13);

fpRound u21 (3'd1, o11, o21);         // zero for zero

fpRound u22 (3'd1, o12, o22); //

fpRound u23 (3'd1, o13, o23); //

endmodule

endmodule

 No newline at end of file

 No newline at end of file

Browse

Tools

Subversion Repositories ft816float

[/] [ft816float/] [trunk/] [rtl/] [verilog/] [fpMul.v] - Diff between revs 6 and 8