OpenCores

Rev 14	Rev 26
`timescale 1ns / 1ps	`timescale 1ns / 1ps
`// ============================================================================`	`// ============================================================================`
`// __`	`// __`
`// \\__/ o\ (C) 2006-2018 Robert Finch, Waterloo`	`// \\__/ o\ (C) 2006-2019 Robert Finch, Waterloo`
`// \ __ / All rights reserved.`	`// \ __ / All rights reserved.`
`// \/_// robfinch<remove>@finitron.ca`	`// \/_// robfinch<remove>@finitron.ca`
`// \|\|`	`// \|\|`
`//`	`//`
`// fpDiv.v`	`// fpDiv.v`
`// - floating point divider`	`// - floating point divider`
`// - parameterized width`	`// - parameterized width`
`// - IEEE 754 representation`	`// - IEEE 754 representation`
`//`	`//`
`//`	`//`
`// This source file is free software: you can redistribute it and/or modify`	`// This source file is free software: you can redistribute it and/or modify`
`// it under the terms of the GNU Lesser General Public License as published`	`// it under the terms of the GNU Lesser General Public License as published`
`// by the Free Software Foundation, either version 3 of the License, or`	`// by the Free Software Foundation, either version 3 of the License, or`
`// (at your option) any later version.`	`// (at your option) any later version.`
`//`	`//`
`// This source file is distributed in the hope that it will be useful,`	`// This source file is distributed in the hope that it will be useful,`
`// but WITHOUT ANY WARRANTY; without even the implied warranty of`	`// but WITHOUT ANY WARRANTY; without even the implied warranty of`
`// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`	`// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
`// GNU General Public License for more details.`	`// GNU General Public License for more details.`
`//`	`//`
`// You should have received a copy of the GNU General Public License`	`// You should have received a copy of the GNU General Public License`
`// along with this program. If not, see <http://www.gnu.org/licenses/>.`	`// along with this program. If not, see <http://www.gnu.org/licenses/>.`
`//`	`//`
`// Floating Point Multiplier / Divider`	`// Floating Point Multiplier / Divider`
`//`	`//`
`//Properties:`	`//Properties:`
`//+-inf * +-inf = -+inf (this is handled by exOver)`	`//+-inf * +-inf = -+inf (this is handled by exOver)`
`//+-inf * 0 = QNaN`	`//+-inf * 0 = QNaN`
`//+-0 / +-0 = QNaN`	`//+-0 / +-0 = QNaN`
`// ============================================================================`	`// ============================================================================`

`include "fp_defines.v"	`include "fp_defines.v"
`define GOLDSCHMIDT 1'b1	//`define GOLDSCHMIDT 1'b1

`module fpDiv(rst, clk, ce, ld, op, a, b, o, done, sign_exe, overflow, underflow);`	`module fpDiv(rst, clk, clk4x, ce, ld, op, a, b, o, done, sign_exe, overflow, underflow);`

`parameter WID = 128;`	`parameter WID = 128;`
`localparam MSB = WID-1;`	`include "fpSize.sv"
`localparam EMSB = WID==128 ? 14 :`
`WID==96 ? 14 :`
`WID==80 ? 14 :`
`WID==64 ? 10 :`
`WID==52 ? 10 :`
`WID==48 ? 11 :`
`WID==44 ? 10 :`
`WID==42 ? 10 :`
`WID==40 ? 9 :`
`WID==32 ? 7 :`
`WID==24 ? 6 : 4;`
`localparam FMSB = WID==128 ? 111 :`
`WID==96 ? 79 :`
`WID==80 ? 63 :`
`WID==64 ? 51 :`
`WID==52 ? 39 :`
`WID==48 ? 34 :`
`WID==44 ? 31 :`
`WID==42 ? 29 :`
`WID==40 ? 28 :`
`WID==32 ? 22 :`
`WID==24 ? 15 : 9;`
`// FADD is a constant that makes the divider width a multiple of four and includes eight extra bits.`	`// FADD is a constant that makes the divider width a multiple of four and includes eight extra bits.`
`localparam FADD = WID==128 ? 9 :`	`localparam FADD = WID==128 ? 9 :`
`WID==96 ? 9 :`	`WID==96 ? 9 :`
	`WID==84 ? 9 :`
`WID==80 ? 9 :`	`WID==80 ? 9 :`
`WID==64 ? 13 :`	`WID==64 ? 13 :`
`WID==52 ? 9 :`	`WID==52 ? 9 :`
`WID==48 ? 10 :`	`WID==48 ? 10 :`
`WID==44 ? 9 :`	`WID==44 ? 9 :`
`WID==42 ? 11 :`	`WID==42 ? 11 :`
`WID==40 ? 8 :`	`WID==40 ? 8 :`
`WID==32 ? 10 :`	`WID==32 ? 10 :`
`WID==24 ? 9 : 11;`	`WID==24 ? 9 : 11;`

`localparam FX = (FMSB+2)*2-1; // the MSB of the expanded fraction`
`localparam EX = FX + 1 + EMSB + 1 + 1 - 1;`
`input rst;`	`input rst;`
`input clk;`	`input clk;`
	`input clk4x;`
`input ce;`	`input ce;`
`input ld;`	`input ld;`
`input op;`	`input op;`
`input [MSB:0] a, b;`	`input [MSB:0] a, b;`
`output [EX:0] o;`	`output [EX:0] o;`
`output done;`	`output done;`
`output sign_exe;`	`output sign_exe;`
`output overflow;`	`output overflow;`
`output underflow;`	`output underflow;`

`// registered outputs`	`// registered outputs`
`reg sign_exe=0;`	`reg sign_exe=0;`
`reg inf=0;`	`reg inf=0;`
`reg overflow=0;`	`reg overflow=0;`
`reg underflow=0;`	`reg underflow=0;`

`reg so;`	`reg so;`
`reg [EMSB:0] xo;`	`reg [EMSB:0] xo;`
`reg [FX:0] mo;`	`reg [FX:0] mo;`
`assign o = {so,xo,mo};`	`assign o = {so,xo,mo};`

`// constants`	`// constants`
`wire [EMSB:0] infXp = {EMSB+1{1'b1}}; // infinite / NaN - all ones`	`wire [EMSB:0] infXp = {EMSB+1{1'b1}}; // infinite / NaN - all ones`
`// The following is the value for an exponent of zero, with the offset`	`// The following is the value for an exponent of zero, with the offset`
`// eg. 8'h7f for eight bit exponent, 11'h7ff for eleven bit exponent, etc.`	`// eg. 8'h7f for eight bit exponent, 11'h7ff for eleven bit exponent, etc.`
`wire [EMSB:0] bias = {1'b0,{EMSB{1'b1}}}; //2^0 exponent`	`wire [EMSB:0] bias = {1'b0,{EMSB{1'b1}}}; //2^0 exponent`
`// The following is a template for a quiet nan. (MSB=1)`	`// The following is a template for a quiet nan. (MSB=1)`
`wire [FMSB:0] qNaN = {1'b1,{FMSB{1'b0}}};`	`wire [FMSB:0] qNaN = {1'b1,{FMSB{1'b0}}};`

`// variables`	`// variables`
`wire [EMSB+2:0] ex1; // sum of exponents`	`wire [EMSB+2:0] ex1; // sum of exponents`
`ifndef GOLDSCHMIDT	`ifndef GOLDSCHMIDT
`wire [(FMSB+FADD)*2-1:0] divo;`	`wire [(FMSB+FADD)*2-1:0] divo;`
`else	`else
`wire [(FMSB+5)*2-1:0] divo;`	`wire [(FMSB+5)*2-1:0] divo;`
`endif	`endif

`// Operands`	`// Operands`
`wire sa, sb; // sign bit`	`wire sa, sb; // sign bit`
`wire [EMSB:0] xa, xb; // exponent bits`	`wire [EMSB:0] xa, xb; // exponent bits`
`wire [FMSB+1:0] fracta, fractb;`	`wire [FMSB+1:0] fracta, fractb;`
`wire a_dn, b_dn; // a/b is denormalized`	`wire a_dn, b_dn; // a/b is denormalized`
`wire az, bz;`	`wire az, bz;`
`wire aInf, bInf;`	`wire aInf, bInf;`
`wire aNan,bNan;`	`wire aNan,bNan;`
`wire done1;`	`wire done1;`
`wire signed [7:0] lzcnt;`	`wire signed [7:0] lzcnt;`

`// -----------------------------------------------------------`	`// -----------------------------------------------------------`
`// - decode the input operands`	`// - decode the input operands`
`// - derive basic information`	`// - derive basic information`
`// - calculate exponent`	`// - calculate exponent`
`// - calculate fraction`	`// - calculate fraction`
`// -----------------------------------------------------------`	`// -----------------------------------------------------------`

`fpDecomp #(WID) u1a (.i(a), .sgn(sa), .exp(xa), .fract(fracta), .xz(a_dn), .vz(az), .inf(aInf), .nan(aNan) );`	`fpDecomp #(WID) u1a (.i(a), .sgn(sa), .exp(xa), .fract(fracta), .xz(a_dn), .vz(az), .inf(aInf), .nan(aNan) );`
`fpDecomp #(WID) u1b (.i(b), .sgn(sb), .exp(xb), .fract(fractb), .xz(b_dn), .vz(bz), .inf(bInf), .nan(bNan) );`	`fpDecomp #(WID) u1b (.i(b), .sgn(sb), .exp(xb), .fract(fractb), .xz(b_dn), .vz(bz), .inf(bInf), .nan(bNan) );`

`// Compute the exponent.`	`// Compute the exponent.`
`// - correct the exponent for denormalized operands`	`// - correct the exponent for denormalized operands`
`// - adjust the difference by the bias (add 127)`	`// - adjust the difference by the bias (add 127)`
`// - also factor in the different decimal position for division`	`// - also factor in the different decimal position for division`
`ifndef GOLDSCHMIDT	`ifndef GOLDSCHMIDT
`assign ex1 = (xa\|a_dn) - (xb\|b_dn) + bias + FMSB + (FADD-1) - lzcnt - 8'd1;`	`assign ex1 = (xa\|a_dn) - (xb\|b_dn) + bias + FMSB + (FADD-1) - lzcnt - 8'd1;`
`else	`else
`assign ex1 = (xa\|a_dn) - (xb\|b_dn) + bias + FMSB - lzcnt + 8'd4;`	`assign ex1 = (xa\|a_dn) - (xb\|b_dn) + bias + FMSB - lzcnt + 8'd4;`
`endif	`endif

`// check for exponent underflow/overflow`	`// check for exponent underflow/overflow`
`wire under = ex1[EMSB+2]; // MSB set = negative exponent`	`wire under = ex1[EMSB+2]; // MSB set = negative exponent`
`wire over = (&ex1[EMSB:0] \| ex1[EMSB+1]) & !ex1[EMSB+2];`	`wire over = (&ex1[EMSB:0] \| ex1[EMSB+1]) & !ex1[EMSB+2];`

`// Perform divide`	`// Perform divide`
`// Divider width must be a multiple of four`	`// Divider width must be a multiple of four`
`ifndef GOLDSCHMIDT	`ifndef GOLDSCHMIDT
`fpdivr16 #(FMSB+FADD) u2 (.clk(clk), .ld(ld), .a({3'b0,fracta,8'b0}), .b({3'b0,fractb,8'b0}), .q(divo), .r(), .done(done1), .lzcnt(lzcnt));`	`fpdivr16 #(FMSB+FADD) u2 (.clk(clk), .ld(ld), .a({3'b0,fracta,8'b0}), .b({3'b0,fractb,8'b0}), .q(divo), .r(), .done(done1), .lzcnt(lzcnt));`
	`//fpdivr2 #(FMSB+FADD) u2 (.clk4x(clk4x), .ld(ld), .a({3'b0,fracta,8'b0}), .b({3'b0,fractb,8'b0}), .q(divo), .r(), .done(done1), .lzcnt(lzcnt));`
`wire [(FMSB+FADD)2-1:0] divo1 = divo[(FMSB+FADD)2-1:0] << (lzcnt-2);`	`wire [(FMSB+FADD)2-1:0] divo1 = divo[(FMSB+FADD)2-1:0] << (lzcnt-2);`
`else	`else
`DivGoldschmidt #(.WID(FMSB+6),.WHOLE(1),.POINTS(FMSB+5))`	`DivGoldschmidt #(.WID(FMSB+6),.WHOLE(1),.POINTS(FMSB+5))`
`u2 (.rst(rst), .clk(clk), .ld(ld), .a({fracta,4'b0}), .b({fractb,4'b0}), .q(divo), .done(done1), .lzcnt(lzcnt));`	`u2 (.rst(rst), .clk(clk), .ld(ld), .a({fracta,4'b0}), .b({fractb,4'b0}), .q(divo), .done(done1), .lzcnt(lzcnt));`
`wire [(FMSB+6)*2+1:0] divo1 =`	`wire [(FMSB+6)*2+1:0] divo1 =`
`lzcnt > 8'd5 ? divo << (lzcnt-8'd6) :`	`lzcnt > 8'd5 ? divo << (lzcnt-8'd6) :`
`divo >> (8'd6-lzcnt);`	`divo >> (8'd6-lzcnt);`
`;`	`;`
`endif	`endif
`delay1 #(1) u3 (.clk(clk), .ce(ce), .i(done1), .o(done));`	`delay1 #(1) u3 (.clk(clk), .ce(ce), .i(done1), .o(done));`


`// determine when a NaN is output`	`// determine when a NaN is output`
`wire qNaNOut = (az&bz)\|(aInf&bInf);`	`wire qNaNOut = (az&bz)\|(aInf&bInf);`

`always @(posedge clk)`	`always @(posedge clk)`
`// Simulation likes to see these values reset to zero on reset. Otherwise the`	`// Simulation likes to see these values reset to zero on reset. Otherwise the`
`// values propagate in sim as X's.`	`// values propagate in sim as X's.`
`if (rst) begin`	`if (rst) begin`
`xo <= 1'd0;`	`xo <= 1'd0;`
`mo <= 1'd0;`	`mo <= 1'd0;`
`so <= 1'd0;`	`so <= 1'd0;`
`sign_exe <= 1'd0;`	`sign_exe <= 1'd0;`
`overflow <= 1'd0;`	`overflow <= 1'd0;`
`underflow <= 1'd0;`	`underflow <= 1'd0;`
`end`	`end`
`else if (ce) begin`	`else if (ce) begin`
`if (done1) begin`	`if (done1) begin`
`casez({qNaNOut\|aNan\|bNan,bInf,bz,over,under})`	`casez({qNaNOut\|aNan\|bNan,bInf,bz,over,under})`
`5'b1????: xo <= infXp; // NaN exponent value`	`5'b1????: xo <= infXp; // NaN exponent value`
`5'b01???: xo <= 1'd0; // divide by inf`	`5'b01???: xo <= 1'd0; // divide by inf`
`5'b001??: xo <= infXp; // divide by zero`	`5'b001??: xo <= infXp; // divide by zero`
`5'b0001?: xo <= infXp; // overflow`	`5'b0001?: xo <= infXp; // overflow`
`5'b00001: xo <= 1'd0; // underflow`	`5'b00001: xo <= 1'd0; // underflow`
`default: xo <= ex1; // normal or underflow: passthru neg. exp. for normalization`	`default: xo <= ex1; // normal or underflow: passthru neg. exp. for normalization`
`endcase`	`endcase`

`casez({aNan,bNan,qNaNOut,bInf,bz,over,aInf&bInf,az&bz})`	`casez({aNan,bNan,qNaNOut,bInf,bz,over,aInf&bInf,az&bz})`
`8'b1???????: mo <= {1'b1,a[FMSB:0],{FMSB+1{1'b0}}};`	`8'b1???????: mo <= {1'b1,a[FMSB:0],{FMSB+1{1'b0}}};`
`8'b01??????: mo <= {1'b1,b[FMSB:0],{FMSB+1{1'b0}}};`	`8'b01??????: mo <= {1'b1,b[FMSB:0],{FMSB+1{1'b0}}};`
`8'b001?????: mo <= {1'b1,qNaN[FMSB:0]\|{aInf,1'b0}\|{az,bz},{FMSB+1{1'b0}}};`	`8'b001?????: mo <= {1'b1,qNaN[FMSB:0]\|{aInf,1'b0}\|{az,bz},{FMSB+1{1'b0}}};`
`8'b0001????: mo <= 1'd0; // div by inf`	`8'b0001????: mo <= 1'd0; // div by inf`
`8'b00001???: mo <= 1'd0; // div by zero`	`8'b00001???: mo <= 1'd0; // div by zero`
`8'b000001??: mo <= 1'd0; // Inf exponent`	`8'b000001??: mo <= 1'd0; // Inf exponent`
8'b0000001?: mo <= {1'b1,qNaN\|`QINFDIV,{FMSB+1{1'b0}}}; // infinity / infinity	8'b0000001?: mo <= {1'b1,qNaN\|`QINFDIV,{FMSB+1{1'b0}}}; // infinity / infinity
8'b00000001: mo <= {1'b1,qNaN\|`QZEROZERO,{FMSB+1{1'b0}}}; // zero / zero	8'b00000001: mo <= {1'b1,qNaN\|`QZEROZERO,{FMSB+1{1'b0}}}; // zero / zero
`ifndef GOLDSCHMIDT	`ifndef GOLDSCHMIDT
`default: mo <= divo1[(FMSB+FADD)2-1:(FADD-2)2-2]; // plain div`	`default: mo <= divo1[(FMSB+FADD)2-1:(FADD-2)2-2]; // plain div`
`else	`else
`default: mo <= divo1[(FMSB+6)*2+1:2]; // plain div`	`default: mo <= divo1[(FMSB+6)*2+1:2]; // plain div`
`endif	`endif
`endcase`	`endcase`

`so <= sa ^ sb;`	`so <= sa ^ sb;`
`sign_exe <= sa & sb;`	`sign_exe <= sa & sb;`
`overflow <= over;`	`overflow <= over;`
`underflow <= under;`	`underflow <= under;`
`end`	`end`
`end`	`end`

`endmodule`	`endmodule`

`module fpDivnr(rst, clk, ce, ld, op, a, b, o, rm, done, sign_exe, inf, overflow, underflow);`	`module fpDivnr(rst, clk, clk4x, ce, ld, op, a, b, o, rm, done, sign_exe, inf, overflow, underflow);`
`parameter WID=32;`	`parameter WID=32;`
`localparam MSB = WID-1;`	`include "fpSize.sv"
`localparam EMSB = WID==128 ? 14 :`
`WID==96 ? 14 :`
`WID==80 ? 14 :`
`WID==64 ? 10 :`
`WID==52 ? 10 :`
`WID==48 ? 11 :`
`WID==44 ? 10 :`
`WID==42 ? 10 :`
`WID==40 ? 9 :`
`WID==32 ? 7 :`
`WID==24 ? 6 : 4;`
`localparam FMSB = WID==128 ? 111 :`
`WID==96 ? 79 :`
`WID==80 ? 63 :`
`WID==64 ? 51 :`
`WID==52 ? 39 :`
`WID==48 ? 34 :`
`WID==44 ? 31 :`
`WID==42 ? 29 :`
`WID==40 ? 28 :`
`WID==32 ? 22 :`
`WID==24 ? 15 : 9;`

`localparam FX = (FMSB+2)*2-1; // the MSB of the expanded fraction`
`localparam EX = FX + 1 + EMSB + 1 + 1 - 1;`
`input rst;`	`input rst;`
`input clk;`	`input clk;`
	`input clk4x;`
`input ce;`	`input ce;`
`input ld;`	`input ld;`
`input op;`	`input op;`
`input [MSB:0] a, b;`	`input [MSB:0] a, b;`
`output [MSB:0] o;`	`output [MSB:0] o;`
`input [2:0] rm;`	`input [2:0] rm;`
`output sign_exe;`	`output sign_exe;`
`output done;`	`output done;`
`output inf;`	`output inf;`
`output overflow;`	`output overflow;`
`output underflow;`	`output underflow;`

`wire [EX:0] o1;`	`wire [EX:0] o1;`
`wire sign_exe1, inf1, overflow1, underflow1;`	`wire sign_exe1, inf1, overflow1, underflow1;`
`wire [MSB+3:0] fpn0;`	`wire [MSB+3:0] fpn0;`
`wire done1;`	`wire done1;`

`fpDiv #(WID) u1 (rst, clk, ce, ld, op, a, b, o1, done1, sign_exe1, overflow1, underflow1);`	`fpDiv #(WID) u1 (rst, clk, clk4x, ce, ld, op, a, b, o1, done1, sign_exe1, overflow1, underflow1);`
`fpNormalize #(WID) u2(.clk(clk), .ce(ce), .under(underflow1), .i(o1), .o(fpn0) );`	`fpNormalize #(WID) u2(.clk(clk), .ce(ce), .under(underflow1), .i(o1), .o(fpn0) );`
`fpRoundReg #(WID) u3(.clk(clk), .ce(ce), .rm(rm), .i(fpn0), .o(o) );`	`fpRoundReg #(WID) u3(.clk(clk), .ce(ce), .rm(rm), .i(fpn0), .o(o) );`
`delay2 #(1) u4(.clk(clk), .ce(ce), .i(sign_exe1), .o(sign_exe));`	`delay2 #(1) u4(.clk(clk), .ce(ce), .i(sign_exe1), .o(sign_exe));`
`delay2 #(1) u5(.clk(clk), .ce(ce), .i(inf1), .o(inf));`	`delay2 #(1) u5(.clk(clk), .ce(ce), .i(inf1), .o(inf));`
`delay2 #(1) u6(.clk(clk), .ce(ce), .i(overflow1), .o(overflow));`	`delay2 #(1) u6(.clk(clk), .ce(ce), .i(overflow1), .o(overflow));`
`delay2 #(1) u7(.clk(clk), .ce(ce), .i(underflow1), .o(underflow));`	`delay2 #(1) u7(.clk(clk), .ce(ce), .i(underflow1), .o(underflow));`
`delay2 #(1) u8(.clk(clk), .ce(ce), .i(done1), .o(done));`	`delay2 #(1) u8(.clk(clk), .ce(ce), .i(done1), .o(done));`
`endmodule`	`endmodule`

`timescale 1ns / 1ps

`timescale 1ns / 1ps

// ============================================================================

// ============================================================================

//        __

//        __

//   \\__/ o\    (C) 2006-2018  Robert Finch, Waterloo

//   \\__/ o\    (C) 2006-2019  Robert Finch, Waterloo

//    \  __ /    All rights reserved.

//    \  __ /    All rights reserved.

//     \/_//     robfinch<remove>@finitron.ca

//     \/_//     robfinch<remove>@finitron.ca

//       ||

//       ||

//

//

//      fpDiv.v

//      fpDiv.v

//    - floating point divider

//    - floating point divider

//    - parameterized width

//    - parameterized width

//    - IEEE 754 representation

//    - IEEE 754 representation

//

//

//

//

// This source file is free software: you can redistribute it and/or modify

// This source file is free software: you can redistribute it and/or modify

// it under the terms of the GNU Lesser General Public License as published

// it under the terms of the GNU Lesser General Public License as published

// by the Free Software Foundation, either version 3 of the License, or

// by the Free Software Foundation, either version 3 of the License, or

// (at your option) any later version.

// (at your option) any later version.

//

//

// This source file is distributed in the hope that it will be useful,

// This source file is distributed in the hope that it will be useful,

// but WITHOUT ANY WARRANTY; without even the implied warranty of

// but WITHOUT ANY WARRANTY; without even the implied warranty of

// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

// GNU General Public License for more details.

// GNU General Public License for more details.

//

//

// You should have received a copy of the GNU General Public License

// You should have received a copy of the GNU General Public License

// along with this program.  If not, see <http://www.gnu.org/licenses/>.

// along with this program.  If not, see <http://www.gnu.org/licenses/>.

//

//

//      Floating Point Multiplier / Divider

//      Floating Point Multiplier / Divider

//

//

//Properties:

//Properties:

//+-inf * +-inf = -+inf    (this is handled by exOver)

//+-inf * +-inf = -+inf    (this is handled by exOver)

//+-inf * 0     = QNaN

//+-inf * 0     = QNaN

//+-0 / +-0      = QNaN

//+-0 / +-0      = QNaN

// ============================================================================

// ============================================================================

`include "fp_defines.v"

`include "fp_defines.v"

`define GOLDSCHMIDT     1'b1

//`define GOLDSCHMIDT   1'b1

module fpDiv(rst, clk, ce, ld, op, a, b, o, done, sign_exe, overflow, underflow);

module fpDiv(rst, clk, clk4x, ce, ld, op, a, b, o, done, sign_exe, overflow, underflow);

parameter WID = 128;

parameter WID = 128;

localparam MSB = WID-1;

`include "fpSize.sv"

localparam EMSB = WID==128 ? 14 :

                  WID==96 ? 14 :

                  WID==80 ? 14 :

                  WID==64 ? 10 :

                                  WID==52 ? 10 :

                                  WID==48 ? 11 :

                                  WID==44 ? 10 :

                                  WID==42 ? 10 :

                                  WID==40 ?  9 :

                                  WID==32 ?  7 :

                                  WID==24 ?  6 : 4;

localparam FMSB = WID==128 ? 111 :

                  WID==96 ? 79 :

                  WID==80 ? 63 :

                  WID==64 ? 51 :

                                  WID==52 ? 39 :

                                  WID==48 ? 34 :

                                  WID==44 ? 31 :

                                  WID==42 ? 29 :

                                  WID==40 ? 28 :

                                  WID==32 ? 22 :

                                  WID==24 ? 15 : 9;

// FADD is a constant that makes the divider width a multiple of four and includes eight extra bits.

// FADD is a constant that makes the divider width a multiple of four and includes eight extra bits.

localparam FADD = WID==128 ? 9 :

localparam FADD = WID==128 ? 9 :

                                  WID==96 ? 9 :

                                  WID==96 ? 9 :

                                  WID==84 ? 9 :

                                  WID==80 ? 9 :

                                  WID==80 ? 9 :

                                  WID==64 ? 13 :

                                  WID==64 ? 13 :

                                  WID==52 ? 9 :

                                  WID==52 ? 9 :

                                  WID==48 ? 10 :

                                  WID==48 ? 10 :

                                  WID==44 ? 9 :

                                  WID==44 ? 9 :

                                  WID==42 ? 11 :

                                  WID==42 ? 11 :

                                  WID==40 ? 8 :

                                  WID==40 ? 8 :

                                  WID==32 ? 10 :

                                  WID==32 ? 10 :

                                  WID==24 ? 9 : 11;

                                  WID==24 ? 9 : 11;

localparam FX = (FMSB+2)*2-1;   // the MSB of the expanded fraction

localparam EX = FX + 1 + EMSB + 1 + 1 - 1;

input rst;

input rst;

input clk;

input clk;

input clk4x;

input ce;

input ce;

input ld;

input ld;

input op;

input op;

input [MSB:0] a, b;

input [MSB:0] a, b;

output [EX:0] o;

output [EX:0] o;

output done;

output done;

output sign_exe;

output sign_exe;

output overflow;

output overflow;

output underflow;

output underflow;

// registered outputs

// registered outputs

reg sign_exe=0;

reg sign_exe=0;

reg inf=0;

reg inf=0;

reg     overflow=0;

reg     overflow=0;

reg     underflow=0;

reg     underflow=0;

reg so;

reg so;

reg [EMSB:0] xo;

reg [EMSB:0] xo;

reg [FX:0] mo;

reg [FX:0] mo;

assign o = {so,xo,mo};

assign o = {so,xo,mo};

// constants

// constants

wire [EMSB:0] infXp = {EMSB+1{1'b1}};    // infinite / NaN - all ones

wire [EMSB:0] infXp = {EMSB+1{1'b1}};    // infinite / NaN - all ones

// The following is the value for an exponent of zero, with the offset

// The following is the value for an exponent of zero, with the offset

// eg. 8'h7f for eight bit exponent, 11'h7ff for eleven bit exponent, etc.

// eg. 8'h7f for eight bit exponent, 11'h7ff for eleven bit exponent, etc.

wire [EMSB:0] bias = {1'b0,{EMSB{1'b1}}};        //2^0 exponent

wire [EMSB:0] bias = {1'b0,{EMSB{1'b1}}};        //2^0 exponent

// The following is a template for a quiet nan. (MSB=1)

// The following is a template for a quiet nan. (MSB=1)

wire [FMSB:0] qNaN  = {1'b1,{FMSB{1'b0}}};

wire [FMSB:0] qNaN  = {1'b1,{FMSB{1'b0}}};

// variables

// variables

wire [EMSB+2:0] ex1;     // sum of exponents

wire [EMSB+2:0] ex1;     // sum of exponents

`ifndef GOLDSCHMIDT

`ifndef GOLDSCHMIDT

wire [(FMSB+FADD)*2-1:0] divo;

wire [(FMSB+FADD)*2-1:0] divo;

`else

`else

wire [(FMSB+5)*2-1:0] divo;

wire [(FMSB+5)*2-1:0] divo;

`endif

`endif

// Operands

// Operands

wire sa, sb;                    // sign bit

wire sa, sb;                    // sign bit

wire [EMSB:0] xa, xb;    // exponent bits

wire [EMSB:0] xa, xb;    // exponent bits

wire [FMSB+1:0] fracta, fractb;

wire [FMSB+1:0] fracta, fractb;

wire a_dn, b_dn;                        // a/b is denormalized

wire a_dn, b_dn;                        // a/b is denormalized

wire az, bz;

wire az, bz;

wire aInf, bInf;

wire aInf, bInf;

wire aNan,bNan;

wire aNan,bNan;

wire done1;

wire done1;

wire signed [7:0] lzcnt;

wire signed [7:0] lzcnt;

// -----------------------------------------------------------

// -----------------------------------------------------------

// - decode the input operands

// - decode the input operands

// - derive basic information

// - derive basic information

// - calculate exponent

// - calculate exponent

// - calculate fraction

// - calculate fraction

// -----------------------------------------------------------

// -----------------------------------------------------------

fpDecomp #(WID) u1a (.i(a), .sgn(sa), .exp(xa), .fract(fracta), .xz(a_dn), .vz(az), .inf(aInf), .nan(aNan) );

fpDecomp #(WID) u1a (.i(a), .sgn(sa), .exp(xa), .fract(fracta), .xz(a_dn), .vz(az), .inf(aInf), .nan(aNan) );

fpDecomp #(WID) u1b (.i(b), .sgn(sb), .exp(xb), .fract(fractb), .xz(b_dn), .vz(bz), .inf(bInf), .nan(bNan) );

fpDecomp #(WID) u1b (.i(b), .sgn(sb), .exp(xb), .fract(fractb), .xz(b_dn), .vz(bz), .inf(bInf), .nan(bNan) );

// Compute the exponent.

// Compute the exponent.

// - correct the exponent for denormalized operands

// - correct the exponent for denormalized operands

// - adjust the difference by the bias (add 127)

// - adjust the difference by the bias (add 127)

// - also factor in the different decimal position for division

// - also factor in the different decimal position for division

`ifndef GOLDSCHMIDT

`ifndef GOLDSCHMIDT

assign ex1 = (xa|a_dn) - (xb|b_dn) + bias + FMSB + (FADD-1) - lzcnt - 8'd1;

assign ex1 = (xa|a_dn) - (xb|b_dn) + bias + FMSB + (FADD-1) - lzcnt - 8'd1;

`else

`else

assign ex1 = (xa|a_dn) - (xb|b_dn) + bias + FMSB - lzcnt + 8'd4;

assign ex1 = (xa|a_dn) - (xb|b_dn) + bias + FMSB - lzcnt + 8'd4;

`endif

`endif

// check for exponent underflow/overflow

// check for exponent underflow/overflow

wire under = ex1[EMSB+2];       // MSB set = negative exponent

wire under = ex1[EMSB+2];       // MSB set = negative exponent

wire over = (&ex1[EMSB:0] | ex1[EMSB+1]) & !ex1[EMSB+2];

wire over = (&ex1[EMSB:0] | ex1[EMSB+1]) & !ex1[EMSB+2];

// Perform divide

// Perform divide

// Divider width must be a multiple of four

// Divider width must be a multiple of four

`ifndef GOLDSCHMIDT

`ifndef GOLDSCHMIDT

fpdivr16 #(FMSB+FADD) u2 (.clk(clk), .ld(ld), .a({3'b0,fracta,8'b0}), .b({3'b0,fractb,8'b0}), .q(divo), .r(), .done(done1), .lzcnt(lzcnt));

fpdivr16 #(FMSB+FADD) u2 (.clk(clk), .ld(ld), .a({3'b0,fracta,8'b0}), .b({3'b0,fractb,8'b0}), .q(divo), .r(), .done(done1), .lzcnt(lzcnt));

//fpdivr2 #(FMSB+FADD) u2 (.clk4x(clk4x), .ld(ld), .a({3'b0,fracta,8'b0}), .b({3'b0,fractb,8'b0}), .q(divo), .r(), .done(done1), .lzcnt(lzcnt));

wire [(FMSB+FADD)*2-1:0] divo1 = divo[(FMSB+FADD)*2-1:0] << (lzcnt-2);

wire [(FMSB+FADD)*2-1:0] divo1 = divo[(FMSB+FADD)*2-1:0] << (lzcnt-2);

`else

`else

DivGoldschmidt #(.WID(FMSB+6),.WHOLE(1),.POINTS(FMSB+5))

DivGoldschmidt #(.WID(FMSB+6),.WHOLE(1),.POINTS(FMSB+5))

        u2 (.rst(rst), .clk(clk), .ld(ld), .a({fracta,4'b0}), .b({fractb,4'b0}), .q(divo), .done(done1), .lzcnt(lzcnt));

        u2 (.rst(rst), .clk(clk), .ld(ld), .a({fracta,4'b0}), .b({fractb,4'b0}), .q(divo), .done(done1), .lzcnt(lzcnt));

wire [(FMSB+6)*2+1:0] divo1 =

wire [(FMSB+6)*2+1:0] divo1 =

        lzcnt > 8'd5 ? divo << (lzcnt-8'd6) :

        lzcnt > 8'd5 ? divo << (lzcnt-8'd6) :

        divo >> (8'd6-lzcnt);

        divo >> (8'd6-lzcnt);

`endif

`endif

delay1 #(1) u3 (.clk(clk), .ce(ce), .i(done1), .o(done));

delay1 #(1) u3 (.clk(clk), .ce(ce), .i(done1), .o(done));

// determine when a NaN is output

// determine when a NaN is output

wire qNaNOut = (az&bz)|(aInf&bInf);

wire qNaNOut = (az&bz)|(aInf&bInf);

always @(posedge clk)

always @(posedge clk)

// Simulation likes to see these values reset to zero on reset. Otherwise the

// Simulation likes to see these values reset to zero on reset. Otherwise the

// values propagate in sim as X's.

// values propagate in sim as X's.

if (rst) begin

if (rst) begin

        xo <= 1'd0;

        xo <= 1'd0;

        mo <= 1'd0;

        mo <= 1'd0;

        so <= 1'd0;

        so <= 1'd0;

        sign_exe <= 1'd0;

        sign_exe <= 1'd0;

        overflow <= 1'd0;

        overflow <= 1'd0;

        underflow <= 1'd0;

        underflow <= 1'd0;

end

end

else if (ce) begin

else if (ce) begin

                if (done1) begin

                if (done1) begin

                        casez({qNaNOut|aNan|bNan,bInf,bz,over,under})

                        casez({qNaNOut|aNan|bNan,bInf,bz,over,under})

                        5'b1????:               xo <= infXp;    // NaN exponent value

                        5'b1????:               xo <= infXp;    // NaN exponent value

                        5'b01???:               xo <= 1'd0;             // divide by inf

                        5'b01???:               xo <= 1'd0;             // divide by inf

                        5'b001??:               xo <= infXp;    // divide by zero

                        5'b001??:               xo <= infXp;    // divide by zero

                        5'b0001?:               xo <= infXp;    // overflow

                        5'b0001?:               xo <= infXp;    // overflow

                        5'b00001:               xo <= 1'd0;             // underflow

                        5'b00001:               xo <= 1'd0;             // underflow

                        default:                xo <= ex1;      // normal or underflow: passthru neg. exp. for normalization

                        default:                xo <= ex1;      // normal or underflow: passthru neg. exp. for normalization

                        endcase

                        endcase

                        casez({aNan,bNan,qNaNOut,bInf,bz,over,aInf&bInf,az&bz})

                        casez({aNan,bNan,qNaNOut,bInf,bz,over,aInf&bInf,az&bz})

                        8'b1???????:    mo <= {1'b1,a[FMSB:0],{FMSB+1{1'b0}}};

                        8'b1???????:    mo <= {1'b1,a[FMSB:0],{FMSB+1{1'b0}}};

                        8'b01??????:    mo <= {1'b1,b[FMSB:0],{FMSB+1{1'b0}}};

                        8'b01??????:    mo <= {1'b1,b[FMSB:0],{FMSB+1{1'b0}}};

                        8'b001?????:    mo <= {1'b1,qNaN[FMSB:0]|{aInf,1'b0}|{az,bz},{FMSB+1{1'b0}}};

                        8'b001?????:    mo <= {1'b1,qNaN[FMSB:0]|{aInf,1'b0}|{az,bz},{FMSB+1{1'b0}}};

                        8'b0001????:    mo <= 1'd0;     // div by inf

                        8'b0001????:    mo <= 1'd0;     // div by inf

                        8'b00001???:    mo <= 1'd0;     // div by zero

                        8'b00001???:    mo <= 1'd0;     // div by zero

                        8'b000001??:    mo <= 1'd0;     // Inf exponent

                        8'b000001??:    mo <= 1'd0;     // Inf exponent

                        8'b0000001?:    mo <= {1'b1,qNaN|`QINFDIV,{FMSB+1{1'b0}}};      // infinity / infinity

                        8'b0000001?:    mo <= {1'b1,qNaN|`QINFDIV,{FMSB+1{1'b0}}};      // infinity / infinity

                        8'b00000001:    mo <= {1'b1,qNaN|`QZEROZERO,{FMSB+1{1'b0}}};    // zero / zero

                        8'b00000001:    mo <= {1'b1,qNaN|`QZEROZERO,{FMSB+1{1'b0}}};    // zero / zero

`ifndef GOLDSCHMIDT

`ifndef GOLDSCHMIDT

                        default:                mo <= divo1[(FMSB+FADD)*2-1:(FADD-2)*2-2];      // plain div

                        default:                mo <= divo1[(FMSB+FADD)*2-1:(FADD-2)*2-2];      // plain div

`else

`else

                        default:                mo <= divo1[(FMSB+6)*2+1:2];    // plain div

                        default:                mo <= divo1[(FMSB+6)*2+1:2];    // plain div

`endif

`endif

                        endcase

                        endcase

                        so              <= sa ^ sb;

                        so              <= sa ^ sb;

                        sign_exe        <= sa & sb;

                        sign_exe        <= sa & sb;

                        overflow        <= over;

                        overflow        <= over;

                        underflow       <= under;

                        underflow       <= under;

end

end

end

end

endmodule

endmodule

module fpDivnr(rst, clk, ce, ld, op, a, b, o, rm, done, sign_exe, inf, overflow, underflow);

module fpDivnr(rst, clk, clk4x, ce, ld, op, a, b, o, rm, done, sign_exe, inf, overflow, underflow);

parameter WID=32;

parameter WID=32;

localparam MSB = WID-1;

`include "fpSize.sv"

localparam EMSB = WID==128 ? 14 :

                  WID==96 ? 14 :

                  WID==80 ? 14 :

                  WID==64 ? 10 :

                                  WID==52 ? 10 :

                                  WID==48 ? 11 :

                                  WID==44 ? 10 :

                                  WID==42 ? 10 :

                                  WID==40 ?  9 :

                                  WID==32 ?  7 :

                                  WID==24 ?  6 : 4;

localparam FMSB = WID==128 ? 111 :

                  WID==96 ? 79 :

                  WID==80 ? 63 :

                  WID==64 ? 51 :

                                  WID==52 ? 39 :

                                  WID==48 ? 34 :

                                  WID==44 ? 31 :

                                  WID==42 ? 29 :

                                  WID==40 ? 28 :

                                  WID==32 ? 22 :

                                  WID==24 ? 15 : 9;

localparam FX = (FMSB+2)*2-1;   // the MSB of the expanded fraction

localparam EX = FX + 1 + EMSB + 1 + 1 - 1;

input rst;

input rst;

input clk;

input clk;

input clk4x;

input ce;

input ce;

input ld;

input ld;

input op;

input op;

input  [MSB:0] a, b;

input  [MSB:0] a, b;

output [MSB:0] o;

output [MSB:0] o;

input [2:0] rm;

input [2:0] rm;

output sign_exe;

output sign_exe;

output done;

output done;

output inf;

output inf;

output overflow;

output overflow;

output underflow;

output underflow;

wire [EX:0] o1;

wire [EX:0] o1;

wire sign_exe1, inf1, overflow1, underflow1;

wire sign_exe1, inf1, overflow1, underflow1;

wire [MSB+3:0] fpn0;

wire [MSB+3:0] fpn0;

wire done1;

wire done1;

fpDiv       #(WID) u1 (rst, clk, ce, ld, op, a, b, o1, done1, sign_exe1, overflow1, underflow1);

fpDiv       #(WID) u1 (rst, clk, clk4x, ce, ld, op, a, b, o1, done1, sign_exe1, overflow1, underflow1);

fpNormalize #(WID) u2(.clk(clk), .ce(ce), .under(underflow1), .i(o1), .o(fpn0) );

fpNormalize #(WID) u2(.clk(clk), .ce(ce), .under(underflow1), .i(o1), .o(fpn0) );

fpRoundReg  #(WID) u3(.clk(clk), .ce(ce), .rm(rm), .i(fpn0), .o(o) );

fpRoundReg  #(WID) u3(.clk(clk), .ce(ce), .rm(rm), .i(fpn0), .o(o) );

delay2      #(1)   u4(.clk(clk), .ce(ce), .i(sign_exe1), .o(sign_exe));

delay2      #(1)   u4(.clk(clk), .ce(ce), .i(sign_exe1), .o(sign_exe));

delay2      #(1)   u5(.clk(clk), .ce(ce), .i(inf1), .o(inf));

delay2      #(1)   u5(.clk(clk), .ce(ce), .i(inf1), .o(inf));

delay2      #(1)   u6(.clk(clk), .ce(ce), .i(overflow1), .o(overflow));

delay2      #(1)   u6(.clk(clk), .ce(ce), .i(overflow1), .o(overflow));

delay2      #(1)   u7(.clk(clk), .ce(ce), .i(underflow1), .o(underflow));

delay2      #(1)   u7(.clk(clk), .ce(ce), .i(underflow1), .o(underflow));

delay2            #(1)   u8(.clk(clk), .ce(ce), .i(done1), .o(done));

delay2            #(1)   u8(.clk(clk), .ce(ce), .i(done1), .o(done));

endmodule

endmodule

Browse

Tools

Subversion Repositories ft816float

[/] [ft816float/] [trunk/] [rtl/] [verilog/] [fpDiv.v] - Diff between revs 14 and 26