OpenCores

Rev 80	Rev 81
`timescale 1ns / 1ps	`timescale 1ns / 1ps
`// ============================================================================`	`// ============================================================================`
`// __`	`// __`
`// \\__/ o\ (C) 2006-2022 Robert Finch, Waterloo`	`// \\__/ o\ (C) 2006-2022 Robert Finch, Waterloo`
`// \ __ / All rights reserved.`	`// \ __ / All rights reserved.`
`// \/_// robfinch@finitron.ca`	`// \/_// robfinch@finitron.ca`
`// \|\|`	`// \|\|`
`//`	`//`
`// DFPDivide96.sv`	`// DFPDivide96.sv`
`// - decimal floating point divider`	`// - decimal floating point divider`
`// - parameterized width`	`// - parameterized width`
`//`	`//`
`//`	`//`
`// BSD 3-Clause License`	`// BSD 3-Clause License`
`// Redistribution and use in source and binary forms, with or without`	`// Redistribution and use in source and binary forms, with or without`
`// modification, are permitted provided that the following conditions are met:`	`// modification, are permitted provided that the following conditions are met:`
`//`	`//`
`// 1. Redistributions of source code must retain the above copyright notice, this`	`// 1. Redistributions of source code must retain the above copyright notice, this`
`// list of conditions and the following disclaimer.`	`// list of conditions and the following disclaimer.`
`//`	`//`
`// 2. Redistributions in binary form must reproduce the above copyright notice,`	`// 2. Redistributions in binary form must reproduce the above copyright notice,`
`// this list of conditions and the following disclaimer in the documentation`	`// this list of conditions and the following disclaimer in the documentation`
`// and/or other materials provided with the distribution.`	`// and/or other materials provided with the distribution.`
`//`	`//`
`// 3. Neither the name of the copyright holder nor the names of its`	`// 3. Neither the name of the copyright holder nor the names of its`
`// contributors may be used to endorse or promote products derived from`	`// contributors may be used to endorse or promote products derived from`
`// this software without specific prior written permission.`	`// this software without specific prior written permission.`
`//`	`//`
`// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"`	`// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"`
`// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE`	`// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE`
`// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE`	`// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE`
`// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE`	`// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE`
`// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL`	`// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL`
`// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR`	`// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR`
`// SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER`	`// SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER`
`// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,`	`// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,`
`// OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE`	`// OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE`
`// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.`	`// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.`
`//`	`//`
`// Floating Point Divider`	`// Floating Point Divider`
`//`	`//`
`//Properties:`	`//Properties:`
`//+-inf * +-inf = -+inf (this is handled by exOver)`	`//+-inf * +-inf = -+inf (this is handled by exOver)`
`//+-inf * 0 = QNaN`	`//+-inf * 0 = QNaN`
`//+-0 / +-0 = QNaN`	`//+-0 / +-0 = QNaN`
`// ============================================================================`	`// ============================================================================`

`import DFPPkg::*;`	`import DFPPkg::*;`

`define QINFDIV 4'd2	`define QINFDIV 4'd2
`define QZEROZERO 4'd3	`define QZEROZERO 4'd3

`module DFPDivide96(rst, clk, ce, ld, op, a, b, o, done, sign_exe, overflow, underflow);`	`module DFPDivide96(rst, clk, ce, ld, op, a, b, o, done, sign_exe, overflow, underflow);`
`parameter N=25;`	`parameter N=25;`
`// FADD is a constant that makes the divider width a multiple of four and includes eight extra bits.`	`// FADD is a constant that makes the divider width a multiple of four and includes eight extra bits.`
`input rst;`	`input rst;`
`input clk;`	`input clk;`
`input ce;`	`input ce;`
`input ld;`	`input ld;`
`input op;`	`input op;`
`input DFP96 a, b;`	`input DFP96 a, b;`
`output DFP96UD o;`	`output DFP96UD o;`
`output reg done;`	`output reg done;`
`output sign_exe;`	`output sign_exe;`
`output overflow;`	`output overflow;`
`output underflow;`	`output underflow;`

`// registered outputs`	`// registered outputs`
`reg sign_exe=0;`	`reg sign_exe=0;`
`reg inf=0;`	`reg inf=0;`
`reg overflow=0;`	`reg overflow=0;`
`reg underflow=0;`	`reg underflow=0;`

`reg so, sxo;`	`reg so, sxo;`
`reg [11:0] xo;`	`reg [11:0] xo;`
`reg [(N+1)42-1:0] mo;`	`reg [(N+1)42-1:0] mo;`

`DFP96U au, bu;`	`DFP96U au, bu;`
`DFPUnpack96 u01 (a, au);`	`DFPUnpack96 u01 (a, au);`
`DFPUnpack96 u02 (b, bu);`	`DFPUnpack96 u02 (b, bu);`

`// constants`	`// constants`
`wire [11:0] infXp = 12'hBFF; // infinite / NaN - all ones`	`wire [11:0] infXp = 12'hBFF; // infinite / NaN - all ones`
`wire [11:0] bias = 12'h5FF;`	`wire [11:0] bias = 12'h5FF;`
`// The following is the value for an exponent of zero, with the offset`	`// The following is the value for an exponent of zero, with the offset`
`// eg. 8'h7f for eight bit exponent, 11'h7ff for eleven bit exponent, etc.`	`// eg. 8'h7f for eight bit exponent, 11'h7ff for eleven bit exponent, etc.`
`// The following is a template for a quiet nan. (MSB=1)`	`// The following is a template for a quiet nan. (MSB=1)`
`wire [N4-1:0] qNaN = {4'h1,{(N-1)4{1'b0}}};`	`wire [N4-1:0] qNaN = {4'h1,{(N-1)4{1'b0}}};`

`// variables`	`// variables`
`wire [(N+2)42-1:0] divo;`	`wire [(N+2)42-1:0] divo;`

`// Operands`	`// Operands`
`reg sa, sb; // sign bit`	`reg sa, sb; // sign bit`
`reg [N*4-1:0] siga, sigb;`	`reg [N*4-1:0] siga, sigb;`
`reg az, bz;`	`reg az, bz;`
`reg aInf, bInf;`	`reg aInf, bInf;`
`reg aNan,bNan;`	`reg aNan,bNan;`
`wire done1;`	`wire done1;`
`wire signed [7:0] lzcnt;`	`wire signed [7:0] lzcnt;`

`// -----------------------------------------------------------`	`// -----------------------------------------------------------`
`// Clock #1`	`// Clock #1`
`// - decode the input operands`	`// - decode the input operands`
`// - derive basic information`	`// - derive basic information`
`// - calculate fraction`	`// - calculate fraction`
`// -----------------------------------------------------------`	`// -----------------------------------------------------------`
`reg ld1;`	`reg ld1;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) sa <= au.sign;`	`if (ce) sa <= au.sign;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) sb <= bu.sign;`	`if (ce) sb <= bu.sign;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) siga <= au.sig;`	`if (ce) siga <= au.sig;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) sigb <= bu.sig;`	`if (ce) sigb <= bu.sig;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) az <= au.exp==12'd0 && au.sig==100'd0;`	`if (ce) az <= au.exp==12'd0 && au.sig==100'd0;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) bz <= bu.exp==12'd0 && bu.sig==100'd0;`	`if (ce) bz <= bu.exp==12'd0 && bu.sig==100'd0;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) aInf <= au.infinity;`	`if (ce) aInf <= au.infinity;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) bInf <= bu.infinity;`	`if (ce) bInf <= bu.infinity;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) aNan <= au.nan;`	`if (ce) aNan <= au.nan;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) bNan <= bu.nan;`	`if (ce) bNan <= bu.nan;`
`ft_delay #(.WID(1), .DEP(1)) udly1 (.clk(clk), .ce(ce), .i(ld), .o(ld1));`	`ft_delay #(.WID(1), .DEP(1)) udly1 (.clk(clk), .ce(ce), .i(ld), .o(ld1));`

`// -----------------------------------------------------------`	`// -----------------------------------------------------------`
`// Clock #2 to N`	`// Clock #2 to N`
`// - calculate fraction`	`// - calculate fraction`
`// -----------------------------------------------------------`	`// -----------------------------------------------------------`
`wire done3a,done3;`	`wire done3a,done3;`
`// Perform divide`	`// Perform divide`
`dfdiv2 #(N+2) u2 (.clk(clk), .ld(ld1), .a({siga,8'b0}), .b({sigb,8'b0}), .q(divo), .r(), .done(done1), .lzcnt(lzcnt));`	`dfdiv2 #(N+2) u2 (.clk(clk), .ld(ld1), .a({siga,8'b0}), .b({sigb,8'b0}), .q(divo), .r(), .done(done1), .lzcnt(lzcnt));`
`//wire [7:0] lzcnt_bin = lzcnt[3:0] + (lzcnt[7:4] * 10);`	`//wire [7:0] lzcnt_bin = lzcnt[3:0] + (lzcnt[7:4] * 10);`
`wire [(N+2)42-1:0] divo1 = divo[(N+2)42-1:0] << ({lzcnt-1,2'b0});//WAS FPWID=128?+44`	`wire [(N+2)42-1:0] divo1 = divo[(N+2)42-1:0] << ({lzcnt-1,2'b0});//WAS FPWID=128?+44`
`ft_delay #(.WID(1), .DEP(3)) u3 (.clk(clk), .ce(ce), .i(done1), .o(done3a));`	`ft_delay #(.WID(1), .DEP(3)) u3 (.clk(clk), .ce(ce), .i(done1), .o(done3a));`
`assign done3 = done1&done3a;`	`assign done3 = done1&done3a;`

`// -----------------------------------------------------------`	`// -----------------------------------------------------------`
`// Clock #N+1`	`// Clock #N+1`
`// - calculate exponent`	`// - calculate exponent`
`// - calculate fraction`	`// - calculate fraction`
`// - determine when a NaN is output`	`// - determine when a NaN is output`
`// -----------------------------------------------------------`	`// -----------------------------------------------------------`
`// Compute the exponent.`	`// Compute the exponent.`
`// - correct the exponent for denormalized operands`	`// - correct the exponent for denormalized operands`
`// - adjust the difference by the bias (add 127)`	`// - adjust the difference by the bias (add 127)`
`// - also factor in the different decimal position for division`	`// - also factor in the different decimal position for division`
`reg [13:0] ex1; // sum of exponents`	`reg [13:0] ex1; // sum of exponents`
`reg qNaNOut;`	`reg qNaNOut;`

`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) ex1 <= au.exp - bu.exp + bias - (({lzcnt,2'b00} > N+2) ? lzcnt-(N+2) : 0);`	`if (ce) ex1 <= au.exp - bu.exp + bias - (({lzcnt,2'b00} > N+2) ? lzcnt-(N+2) : 0);`

`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) qNaNOut <= (az&bz)\|(aInf&bInf);`	`if (ce) qNaNOut <= (az&bz)\|(aInf&bInf);`

`wire over = 1'b0;`	`wire over = 1'b0;`
`wire under = &ex1[13:12];`	`wire under = &ex1[13:12];`
`reg [3:0] st;`	`reg [3:0] st;`

`// -----------------------------------------------------------`	`// -----------------------------------------------------------`
`// Clock #N+3`	`// Clock #N+3`
`// -----------------------------------------------------------`	`// -----------------------------------------------------------`
`always_ff @(posedge clk)`	`always_ff @(posedge clk)`
`// Simulation likes to see these values reset to zero on reset. Otherwise the`	`// Simulation likes to see these values reset to zero on reset. Otherwise the`
`// values propagate in sim as X's.`	`// values propagate in sim as X's.`
`if (rst) begin`	`if (rst) begin`
`xo <= 1'd0;`	`xo <= 1'd0;`
`mo <= 1'd0;`	`mo <= 1'd0;`
`so <= 1'd0;`	`so <= 1'd0;`
`sign_exe <= 1'd0;`	`sign_exe <= 1'd0;`
`overflow <= 1'd0;`	`overflow <= 1'd0;`
`underflow <= 1'd0;`	`underflow <= 1'd0;`
`done <= 1'b1;`	`done <= 1'b1;`
`end`	`end`
`else if (ce) begin`	`else if (ce) begin`
`done <= 1'b0;`	`done <= 1'b0;`
`if (done3&done1) begin`	`if (done3&done1) begin`
`done <= 1'b1;`	`done <= 1'b1;`

`casez({qNaNOut\|aNan\|bNan,bInf,bz,over,under})`	`casez({qNaNOut\|aNan\|bNan,bInf,bz,over,under})`
`5'b1????: xo <= infXp; // NaN exponent value`	`5'b1????: xo <= infXp; // NaN exponent value`
`5'b01???: xo <= 1'd0; // divide by inf`	`5'b01???: xo <= 1'd0; // divide by inf`
`5'b001??: xo <= infXp; // divide by zero`	`5'b001??: xo <= infXp; // divide by zero`
`5'b0001?: xo <= infXp; // overflow`	`5'b0001?: xo <= infXp; // overflow`
`5'b00001: xo <= 1'd0; // underflow`	`5'b00001: xo <= 1'd0; // underflow`
`default: xo <= ex1; // normal or underflow: passthru neg. exp. for normalization`	`default: xo <= ex1; // normal or underflow: passthru neg. exp. for normalization`
`endcase`	`endcase`

`casez({aNan,bNan,qNaNOut,bInf,bz,over,aInf&bInf,az&bz})`	`casez({aNan,bNan,qNaNOut,bInf,bz,over,aInf&bInf,az&bz})`
`8'b1???????: begin mo <= {4'h1,au[N4-1:0],{(N+1)4-1{1'b0}}}; st[3] <= 1'b1; end`	`8'b1???????: begin mo <= {4'h1,au[N4-1:0],{(N+1)4-1{1'b0}}}; st[3] <= 1'b1; end`
`8'b01??????: begin mo <= {4'h1,bu[N4-1:0],{(N+1)4-1{1'b0}}}; st[3] <= 1'b1; end`	`8'b01??????: begin mo <= {4'h1,bu[N4-1:0],{(N+1)4-1{1'b0}}}; st[3] <= 1'b1; end`
`8'b001?????: begin mo <= {4'h1,qNaN[N4-1:0]\|{aInf,1'b0}\|{az,bz},{(N+1)4-1{1'b0}}}; st[3] <= 1'b1; end`	`8'b001?????: begin mo <= {4'h1,qNaN[N4-1:0]\|{aInf,1'b0}\|{az,bz},{(N+1)4-1{1'b0}}}; st[3] <= 1'b1; end`
`8'b0001????: begin mo <= {(N+1)42-1{1'd0}}; st[3] <= 1'b0; end // div by inf`	`8'b0001????: begin mo <= {(N+1)42-1{1'd0}}; st[3] <= 1'b0; end // div by inf`
`8'b00001???: begin mo <= {(N+1)42-1{1'd0}}; st[3] <= 1'b0; end // div by zero`	`8'b00001???: begin mo <= {(N+1)42-1{1'd0}}; st[3] <= 1'b0; end // div by zero`
`8'b000001??: begin mo <= {(N+1)42-1{1'd0}}; st[3] <= 1'b0; end // Inf exponent`	`8'b000001??: begin mo <= {(N+1)42-1{1'd0}}; st[3] <= 1'b0; end // Inf exponent`
8'b0000001?: begin mo <= {4'h1,qNaN\|`QINFDIV,{(N+1)*4-1{1'b0}}}; st[3] <= 1'b1; end // infinity / infinity	8'b0000001?: begin mo <= {4'h1,qNaN\|`QINFDIV,{(N+1)*4-1{1'b0}}}; st[3] <= 1'b1; end // infinity / infinity
8'b00000001: begin mo <= {4'h1,qNaN\|`QZEROZERO,{(N+1)*4-1{1'b0}}}; st[3] <= 1'b1; end // zero / zero	8'b00000001: begin mo <= {4'h1,qNaN\|`QZEROZERO,{(N+1)*4-1{1'b0}}}; st[3] <= 1'b1; end // zero / zero
`default: begin mo <= divo1[(N+2)42-1:8]; st[3] <= 1'b0; end // plain div`	`default: begin mo <= divo1[(N+2)42-1:8]; st[3] <= 1'b0; end // plain div`
`endcase`	`endcase`

`sign_exe <= sa & sb;`	`sign_exe <= sa & sb;`
`overflow <= over;`	`overflow <= over;`
`underflow <= under;`	`underflow <= under;`

`o.nan <= aNan\|bNan\|qNaNOut;`	`o.nan <= aNan\|bNan\|qNaNOut;`
`o.snan <= aNan\|bNan\|qNaNOut;`	`o.snan <= aNan\|bNan\|qNaNOut;`
`o.qnan <= 1'b0;`	`o.qnan <= 1'b0;`
`o.infinity <= over\|aInf;`	`o.infinity <= over\|aInf;`
`o.sign <= sa ^ sb;`	`o.sign <= sa ^ sb;`
`o.exp <= xo;`	`o.exp <= xo;`
`o.sig <= mo;`	`o.sig <= mo;`
`end`	`end`
`end`	`end`

`endmodule`	`endmodule`

`module DFPDivide96nr(rst, clk, ce, ld, op, a, b, o, rm, done, sign_exe, inf, overflow, underflow);`	`module DFPDivide96nr(rst, clk, ce, ld, op, a, b, o, rm, done, sign_exe, inf, overflow, underflow);`
`parameter N=25;`	`parameter N=25;`
`input rst;`	`input rst;`
`input clk;`	`input clk;`
`input ce;`	`input ce;`
`input ld;`	`input ld;`
`input op;`	`input op;`
`input DFP96 a, b;`	`input DFP96 a, b;`
`output DFP96 o;`	`output DFP96 o;`
`input [2:0] rm;`	`input [2:0] rm;`
`output sign_exe;`	`output sign_exe;`
`output done;`	`output done;`
`output inf;`	`output inf;`
`output overflow;`	`output overflow;`
`output underflow;`	`output underflow;`

`DFP96UD o1;`	`DFP96UD o1;`
`wire sign_exe1, inf1, overflow1, underflow1;`	`wire sign_exe1, inf1, overflow1, underflow1;`
`DFP96UN fpn0;`	`DFP96UN fpn0;`
`wire done1, done1a;`	`wire done1, done1a;`

`DFPDivide96 #(.N(N)) u1 (rst, clk, ce, ld, op, a, b, o1, done1, sign_exe1, overflow1, underflow1);`	`DFPDivide96 #(.N(N)) u1 (rst, clk, ce, ld, op, a, b, o1, done1, sign_exe1, overflow1, underflow1);`
`DFPNormalize96 #(.N(N)) u2(.clk(clk), .ce(ce), .under_i(underflow1), .i(o1), .o(fpn0) );`	`DFPNormalize96 #(.N(N)) u2(.clk(clk), .ce(ce), .under_i(underflow1), .i(o1), .o(fpn0) );`
`DFPRound96 #(.N(N)) u3(.clk(clk), .ce(ce), .rm(rm), .i(fpn0), .o(o) );`	`DFPRound96 #(.N(N)) u3(.clk(clk), .ce(ce), .rm(rm), .i(fpn0), .o(o) );`
`delay2 #(1) u4(.clk(clk), .ce(ce), .i(sign_exe1), .o(sign_exe));`	`delay2 #(1) u4(.clk(clk), .ce(ce), .i(sign_exe1), .o(sign_exe));`
`delay2 #(1) u5(.clk(clk), .ce(ce), .i(inf1), .o(inf));`	`delay2 #(1) u5(.clk(clk), .ce(ce), .i(inf1), .o(inf));`
`delay2 #(1) u6(.clk(clk), .ce(ce), .i(overflow1), .o(overflow));`	`delay2 #(1) u6(.clk(clk), .ce(ce), .i(overflow1), .o(overflow));`
`delay2 #(1) u7(.clk(clk), .ce(ce), .i(underflow1), .o(underflow));`	`delay2 #(1) u7(.clk(clk), .ce(ce), .i(underflow1), .o(underflow));`
`ft_delay #(.WID(1),.DEP(11)) u8(.clk(clk), .ce(ce), .i(done1), .o(done1a));`	`ft_delay #(.WID(1),.DEP(14)) u8(.clk(clk), .ce(ce), .i(done1), .o(done1a));`
`assign done = done1&done1a;`	`assign done = done1&done1a;`

`endmodule`	`endmodule`

`timescale 1ns / 1ps

`timescale 1ns / 1ps

// ============================================================================

// ============================================================================

//        __

//        __

//   \\__/ o\    (C) 2006-2022  Robert Finch, Waterloo

//   \\__/ o\    (C) 2006-2022  Robert Finch, Waterloo

//    \  __ /    All rights reserved.

//    \  __ /    All rights reserved.

//     \/_//     robfinch@finitron.ca

//     \/_//     robfinch@finitron.ca

//       ||

//       ||

//

//

//      DFPDivide96.sv

//      DFPDivide96.sv

//    - decimal floating point divider

//    - decimal floating point divider

//    - parameterized width

//    - parameterized width

//

//

//

//

// BSD 3-Clause License

// BSD 3-Clause License

// Redistribution and use in source and binary forms, with or without

// Redistribution and use in source and binary forms, with or without

// modification, are permitted provided that the following conditions are met:

// modification, are permitted provided that the following conditions are met:

//

//

// 1. Redistributions of source code must retain the above copyright notice, this

// 1. Redistributions of source code must retain the above copyright notice, this

//    list of conditions and the following disclaimer.

//    list of conditions and the following disclaimer.

//

//

// 2. Redistributions in binary form must reproduce the above copyright notice,

// 2. Redistributions in binary form must reproduce the above copyright notice,

//    this list of conditions and the following disclaimer in the documentation

//    this list of conditions and the following disclaimer in the documentation

//    and/or other materials provided with the distribution.

//    and/or other materials provided with the distribution.

//

//

// 3. Neither the name of the copyright holder nor the names of its

// 3. Neither the name of the copyright holder nor the names of its

//    contributors may be used to endorse or promote products derived from

//    contributors may be used to endorse or promote products derived from

//    this software without specific prior written permission.

//    this software without specific prior written permission.

//

//

// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE

// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE

// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL

// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL

// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR

// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR

// SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER

// SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER

// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,

// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,

// OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

// OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

//

//

//      Floating Point Divider

//      Floating Point Divider

//

//

//Properties:

//Properties:

//+-inf * +-inf = -+inf    (this is handled by exOver)

//+-inf * +-inf = -+inf    (this is handled by exOver)

//+-inf * 0     = QNaN

//+-inf * 0     = QNaN

//+-0 / +-0      = QNaN

//+-0 / +-0      = QNaN

// ============================================================================

// ============================================================================

import DFPPkg::*;

import DFPPkg::*;

`define QINFDIV         4'd2

`define QINFDIV         4'd2

`define QZEROZERO       4'd3

`define QZEROZERO       4'd3

module DFPDivide96(rst, clk, ce, ld, op, a, b, o, done, sign_exe, overflow, underflow);

module DFPDivide96(rst, clk, ce, ld, op, a, b, o, done, sign_exe, overflow, underflow);

parameter N=25;

parameter N=25;

// FADD is a constant that makes the divider width a multiple of four and includes eight extra bits.

// FADD is a constant that makes the divider width a multiple of four and includes eight extra bits.

input rst;

input rst;

input clk;

input clk;

input ce;

input ce;

input ld;

input ld;

input op;

input op;

input  DFP96 a, b;

input  DFP96 a, b;

output DFP96UD o;

output DFP96UD o;

output reg done;

output reg done;

output sign_exe;

output sign_exe;

output overflow;

output overflow;

output underflow;

output underflow;

// registered outputs

// registered outputs

reg sign_exe=0;

reg sign_exe=0;

reg inf=0;

reg inf=0;

reg     overflow=0;

reg     overflow=0;

reg     underflow=0;

reg     underflow=0;

reg so, sxo;

reg so, sxo;

reg [11:0] xo;

reg [11:0] xo;

reg [(N+1)*4*2-1:0] mo;

reg [(N+1)*4*2-1:0] mo;

DFP96U au, bu;

DFP96U au, bu;

DFPUnpack96 u01 (a, au);

DFPUnpack96 u01 (a, au);

DFPUnpack96 u02 (b, bu);

DFPUnpack96 u02 (b, bu);

// constants

// constants

wire [11:0] infXp = 12'hBFF;    // infinite / NaN - all ones

wire [11:0] infXp = 12'hBFF;    // infinite / NaN - all ones

wire [11:0] bias = 12'h5FF;

wire [11:0] bias = 12'h5FF;

// The following is the value for an exponent of zero, with the offset

// The following is the value for an exponent of zero, with the offset

// eg. 8'h7f for eight bit exponent, 11'h7ff for eleven bit exponent, etc.

// eg. 8'h7f for eight bit exponent, 11'h7ff for eleven bit exponent, etc.

// The following is a template for a quiet nan. (MSB=1)

// The following is a template for a quiet nan. (MSB=1)

wire [N*4-1:0] qNaN  = {4'h1,{(N-1)*4{1'b0}}};

wire [N*4-1:0] qNaN  = {4'h1,{(N-1)*4{1'b0}}};

// variables

// variables

wire [(N+2)*4*2-1:0] divo;

wire [(N+2)*4*2-1:0] divo;

// Operands

// Operands

reg sa, sb;                     // sign bit

reg sa, sb;                     // sign bit

reg [N*4-1:0] siga, sigb;

reg [N*4-1:0] siga, sigb;

reg az, bz;

reg az, bz;

reg aInf, bInf;

reg aInf, bInf;

reg aNan,bNan;

reg aNan,bNan;

wire done1;

wire done1;

wire signed [7:0] lzcnt;

wire signed [7:0] lzcnt;

// -----------------------------------------------------------

// -----------------------------------------------------------

// Clock #1

// Clock #1

// - decode the input operands

// - decode the input operands

// - derive basic information

// - derive basic information

// - calculate fraction

// - calculate fraction

// -----------------------------------------------------------

// -----------------------------------------------------------

reg ld1;

reg ld1;

always @(posedge clk)

always @(posedge clk)

        if (ce) sa <= au.sign;

        if (ce) sa <= au.sign;

always @(posedge clk)

always @(posedge clk)

        if (ce) sb <= bu.sign;

        if (ce) sb <= bu.sign;

always @(posedge clk)

always @(posedge clk)

        if (ce) siga <= au.sig;

        if (ce) siga <= au.sig;

always @(posedge clk)

always @(posedge clk)

        if (ce) sigb <= bu.sig;

        if (ce) sigb <= bu.sig;

always @(posedge clk)

always @(posedge clk)

        if (ce) az <= au.exp==12'd0 && au.sig==100'd0;

        if (ce) az <= au.exp==12'd0 && au.sig==100'd0;

always @(posedge clk)

always @(posedge clk)

        if (ce) bz <= bu.exp==12'd0 && bu.sig==100'd0;

        if (ce) bz <= bu.exp==12'd0 && bu.sig==100'd0;

always @(posedge clk)

always @(posedge clk)

        if (ce) aInf <= au.infinity;

        if (ce) aInf <= au.infinity;

always @(posedge clk)

always @(posedge clk)

        if (ce) bInf <= bu.infinity;

        if (ce) bInf <= bu.infinity;

always @(posedge clk)

always @(posedge clk)

        if (ce) aNan <= au.nan;

        if (ce) aNan <= au.nan;

always @(posedge clk)

always @(posedge clk)

        if (ce) bNan <= bu.nan;

        if (ce) bNan <= bu.nan;

ft_delay #(.WID(1), .DEP(1)) udly1 (.clk(clk), .ce(ce), .i(ld), .o(ld1));

ft_delay #(.WID(1), .DEP(1)) udly1 (.clk(clk), .ce(ce), .i(ld), .o(ld1));

// -----------------------------------------------------------

// -----------------------------------------------------------

// Clock #2 to N

// Clock #2 to N

// - calculate fraction

// - calculate fraction

// -----------------------------------------------------------

// -----------------------------------------------------------

wire done3a,done3;

wire done3a,done3;

// Perform divide

// Perform divide

dfdiv2 #(N+2) u2 (.clk(clk), .ld(ld1), .a({siga,8'b0}), .b({sigb,8'b0}), .q(divo), .r(), .done(done1), .lzcnt(lzcnt));

dfdiv2 #(N+2) u2 (.clk(clk), .ld(ld1), .a({siga,8'b0}), .b({sigb,8'b0}), .q(divo), .r(), .done(done1), .lzcnt(lzcnt));

//wire [7:0] lzcnt_bin = lzcnt[3:0] + (lzcnt[7:4] * 10);

//wire [7:0] lzcnt_bin = lzcnt[3:0] + (lzcnt[7:4] * 10);

wire [(N+2)*4*2-1:0] divo1 = divo[(N+2)*4*2-1:0] << ({lzcnt-1,2'b0});//WAS FPWID=128?+44

wire [(N+2)*4*2-1:0] divo1 = divo[(N+2)*4*2-1:0] << ({lzcnt-1,2'b0});//WAS FPWID=128?+44

ft_delay #(.WID(1), .DEP(3)) u3 (.clk(clk), .ce(ce), .i(done1), .o(done3a));

ft_delay #(.WID(1), .DEP(3)) u3 (.clk(clk), .ce(ce), .i(done1), .o(done3a));

assign done3 = done1&done3a;

assign done3 = done1&done3a;

// -----------------------------------------------------------

// -----------------------------------------------------------

// Clock #N+1

// Clock #N+1

// - calculate exponent

// - calculate exponent

// - calculate fraction

// - calculate fraction

// - determine when a NaN is output

// - determine when a NaN is output

// -----------------------------------------------------------

// -----------------------------------------------------------

// Compute the exponent.

// Compute the exponent.

// - correct the exponent for denormalized operands

// - correct the exponent for denormalized operands

// - adjust the difference by the bias (add 127)

// - adjust the difference by the bias (add 127)

// - also factor in the different decimal position for division

// - also factor in the different decimal position for division

reg [13:0] ex1; // sum of exponents

reg [13:0] ex1; // sum of exponents

reg qNaNOut;

reg qNaNOut;

always @(posedge clk)

always @(posedge clk)

  if (ce) ex1 <= au.exp - bu.exp + bias - (({lzcnt,2'b00} > N+2) ? lzcnt-(N+2) : 0);

  if (ce) ex1 <= au.exp - bu.exp + bias - (({lzcnt,2'b00} > N+2) ? lzcnt-(N+2) : 0);

always @(posedge clk)

always @(posedge clk)

  if (ce) qNaNOut <= (az&bz)|(aInf&bInf);

  if (ce) qNaNOut <= (az&bz)|(aInf&bInf);

wire over = 1'b0;

wire over = 1'b0;

wire under = &ex1[13:12];

wire under = &ex1[13:12];

reg [3:0] st;

reg [3:0] st;

// -----------------------------------------------------------

// -----------------------------------------------------------

// Clock #N+3

// Clock #N+3

// -----------------------------------------------------------

// -----------------------------------------------------------

always_ff @(posedge clk)

always_ff @(posedge clk)

// Simulation likes to see these values reset to zero on reset. Otherwise the

// Simulation likes to see these values reset to zero on reset. Otherwise the

// values propagate in sim as X's.

// values propagate in sim as X's.

if (rst) begin

if (rst) begin

        xo <= 1'd0;

        xo <= 1'd0;

        mo <= 1'd0;

        mo <= 1'd0;

        so <= 1'd0;

        so <= 1'd0;

        sign_exe <= 1'd0;

        sign_exe <= 1'd0;

        overflow <= 1'd0;

        overflow <= 1'd0;

        underflow <= 1'd0;

        underflow <= 1'd0;

        done <= 1'b1;

        done <= 1'b1;

end

end

else if (ce) begin

else if (ce) begin

  done <= 1'b0;

  done <= 1'b0;

        if (done3&done1) begin

        if (done3&done1) begin

          done <= 1'b1;

          done <= 1'b1;

                casez({qNaNOut|aNan|bNan,bInf,bz,over,under})

                casez({qNaNOut|aNan|bNan,bInf,bz,over,under})

                5'b1????:               xo <= infXp;    // NaN exponent value

                5'b1????:               xo <= infXp;    // NaN exponent value

                5'b01???:               xo <= 1'd0;             // divide by inf

                5'b01???:               xo <= 1'd0;             // divide by inf

                5'b001??:               xo <= infXp;    // divide by zero

                5'b001??:               xo <= infXp;    // divide by zero

                5'b0001?:               xo <= infXp;    // overflow

                5'b0001?:               xo <= infXp;    // overflow

                5'b00001:               xo <= 1'd0;             // underflow

                5'b00001:               xo <= 1'd0;             // underflow

                default:                xo <= ex1;      // normal or underflow: passthru neg. exp. for normalization

                default:                xo <= ex1;      // normal or underflow: passthru neg. exp. for normalization

                endcase

                endcase

                casez({aNan,bNan,qNaNOut,bInf,bz,over,aInf&bInf,az&bz})

                casez({aNan,bNan,qNaNOut,bInf,bz,over,aInf&bInf,az&bz})

                8'b1???????:  begin mo <= {4'h1,au[N*4-1:0],{(N+1)*4-1{1'b0}}}; st[3] <= 1'b1; end

                8'b1???????:  begin mo <= {4'h1,au[N*4-1:0],{(N+1)*4-1{1'b0}}}; st[3] <= 1'b1; end

                8'b01??????:  begin mo <= {4'h1,bu[N*4-1:0],{(N+1)*4-1{1'b0}}}; st[3] <= 1'b1; end

                8'b01??????:  begin mo <= {4'h1,bu[N*4-1:0],{(N+1)*4-1{1'b0}}}; st[3] <= 1'b1; end

                8'b001?????:    begin mo <= {4'h1,qNaN[N*4-1:0]|{aInf,1'b0}|{az,bz},{(N+1)*4-1{1'b0}}}; st[3] <= 1'b1; end

                8'b001?????:    begin mo <= {4'h1,qNaN[N*4-1:0]|{aInf,1'b0}|{az,bz},{(N+1)*4-1{1'b0}}}; st[3] <= 1'b1; end

                8'b0001????:    begin mo <= {(N+1)*4*2-1{1'd0}};        st[3] <= 1'b0; end      // div by inf

                8'b0001????:    begin mo <= {(N+1)*4*2-1{1'd0}};        st[3] <= 1'b0; end      // div by inf

                8'b00001???:    begin mo <= {(N+1)*4*2-1{1'd0}};        st[3] <= 1'b0; end      // div by zero

                8'b00001???:    begin mo <= {(N+1)*4*2-1{1'd0}};        st[3] <= 1'b0; end      // div by zero

                8'b000001??:    begin mo <= {(N+1)*4*2-1{1'd0}};        st[3] <= 1'b0; end      // Inf exponent

                8'b000001??:    begin mo <= {(N+1)*4*2-1{1'd0}};        st[3] <= 1'b0; end      // Inf exponent

                8'b0000001?:    begin mo <= {4'h1,qNaN|`QINFDIV,{(N+1)*4-1{1'b0}}};     st[3] <= 1'b1; end      // infinity / infinity

                8'b0000001?:    begin mo <= {4'h1,qNaN|`QINFDIV,{(N+1)*4-1{1'b0}}};     st[3] <= 1'b1; end      // infinity / infinity

                8'b00000001:    begin mo <= {4'h1,qNaN|`QZEROZERO,{(N+1)*4-1{1'b0}}};   st[3] <= 1'b1; end      // zero / zero

                8'b00000001:    begin mo <= {4'h1,qNaN|`QZEROZERO,{(N+1)*4-1{1'b0}}};   st[3] <= 1'b1; end      // zero / zero

                default:                begin mo <= divo1[(N+2)*4*2-1:8];       st[3] <= 1'b0; end      // plain div

                default:                begin mo <= divo1[(N+2)*4*2-1:8];       st[3] <= 1'b0; end      // plain div

                endcase

                endcase

                sign_exe        <= sa & sb;

                sign_exe        <= sa & sb;

                overflow        <= over;

                overflow        <= over;

                underflow       <= under;

                underflow       <= under;

                o.nan <= aNan|bNan|qNaNOut;

                o.nan <= aNan|bNan|qNaNOut;

                o.snan <= aNan|bNan|qNaNOut;

                o.snan <= aNan|bNan|qNaNOut;

                o.qnan <= 1'b0;

                o.qnan <= 1'b0;

                o.infinity <= over|aInf;

                o.infinity <= over|aInf;

                o.sign <= sa ^ sb;

                o.sign <= sa ^ sb;

                o.exp <= xo;

                o.exp <= xo;

                o.sig <= mo;

                o.sig <= mo;

end

end

end

end

endmodule

endmodule

module DFPDivide96nr(rst, clk, ce, ld, op, a, b, o, rm, done, sign_exe, inf, overflow, underflow);

module DFPDivide96nr(rst, clk, ce, ld, op, a, b, o, rm, done, sign_exe, inf, overflow, underflow);

parameter N=25;

parameter N=25;

input rst;

input rst;

input clk;

input clk;

input ce;

input ce;

input ld;

input ld;

input op;

input op;

input  DFP96 a, b;

input  DFP96 a, b;

output DFP96 o;

output DFP96 o;

input [2:0] rm;

input [2:0] rm;

output sign_exe;

output sign_exe;

output done;

output done;

output inf;

output inf;

output overflow;

output overflow;

output underflow;

output underflow;

DFP96UD o1;

DFP96UD o1;

wire sign_exe1, inf1, overflow1, underflow1;

wire sign_exe1, inf1, overflow1, underflow1;

DFP96UN fpn0;

DFP96UN fpn0;

wire done1, done1a;

wire done1, done1a;

DFPDivide96    #(.N(N)) u1 (rst, clk, ce, ld, op, a, b, o1, done1, sign_exe1, overflow1, underflow1);

DFPDivide96    #(.N(N)) u1 (rst, clk, ce, ld, op, a, b, o1, done1, sign_exe1, overflow1, underflow1);

DFPNormalize96 #(.N(N)) u2(.clk(clk), .ce(ce), .under_i(underflow1), .i(o1), .o(fpn0) );

DFPNormalize96 #(.N(N)) u2(.clk(clk), .ce(ce), .under_i(underflow1), .i(o1), .o(fpn0) );

DFPRound96     #(.N(N)) u3(.clk(clk), .ce(ce), .rm(rm), .i(fpn0), .o(o) );

DFPRound96     #(.N(N)) u3(.clk(clk), .ce(ce), .rm(rm), .i(fpn0), .o(o) );

delay2      #(1)   u4(.clk(clk), .ce(ce), .i(sign_exe1), .o(sign_exe));

delay2      #(1)   u4(.clk(clk), .ce(ce), .i(sign_exe1), .o(sign_exe));

delay2      #(1)   u5(.clk(clk), .ce(ce), .i(inf1), .o(inf));

delay2      #(1)   u5(.clk(clk), .ce(ce), .i(inf1), .o(inf));

delay2      #(1)   u6(.clk(clk), .ce(ce), .i(overflow1), .o(overflow));

delay2      #(1)   u6(.clk(clk), .ce(ce), .i(overflow1), .o(overflow));

delay2      #(1)   u7(.clk(clk), .ce(ce), .i(underflow1), .o(underflow));

delay2      #(1)   u7(.clk(clk), .ce(ce), .i(underflow1), .o(underflow));

ft_delay        #(.WID(1),.DEP(11))   u8(.clk(clk), .ce(ce), .i(done1), .o(done1a));

ft_delay        #(.WID(1),.DEP(14))   u8(.clk(clk), .ce(ce), .i(done1), .o(done1a));

assign done = done1&done1a;

assign done = done1&done1a;

endmodule

endmodule

Browse

Tools

Subversion Repositories ft816float

[/] [ft816float/] [trunk/] [rtl/] [verilog2/] [DFPDivide96.sv] - Diff between revs 80 and 81