OpenCores

Rev 18	Rev 26
`// ============================================================================`	`// ============================================================================`
`// __`	`// __`
`// \\__/ o\ (C) 2017-2019 Robert Finch, Waterloo`	`// \\__/ o\ (C) 2017-2019 Robert Finch, Waterloo`
`// \ __ / All rights reserved.`	`// \ __ / All rights reserved.`
`// \/_// robfinch<remove>@finitron.ca`	`// \/_// robfinch<remove>@finitron.ca`
`// \|\|`	`// \|\|`
`//`	`//`
`// sigmoid.v`	`// sigmoid.v`
`// - perform sigmoid function`	`// - perform sigmoid function`
`//`	`//`
`//`	`//`
`// This source file is free software: you can redistribute it and/or modify`	`// This source file is free software: you can redistribute it and/or modify`
`// it under the terms of the GNU Lesser General Public License as published`	`// it under the terms of the GNU Lesser General Public License as published`
`// by the Free Software Foundation, either version 3 of the License, or`	`// by the Free Software Foundation, either version 3 of the License, or`
`// (at your option) any later version.`	`// (at your option) any later version.`
`//`	`//`
`// This source file is distributed in the hope that it will be useful,`	`// This source file is distributed in the hope that it will be useful,`
`// but WITHOUT ANY WARRANTY; without even the implied warranty of`	`// but WITHOUT ANY WARRANTY; without even the implied warranty of`
`// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`	`// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
`// GNU General Public License for more details.`	`// GNU General Public License for more details.`
`//`	`//`
`// You should have received a copy of the GNU General Public License`	`// You should have received a copy of the GNU General Public License`
`// along with this program. If not, see <http://www.gnu.org/licenses/>.`	`// along with this program. If not, see <http://www.gnu.org/licenses/>.`
`//`	`//`
`//`	`//`
`// This module returns the sigmoid of a number using a lookup table.`	`// This module returns the sigmoid of a number using a lookup table.`
`// -1.0 or +1.0 is returned for entries outside of the range -8.0 to +8.0`	`// -1.0 or +1.0 is returned for entries outside of the range -8.0 to +8.0`
`//`	`//`
`// ToTo: check pipelining of values`	`// ToTo: check pipelining of values`
`// ============================================================================`	`// ============================================================================`

`define ONE80 80'h3FFF0000000000000000	`define ONE80 80'h3FFF0000000000000000
`define EIGHT80 80'h40020000000000000000	`define EIGHT80 80'h40020000000000000000
`define FIVETWELVE80 80'h40080000000000000000	`define FIVETWELVE80 80'h40080000000000000000
`define ONE64 64'h3FF0000000000000	`define ONE64 64'h3FF0000000000000
`define EIGHT64 64'h4020000000000000	`define EIGHT64 64'h4020000000000000
`define FIVETWELVE64 64'h4080000000000000	`define FIVETWELVE64 64'h4080000000000000
`define ONE40 40'h3FE0000000	`define ONE40 40'h3FE0000000
`define EIGHT40 40'h4040000000	`define EIGHT40 40'h4040000000
`define ONE32 32'h7F000000	`define ONE32 32'h7F000000
`define EIGHT32 32'h42000000	`define EIGHT32 32'h42000000
`define FIVETWELVE32 32'h48000000	`define FIVETWELVE32 32'h48000000

`module fpSigmoid(clk, ce, a, o);`	`module fpSigmoid(clk, ce, a, o);`
`parameter WID = 128;`	`parameter WID = 128;`
`localparam MSB = WID-1;`	`include "fpSize.sv"
`localparam EMSB = WID==128 ? 14 :`
`WID==96 ? 14 :`
`WID==80 ? 14 :`
`WID==64 ? 10 :`
`WID==52 ? 10 :`
`WID==48 ? 11 :`
`WID==44 ? 10 :`
`WID==42 ? 10 :`
`WID==40 ? 9 :`
`WID==32 ? 7 :`
`WID==24 ? 6 : 4;`
`localparam FMSB = WID==128 ? 111 :`
`WID==96 ? 79 :`
`WID==80 ? 63 :`
`WID==64 ? 51 :`
`WID==52 ? 39 :`
`WID==48 ? 34 :`
`WID==44 ? 31 :`
`WID==42 ? 29 :`
`WID==40 ? 28 :`
`WID==32 ? 22 :`
`WID==24 ? 15 : 9;`
`input clk;`	`input clk;`
`input ce;`	`input ce;`
`input [WID-1:0] a;`	`input [WID-1:0] a;`
`output reg [WID-1:0] o;`	`output reg [WID-1:0] o;`

`wire [4:0] cmp1_o;`	`wire [4:0] cmp1_o;`
`reg [4:0] cmp2_o;`	`reg [4:0] cmp2_o;`

`// Just the mantissa is stored in the table to economize on the storate.`	`// Just the mantissa is stored in the table to economize on the storate.`
`// The exponent is always the same value (0x3ff). Only the top 32 bits of`	`// The exponent is always the same value (0x3ff). Only the top 32 bits of`
`// the mantissa are stored.`	`// the mantissa are stored.`
`(* ram_style="block" *)`	`(* ram_style="block" *)`
`reg [31:0] SigmoidLUT [0:1023];`	`reg [31:0] SigmoidLUT [0:1023];`

`// Check if the input is in the range (-8 to +8)`	`// Check if the input is in the range (-8 to +8)`
`// We take the absolute value by trimming off the sign bit.`	`// We take the absolute value by trimming off the sign bit.`
`generate begin : ext`	`generate begin : ext`
`if (WID==80)`	`if (WID==80)`
fp_cmp_unit #(WID) u1 (.a(a & 80'h7FFFFFFFFFFFFFFFFFFF), .b(`EIGHT80), .o(cmp1_o), .nanx() );	fp_cmp_unit #(WID) u1 (.a(a & 80'h7FFFFFFFFFFFFFFFFFFF), .b(`EIGHT80), .o(cmp1_o), .nanx() );
`else if (WID==64)`	`else if (WID==64)`
fp_cmp_unit #(WID) u1 (.a(a & 64'h7FFFFFFFFFFFFFFF), .b(`EIGHT64), .o(cmp1_o), .nanx() );	fp_cmp_unit #(WID) u1 (.a(a & 64'h7FFFFFFFFFFFFFFF), .b(`EIGHT64), .o(cmp1_o), .nanx() );
`else if (WID==40)`	`else if (WID==40)`
fp_cmp_unit #(WID) u1 (.a(a & 40'h7FFFFFFFFF), .b(`EIGHT40), .o(cmp1_o), .nanx() );	fp_cmp_unit #(WID) u1 (.a(a & 40'h7FFFFFFFFF), .b(`EIGHT40), .o(cmp1_o), .nanx() );
`else if (WID==32)`	`else if (WID==32)`
fp_cmp_unit #(WID) u1 (.a(a & 32'h7FFFFFFF), .b(`EIGHT32), .o(cmp1_o), .nanx() );	fp_cmp_unit #(WID) u1 (.a(a & 32'h7FFFFFFF), .b(`EIGHT32), .o(cmp1_o), .nanx() );
`else begin`	`else begin`
`always @*`	`always @*`
`begin`	`begin`
`$display("Sigmoid: unsupported width.");`	`$display("Sigmoid: unsupported width.");`
`$stop;`	`$stop;`
`end`	`end`
`end`	`end`
`end`	`end`
`endgenerate`	`endgenerate`

`initial begin`	`initial begin`
`include "D:\Cores6\rtfItanium\v1\rtl\fpUnit\SigTbl.ver"	`include "D:\Cores6\nvio\v1\rtl\fpUnit\SigTbl.ver"
`end`	`end`

`// Quickly multiply number by 64 (it is in range -8 to 8) then convert to integer to get`	`// Quickly multiply number by 64 (it is in range -8 to 8) then convert to integer to get`
`// table index = add 6 to exponent then convert to integer`	`// table index = add 6 to exponent then convert to integer`
`wire sa;`	`wire sa;`
`wire [EMSB:0] xa;`	`wire [EMSB:0] xa;`
`wire [FMSB:0] ma;`	`wire [FMSB:0] ma;`
`fpDecomp #(WID) u1 (.i(a), .sgn(sa), .exp(xa), .man(ma), .fract(), .xz(), .vz(), .xinf(), .inf(), .nan() );`	`fpDecomp #(WID) u1 (.i(a), .sgn(sa), .exp(xa), .man(ma), .fract(), .xz(), .vz(), .xinf(), .inf(), .nan() );`

`reg [9:0] lutadr;`	`reg [9:0] lutadr;`
`wire [5:0] lzcnt;`	`wire [5:0] lzcnt;`
`wire [WID-1:0] a1;`	`wire [WID-1:0] a1;`
`wire [WID-1:0] i1, i2;`	`wire [WID-1:0] i1, i2;`
`wire [EMSB:0] xa1 = xa + 4'd6;`	`wire [EMSB:0] xa1 = xa + 4'd6;`
`assign a1 = {sa,xa1,ma}; // we know the exponent won't overflow`	`assign a1 = {sa,xa1,ma}; // we know the exponent won't overflow`
`wire [31:0] man32a = SigmoidLUT[lutadr];`	`wire [31:0] man32a = SigmoidLUT[lutadr];`
`wire [31:0] man32b = lutadr==10'h3ff ? man32a : SigmoidLUT[lutadr+1];`	`wire [31:0] man32b = lutadr==10'h3ff ? man32a : SigmoidLUT[lutadr+1];`
`wire [31:0] man32;`	`wire [31:0] man32;`
`wire [79:0] sig80;`	`wire [79:0] sig80;`
`generate begin : la`	`generate begin : la`
`if (WID >= 40) begin`	`if (WID >= 40) begin`
`wire [15:0] eps = ma[FMSB-10:FMSB-10-15];`	`wire [15:0] eps = ma[FMSB-10:FMSB-10-15];`
`wire [47:0] p = (man32b - man32a) * eps;`	`wire [47:0] p = (man32b - man32a) * eps;`
`assign man32 = man32a + (p >> 26);`	`assign man32 = man32a + (p >> 26);`
`cntlz32 u3 (man32,lzcnt);`	`cntlz32 u3 (man32,lzcnt);`
`end`	`end`
`else if (WID==32) begin`	`else if (WID==32) begin`
`wire [12:0] eps = ma[FMSB-10:0];`	`wire [12:0] eps = ma[FMSB-10:0];`
`wire [43:0] p = (man32b - man32a) * eps;`	`wire [43:0] p = (man32b - man32a) * eps;`
`assign man32 = man32a + (p >> 26);`	`assign man32 = man32a + (p >> 26);`
`cntlz32 u3 (man32,lzcnt);`	`cntlz32 u3 (man32,lzcnt);`
`end`	`end`
`end`	`end`
`endgenerate`	`endgenerate`

`wire [31:0] man32s = man32 << (lzcnt + 2'd1); // +1 to hide leading one`	`wire [31:0] man32s = man32 << (lzcnt + 2'd1); // +1 to hide leading one`

`// Convert to integer`	`// Convert to integer`
`f2i #(WID) u2`	`f2i #(WID) u2`
`(`	`(`
`.clk(clk),`	`.clk(clk),`
`.ce(1'b1),`	`.ce(1'b1),`
`.i(a1),`	`.i(a1),`
`.o(i2)`	`.o(i2)`
`);`	`);`
`assign i1 = i2 + 512;`	`assign i1 = i2 + 512;`

`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) cmp2_o <= cmp1_o;`	`if (ce) cmp2_o <= cmp1_o;`

`// We know the integer is in range 0 to 1023`	`// We know the integer is in range 0 to 1023`
`always @(posedge clk)`	`always @(posedge clk)`
`if(ce) lutadr <= i1[9:0];`	`if(ce) lutadr <= i1[9:0];`
`reg sa1,sa2;`	`reg sa1,sa2;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) sa1 <= a[WID-1];`	`if (ce) sa1 <= a[WID-1];`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) sa2 <= sa1;`	`if (ce) sa2 <= sa1;`

`generate begin : ooo`	`generate begin : ooo`
`if (WID==80) begin`	`if (WID==80) begin`
`wire [14:0] ex1 = 15'h3ffe - lzcnt;`	`wire [14:0] ex1 = 15'h3ffe - lzcnt;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) begin`	`if (ce) begin`
`if (cmp2_o[1]) // abs(a) less than 8 ?`	`if (cmp2_o[1]) // abs(a) less than 8 ?`
`o <= {1'b0,ex1,man32s[31:0],32'd0};`	`o <= {1'b0,ex1,man32s[31:0],32'd0};`
`else`	`else`
o <= sa1 ? 80'h0 : `ONE80;	o <= sa1 ? 80'h0 : `ONE80;
`end`	`end`
`end`	`end`
`else if (WID==64) begin`	`else if (WID==64) begin`
`wire [10:0] ex1 = 11'h3fe - lzcnt;`	`wire [10:0] ex1 = 11'h3fe - lzcnt;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) begin`	`if (ce) begin`
`if (cmp2_o[1]) // abs(a) less than 8 ?`	`if (cmp2_o[1]) // abs(a) less than 8 ?`
`o <= {1'b0,ex1,man32s[31:0],20'd0};`	`o <= {1'b0,ex1,man32s[31:0],20'd0};`
`else`	`else`
o <= sa1 ? 64'h0 : `ONE64;	o <= sa1 ? 64'h0 : `ONE64;
`end`	`end`
`end`	`end`
`else if (WID==40) begin`	`else if (WID==40) begin`
`wire [9:0] ex1 = 10'h1fe - lzcnt;`	`wire [9:0] ex1 = 10'h1fe - lzcnt;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) begin`	`if (ce) begin`
`if (cmp2_o[1]) // abs(a) less than 8 ?`	`if (cmp2_o[1]) // abs(a) less than 8 ?`
`o <= {1'b0,ex1,man32s[31:3]};`	`o <= {1'b0,ex1,man32s[31:3]};`
`else`	`else`
o <= sa1 ? 40'h0 : `ONE40;	o <= sa1 ? 40'h0 : `ONE40;
`end`	`end`
`end`	`end`
`else if (WID==32) begin`	`else if (WID==32) begin`
`wire [7:0] ex1 = 8'h7e - lzcnt;`	`wire [7:0] ex1 = 8'h7e - lzcnt;`
`always @(posedge clk)`	`always @(posedge clk)`
`if (ce) begin`	`if (ce) begin`
`if (cmp2_o[1]) // abs(a) less than 8 ?`	`if (cmp2_o[1]) // abs(a) less than 8 ?`
`o <= {1'b0,ex1,man32s[31:9]};`	`o <= {1'b0,ex1,man32s[31:9]};`
`else`	`else`
o <= sa1 ? 32'h0 : `ONE32;	o <= sa1 ? 32'h0 : `ONE32;
`end`	`end`
`end`	`end`
`end`	`end`
`endgenerate`	`endgenerate`

`endmodule`	`endmodule`

// ============================================================================

// ============================================================================

//        __

//        __

//   \\__/ o\    (C) 2017-2019  Robert Finch, Waterloo

//   \\__/ o\    (C) 2017-2019  Robert Finch, Waterloo

//    \  __ /    All rights reserved.

//    \  __ /    All rights reserved.

//     \/_//     robfinch<remove>@finitron.ca

//     \/_//     robfinch<remove>@finitron.ca

//       ||

//       ||

//

//

//      sigmoid.v

//      sigmoid.v

//              - perform sigmoid function

//              - perform sigmoid function

//

//

//

//

// This source file is free software: you can redistribute it and/or modify

// This source file is free software: you can redistribute it and/or modify

// it under the terms of the GNU Lesser General Public License as published

// it under the terms of the GNU Lesser General Public License as published

// by the Free Software Foundation, either version 3 of the License, or

// by the Free Software Foundation, either version 3 of the License, or

// (at your option) any later version.

// (at your option) any later version.

//

//

// This source file is distributed in the hope that it will be useful,

// This source file is distributed in the hope that it will be useful,

// but WITHOUT ANY WARRANTY; without even the implied warranty of

// but WITHOUT ANY WARRANTY; without even the implied warranty of

// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

// GNU General Public License for more details.

// GNU General Public License for more details.

//

//

// You should have received a copy of the GNU General Public License

// You should have received a copy of the GNU General Public License

// along with this program.  If not, see <http://www.gnu.org/licenses/>.

// along with this program.  If not, see <http://www.gnu.org/licenses/>.

//

//

//

//

// This module returns the sigmoid of a number using a lookup table.

// This module returns the sigmoid of a number using a lookup table.

// -1.0 or +1.0 is returned for entries outside of the range -8.0 to +8.0

// -1.0 or +1.0 is returned for entries outside of the range -8.0 to +8.0

//

//

// ToTo: check pipelining of values

// ToTo: check pipelining of values

// ============================================================================

// ============================================================================

`define ONE80                                   80'h3FFF0000000000000000

`define ONE80                                   80'h3FFF0000000000000000

`define EIGHT80                         80'h40020000000000000000

`define EIGHT80                         80'h40020000000000000000

`define FIVETWELVE80    80'h40080000000000000000

`define FIVETWELVE80    80'h40080000000000000000

`define ONE64                                   64'h3FF0000000000000

`define ONE64                                   64'h3FF0000000000000

`define EIGHT64                         64'h4020000000000000

`define EIGHT64                         64'h4020000000000000

`define FIVETWELVE64    64'h4080000000000000

`define FIVETWELVE64    64'h4080000000000000

`define ONE40                                   40'h3FE0000000

`define ONE40                                   40'h3FE0000000

`define EIGHT40                         40'h4040000000

`define EIGHT40                         40'h4040000000

`define ONE32                                   32'h7F000000

`define ONE32                                   32'h7F000000

`define EIGHT32                         32'h42000000

`define EIGHT32                         32'h42000000

`define FIVETWELVE32    32'h48000000

`define FIVETWELVE32    32'h48000000

module fpSigmoid(clk, ce, a, o);

module fpSigmoid(clk, ce, a, o);

parameter WID = 128;

parameter WID = 128;

localparam MSB = WID-1;

`include "fpSize.sv"

localparam EMSB = WID==128 ? 14 :

                  WID==96 ? 14 :

                  WID==80 ? 14 :

                  WID==64 ? 10 :

                                  WID==52 ? 10 :

                                  WID==48 ? 11 :

                                  WID==44 ? 10 :

                                  WID==42 ? 10 :

                                  WID==40 ?  9 :

                                  WID==32 ?  7 :

                                  WID==24 ?  6 : 4;

localparam FMSB = WID==128 ? 111 :

                  WID==96 ? 79 :

                  WID==80 ? 63 :

                  WID==64 ? 51 :

                                  WID==52 ? 39 :

                                  WID==48 ? 34 :

                                  WID==44 ? 31 :

                                  WID==42 ? 29 :

                                  WID==40 ? 28 :

                                  WID==32 ? 22 :

                                  WID==24 ? 15 : 9;

input clk;

input clk;

input ce;

input ce;

input [WID-1:0] a;

input [WID-1:0] a;

output reg [WID-1:0] o;

output reg [WID-1:0] o;

wire [4:0] cmp1_o;

wire [4:0] cmp1_o;

reg [4:0] cmp2_o;

reg [4:0] cmp2_o;

// Just the mantissa is stored in the table to economize on the storate.

// Just the mantissa is stored in the table to economize on the storate.

// The exponent is always the same value (0x3ff). Only the top 32 bits of

// The exponent is always the same value (0x3ff). Only the top 32 bits of

// the mantissa are stored.

// the mantissa are stored.

(* ram_style="block" *)

(* ram_style="block" *)

reg [31:0] SigmoidLUT [0:1023];

reg [31:0] SigmoidLUT [0:1023];

// Check if the input is in the range (-8 to +8)

// Check if the input is in the range (-8 to +8)

// We take the absolute value by trimming off the sign bit.

// We take the absolute value by trimming off the sign bit.

generate begin : ext

generate begin : ext

if (WID==80)

if (WID==80)

fp_cmp_unit #(WID) u1 (.a(a & 80'h7FFFFFFFFFFFFFFFFFFF), .b(`EIGHT80), .o(cmp1_o), .nanx() );

fp_cmp_unit #(WID) u1 (.a(a & 80'h7FFFFFFFFFFFFFFFFFFF), .b(`EIGHT80), .o(cmp1_o), .nanx() );

else if (WID==64)

else if (WID==64)

fp_cmp_unit #(WID) u1 (.a(a & 64'h7FFFFFFFFFFFFFFF), .b(`EIGHT64), .o(cmp1_o), .nanx() );

fp_cmp_unit #(WID) u1 (.a(a & 64'h7FFFFFFFFFFFFFFF), .b(`EIGHT64), .o(cmp1_o), .nanx() );

else if (WID==40)

else if (WID==40)

fp_cmp_unit #(WID) u1 (.a(a & 40'h7FFFFFFFFF), .b(`EIGHT40), .o(cmp1_o), .nanx() );

fp_cmp_unit #(WID) u1 (.a(a & 40'h7FFFFFFFFF), .b(`EIGHT40), .o(cmp1_o), .nanx() );

else if (WID==32)

else if (WID==32)

fp_cmp_unit #(WID) u1 (.a(a & 32'h7FFFFFFF), .b(`EIGHT32), .o(cmp1_o), .nanx() );

fp_cmp_unit #(WID) u1 (.a(a & 32'h7FFFFFFF), .b(`EIGHT32), .o(cmp1_o), .nanx() );

else begin

else begin

        always @*

        always @*

        begin

        begin

                $display("Sigmoid: unsupported width.");

                $display("Sigmoid: unsupported width.");

                $stop;

                $stop;

end

end

end

end

end

end

endgenerate

endgenerate

initial begin

initial begin

`include "D:\Cores6\rtfItanium\v1\rtl\fpUnit\SigTbl.ver"

`include "D:\Cores6\nvio\v1\rtl\fpUnit\SigTbl.ver"

end

end

// Quickly multiply number by 64 (it is in range -8 to 8) then convert to integer to get

// Quickly multiply number by 64 (it is in range -8 to 8) then convert to integer to get

// table index = add 6 to exponent then convert to integer

// table index = add 6 to exponent then convert to integer

wire sa;

wire sa;

wire [EMSB:0] xa;

wire [EMSB:0] xa;

wire [FMSB:0] ma;

wire [FMSB:0] ma;

fpDecomp #(WID) u1 (.i(a), .sgn(sa), .exp(xa), .man(ma), .fract(), .xz(), .vz(), .xinf(), .inf(), .nan() );

fpDecomp #(WID) u1 (.i(a), .sgn(sa), .exp(xa), .man(ma), .fract(), .xz(), .vz(), .xinf(), .inf(), .nan() );

reg [9:0] lutadr;

reg [9:0] lutadr;

wire [5:0] lzcnt;

wire [5:0] lzcnt;

wire [WID-1:0] a1;

wire [WID-1:0] a1;

wire [WID-1:0] i1, i2;

wire [WID-1:0] i1, i2;

wire [EMSB:0] xa1 = xa + 4'd6;

wire [EMSB:0] xa1 = xa + 4'd6;

assign a1 = {sa,xa1,ma};        // we know the exponent won't overflow

assign a1 = {sa,xa1,ma};        // we know the exponent won't overflow

wire [31:0] man32a = SigmoidLUT[lutadr];

wire [31:0] man32a = SigmoidLUT[lutadr];

wire [31:0] man32b = lutadr==10'h3ff ? man32a : SigmoidLUT[lutadr+1];

wire [31:0] man32b = lutadr==10'h3ff ? man32a : SigmoidLUT[lutadr+1];

wire [31:0] man32;

wire [31:0] man32;

wire [79:0] sig80;

wire [79:0] sig80;

generate begin : la

generate begin : la

if (WID >= 40) begin

if (WID >= 40) begin

wire [15:0] eps = ma[FMSB-10:FMSB-10-15];

wire [15:0] eps = ma[FMSB-10:FMSB-10-15];

wire [47:0] p = (man32b - man32a) * eps;

wire [47:0] p = (man32b - man32a) * eps;

assign man32 = man32a + (p >> 26);

assign man32 = man32a + (p >> 26);

cntlz32 u3 (man32,lzcnt);

cntlz32 u3 (man32,lzcnt);

end

end

else if (WID==32) begin

else if (WID==32) begin

wire [12:0] eps = ma[FMSB-10:0];

wire [12:0] eps = ma[FMSB-10:0];

wire [43:0] p = (man32b - man32a) * eps;

wire [43:0] p = (man32b - man32a) * eps;

assign man32 = man32a + (p >> 26);

assign man32 = man32a + (p >> 26);

cntlz32 u3 (man32,lzcnt);

cntlz32 u3 (man32,lzcnt);

end

end

end

end

endgenerate

endgenerate

wire [31:0] man32s = man32 << (lzcnt + 2'd1);    // +1 to hide leading one

wire [31:0] man32s = man32 << (lzcnt + 2'd1);    // +1 to hide leading one

// Convert to integer

// Convert to integer

f2i #(WID) u2

f2i #(WID) u2

  .clk(clk),

  .clk(clk),

  .ce(1'b1),

  .ce(1'b1),

  .i(a1),

  .i(a1),

  .o(i2)

  .o(i2)

);

);

assign i1 = i2 + 512;

assign i1 = i2 + 512;

always @(posedge clk)

always @(posedge clk)

  if (ce) cmp2_o <= cmp1_o;

  if (ce) cmp2_o <= cmp1_o;

// We know the integer is in range 0 to 1023

// We know the integer is in range 0 to 1023

always @(posedge clk)

always @(posedge clk)

  if(ce) lutadr <= i1[9:0];

  if(ce) lutadr <= i1[9:0];

reg sa1,sa2;

reg sa1,sa2;

always @(posedge clk)

always @(posedge clk)

if (ce) sa1 <= a[WID-1];

if (ce) sa1 <= a[WID-1];

always @(posedge clk)

always @(posedge clk)

if (ce) sa2 <= sa1;

if (ce) sa2 <= sa1;

generate begin : ooo

generate begin : ooo

if (WID==80) begin

if (WID==80) begin

wire [14:0] ex1 = 15'h3ffe - lzcnt;

wire [14:0] ex1 = 15'h3ffe - lzcnt;

always @(posedge clk)

always @(posedge clk)

if (ce) begin

if (ce) begin

        if (cmp2_o[1])  // abs(a) less than 8 ?

        if (cmp2_o[1])  // abs(a) less than 8 ?

          o <= {1'b0,ex1,man32s[31:0],32'd0};

          o <= {1'b0,ex1,man32s[31:0],32'd0};

        else

        else

          o <= sa1 ? 80'h0 : `ONE80;

          o <= sa1 ? 80'h0 : `ONE80;

end

end

end

end

else if (WID==64) begin

else if (WID==64) begin

wire [10:0] ex1 = 11'h3fe - lzcnt;

wire [10:0] ex1 = 11'h3fe - lzcnt;

always @(posedge clk)

always @(posedge clk)

if (ce) begin

if (ce) begin

        if (cmp2_o[1])  // abs(a) less than 8 ?

        if (cmp2_o[1])  // abs(a) less than 8 ?

          o <= {1'b0,ex1,man32s[31:0],20'd0};

          o <= {1'b0,ex1,man32s[31:0],20'd0};

        else

        else

          o <= sa1 ? 64'h0 : `ONE64;

          o <= sa1 ? 64'h0 : `ONE64;

end

end

end

end

else if (WID==40) begin

else if (WID==40) begin

wire [9:0] ex1 = 10'h1fe - lzcnt;

wire [9:0] ex1 = 10'h1fe - lzcnt;

always @(posedge clk)

always @(posedge clk)

if (ce) begin

if (ce) begin

        if (cmp2_o[1])  // abs(a) less than 8 ?

        if (cmp2_o[1])  // abs(a) less than 8 ?

          o <= {1'b0,ex1,man32s[31:3]};

          o <= {1'b0,ex1,man32s[31:3]};

        else

        else

          o <= sa1 ? 40'h0 : `ONE40;

          o <= sa1 ? 40'h0 : `ONE40;

end

end

end

end

else if (WID==32) begin

else if (WID==32) begin

wire [7:0] ex1 = 8'h7e - lzcnt;

wire [7:0] ex1 = 8'h7e - lzcnt;

always @(posedge clk)

always @(posedge clk)

if (ce) begin

if (ce) begin

        if (cmp2_o[1])  // abs(a) less than 8 ?

        if (cmp2_o[1])  // abs(a) less than 8 ?

          o <= {1'b0,ex1,man32s[31:9]};

          o <= {1'b0,ex1,man32s[31:9]};

        else

        else

          o <= sa1 ? 32'h0 : `ONE32;

          o <= sa1 ? 32'h0 : `ONE32;

end

end

end

end

end

end

endgenerate

endgenerate

endmodule

endmodule

Browse

Tools

Subversion Repositories ft816float

[/] [ft816float/] [trunk/] [rtl/] [verilog/] [fpSigmoid.v] - Diff between revs 18 and 26