OpenCores

-- #################################################################################################

-- #################################################################################################

-- # << NEORV32 - CPU Co-Processor: Single-Prec. Floating Point Unit (RISC-V "Zfinx" Extension) >> #

-- # << NEORV32 - CPU Co-Processor: Single-Prec. Floating Point Unit (RISC-V "Zfinx" Extension) >> #

-- # ********************************************************************************************* #

-- # ********************************************************************************************* #

-- # The Zfinx floating-point extension uses the integer register file (x) for all FP operations.  #

-- # The Zfinx floating-point extension uses the integer register file (x) for all FP operations.  #

-- # See the official RISC-V specs (https://github.com/riscv/riscv-zfinx) for more information.    #

-- # See the official RISC-V specs (https://github.com/riscv/riscv-zfinx) for more information.    #

-- #                                                                                               #

-- #                                                                                               #

-- # Design Notes:                                                                                 #

-- # Design Notes:                                                                                 #

-- # * This FPU is based on a multi-cycle architecture and is NOT suited for pipelined operations. #

-- # * This FPU is based on a multi-cycle architecture and is NOT suited for pipelined operations. #

-- # * The hardware design goal was SIZE (performance comes second). All shift operations are done #

-- # * The hardware design goal was SIZE (performance comes second). All shift operations are done #

-- #   using an iterative approach (one bit per clock cycle, no barrel shifters!).                 #

-- #   using an iterative approach (one bit per clock cycle, no barrel shifters!).                 #

-- # * Multiplication (FMUL instruction) will infer DSP blocks (if available).                     #

-- # * Multiplication (FMUL instruction) will infer DSP blocks (if available).                     #

-- # * Subnormal numbers are not supported yet - they are "flushed to zero" before entering the    #

-- # * Subnormal numbers are not supported yet - they are "flushed to zero" before entering the    #

-- #   actual FPU core.                                                                            #

-- #   actual FPU core.                                                                            #

-- # * Division and sqare root operations (FDIV, FSQRT) and fused multiply-accumulate operations   #

-- # * Division and sqare root operations (FDIV, FSQRT) and fused multiply-accumulate operations   #

-- #   (F[N]MADD) are not supported yet - they will raise an illegal instruction exception.        #

-- #   (F[N]MADD) are not supported yet - they will raise an illegal instruction exception.        #

-- # * Rounding mode <100> ("round to nearest, ties to max magnitude") is not supported yet.       #

-- # * Rounding mode <100> ("round to nearest, ties to max magnitude") is not supported yet.       #

-- # * Signaling NaNs (sNaN) will not be generated by the hardware at all. However, if inserted by #

-- # * Signaling NaNs (sNaN) will not be generated by the hardware at all. However, if inserted by #

-- #   the programmer they are handled correctly.                                                  #

-- #   the programmer they are handled correctly.                                                  #

-- # ********************************************************************************************* #

-- # ********************************************************************************************* #

-- # BSD 3-Clause License                                                                          #

-- # BSD 3-Clause License                                                                          #

-- #                                                                                               #

-- #                                                                                               #

-- # Copyright (c) 2022, Stephan Nolting. All rights reserved.                                     #

-- # Copyright (c) 2022, Stephan Nolting. All rights reserved.                                     #

-- #                                                                                               #

-- #                                                                                               #

-- # Redistribution and use in source and binary forms, with or without modification, are          #

-- # Redistribution and use in source and binary forms, with or without modification, are          #

-- # permitted provided that the following conditions are met:                                     #

-- # permitted provided that the following conditions are met:                                     #

-- #                                                                                               #

-- #                                                                                               #

-- # 1. Redistributions of source code must retain the above copyright notice, this list of        #

-- # 1. Redistributions of source code must retain the above copyright notice, this list of        #

-- #    conditions and the following disclaimer.                                                   #

-- #    conditions and the following disclaimer.                                                   #

-- #                                                                                               #

-- #                                                                                               #

-- # 2. Redistributions in binary form must reproduce the above copyright notice, this list of     #

-- # 2. Redistributions in binary form must reproduce the above copyright notice, this list of     #

-- #    conditions and the following disclaimer in the documentation and/or other materials        #

-- #    conditions and the following disclaimer in the documentation and/or other materials        #

-- #    provided with the distribution.                                                            #

-- #    provided with the distribution.                                                            #

-- #                                                                                               #

-- #                                                                                               #

-- # 3. Neither the name of the copyright holder nor the names of its contributors may be used to  #

-- # 3. Neither the name of the copyright holder nor the names of its contributors may be used to  #

-- #    endorse or promote products derived from this software without specific prior written      #

-- #    endorse or promote products derived from this software without specific prior written      #

-- #    permission.                                                                                #

-- #    permission.                                                                                #

-- #                                                                                               #

-- #                                                                                               #

-- # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS   #

-- # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS   #

-- # OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF               #

-- # OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF               #

-- # MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE    #

-- # MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE    #

-- # COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,     #

-- # COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,     #

-- # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE #

-- # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE #

-- # GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED    #

-- # GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED    #

-- # AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING     #

-- # AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING     #

-- # NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED  #

-- # NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED  #

-- # OF THE POSSIBILITY OF SUCH DAMAGE.                                                            #

-- # OF THE POSSIBILITY OF SUCH DAMAGE.                                                            #

-- # ********************************************************************************************* #

-- # ********************************************************************************************* #

-- # The NEORV32 Processor - https://github.com/stnolting/neorv32              (c) Stephan Nolting #

-- # The NEORV32 Processor - https://github.com/stnolting/neorv32              (c) Stephan Nolting #

-- #################################################################################################

-- #################################################################################################

library ieee;

library ieee;

use ieee.std_logic_1164.all;

use ieee.std_logic_1164.all;

use ieee.numeric_std.all;

use ieee.numeric_std.all;

library neorv32;

library neorv32;

use neorv32.neorv32_package.all;

use neorv32.neorv32_package.all;

entity neorv32_cpu_cp_fpu is

entity neorv32_cpu_cp_fpu is

  port (

  port (

    -- global control --

    -- global control --

    clk_i    : in  std_ulogic; -- global clock, rising edge

    clk_i    : in  std_ulogic; -- global clock, rising edge

    rstn_i   : in  std_ulogic; -- global reset, low-active, async

    rstn_i   : in  std_ulogic; -- global reset, low-active, async

    ctrl_i   : in  std_ulogic_vector(ctrl_width_c-1 downto 0); -- main control bus

    ctrl_i   : in  std_ulogic_vector(ctrl_width_c-1 downto 0); -- main control bus

    start_i  : in  std_ulogic; -- trigger operation

    start_i  : in  std_ulogic; -- trigger operation

    -- data input --

    -- data input --

    cmp_i    : in  std_ulogic_vector(1 downto 0); -- comparator status

    cmp_i    : in  std_ulogic_vector(1 downto 0); -- comparator status

    rs1_i    : in  std_ulogic_vector(data_width_c-1 downto 0); -- rf source 1

    rs1_i    : in  std_ulogic_vector(data_width_c-1 downto 0); -- rf source 1

    rs2_i    : in  std_ulogic_vector(data_width_c-1 downto 0); -- rf source 2

    rs2_i    : in  std_ulogic_vector(data_width_c-1 downto 0); -- rf source 2

    -- result and status --

    -- result and status --

    res_o    : out std_ulogic_vector(data_width_c-1 downto 0); -- operation result

    res_o    : out std_ulogic_vector(data_width_c-1 downto 0); -- operation result

    fflags_o : out std_ulogic_vector(4 downto 0); -- exception flags

    fflags_o : out std_ulogic_vector(4 downto 0); -- exception flags

    valid_o  : out std_ulogic -- data output valid

    valid_o  : out std_ulogic -- data output valid

);

);

end neorv32_cpu_cp_fpu;

end neorv32_cpu_cp_fpu;

architecture neorv32_cpu_cp_fpu_rtl of neorv32_cpu_cp_fpu is

architecture neorv32_cpu_cp_fpu_rtl of neorv32_cpu_cp_fpu is

  -- FPU core functions --

  -- FPU core functions --

  constant op_class_c  : std_ulogic_vector(2 downto 0) := "000";

  constant op_class_c  : std_ulogic_vector(2 downto 0) := "000";

  constant op_comp_c   : std_ulogic_vector(2 downto 0) := "001";

  constant op_comp_c   : std_ulogic_vector(2 downto 0) := "001";

  constant op_i2f_c    : std_ulogic_vector(2 downto 0) := "010";

  constant op_i2f_c    : std_ulogic_vector(2 downto 0) := "010";

  constant op_f2i_c    : std_ulogic_vector(2 downto 0) := "011";

  constant op_f2i_c    : std_ulogic_vector(2 downto 0) := "011";

  constant op_sgnj_c   : std_ulogic_vector(2 downto 0) := "100";

  constant op_sgnj_c   : std_ulogic_vector(2 downto 0) := "100";

  constant op_minmax_c : std_ulogic_vector(2 downto 0) := "101";

  constant op_minmax_c : std_ulogic_vector(2 downto 0) := "101";

  constant op_addsub_c : std_ulogic_vector(2 downto 0) := "110";

  constant op_addsub_c : std_ulogic_vector(2 downto 0) := "110";

  constant op_mul_c    : std_ulogic_vector(2 downto 0) := "111";

  constant op_mul_c    : std_ulogic_vector(2 downto 0) := "111";

  -- float-to-integer unit --

  -- float-to-integer unit --

  component neorv32_cpu_cp_fpu_f2i

  component neorv32_cpu_cp_fpu_f2i

  port (

  port (

    -- control --

    -- control --

    clk_i      : in  std_ulogic; -- global clock, rising edge

    clk_i      : in  std_ulogic; -- global clock, rising edge

    rstn_i     : in  std_ulogic; -- global reset, low-active, async

    rstn_i     : in  std_ulogic; -- global reset, low-active, async

    start_i    : in  std_ulogic; -- trigger operation

    start_i    : in  std_ulogic; -- trigger operation

    rmode_i    : in  std_ulogic_vector(02 downto 0); -- rounding mode

    rmode_i    : in  std_ulogic_vector(02 downto 0); -- rounding mode

    funct_i    : in  std_ulogic; -- 0=signed, 1=unsigned

    funct_i    : in  std_ulogic; -- 0=signed, 1=unsigned

    -- input --

    -- input --

    sign_i     : in  std_ulogic; -- sign

    sign_i     : in  std_ulogic; -- sign

    exponent_i : in  std_ulogic_vector(07 downto 0); -- exponent

    exponent_i : in  std_ulogic_vector(07 downto 0); -- exponent

    mantissa_i : in  std_ulogic_vector(22 downto 0); -- mantissa

    mantissa_i : in  std_ulogic_vector(22 downto 0); -- mantissa

    class_i    : in  std_ulogic_vector(09 downto 0); -- operand class

    class_i    : in  std_ulogic_vector(09 downto 0); -- operand class

    -- output --

    -- output --

    result_o   : out std_ulogic_vector(31 downto 0); -- integer result

    result_o   : out std_ulogic_vector(31 downto 0); -- integer result

    flags_o    : out std_ulogic_vector(04 downto 0); -- exception flags

    flags_o    : out std_ulogic_vector(04 downto 0); -- exception flags

    done_o     : out std_ulogic -- operation done

    done_o     : out std_ulogic -- operation done

);

);

  end component;

  end component;

  -- normalizer + rounding unit --

  -- normalizer + rounding unit --

  component neorv32_cpu_cp_fpu_normalizer

  component neorv32_cpu_cp_fpu_normalizer

  port (

  port (

    -- control --

    -- control --

    clk_i      : in  std_ulogic; -- global clock, rising edge

    clk_i      : in  std_ulogic; -- global clock, rising edge

    rstn_i     : in  std_ulogic; -- global reset, low-active, async

    rstn_i     : in  std_ulogic; -- global reset, low-active, async

    start_i    : in  std_ulogic; -- trigger operation

    start_i    : in  std_ulogic; -- trigger operation

    rmode_i    : in  std_ulogic_vector(02 downto 0); -- rounding mode

    rmode_i    : in  std_ulogic_vector(02 downto 0); -- rounding mode

    funct_i    : in  std_ulogic; -- operating mode (0=norm&round, 1=int-to-float)

    funct_i    : in  std_ulogic; -- operating mode (0=norm&round, 1=int-to-float)

    -- input --

    -- input --

    sign_i     : in  std_ulogic; -- sign

    sign_i     : in  std_ulogic; -- sign

    exponent_i : in  std_ulogic_vector(08 downto 0); -- extended exponent

    exponent_i : in  std_ulogic_vector(08 downto 0); -- extended exponent

    mantissa_i : in  std_ulogic_vector(47 downto 0); -- extended mantissa

    mantissa_i : in  std_ulogic_vector(47 downto 0); -- extended mantissa

    integer_i  : in  std_ulogic_vector(31 downto 0); -- integer input

    integer_i  : in  std_ulogic_vector(31 downto 0); -- integer input

    class_i    : in  std_ulogic_vector(09 downto 0); -- input number class

    class_i    : in  std_ulogic_vector(09 downto 0); -- input number class

    flags_i    : in  std_ulogic_vector(04 downto 0); -- exception flags input

    flags_i    : in  std_ulogic_vector(04 downto 0); -- exception flags input

    -- output --

    -- output --

    result_o   : out std_ulogic_vector(31 downto 0); -- result (float or int)

    result_o   : out std_ulogic_vector(31 downto 0); -- result (float or int)

    flags_o    : out std_ulogic_vector(04 downto 0); -- exception flags

    flags_o    : out std_ulogic_vector(04 downto 0); -- exception flags

    done_o     : out std_ulogic -- operation done

    done_o     : out std_ulogic -- operation done

);

);

  end component;

  end component;

  -- commands (one-hot) --

  -- commands (one-hot) --

  type cmd_t is record

  type cmd_t is record

    instr_class  : std_ulogic;

    instr_class  : std_ulogic;

    instr_sgnj   : std_ulogic;

    instr_sgnj   : std_ulogic;

    instr_comp   : std_ulogic;

    instr_comp   : std_ulogic;

    instr_i2f    : std_ulogic;

    instr_i2f    : std_ulogic;

    instr_f2i    : std_ulogic;

    instr_f2i    : std_ulogic;

    instr_minmax : std_ulogic;

    instr_minmax : std_ulogic;

    instr_addsub : std_ulogic;

    instr_addsub : std_ulogic;

    instr_mul    : std_ulogic;

    instr_mul    : std_ulogic;

    funct        : std_ulogic_vector(2 downto 0);

    funct        : std_ulogic_vector(2 downto 0);

  end record;

  end record;

  signal cmd : cmd_t;

  signal cmd : cmd_t;

  signal funct_ff : std_ulogic_vector(2 downto 0);

  signal funct_ff : std_ulogic_vector(2 downto 0);

  -- co-processor control engine --

  -- co-processor control engine --

  type ctrl_state_t is (S_IDLE, S_BUSY);

  type ctrl_state_t is (S_IDLE, S_BUSY);

  type ctrl_engine_t is record

  type ctrl_engine_t is record

    state : ctrl_state_t;

    state : ctrl_state_t;

    start : std_ulogic;

    start : std_ulogic;

    valid : std_ulogic;

    valid : std_ulogic;

  end record;

  end record;

  signal ctrl_engine : ctrl_engine_t;

  signal ctrl_engine : ctrl_engine_t;

  -- floating-point operands --

  -- floating-point operands --

  type op_data_t  is array (0 to 1) of std_ulogic_vector(31 downto 0);

  type op_data_t  is array (0 to 1) of std_ulogic_vector(31 downto 0);

  type op_class_t is array (0 to 1) of std_ulogic_vector(09 downto 0);

  type op_class_t is array (0 to 1) of std_ulogic_vector(09 downto 0);

  type fpu_operands_t is record

  type fpu_operands_t is record

    rs1       : std_ulogic_vector(31 downto 0); -- operand 1

    rs1       : std_ulogic_vector(31 downto 0); -- operand 1

    rs1_class : std_ulogic_vector(09 downto 0); -- operand 1 number class

    rs1_class : std_ulogic_vector(09 downto 0); -- operand 1 number class

    rs2       : std_ulogic_vector(31 downto 0); -- operand 2

    rs2       : std_ulogic_vector(31 downto 0); -- operand 2

    rs2_class : std_ulogic_vector(09 downto 0); -- operand 2 number class

    rs2_class : std_ulogic_vector(09 downto 0); -- operand 2 number class

    frm       : std_ulogic_vector(02 downto 0); -- rounding mode

    frm       : std_ulogic_vector(02 downto 0); -- rounding mode

  end record;

  end record;

  signal op_data      : op_data_t;

  signal op_data      : op_data_t;

  signal op_class     : op_class_t;

  signal op_class     : op_class_t;

  signal fpu_operands : fpu_operands_t;

  signal fpu_operands : fpu_operands_t;

  -- floating-point comparator --

  -- floating-point comparator --

  signal cmp_ff        : std_ulogic_vector(01 downto 0);

  signal cmp_ff        : std_ulogic_vector(01 downto 0);

  signal comp_equal_ff : std_ulogic;

  signal comp_equal_ff : std_ulogic;

  signal comp_less_ff  : std_ulogic;

  signal comp_less_ff  : std_ulogic;

  -- functional units interface --

  -- functional units interface --

  type fu_interface_t is record

  type fu_interface_t is record

    result : std_ulogic_vector(31 downto 0);

    result : std_ulogic_vector(31 downto 0);

    flags  : std_ulogic_vector(04 downto 0);

    flags  : std_ulogic_vector(04 downto 0);

    start  : std_ulogic;

    start  : std_ulogic;

    done   : std_ulogic;

    done   : std_ulogic;

  end record;

  end record;

  signal fu_classify    : fu_interface_t;

  signal fu_classify    : fu_interface_t;

  signal fu_compare     : fu_interface_t;

  signal fu_compare     : fu_interface_t;

  signal fu_sign_inject : fu_interface_t;

  signal fu_sign_inject : fu_interface_t;

  signal fu_min_max     : fu_interface_t;

  signal fu_min_max     : fu_interface_t;

  signal fu_conv_f2i    : fu_interface_t;

  signal fu_conv_f2i    : fu_interface_t;

  signal fu_addsub      : fu_interface_t;

  signal fu_addsub      : fu_interface_t;

  signal fu_mul         : fu_interface_t;

  signal fu_mul         : fu_interface_t;

  signal fu_core_done   : std_ulogic; -- FU operation completed

  signal fu_core_done   : std_ulogic; -- FU operation completed

  -- integer-to-float --

  -- integer-to-float --

  type fu_i2f_interface_t is record

  type fu_i2f_interface_t is record

    result : std_ulogic_vector(31 downto 0);

    result : std_ulogic_vector(31 downto 0);

    sign   : std_ulogic;

    sign   : std_ulogic;

    start  : std_ulogic;

    start  : std_ulogic;

    done   : std_ulogic;

    done   : std_ulogic;

  end record;

  end record;

  signal fu_conv_i2f : fu_i2f_interface_t; -- float result

  signal fu_conv_i2f : fu_i2f_interface_t; -- float result

  -- multiplier unit --

  -- multiplier unit --

  type multiplier_t is record

  type multiplier_t is record

    opa       : unsigned(23 downto 0); -- mantissa A plus hidden one

    opa       : unsigned(23 downto 0); -- mantissa A plus hidden one

    opb       : unsigned(23 downto 0); -- mantissa B plus hidden one

    opb       : unsigned(23 downto 0); -- mantissa B plus hidden one

    buf_ff    : unsigned(47 downto 0); -- product buffer

    buf_ff    : unsigned(47 downto 0); -- product buffer

    sign      : std_ulogic; -- resulting sign

    sign      : std_ulogic; -- resulting sign

    product   : std_ulogic_vector(47 downto 0); -- product

    product   : std_ulogic_vector(47 downto 0); -- product

    exp_sum   : std_ulogic_vector(08 downto 0); -- incl 1x overflow/underflow bit

    exp_sum   : std_ulogic_vector(08 downto 0); -- incl 1x overflow/underflow bit

    exp_res   : std_ulogic_vector(09 downto 0); -- resulting exponent incl 2x overflow/underflow bit

    exp_res   : std_ulogic_vector(09 downto 0); -- resulting exponent incl 2x overflow/underflow bit

--

--

    res_class : std_ulogic_vector(09 downto 0);

    res_class : std_ulogic_vector(09 downto 0);

    flags     : std_ulogic_vector(04 downto 0); -- exception flags

    flags     : std_ulogic_vector(04 downto 0); -- exception flags

--

--

    start     : std_ulogic;

    start     : std_ulogic;

    latency   : std_ulogic_vector(02 downto 0); -- unit latency

    latency   : std_ulogic_vector(02 downto 0); -- unit latency

    done      : std_ulogic;

    done      : std_ulogic;

  end record;

  end record;

  signal multiplier : multiplier_t;

  signal multiplier : multiplier_t;

  -- adder/subtractor unit --

  -- adder/subtractor unit --

  type addsub_t is record

  type addsub_t is record

    -- input comparison --

    -- input comparison --

    exp_comp  : std_ulogic_vector(01 downto 0); -- equal & less

    exp_comp  : std_ulogic_vector(01 downto 0); -- equal & less

    small_exp : std_ulogic_vector(07 downto 0);

    small_exp : std_ulogic_vector(07 downto 0);

    small_man : std_ulogic_vector(23 downto 0); -- mantissa + hiden one

    small_man : std_ulogic_vector(23 downto 0); -- mantissa + hiden one

    large_exp : std_ulogic_vector(07 downto 0);

    large_exp : std_ulogic_vector(07 downto 0);

    large_man : std_ulogic_vector(23 downto 0); -- mantissa + hiden one

    large_man : std_ulogic_vector(23 downto 0); -- mantissa + hiden one

    -- smaller mantissa alginment --

    -- smaller mantissa alginment --

    man_sreg  : std_ulogic_vector(23 downto 0); -- mantissa + hidden one

    man_sreg  : std_ulogic_vector(23 downto 0); -- mantissa + hidden one

    man_g_ext : std_ulogic;

    man_g_ext : std_ulogic;

    man_r_ext : std_ulogic;

    man_r_ext : std_ulogic;

    man_s_ext : std_ulogic;

    man_s_ext : std_ulogic;

    exp_cnt   : std_ulogic_vector(08 downto 0);

    exp_cnt   : std_ulogic_vector(08 downto 0);

    -- adder/subtractor stage --

    -- adder/subtractor stage --

    man_comp  : std_ulogic;

    man_comp  : std_ulogic;

    man_s     : std_ulogic_vector(26 downto 0); -- mantissa + hiden one + GRS

    man_s     : std_ulogic_vector(26 downto 0); -- mantissa + hiden one + GRS

    man_l     : std_ulogic_vector(26 downto 0); -- mantissa + hiden one + GRS

    man_l     : std_ulogic_vector(26 downto 0); -- mantissa + hiden one + GRS

    add_stage : std_ulogic_vector(27 downto 0); -- adder result incl. overflow

    add_stage : std_ulogic_vector(27 downto 0); -- adder result incl. overflow

    -- result --

    -- result --

    res_sign  : std_ulogic;

    res_sign  : std_ulogic;

    res_sum   : std_ulogic_vector(27 downto 0); -- mantissa sum (+1 bit) + GRS bits (for rounding)

    res_sum   : std_ulogic_vector(27 downto 0); -- mantissa sum (+1 bit) + GRS bits (for rounding)

    res_class : std_ulogic_vector(09 downto 0);

    res_class : std_ulogic_vector(09 downto 0);

    flags     : std_ulogic_vector(04 downto 0); -- exception flags

    flags     : std_ulogic_vector(04 downto 0); -- exception flags

    -- arbitration --

    -- arbitration --

    start     : std_ulogic;

    start     : std_ulogic;

    latency   : std_ulogic_vector(04 downto 0); -- unit latency

    latency   : std_ulogic_vector(04 downto 0); -- unit latency

    done      : std_ulogic;

    done      : std_ulogic;

  end record;

  end record;

  signal addsub : addsub_t;

  signal addsub : addsub_t;

  -- normalizer interface (normalization & rounding and int-to-float) --

  -- normalizer interface (normalization & rounding and int-to-float) --

  type normalizer_t is record

  type normalizer_t is record

    start     : std_ulogic;

    start     : std_ulogic;

    mode      : std_ulogic;

    mode      : std_ulogic;

    sign      : std_ulogic;

    sign      : std_ulogic;

    xexp      : std_ulogic_vector(08 downto 0);

    xexp      : std_ulogic_vector(08 downto 0);

    xmantissa : std_ulogic_vector(47 downto 0);

    xmantissa : std_ulogic_vector(47 downto 0);

    result    : std_ulogic_vector(31 downto 0);

    result    : std_ulogic_vector(31 downto 0);

    class     : std_ulogic_vector(09 downto 0);

    class     : std_ulogic_vector(09 downto 0);

    flags_in  : std_ulogic_vector(04 downto 0);

    flags_in  : std_ulogic_vector(04 downto 0);

    flags_out : std_ulogic_vector(04 downto 0);

    flags_out : std_ulogic_vector(04 downto 0);

    done      : std_ulogic;

    done      : std_ulogic;

  end record;

  end record;

  signal normalizer : normalizer_t;

  signal normalizer : normalizer_t;

begin

begin

-- ****************************************************************************************************************************

-- ****************************************************************************************************************************

-- Control

-- Control

-- ****************************************************************************************************************************

-- ****************************************************************************************************************************

  -- Instruction Decoding -------------------------------------------------------------------

  -- Instruction Decoding -------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- one-hot re-encoding --

  -- one-hot re-encoding --

  cmd.instr_class  <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "11100") else '0';

  cmd.instr_class  <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "11100") else '0';

  cmd.instr_comp   <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "10100") else '0';

  cmd.instr_comp   <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "10100") else '0';

  cmd.instr_i2f    <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "11010") else '0';

  cmd.instr_i2f    <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "11010") else '0';

  cmd.instr_f2i    <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "11000") else '0';

  cmd.instr_f2i    <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "11000") else '0';

  cmd.instr_sgnj   <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "00100") else '0';

  cmd.instr_sgnj   <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "00100") else '0';

  cmd.instr_minmax <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "00101") else '0';

  cmd.instr_minmax <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "00101") else '0';

  cmd.instr_addsub <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_8_c) = "0000")  else '0';

  cmd.instr_addsub <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_8_c) = "0000")  else '0';

  cmd.instr_mul    <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "00010") else '0';

  cmd.instr_mul    <= '1' when (ctrl_i(ctrl_ir_funct12_11_c downto ctrl_ir_funct12_7_c) = "00010") else '0';

  -- binary re-encoding --

  -- binary re-encoding --

  cmd.funct <= op_mul_c     when (cmd.instr_mul    = '1') else

  cmd.funct <= op_mul_c     when (cmd.instr_mul    = '1') else

               op_addsub_c  when (cmd.instr_addsub = '1') else

               op_addsub_c  when (cmd.instr_addsub = '1') else

               op_minmax_c  when (cmd.instr_minmax = '1') else

               op_minmax_c  when (cmd.instr_minmax = '1') else

               op_sgnj_c    when (cmd.instr_sgnj   = '1') else

               op_sgnj_c    when (cmd.instr_sgnj   = '1') else

               op_f2i_c     when (cmd.instr_f2i    = '1') else

               op_f2i_c     when (cmd.instr_f2i    = '1') else

               op_i2f_c     when (cmd.instr_i2f    = '1') else

               op_i2f_c     when (cmd.instr_i2f    = '1') else

               op_comp_c    when (cmd.instr_comp   = '1') else

               op_comp_c    when (cmd.instr_comp   = '1') else

               op_class_c;--when (cmd.instr_class  = '1') else (others => '-');

               op_class_c;--when (cmd.instr_class  = '1') else (others => '-');

  -- Input Operands: Check for subnormal numbers (flush to zero) ----------------------------

  -- Input Operands: Check for subnormal numbers (flush to zero) ----------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- Subnormal numbers are not supported and are "flushed to zero"! FIXME / TODO

  -- Subnormal numbers are not supported and are "flushed to zero"! FIXME / TODO

  -- rs1 --

  -- rs1 --

  op_data(0)(31)           <= rs1_i(31);

  op_data(0)(31)           <= rs1_i(31);

  op_data(0)(30 downto 23) <= rs1_i(30 downto 23);

  op_data(0)(30 downto 23) <= rs1_i(30 downto 23);

  op_data(0)(22 downto 00) <= (others => '0') when (rs1_i(30 downto 23) = "00000000") else rs1_i(22 downto 0); -- flush mantissa to zero if subnormal

  op_data(0)(22 downto 00) <= (others => '0') when (rs1_i(30 downto 23) = "00000000") else rs1_i(22 downto 0); -- flush mantissa to zero if subnormal

  -- rs2 --

  -- rs2 --

  op_data(1)(31)           <= rs2_i(31);

  op_data(1)(31)           <= rs2_i(31);

  op_data(1)(30 downto 23) <= rs2_i(30 downto 23);

  op_data(1)(30 downto 23) <= rs2_i(30 downto 23);

  op_data(1)(22 downto 00) <= (others => '0') when (rs2_i(30 downto 23) = "00000000") else rs2_i(22 downto 0); -- flush mantissa to zero if subnormal

  op_data(1)(22 downto 00) <= (others => '0') when (rs2_i(30 downto 23) = "00000000") else rs2_i(22 downto 0); -- flush mantissa to zero if subnormal

  -- Number Classifier ----------------------------------------------------------------------

  -- Number Classifier ----------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  number_classifier: process(op_data)

  number_classifier: process(op_data)

    variable op_m_all_zero_v, op_e_all_zero_v, op_e_all_one_v       : std_ulogic;

    variable op_m_all_zero_v, op_e_all_zero_v, op_e_all_one_v       : std_ulogic;

    variable op_is_zero_v, op_is_inf_v, op_is_denorm_v, op_is_nan_v : std_ulogic;

    variable op_is_zero_v, op_is_inf_v, op_is_denorm_v, op_is_nan_v : std_ulogic;

  begin

  begin

    for i in 0 to 1 loop -- for rs1 and rs2 inputs

    for i in 0 to 1 loop -- for rs1 and rs2 inputs

      -- check for all-zero/all-one --

      -- check for all-zero/all-one --

      op_m_all_zero_v := not or_reduce_f(op_data(i)(22 downto 00));

      op_m_all_zero_v := '0';

      op_e_all_zero_v := not or_reduce_f(op_data(i)(30 downto 23));

      op_e_all_zero_v := '0';

      op_e_all_one_v  := and_reduce_f(op_data(i)(30 downto 23));

      op_e_all_one_v  := '0';

      if (or_reduce_f(op_data(i)(22 downto 00)) = '0') then

        op_m_all_zero_v := '1';

      end if;

      if (or_reduce_f(op_data(i)(30 downto 23)) = '0') then

        op_e_all_zero_v := '1';

      end if;

      if (and_reduce_f(op_data(i)(30 downto 23)) = '1') then

        op_e_all_one_v  := '1';

      end if;

      -- check special cases --

      -- check special cases --

      op_is_zero_v   := op_e_all_zero_v and      op_m_all_zero_v;  -- zero

      op_is_zero_v   := op_e_all_zero_v and      op_m_all_zero_v;  -- zero

      op_is_inf_v    := op_e_all_one_v  and      op_m_all_zero_v;  -- infinity

      op_is_inf_v    := op_e_all_one_v  and      op_m_all_zero_v;  -- infinity

      op_is_denorm_v := '0'; -- FIXME / TODO -- op_e_all_zero_v and (not op_m_all_zero_v); -- subnormal

      op_is_denorm_v := '0'; -- FIXME / TODO -- op_e_all_zero_v and (not op_m_all_zero_v); -- subnormal

      op_is_nan_v    := op_e_all_one_v  and (not op_m_all_zero_v); -- NaN

      op_is_nan_v    := op_e_all_one_v  and (not op_m_all_zero_v); -- NaN

      -- actual attributes --

      -- actual attributes --

      op_class(i)(fp_class_neg_inf_c)    <= op_data(i)(31) and op_is_inf_v; -- negative infinity

      op_class(i)(fp_class_neg_inf_c)    <= op_data(i)(31) and op_is_inf_v; -- negative infinity

      op_class(i)(fp_class_neg_norm_c)   <= op_data(i)(31) and (not op_is_denorm_v) and (not op_is_nan_v) and (not op_is_inf_v) and (not op_is_zero_v); -- negative normal number

      op_class(i)(fp_class_neg_norm_c)   <= op_data(i)(31) and (not op_is_denorm_v) and (not op_is_nan_v) and (not op_is_inf_v) and (not op_is_zero_v); -- negative normal number

      op_class(i)(fp_class_neg_denorm_c) <= op_data(i)(31) and op_is_denorm_v; -- negative subnormal number

      op_class(i)(fp_class_neg_denorm_c) <= op_data(i)(31) and op_is_denorm_v; -- negative subnormal number

      op_class(i)(fp_class_neg_zero_c)   <= op_data(i)(31) and op_is_zero_v; -- negative zero

      op_class(i)(fp_class_neg_zero_c)   <= op_data(i)(31) and op_is_zero_v; -- negative zero

      op_class(i)(fp_class_pos_zero_c)   <= (not op_data(i)(31)) and op_is_zero_v; -- positive zero

      op_class(i)(fp_class_pos_zero_c)   <= (not op_data(i)(31)) and op_is_zero_v; -- positive zero

      op_class(i)(fp_class_pos_denorm_c) <= (not op_data(i)(31)) and op_is_denorm_v; -- positive subnormal number

      op_class(i)(fp_class_pos_denorm_c) <= (not op_data(i)(31)) and op_is_denorm_v; -- positive subnormal number

      op_class(i)(fp_class_pos_norm_c)   <= (not op_data(i)(31)) and (not op_is_denorm_v) and (not op_is_nan_v) and (not op_is_inf_v) and (not op_is_zero_v); -- positive normal number

      op_class(i)(fp_class_pos_norm_c)   <= (not op_data(i)(31)) and (not op_is_denorm_v) and (not op_is_nan_v) and (not op_is_inf_v) and (not op_is_zero_v); -- positive normal number

      op_class(i)(fp_class_pos_inf_c)    <= (not op_data(i)(31)) and op_is_inf_v; -- positive infinity

      op_class(i)(fp_class_pos_inf_c)    <= (not op_data(i)(31)) and op_is_inf_v; -- positive infinity

      op_class(i)(fp_class_snan_c)       <= op_is_nan_v and (not op_data(i)(22)); -- signaling NaN

      op_class(i)(fp_class_snan_c)       <= op_is_nan_v and (not op_data(i)(22)); -- signaling NaN

      op_class(i)(fp_class_qnan_c)       <= op_is_nan_v and (    op_data(i)(22)); -- quiet NaN

      op_class(i)(fp_class_qnan_c)       <= op_is_nan_v and (    op_data(i)(22)); -- quiet NaN

    end loop; -- i

    end loop; -- i

  end process number_classifier;

  end process number_classifier;

  -- Co-Processor Control Engine ------------------------------------------------------------

  -- Co-Processor Control Engine ------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  control_engine_fsm: process(rstn_i, clk_i)

  control_engine_fsm: process(rstn_i, clk_i)

  begin

  begin

    if (rstn_i = '0') then

    if (rstn_i = '0') then

      ctrl_engine.state      <= S_IDLE;

      ctrl_engine.state      <= S_IDLE;

      ctrl_engine.valid      <= '0';

      ctrl_engine.start      <= '0';

      ctrl_engine.start      <= '0';

      fpu_operands.frm       <= (others => def_rst_val_c);

      fpu_operands.frm       <= (others => def_rst_val_c);

      fpu_operands.rs1       <= (others => def_rst_val_c);

      fpu_operands.rs1       <= (others => def_rst_val_c);

      fpu_operands.rs1_class <= (others => def_rst_val_c);

      fpu_operands.rs1_class <= (others => def_rst_val_c);

      fpu_operands.rs2       <= (others => def_rst_val_c);

      fpu_operands.rs2       <= (others => def_rst_val_c);

      fpu_operands.rs2_class <= (others => def_rst_val_c);

      fpu_operands.rs2_class <= (others => def_rst_val_c);

      funct_ff               <= (others => def_rst_val_c);

      funct_ff               <= (others => def_rst_val_c);

      cmp_ff                 <= (others => def_rst_val_c);

      cmp_ff                 <= (others => def_rst_val_c);

    elsif rising_edge(clk_i) then

    elsif rising_edge(clk_i) then

      -- arbiter defaults --

      -- arbiter defaults --

      ctrl_engine.valid <= '0';

      ctrl_engine.valid <= '0';

      ctrl_engine.start <= '0';

      ctrl_engine.start <= '0';

      -- state machine --

      -- state machine --

      case ctrl_engine.state is

      case ctrl_engine.state is

        when S_IDLE => -- waiting for operation trigger

        when S_IDLE => -- waiting for operation trigger

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          funct_ff <= cmd.funct; -- actual operation to execute

          funct_ff <= cmd.funct; -- actual operation to execute

          cmp_ff   <= cmp_i; -- main ALU comparator

          cmp_ff   <= cmp_i; -- main ALU comparator

          -- rounding mode --

          -- rounding mode --

          -- TODO / FIXME "round to nearest, ties to max magnitude" (0b100) is not supported yet

          -- TODO / FIXME "round to nearest, ties to max magnitude" (0b100) is not supported yet

          if (ctrl_i(ctrl_ir_funct3_2_c downto ctrl_ir_funct3_0_c) = "111") then

          if (ctrl_i(ctrl_ir_funct3_2_c downto ctrl_ir_funct3_0_c) = "111") then

            fpu_operands.frm <= '0' & ctrl_i(ctrl_alu_frm1_c downto ctrl_alu_frm0_c);

            fpu_operands.frm <= '0' & ctrl_i(ctrl_alu_frm1_c downto ctrl_alu_frm0_c);

          else

          else

            fpu_operands.frm <= '0' & ctrl_i(ctrl_ir_funct3_1_c downto ctrl_ir_funct3_0_c);

            fpu_operands.frm <= '0' & ctrl_i(ctrl_ir_funct3_1_c downto ctrl_ir_funct3_0_c);

          end if;

          end if;

--

--

          if (start_i = '1') then

          if (start_i = '1') then

            -- operand data --

            -- operand data --

            fpu_operands.rs1       <= op_data(0);

            fpu_operands.rs1       <= op_data(0);

            fpu_operands.rs1_class <= op_class(0);

            fpu_operands.rs1_class <= op_class(0);

            fpu_operands.rs2       <= op_data(1);

            fpu_operands.rs2       <= op_data(1);

            fpu_operands.rs2_class <= op_class(1);

            fpu_operands.rs2_class <= op_class(1);

            -- execute! --

            -- execute! --

            ctrl_engine.start <= '1';

            ctrl_engine.start <= '1';

            ctrl_engine.state <= S_BUSY;

            ctrl_engine.state <= S_BUSY;

          end if;

          end if;

        when S_BUSY => -- operation in progress (multi-cycle)

        when S_BUSY => -- operation in progress (multi-cycle)

        -- -----------------------------------------------------------

        -- -----------------------------------------------------------

          if (fu_core_done = '1') or (ctrl_i(ctrl_trap_c) = '1') then -- processing done? abort if trap

          if (fu_core_done = '1') or (ctrl_i(ctrl_trap_c) = '1') then -- processing done? abort if trap

            ctrl_engine.valid <= '1';

            ctrl_engine.valid <= '1';

            ctrl_engine.state <= S_IDLE;

            ctrl_engine.state <= S_IDLE;

          end if;

          end if;

        when others => -- undefined

        when others => -- undefined

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          ctrl_engine.state <= S_IDLE;

          ctrl_engine.state <= S_IDLE;

      end case;

      end case;

    end if;

    end if;

  end process control_engine_fsm;

  end process control_engine_fsm;

  -- operation done / valid output --

  -- operation done / valid output --

  valid_o <= ctrl_engine.valid;

  valid_o <= ctrl_engine.valid;

  -- Functional Unit Interface (operation-start trigger) ------------------------------------

  -- Functional Unit Interface (operation-start trigger) ------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  fu_classify.start    <= ctrl_engine.start and cmd.instr_class;

  fu_classify.start    <= ctrl_engine.start and cmd.instr_class;

  fu_compare.start     <= ctrl_engine.start and cmd.instr_comp;

  fu_compare.start     <= ctrl_engine.start and cmd.instr_comp;

  fu_sign_inject.start <= ctrl_engine.start and cmd.instr_sgnj;

  fu_sign_inject.start <= ctrl_engine.start and cmd.instr_sgnj;

  fu_min_max.start     <= ctrl_engine.start and cmd.instr_minmax;

  fu_min_max.start     <= ctrl_engine.start and cmd.instr_minmax;

  fu_conv_i2f.start    <= ctrl_engine.start and cmd.instr_i2f;

  fu_conv_i2f.start    <= ctrl_engine.start and cmd.instr_i2f;

  fu_conv_f2i.start    <= ctrl_engine.start and cmd.instr_f2i;

  fu_conv_f2i.start    <= ctrl_engine.start and cmd.instr_f2i;

  fu_addsub.start      <= ctrl_engine.start and cmd.instr_addsub;

  fu_addsub.start      <= ctrl_engine.start and cmd.instr_addsub;

  fu_mul.start         <= ctrl_engine.start and cmd.instr_mul;

  fu_mul.start         <= ctrl_engine.start and cmd.instr_mul;

-- ****************************************************************************************************************************

-- ****************************************************************************************************************************

-- FPU Core - Functional Units

-- FPU Core - Functional Units

-- ****************************************************************************************************************************

-- ****************************************************************************************************************************

  -- Number Classifier (FCLASS) -------------------------------------------------------------

  -- Number Classifier (FCLASS) -------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  fu_classify.flags <= (others => '0'); -- does not generate flags at all

  fu_classify.flags <= (others => '0'); -- does not generate flags at all

  fu_classify.result(31 downto 10) <= (others => '0');

  fu_classify.result(31 downto 10) <= (others => '0');

  fu_classify.result(09 downto 00) <= fpu_operands.rs1_class;

  fu_classify.result(09 downto 00) <= fpu_operands.rs1_class;

  fu_classify.done <= fu_classify.start;

  fu_classify.done <= fu_classify.start;

  -- Floating-Point Comparator --------------------------------------------------------------

  -- Floating-Point Comparator --------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  float_comparator: process(rstn_i, clk_i)

  float_comparator: process(rstn_i, clk_i)

    variable cond_v : std_ulogic_vector(1 downto 0);

    variable cond_v : std_ulogic_vector(1 downto 0);

  begin

  begin

    if (rstn_i = '0') then

    if (rstn_i = '0') then

      comp_equal_ff   <= def_rst_val_c;

      comp_equal_ff   <= def_rst_val_c;

      comp_less_ff    <= def_rst_val_c;

      comp_less_ff    <= def_rst_val_c;

      fu_compare.done <= def_rst_val_c;

      fu_compare.done <= def_rst_val_c;

      fu_min_max.done <= def_rst_val_c;

      fu_min_max.done <= def_rst_val_c;

    elsif rising_edge(clk_i) then

    elsif rising_edge(clk_i) then

      -- equal --

      -- equal --

      if ((fpu_operands.rs1_class(fp_class_pos_inf_c)   = '1') and (fpu_operands.rs2_class(fp_class_pos_inf_c) = '1')) or -- +inf == +inf

      if ((fpu_operands.rs1_class(fp_class_pos_inf_c)   = '1') and (fpu_operands.rs2_class(fp_class_pos_inf_c) = '1')) or -- +inf == +inf

         ((fpu_operands.rs1_class(fp_class_neg_inf_c)   = '1') and (fpu_operands.rs2_class(fp_class_neg_inf_c) = '1')) or -- -inf == -inf

         ((fpu_operands.rs1_class(fp_class_neg_inf_c)   = '1') and (fpu_operands.rs2_class(fp_class_neg_inf_c) = '1')) or -- -inf == -inf

         (((fpu_operands.rs1_class(fp_class_pos_zero_c) = '1') or (fpu_operands.rs1_class(fp_class_neg_zero_c) = '1')) and

         (((fpu_operands.rs1_class(fp_class_pos_zero_c) = '1') or (fpu_operands.rs1_class(fp_class_neg_zero_c) = '1')) and

          ((fpu_operands.rs2_class(fp_class_pos_zero_c) = '1') or (fpu_operands.rs2_class(fp_class_neg_zero_c) = '1'))) or  -- +/-zero == +/-zero

          ((fpu_operands.rs2_class(fp_class_pos_zero_c) = '1') or (fpu_operands.rs2_class(fp_class_neg_zero_c) = '1'))) or  -- +/-zero == +/-zero

         (cmp_ff(cmp_equal_c) = '1') then -- identical in every way (comparator result from main ALU)

         (cmp_ff(cmp_equal_c) = '1') then -- identical in every way (comparator result from main ALU)

        comp_equal_ff <= '1';

        comp_equal_ff <= '1';

      else

      else

        comp_equal_ff <= '0';

        comp_equal_ff <= '0';

      end if;

      end if;

      -- less than --

      -- less than --

      if ((fpu_operands.rs1_class(fp_class_pos_inf_c)  = '1') and (fpu_operands.rs2_class(fp_class_pos_inf_c) = '1')) or -- +inf !< +inf

      if ((fpu_operands.rs1_class(fp_class_pos_inf_c)  = '1') and (fpu_operands.rs2_class(fp_class_pos_inf_c) = '1')) or -- +inf !< +inf

         ((fpu_operands.rs1_class(fp_class_neg_inf_c)  = '1') and (fpu_operands.rs2_class(fp_class_neg_inf_c) = '1')) or -- -inf !< -inf

         ((fpu_operands.rs1_class(fp_class_neg_inf_c)  = '1') and (fpu_operands.rs2_class(fp_class_neg_inf_c) = '1')) or -- -inf !< -inf

         (((fpu_operands.rs1_class(fp_class_pos_zero_c) = '1') or (fpu_operands.rs1_class(fp_class_neg_zero_c) = '1')) and

         (((fpu_operands.rs1_class(fp_class_pos_zero_c) = '1') or (fpu_operands.rs1_class(fp_class_neg_zero_c) = '1')) and

          ((fpu_operands.rs2_class(fp_class_pos_zero_c) = '1') or (fpu_operands.rs2_class(fp_class_neg_zero_c) = '1'))) then  -- +/-zero !< +/-zero

          ((fpu_operands.rs2_class(fp_class_pos_zero_c) = '1') or (fpu_operands.rs2_class(fp_class_neg_zero_c) = '1'))) then  -- +/-zero !< +/-zero

        comp_less_ff <= '0';

        comp_less_ff <= '0';

      else

      else

        cond_v := fpu_operands.rs1(31) & fpu_operands.rs2(31);

        cond_v := fpu_operands.rs1(31) & fpu_operands.rs2(31);

        case cond_v is

        case cond_v is

          when "10"   => comp_less_ff <= '1'; -- rs1 negative, rs2 positive

          when "10"   => comp_less_ff <= '1'; -- rs1 negative, rs2 positive

          when "01"   => comp_less_ff <= '0'; -- rs1 positive, rs2 negative

          when "01"   => comp_less_ff <= '0'; -- rs1 positive, rs2 negative

          when "00"   => comp_less_ff <= cmp_ff(cmp_less_c); -- both positive (comparator result from main ALU)

          when "00"   => comp_less_ff <= cmp_ff(cmp_less_c); -- both positive (comparator result from main ALU)

          when "11"   => comp_less_ff <= not cmp_ff(cmp_less_c); -- both negative (comparator result from main ALU)

          when "11"   => comp_less_ff <= not cmp_ff(cmp_less_c); -- both negative (comparator result from main ALU)

          when others => comp_less_ff <= '0'; -- undefined

          when others => comp_less_ff <= '0'; -- undefined

        end case;

        end case;

      end if;

      end if;

      -- comparator latency --

      -- comparator latency --

      fu_compare.done <= fu_compare.start; -- for actual comparison operation

      fu_compare.done <= fu_compare.start; -- for actual comparison operation

      fu_min_max.done <= fu_min_max.start; -- for min/max operations

      fu_min_max.done <= fu_min_max.start; -- for min/max operations

    end if;

    end if;

  end process float_comparator;

  end process float_comparator;

  -- Comparison (FEQ/FLT/FLE) ---------------------------------------------------------------

  -- Comparison (FEQ/FLT/FLE) ---------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  float_comparison: process(fpu_operands, ctrl_i, comp_equal_ff, comp_less_ff)

  float_comparison: process(fpu_operands, ctrl_i, comp_equal_ff, comp_less_ff)

    variable snan_v : std_ulogic; -- at least one input is sNaN

    variable snan_v : std_ulogic; -- at least one input is sNaN

    variable qnan_v : std_ulogic; -- at least one input is qNaN

    variable qnan_v : std_ulogic; -- at least one input is qNaN

  begin

  begin

    -- check for NaN --

    -- check for NaN --

    snan_v := fpu_operands.rs1_class(fp_class_snan_c) or fpu_operands.rs2_class(fp_class_snan_c);

    snan_v := fpu_operands.rs1_class(fp_class_snan_c) or fpu_operands.rs2_class(fp_class_snan_c);

    qnan_v := fpu_operands.rs1_class(fp_class_qnan_c) or fpu_operands.rs2_class(fp_class_qnan_c);

    qnan_v := fpu_operands.rs1_class(fp_class_qnan_c) or fpu_operands.rs2_class(fp_class_qnan_c);

    -- condition evaluation --

    -- condition evaluation --

    fu_compare.result <= (others => '0');

    fu_compare.result <= (others => '0');

    case ctrl_i(ctrl_ir_funct3_1_c downto ctrl_ir_funct3_0_c) is

    case ctrl_i(ctrl_ir_funct3_1_c downto ctrl_ir_funct3_0_c) is

      when "00" => -- FLE: less than or equal

      when "00" => -- FLE: less than or equal

        fu_compare.result(0) <= (comp_less_ff or comp_equal_ff) and (not (snan_v or qnan_v)); -- result is zero if either input is NaN

        fu_compare.result(0) <= (comp_less_ff or comp_equal_ff) and (not (snan_v or qnan_v)); -- result is zero if either input is NaN

      when "01" => -- FLT: less than

      when "01" => -- FLT: less than

        fu_compare.result(0) <= comp_less_ff and (not (snan_v or qnan_v)); -- result is zero if either input is NaN

        fu_compare.result(0) <= comp_less_ff and (not (snan_v or qnan_v)); -- result is zero if either input is NaN

      when "10" => -- FEQ: equal

      when "10" => -- FEQ: equal

        fu_compare.result(0) <= comp_equal_ff and (not (snan_v or qnan_v)); -- result is zero if either input is NaN

        fu_compare.result(0) <= comp_equal_ff and (not (snan_v or qnan_v)); -- result is zero if either input is NaN

      when others => -- undefined

      when others => -- undefined

        fu_compare.result(0) <= '0';

        fu_compare.result(0) <= '0';

    end case;

    end case;

  end process float_comparison;

  end process float_comparison;

  -- latency --

  -- latency --

  -- -> done in "float_comparator"

  -- -> done in "float_comparator"

  -- exceptions --

  -- exceptions --

  fu_compare.flags <= (others => '0'); -- does not generate exceptions here, but normalizer can generate exceptions

  fu_compare.flags <= (others => '0'); -- does not generate exceptions here, but normalizer can generate exceptions

  -- Min/Max Select (FMIN/FMAX) -------------------------------------------------------------

  -- Min/Max Select (FMIN/FMAX) -------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  min_max_select: process(fpu_operands, comp_less_ff, fu_compare, ctrl_i)

  min_max_select: process(fpu_operands, comp_less_ff, fu_compare, ctrl_i)

    variable cond_v : std_ulogic_vector(2 downto 0);

    variable cond_v : std_ulogic_vector(2 downto 0);

  begin

  begin

    -- comparison result - check for special cases: -0 is less than +0

    -- comparison result - check for special cases: -0 is less than +0

    if ((fpu_operands.rs1_class(fp_class_neg_zero_c) = '1') and (fpu_operands.rs2_class(fp_class_pos_zero_c) = '1')) then

    if ((fpu_operands.rs1_class(fp_class_neg_zero_c) = '1') and (fpu_operands.rs2_class(fp_class_pos_zero_c) = '1')) then

      cond_v(0) := ctrl_i(ctrl_ir_funct3_0_c);

      cond_v(0) := ctrl_i(ctrl_ir_funct3_0_c);

    elsif ((fpu_operands.rs1_class(fp_class_pos_zero_c) = '1') and (fpu_operands.rs2_class(fp_class_neg_zero_c) = '1')) then

    elsif ((fpu_operands.rs1_class(fp_class_pos_zero_c) = '1') and (fpu_operands.rs2_class(fp_class_neg_zero_c) = '1')) then

      cond_v(0) := not ctrl_i(ctrl_ir_funct3_0_c);

      cond_v(0) := not ctrl_i(ctrl_ir_funct3_0_c);

    else -- "normal= comparison

    else -- "normal= comparison

      cond_v(0) := comp_less_ff xnor ctrl_i(ctrl_ir_funct3_0_c); -- min/max select

      cond_v(0) := comp_less_ff xnor ctrl_i(ctrl_ir_funct3_0_c); -- min/max select

    end if;

    end if;

    -- number NaN check --

    -- number NaN check --

    cond_v(2) := fpu_operands.rs1_class(fp_class_snan_c) or fpu_operands.rs1_class(fp_class_qnan_c);

    cond_v(2) := fpu_operands.rs1_class(fp_class_snan_c) or fpu_operands.rs1_class(fp_class_qnan_c);

    cond_v(1) := fpu_operands.rs2_class(fp_class_snan_c) or fpu_operands.rs2_class(fp_class_qnan_c);

    cond_v(1) := fpu_operands.rs2_class(fp_class_snan_c) or fpu_operands.rs2_class(fp_class_qnan_c);

    -- data output --

    -- data output --

    case cond_v is

    case cond_v is

      when "000"         => fu_min_max.result <= fpu_operands.rs1;

      when "000"         => fu_min_max.result <= fpu_operands.rs1;

      when "001"         => fu_min_max.result <= fpu_operands.rs2;

      when "001"         => fu_min_max.result <= fpu_operands.rs2;

      when "010" | "011" => fu_min_max.result <= fpu_operands.rs1; -- if one input is NaN output the non-NaN one

      when "010" | "011" => fu_min_max.result <= fpu_operands.rs1; -- if one input is NaN output the non-NaN one

      when "100" | "101" => fu_min_max.result <= fpu_operands.rs2; -- if one input is NaN output the non-NaN one

      when "100" | "101" => fu_min_max.result <= fpu_operands.rs2; -- if one input is NaN output the non-NaN one

      when others        => fu_min_max.result <= fp_single_qnan_c; -- output quiet NaN if both inputs are NaN

      when others        => fu_min_max.result <= fp_single_qnan_c; -- output quiet NaN if both inputs are NaN

    end case;

    end case;

  end process min_max_select;

  end process min_max_select;

  -- latency --

  -- latency --

  -- -> done in "float_comparator"

  -- -> done in "float_comparator"

  -- exceptions --

  -- exceptions --

  fu_min_max.flags <= (others => '0'); -- does not generate exceptions here, but normalizer can generate exceptions

  fu_min_max.flags <= (others => '0'); -- does not generate exceptions here, but normalizer can generate exceptions

  -- Convert: Float to [unsigned] Integer (FCVT.S.W) ----------------------------------------

  -- Convert: Float to [unsigned] Integer (FCVT.S.W) ----------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  neorv32_cpu_cp_fpu_f2i_inst: neorv32_cpu_cp_fpu_f2i

  neorv32_cpu_cp_fpu_f2i_inst: neorv32_cpu_cp_fpu_f2i

  port map (

  port map (

    -- control --

    -- control --

    clk_i      => clk_i,                          -- global clock, rising edge

    clk_i      => clk_i,                          -- global clock, rising edge

    rstn_i     => rstn_i,                         -- global reset, low-active, async

    rstn_i     => rstn_i,                         -- global reset, low-active, async

    start_i    => fu_conv_f2i.start,              -- trigger operation

    start_i    => fu_conv_f2i.start,              -- trigger operation

    rmode_i    => fpu_operands.frm,               -- rounding mode

    rmode_i    => fpu_operands.frm,               -- rounding mode

    funct_i    => ctrl_i(ctrl_ir_funct12_0_c),    -- 0=signed, 1=unsigned

    funct_i    => ctrl_i(ctrl_ir_funct12_0_c),    -- 0=signed, 1=unsigned

    -- input --

    -- input --

    sign_i     => fpu_operands.rs1(31),           -- sign

    sign_i     => fpu_operands.rs1(31),           -- sign

    exponent_i => fpu_operands.rs1(30 downto 23), -- exponent

    exponent_i => fpu_operands.rs1(30 downto 23), -- exponent

    mantissa_i => fpu_operands.rs1(22 downto 00), -- mantissa

    mantissa_i => fpu_operands.rs1(22 downto 00), -- mantissa

    class_i    => fpu_operands.rs1_class,         -- operand class

    class_i    => fpu_operands.rs1_class,         -- operand class

    -- output --

    -- output --

    result_o   => fu_conv_f2i.result,             -- integer result

    result_o   => fu_conv_f2i.result,             -- integer result

    flags_o    => fu_conv_f2i.flags,              -- exception flags

    flags_o    => fu_conv_f2i.flags,              -- exception flags

    done_o     => fu_conv_f2i.done                -- operation done

    done_o     => fu_conv_f2i.done                -- operation done

);

);

  -- Sign-Injection (FSGNJ) -----------------------------------------------------------------

  -- Sign-Injection (FSGNJ) -----------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  sign_injector: process(ctrl_i, fpu_operands)

  sign_injector: process(ctrl_i, fpu_operands)

  begin

  begin

    case ctrl_i(ctrl_ir_funct3_1_c downto ctrl_ir_funct3_0_c) is

    case ctrl_i(ctrl_ir_funct3_1_c downto ctrl_ir_funct3_0_c) is

      when "00"   => fu_sign_inject.result(31) <= fpu_operands.rs2(31); -- FSGNJ

      when "00"   => fu_sign_inject.result(31) <= fpu_operands.rs2(31); -- FSGNJ

      when "01"   => fu_sign_inject.result(31) <= not fpu_operands.rs2(31); -- FSGNJN

      when "01"   => fu_sign_inject.result(31) <= not fpu_operands.rs2(31); -- FSGNJN

      when "10"   => fu_sign_inject.result(31) <= fpu_operands.rs1(31) xor fpu_operands.rs2(31); -- FSGNJX

      when "10"   => fu_sign_inject.result(31) <= fpu_operands.rs1(31) xor fpu_operands.rs2(31); -- FSGNJX

      when others => fu_sign_inject.result(31) <= fpu_operands.rs2(31); -- undefined

      when others => fu_sign_inject.result(31) <= fpu_operands.rs2(31); -- undefined

    end case;

    end case;

    fu_sign_inject.result(30 downto 0) <= fpu_operands.rs1(30 downto 0);

    fu_sign_inject.result(30 downto 0) <= fpu_operands.rs1(30 downto 0);

    fu_sign_inject.flags <= (others => '0'); -- does not generate flags

    fu_sign_inject.flags <= (others => '0'); -- does not generate flags

  end process sign_injector;

  end process sign_injector;

  -- latency --

  -- latency --

  fu_sign_inject.done <= fu_sign_inject.start;

  fu_sign_inject.done <= fu_sign_inject.start;

  -- Convert: [unsigned] Integer to Float (FCVT.W.S) ----------------------------------------

  -- Convert: [unsigned] Integer to Float (FCVT.W.S) ----------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  convert_i2f: process(rstn_i, clk_i)

  convert_i2f: process(rstn_i, clk_i)

  begin

  begin

    -- this process only computes the absolute input value

    -- this process only computes the absolute input value

    -- the actual conversion is done by the normalizer

    -- the actual conversion is done by the normalizer

    if (rstn_i = '0') then

    if (rstn_i = '0') then

      fu_conv_i2f.result <= (others => def_rst_val_c);

      fu_conv_i2f.result <= (others => def_rst_val_c);

      fu_conv_i2f.sign   <= def_rst_val_c;

      fu_conv_i2f.sign   <= def_rst_val_c;

    elsif rising_edge(clk_i) then

    elsif rising_edge(clk_i) then

      if (ctrl_i(ctrl_ir_funct12_0_c) = '0') and (rs1_i(31) = '1') then -- convert signed integer

      if (ctrl_i(ctrl_ir_funct12_0_c) = '0') and (rs1_i(31) = '1') then -- convert signed integer

        fu_conv_i2f.result <= std_ulogic_vector(0 - unsigned(rs1_i));

        fu_conv_i2f.result <= std_ulogic_vector(0 - unsigned(rs1_i));

        fu_conv_i2f.sign   <= rs1_i(31); -- original sign

        fu_conv_i2f.sign   <= rs1_i(31); -- original sign

      else -- convert unsigned integer

      else -- convert unsigned integer

        fu_conv_i2f.result <= rs1_i;

        fu_conv_i2f.result <= rs1_i;

        fu_conv_i2f.sign   <= '0';

        fu_conv_i2f.sign   <= '0';

      end if;

      end if;

      fu_conv_i2f.done <= fu_conv_i2f.start; -- actual conversion is done by the normalizer unit

      fu_conv_i2f.done <= fu_conv_i2f.start; -- actual conversion is done by the normalizer unit

    end if;

    end if;

  end process convert_i2f;

  end process convert_i2f;

  -- Multiplier Core (FMUL) -----------------------------------------------------------------

  -- Multiplier Core (FMUL) -----------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  multiplier_core: process(rstn_i, clk_i)

  multiplier_core: process(rstn_i, clk_i)

  begin

  begin

    if (rstn_i = '0') then

    if (rstn_i = '0') then

      multiplier.opa                <= (others => '-'); -- these might be DSP regs!

      multiplier.opa                <= (others => '-'); -- these might be DSP regs!

      multiplier.opb                <= (others => '-'); -- these might be DSP regs!

      multiplier.opb                <= (others => '-'); -- these might be DSP regs!

      multiplier.buf_ff             <= (others => '-'); -- these might be DSP regs!

      multiplier.buf_ff             <= (others => '-'); -- these might be DSP regs!

      multiplier.product            <= (others => '-'); -- these might be DSP regs!

      multiplier.product            <= (others => '-'); -- these might be DSP regs!

      multiplier.sign               <= def_rst_val_c;

      multiplier.sign               <= def_rst_val_c;

      multiplier.exp_res            <= (others => def_rst_val_c);

      multiplier.exp_res            <= (others => def_rst_val_c);

      multiplier.flags(fp_exc_of_c) <= def_rst_val_c;

      multiplier.flags(fp_exc_of_c) <= def_rst_val_c;

      multiplier.flags(fp_exc_uf_c) <= def_rst_val_c;

      multiplier.flags(fp_exc_uf_c) <= def_rst_val_c;

      multiplier.flags(fp_exc_nv_c) <= def_rst_val_c;

      multiplier.flags(fp_exc_nv_c) <= def_rst_val_c;

      multiplier.latency            <= (others => def_rst_val_c);

      multiplier.latency            <= (others => def_rst_val_c);

    elsif rising_edge(clk_i) then

    elsif rising_edge(clk_i) then

      -- multiplier core --

      -- multiplier core --

      if (multiplier.start = '1') then -- FIXME / TODO remove buffer?

      if (multiplier.start = '1') then -- FIXME / TODO remove buffer?

        multiplier.opa <= unsigned('1' & fpu_operands.rs1(22 downto 0)); -- append hidden one

        multiplier.opa <= unsigned('1' & fpu_operands.rs1(22 downto 0)); -- append hidden one

        multiplier.opb <= unsigned('1' & fpu_operands.rs2(22 downto 0)); -- append hidden one

        multiplier.opb <= unsigned('1' & fpu_operands.rs2(22 downto 0)); -- append hidden one

      end if;

      end if;

      multiplier.buf_ff  <= multiplier.opa * multiplier.opb;

      multiplier.buf_ff  <= multiplier.opa * multiplier.opb;

      multiplier.product <= std_ulogic_vector(multiplier.buf_ff(47 downto 0)); -- let the register balancing do the magic here

      multiplier.product <= std_ulogic_vector(multiplier.buf_ff(47 downto 0)); -- let the register balancing do the magic here

      multiplier.sign    <= fpu_operands.rs1(31) xor fpu_operands.rs2(31); -- resulting sign

      multiplier.sign    <= fpu_operands.rs1(31) xor fpu_operands.rs2(31); -- resulting sign

      -- exponent computation --

      -- exponent computation --

      multiplier.exp_res <= std_ulogic_vector(unsigned('0' & multiplier.exp_sum) - 127);

      multiplier.exp_res <= std_ulogic_vector(unsigned('0' & multiplier.exp_sum) - 127);

      if (multiplier.exp_res(multiplier.exp_res'left) = '1') then -- underflow (exp_res is "negative")

      if (multiplier.exp_res(multiplier.exp_res'left) = '1') then -- underflow (exp_res is "negative")

        multiplier.flags(fp_exc_of_c) <= '0';

        multiplier.flags(fp_exc_of_c) <= '0';

        multiplier.flags(fp_exc_uf_c) <= '1';

        multiplier.flags(fp_exc_uf_c) <= '1';

      elsif (multiplier.exp_res(multiplier.exp_res'left-1) = '1') then -- overflow

      elsif (multiplier.exp_res(multiplier.exp_res'left-1) = '1') then -- overflow

        multiplier.flags(fp_exc_of_c) <= '1';

        multiplier.flags(fp_exc_of_c) <= '1';

        multiplier.flags(fp_exc_uf_c) <= '0';

        multiplier.flags(fp_exc_uf_c) <= '0';

      else

      else

        multiplier.flags(fp_exc_of_c) <= '0';

        multiplier.flags(fp_exc_of_c) <= '0';

        multiplier.flags(fp_exc_uf_c) <= '0';

        multiplier.flags(fp_exc_uf_c) <= '0';

      end if;

      end if;

      -- invalid operation --

      -- invalid operation --

      multiplier.flags(fp_exc_nv_c) <=

      multiplier.flags(fp_exc_nv_c) <=

        ((fpu_operands.rs1_class(fp_class_pos_zero_c) or fpu_operands.rs1_class(fp_class_neg_zero_c)) and

        ((fpu_operands.rs1_class(fp_class_pos_zero_c) or fpu_operands.rs1_class(fp_class_neg_zero_c)) and

         (fpu_operands.rs2_class(fp_class_pos_inf_c)  or fpu_operands.rs2_class(fp_class_neg_inf_c))) or -- mul(+/-zero, +/-inf)

         (fpu_operands.rs2_class(fp_class_pos_inf_c)  or fpu_operands.rs2_class(fp_class_neg_inf_c))) or -- mul(+/-zero, +/-inf)

        ((fpu_operands.rs1_class(fp_class_pos_inf_c)  or fpu_operands.rs1_class(fp_class_neg_inf_c)) and

        ((fpu_operands.rs1_class(fp_class_pos_inf_c)  or fpu_operands.rs1_class(fp_class_neg_inf_c)) and

         (fpu_operands.rs2_class(fp_class_pos_zero_c) or fpu_operands.rs2_class(fp_class_neg_zero_c))); -- mul(+/-inf, +/-zero)

         (fpu_operands.rs2_class(fp_class_pos_zero_c) or fpu_operands.rs2_class(fp_class_neg_zero_c))); -- mul(+/-inf, +/-zero)

      -- latency shift register --

      -- latency shift register --

      multiplier.latency <= multiplier.latency(multiplier.latency'left-1 downto 0) & multiplier.start;

      multiplier.latency <= multiplier.latency(multiplier.latency'left-1 downto 0) & multiplier.start;

    end if;

    end if;

  end process multiplier_core;

  end process multiplier_core;

  -- exponent sum --

  -- exponent sum --

  multiplier.exp_sum <= std_ulogic_vector(unsigned('0' & fpu_operands.rs1(30 downto 23)) + unsigned('0' & fpu_operands.rs2(30 downto 23)));

  multiplier.exp_sum <= std_ulogic_vector(unsigned('0' & fpu_operands.rs1(30 downto 23)) + unsigned('0' & fpu_operands.rs2(30 downto 23)));

  -- latency --

  -- latency --

  multiplier.start <= fu_mul.start;

  multiplier.start <= fu_mul.start;

  multiplier.done  <= multiplier.latency(multiplier.latency'left);

  multiplier.done  <= multiplier.latency(multiplier.latency'left);

  fu_mul.done      <= multiplier.done;

  fu_mul.done      <= multiplier.done;

  -- unused exception flags --

  -- unused exception flags --

  multiplier.flags(fp_exc_dz_c) <= '0'; -- division by zero: not possible here

  multiplier.flags(fp_exc_dz_c) <= '0'; -- division by zero: not possible here

  multiplier.flags(fp_exc_nx_c) <= '0'; -- inexcat: not possible here

  multiplier.flags(fp_exc_nx_c) <= '0'; -- inexcat: not possible here

  -- result class --

  -- result class --

  multiplier_class_core: process(rstn_i, clk_i)

  multiplier_class_core: process(rstn_i, clk_i)

    variable a_pos_norm_v, a_neg_norm_v, b_pos_norm_v, b_neg_norm_v : std_ulogic;

    variable a_pos_norm_v, a_neg_norm_v, b_pos_norm_v, b_neg_norm_v : std_ulogic;

    variable a_pos_subn_v, a_neg_subn_v, b_pos_subn_v, b_neg_subn_v : std_ulogic;

    variable a_pos_subn_v, a_neg_subn_v, b_pos_subn_v, b_neg_subn_v : std_ulogic;

    variable a_pos_zero_v, a_neg_zero_v, b_pos_zero_v, b_neg_zero_v : std_ulogic;

    variable a_pos_zero_v, a_neg_zero_v, b_pos_zero_v, b_neg_zero_v : std_ulogic;

    variable a_pos_inf_v,  a_neg_inf_v,  b_pos_inf_v,  b_neg_inf_v  : std_ulogic;

    variable a_pos_inf_v,  a_neg_inf_v,  b_pos_inf_v,  b_neg_inf_v  : std_ulogic;

    variable a_snan_v,     a_qnan_v,     b_snan_v,     b_qnan_v     : std_ulogic;

    variable a_snan_v,     a_qnan_v,     b_snan_v,     b_qnan_v     : std_ulogic;

  begin

  begin

    if (rstn_i = '0') then

    if (rstn_i = '0') then

      multiplier.res_class(fp_class_pos_norm_c) <= def_rst_val_c;

      multiplier.res_class <= (others => def_rst_val_c);

      multiplier.res_class(fp_class_neg_norm_c) <= def_rst_val_c;

      multiplier.res_class(fp_class_pos_inf_c)  <= def_rst_val_c;

      multiplier.res_class(fp_class_neg_inf_c)  <= def_rst_val_c;

      multiplier.res_class(fp_class_pos_zero_c) <= def_rst_val_c;

      multiplier.res_class(fp_class_neg_zero_c) <= def_rst_val_c;

    elsif rising_edge(clk_i) then

    elsif rising_edge(clk_i) then

      -- minions --

      -- minions --

      a_pos_norm_v := fpu_operands.rs1_class(fp_class_pos_norm_c);    b_pos_norm_v := fpu_operands.rs2_class(fp_class_pos_norm_c);

      a_pos_norm_v := fpu_operands.rs1_class(fp_class_pos_norm_c);    b_pos_norm_v := fpu_operands.rs2_class(fp_class_pos_norm_c);

      a_neg_norm_v := fpu_operands.rs1_class(fp_class_neg_norm_c);    b_neg_norm_v := fpu_operands.rs2_class(fp_class_neg_norm_c);

      a_neg_norm_v := fpu_operands.rs1_class(fp_class_neg_norm_c);    b_neg_norm_v := fpu_operands.rs2_class(fp_class_neg_norm_c);

      a_pos_subn_v := fpu_operands.rs1_class(fp_class_pos_denorm_c);  b_pos_subn_v := fpu_operands.rs2_class(fp_class_pos_denorm_c);

      a_pos_subn_v := fpu_operands.rs1_class(fp_class_pos_denorm_c);  b_pos_subn_v := fpu_operands.rs2_class(fp_class_pos_denorm_c);

      a_neg_subn_v := fpu_operands.rs1_class(fp_class_neg_denorm_c);  b_neg_subn_v := fpu_operands.rs2_class(fp_class_neg_denorm_c);

      a_neg_subn_v := fpu_operands.rs1_class(fp_class_neg_denorm_c);  b_neg_subn_v := fpu_operands.rs2_class(fp_class_neg_denorm_c);

      a_pos_zero_v := fpu_operands.rs1_class(fp_class_pos_zero_c);    b_pos_zero_v := fpu_operands.rs2_class(fp_class_pos_zero_c);

      a_pos_zero_v := fpu_operands.rs1_class(fp_class_pos_zero_c);    b_pos_zero_v := fpu_operands.rs2_class(fp_class_pos_zero_c);

      a_neg_zero_v := fpu_operands.rs1_class(fp_class_neg_zero_c);    b_neg_zero_v := fpu_operands.rs2_class(fp_class_neg_zero_c);

      a_neg_zero_v := fpu_operands.rs1_class(fp_class_neg_zero_c);    b_neg_zero_v := fpu_operands.rs2_class(fp_class_neg_zero_c);

      a_pos_inf_v  := fpu_operands.rs1_class(fp_class_pos_inf_c);     b_pos_inf_v  := fpu_operands.rs2_class(fp_class_pos_inf_c);

      a_pos_inf_v  := fpu_operands.rs1_class(fp_class_pos_inf_c);     b_pos_inf_v  := fpu_operands.rs2_class(fp_class_pos_inf_c);

      a_neg_inf_v  := fpu_operands.rs1_class(fp_class_neg_inf_c);     b_neg_inf_v  := fpu_operands.rs2_class(fp_class_neg_inf_c);

      a_neg_inf_v  := fpu_operands.rs1_class(fp_class_neg_inf_c);     b_neg_inf_v  := fpu_operands.rs2_class(fp_class_neg_inf_c);

      a_snan_v     := fpu_operands.rs1_class(fp_class_snan_c);        b_snan_v     := fpu_operands.rs2_class(fp_class_snan_c);

      a_snan_v     := fpu_operands.rs1_class(fp_class_snan_c);        b_snan_v     := fpu_operands.rs2_class(fp_class_snan_c);

      a_qnan_v     := fpu_operands.rs1_class(fp_class_qnan_c);        b_qnan_v     := fpu_operands.rs2_class(fp_class_qnan_c);

      a_qnan_v     := fpu_operands.rs1_class(fp_class_qnan_c);        b_qnan_v     := fpu_operands.rs2_class(fp_class_qnan_c);

      -- +normal --

      -- +normal --

      multiplier.res_class(fp_class_pos_norm_c) <=

      multiplier.res_class(fp_class_pos_norm_c) <=

        (a_pos_norm_v and b_pos_norm_v) or -- +norm * +norm

        (a_pos_norm_v and b_pos_norm_v) or -- +norm * +norm

        (a_neg_norm_v and b_neg_norm_v);   -- -norm * -norm

        (a_neg_norm_v and b_neg_norm_v);   -- -norm * -norm

      -- -normal --

      -- -normal --

      multiplier.res_class(fp_class_neg_norm_c) <=

      multiplier.res_class(fp_class_neg_norm_c) <=

        (a_pos_norm_v and b_neg_norm_v) or -- +norm * -norm

        (a_pos_norm_v and b_neg_norm_v) or -- +norm * -norm

        (a_neg_norm_v and b_pos_norm_v);   -- -norm * +norm

        (a_neg_norm_v and b_pos_norm_v);   -- -norm * +norm

      -- +infinity --

      -- +infinity --

      multiplier.res_class(fp_class_pos_inf_c) <=

      multiplier.res_class(fp_class_pos_inf_c) <=

        (a_pos_inf_v  and b_pos_inf_v)  or -- +inf    * +inf

        (a_pos_inf_v  and b_pos_inf_v)  or -- +inf    * +inf

        (a_neg_inf_v  and b_neg_inf_v)  or -- -inf    * -inf

        (a_neg_inf_v  and b_neg_inf_v)  or -- -inf    * -inf

        (a_pos_norm_v and b_pos_inf_v)  or -- +norm   * +inf

        (a_pos_norm_v and b_pos_inf_v)  or -- +norm   * +inf

        (a_pos_inf_v  and b_pos_norm_v) or -- +inf    * +norm

        (a_pos_inf_v  and b_pos_norm_v) or -- +inf    * +norm

        (a_neg_norm_v and b_neg_inf_v)  or -- -norm   * -inf

        (a_neg_norm_v and b_neg_inf_v)  or -- -norm   * -inf

        (a_neg_inf_v  and b_neg_norm_v) or -- -inf    * -norm

        (a_neg_inf_v  and b_neg_norm_v) or -- -inf    * -norm

        (a_neg_subn_v and b_neg_inf_v)  or -- -denorm * -inf

        (a_neg_subn_v and b_neg_inf_v)  or -- -denorm * -inf

        (a_neg_inf_v  and b_neg_subn_v);   -- -inf    * -denorm

        (a_neg_inf_v  and b_neg_subn_v);   -- -inf    * -denorm

      -- -infinity --

      -- -infinity --

      multiplier.res_class(fp_class_neg_inf_c) <=

      multiplier.res_class(fp_class_neg_inf_c) <=

        (a_pos_inf_v  and b_neg_inf_v)  or -- +inf    * -inf

        (a_pos_inf_v  and b_neg_inf_v)  or -- +inf    * -inf

        (a_neg_inf_v  and b_pos_inf_v)  or -- -inf    * +inf

        (a_neg_inf_v  and b_pos_inf_v)  or -- -inf    * +inf

        (a_pos_norm_v and b_neg_inf_v)  or -- +norm   * -inf

        (a_pos_norm_v and b_neg_inf_v)  or -- +norm   * -inf

        (a_neg_inf_v  and b_pos_norm_v) or -- -inf    * +norm

        (a_neg_inf_v  and b_pos_norm_v) or -- -inf    * +norm

        (a_neg_norm_v and b_pos_inf_v)  or -- -norm   * +inf

        (a_neg_norm_v and b_pos_inf_v)  or -- -norm   * +inf

        (a_pos_inf_v  and b_neg_norm_v) or -- +inf    * -norm

        (a_pos_inf_v  and b_neg_norm_v) or -- +inf    * -norm

        (a_pos_subn_v and b_neg_inf_v)  or -- +denorm * -inf

        (a_pos_subn_v and b_neg_inf_v)  or -- +denorm * -inf

        (a_neg_inf_v  and b_pos_subn_v) or -- -inf    * +de-norm

        (a_neg_inf_v  and b_pos_subn_v) or -- -inf    * +de-norm

        (a_neg_subn_v and b_pos_inf_v)  or -- -denorm * +inf

        (a_neg_subn_v and b_pos_inf_v)  or -- -denorm * +inf

        (a_pos_inf_v  and b_neg_subn_v);   -- +inf    * -de-norm

        (a_pos_inf_v  and b_neg_subn_v);   -- +inf    * -de-norm

      -- +zero --

      -- +zero --

      multiplier.res_class(fp_class_pos_zero_c) <=

      multiplier.res_class(fp_class_pos_zero_c) <=

        (a_pos_zero_v and b_pos_zero_v) or -- +zero   * +zero

        (a_pos_zero_v and b_pos_zero_v) or -- +zero   * +zero

        (a_pos_zero_v and b_pos_norm_v) or -- +zero   * +norm

        (a_pos_zero_v and b_pos_norm_v) or -- +zero   * +norm

        (a_pos_zero_v and b_pos_subn_v) or -- +zero   * +denorm

        (a_pos_zero_v and b_pos_subn_v) or -- +zero   * +denorm

        (a_neg_zero_v and b_neg_zero_v) or -- -zero   * -zero

        (a_neg_zero_v and b_neg_zero_v) or -- -zero   * -zero

        (a_neg_zero_v and b_neg_norm_v) or -- -zero   * -norm

        (a_neg_zero_v and b_neg_norm_v) or -- -zero   * -norm

        (a_neg_zero_v and b_neg_subn_v) or -- -zero   * -denorm

        (a_neg_zero_v and b_neg_subn_v) or -- -zero   * -denorm

        (a_pos_norm_v and b_pos_zero_v) or -- +norm   * +zero

        (a_pos_norm_v and b_pos_zero_v) or -- +norm   * +zero

        (a_pos_subn_v and b_pos_zero_v) or -- +denorm * +zero

        (a_pos_subn_v and b_pos_zero_v) or -- +denorm * +zero

        (a_neg_norm_v and b_neg_zero_v) or -- -norm   * -zero

        (a_neg_norm_v and b_neg_zero_v) or -- -norm   * -zero

        (a_neg_subn_v and b_neg_zero_v);   -- -denorm * -zero

        (a_neg_subn_v and b_neg_zero_v);   -- -denorm * -zero

      -- -zero --

      -- -zero --

      multiplier.res_class(fp_class_neg_zero_c) <=

      multiplier.res_class(fp_class_neg_zero_c) <=

        (a_pos_zero_v and b_neg_zero_v) or -- +zero   * -zero

        (a_pos_zero_v and b_neg_zero_v) or -- +zero   * -zero

        (a_pos_zero_v and b_neg_norm_v) or -- +zero   * -norm

        (a_pos_zero_v and b_neg_norm_v) or -- +zero   * -norm

        (a_pos_zero_v and b_neg_subn_v) or -- +zero   * -denorm

        (a_pos_zero_v and b_neg_subn_v) or -- +zero   * -denorm

        (a_neg_zero_v and b_pos_zero_v) or -- -zero   * +zero

        (a_neg_zero_v and b_pos_zero_v) or -- -zero   * +zero

        (a_neg_zero_v and b_pos_norm_v) or -- -zero   * +norm

        (a_neg_zero_v and b_pos_norm_v) or -- -zero   * +norm

        (a_neg_zero_v and b_pos_subn_v) or -- -zero   * +denorm

        (a_neg_zero_v and b_pos_subn_v) or -- -zero   * +denorm

        (a_neg_norm_v and b_pos_zero_v) or -- -norm   * +zero

        (a_neg_norm_v and b_pos_zero_v) or -- -norm   * +zero

        (a_neg_subn_v and b_pos_zero_v) or -- -denorm * +zero

        (a_neg_subn_v and b_pos_zero_v) or -- -denorm * +zero

        (a_pos_norm_v and b_neg_zero_v) or -- +norm   * -zero

        (a_pos_norm_v and b_neg_zero_v) or -- +norm   * -zero

        (a_pos_subn_v and b_neg_zero_v);   -- +denorm * -zero

        (a_pos_subn_v and b_neg_zero_v);   -- +denorm * -zero

      -- sNaN --

      -- sNaN --

      multiplier.res_class(fp_class_snan_c) <= (a_snan_v or b_snan_v); -- any input is sNaN

      multiplier.res_class(fp_class_snan_c) <= (a_snan_v or b_snan_v); -- any input is sNaN

      -- qNaN --

      -- qNaN --

      multiplier.res_class(fp_class_qnan_c) <=

      multiplier.res_class(fp_class_qnan_c) <=

        (a_snan_v or b_snan_v) or -- any input is sNaN

        (a_snan_v or b_snan_v) or -- any input is sNaN

        (a_qnan_v or b_qnan_v) or -- nay input is qNaN

        (a_qnan_v or b_qnan_v) or -- nay input is qNaN

        ((a_pos_inf_v  or a_neg_inf_v)  and (b_pos_zero_v or b_neg_zero_v)) or -- +/-inf * +/-zero

        ((a_pos_inf_v  or a_neg_inf_v)  and (b_pos_zero_v or b_neg_zero_v)) or -- +/-inf * +/-zero

        ((a_pos_zero_v or a_neg_zero_v) and (b_pos_inf_v  or b_neg_inf_v));    -- +/-zero * +/-inf

        ((a_pos_zero_v or a_neg_zero_v) and (b_pos_inf_v  or b_neg_inf_v));    -- +/-zero * +/-inf

    end if;

  end process multiplier_class_core;

  -- subnormal result --

      -- subnormal result --

  multiplier.res_class(fp_class_pos_denorm_c) <= '0'; -- is evaluated by the normalizer

      multiplier.res_class(fp_class_pos_denorm_c) <= '0'; -- is evaluated by the normalizer

  multiplier.res_class(fp_class_neg_denorm_c) <= '0'; -- is evaluated by the normalizer

  multiplier.res_class(fp_class_neg_denorm_c) <= '0'; -- is evaluated by the normalizer

    end if;

  end process multiplier_class_core;

  -- unused --

  -- unused --

  fu_mul.result <= (others => '0');

  fu_mul.result <= (others => '0');

  fu_mul.flags  <= (others => '0');

  fu_mul.flags  <= (others => '0');

  -- Adder/Subtractor Core (FADD, FSUB) -----------------------------------------------------

  -- Adder/Subtractor Core (FADD, FSUB) -----------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  adder_subtractor_core: process(rstn_i, clk_i)

  adder_subtractor_core: process(rstn_i, clk_i)

  begin

  begin

    if (rstn_i = '0') then

    if (rstn_i = '0') then

      addsub.latency   <= (others => def_rst_val_c);

      addsub.latency   <= (others => def_rst_val_c);

      addsub.exp_comp  <= (others => def_rst_val_c);

      addsub.exp_comp  <= (others => def_rst_val_c);

      addsub.man_sreg  <= (others => def_rst_val_c);

      addsub.man_sreg  <= (others => def_rst_val_c);

      addsub.exp_cnt   <= (others => def_rst_val_c);

      addsub.exp_cnt   <= (others => def_rst_val_c);

      addsub.man_g_ext <= def_rst_val_c;

      addsub.man_g_ext <= def_rst_val_c;

      addsub.man_r_ext <= def_rst_val_c;

      addsub.man_r_ext <= def_rst_val_c;

      addsub.man_s_ext <= def_rst_val_c;

      addsub.man_s_ext <= def_rst_val_c;

      addsub.man_comp  <= def_rst_val_c;

      addsub.man_comp  <= def_rst_val_c;

      addsub.add_stage <= (others => def_rst_val_c);

      addsub.add_stage <= (others => def_rst_val_c);

      addsub.res_sign  <= def_rst_val_c;

      addsub.res_sign  <= def_rst_val_c;

      addsub.flags(fp_exc_nv_c) <= def_rst_val_c;

      addsub.flags(fp_exc_nv_c) <= def_rst_val_c;

    elsif rising_edge(clk_i) then

    elsif rising_edge(clk_i) then

      -- arbitration / latency --

      -- arbitration / latency --

      if (ctrl_engine.state = S_IDLE) then -- hacky "reset"

      if (ctrl_engine.state = S_IDLE) then -- hacky "reset"

        addsub.latency <= (others => '0');

        addsub.latency <= (others => '0');

      else

      else

        addsub.latency(0) <= addsub.start; -- input comparator delay

        addsub.latency(0) <= addsub.start; -- input comparator delay

        if (addsub.latency(0) = '1') then

        if (addsub.latency(0) = '1') then

          addsub.latency(1) <= '1';

          addsub.latency(1) <= '1';

          addsub.latency(2) <= '0';

          addsub.latency(2) <= '0';

        elsif (addsub.exp_cnt(7 downto 0) = addsub.large_exp) then -- radix point not yet aligned

        elsif (addsub.exp_cnt(7 downto 0) = addsub.large_exp) then -- radix point not yet aligned

          addsub.latency(1) <= '0';

          addsub.latency(1) <= '0';

          addsub.latency(2) <= addsub.latency(1) and (not addsub.latency(0)); -- "shift done"

          addsub.latency(2) <= addsub.latency(1) and (not addsub.latency(0)); -- "shift done"

        end if;

        end if;

        addsub.latency(3) <= addsub.latency(2); -- adder stage

        addsub.latency(3) <= addsub.latency(2); -- adder stage

        addsub.latency(4) <= addsub.latency(3); -- final stage

        addsub.latency(4) <= addsub.latency(3); -- final stage

      end if;

      end if;

      -- exponent check: find smaller number (radix-offset-only) --

      -- exponent check: find smaller number (radix-offset-only) --

      if (unsigned(fpu_operands.rs1(30 downto 23)) < unsigned(fpu_operands.rs2(30 downto 23))) then

      if (unsigned(fpu_operands.rs1(30 downto 23)) < unsigned(fpu_operands.rs2(30 downto 23))) then

        addsub.exp_comp(0) <= '1'; -- rs1 < rs2

        addsub.exp_comp(0) <= '1'; -- rs1 < rs2

      else

      else

        addsub.exp_comp(0) <= '0'; -- rs1 >= rs2

        addsub.exp_comp(0) <= '0'; -- rs1 >= rs2

      end if;

      end if;

      if (unsigned(fpu_operands.rs1(30 downto 23)) = unsigned(fpu_operands.rs2(30 downto 23))) then

      if (unsigned(fpu_operands.rs1(30 downto 23)) = unsigned(fpu_operands.rs2(30 downto 23))) then

        addsub.exp_comp(1) <= '1'; -- rs1 == rs2

        addsub.exp_comp(1) <= '1'; -- rs1 == rs2

      else -- rs1 != rs2

      else -- rs1 != rs2

        addsub.exp_comp(1) <= '0';

        addsub.exp_comp(1) <= '0';

      end if;

      end if;

      -- shift right small mantissa to align radix point --

      -- shift right small mantissa to align radix point --

      if (addsub.latency(0) = '1') then

      if (addsub.latency(0) = '1') then

        if ((fpu_operands.rs1_class(fp_class_pos_zero_c) or fpu_operands.rs2_class(fp_class_pos_zero_c) or

        if ((fpu_operands.rs1_class(fp_class_pos_zero_c) or fpu_operands.rs2_class(fp_class_pos_zero_c) or

             fpu_operands.rs1_class(fp_class_neg_zero_c) or fpu_operands.rs2_class(fp_class_neg_zero_c)) = '0') then -- no input is zero

             fpu_operands.rs1_class(fp_class_neg_zero_c) or fpu_operands.rs2_class(fp_class_neg_zero_c)) = '0') then -- no input is zero

          addsub.man_sreg <= addsub.small_man;

          addsub.man_sreg <= addsub.small_man;

        else

        else

          addsub.man_sreg <= (others => '0');

          addsub.man_sreg <= (others => '0');

        end if;

        end if;

        addsub.exp_cnt   <= '0' & addsub.small_exp;

        addsub.exp_cnt   <= '0' & addsub.small_exp;

        addsub.man_g_ext <= '0';

        addsub.man_g_ext <= '0';

        addsub.man_r_ext <= '0';

        addsub.man_r_ext <= '0';

        addsub.man_s_ext <= '0';

        addsub.man_s_ext <= '0';

      elsif (addsub.exp_cnt(7 downto 0) /= addsub.large_exp) then -- shift right until same magnitude

      elsif (addsub.exp_cnt(7 downto 0) /= addsub.large_exp) then -- shift right until same magnitude

        addsub.man_sreg  <= '0' & addsub.man_sreg(addsub.man_sreg'left downto 1);

        addsub.man_sreg  <= '0' & addsub.man_sreg(addsub.man_sreg'left downto 1);

        addsub.man_g_ext <= addsub.man_sreg(0);

        addsub.man_g_ext <= addsub.man_sreg(0);

        addsub.man_r_ext <= addsub.man_g_ext;

        addsub.man_r_ext <= addsub.man_g_ext;

        addsub.man_s_ext <= addsub.man_s_ext or addsub.man_r_ext; -- sticky bit

        addsub.man_s_ext <= addsub.man_s_ext or addsub.man_r_ext; -- sticky bit

        addsub.exp_cnt   <= std_ulogic_vector(unsigned(addsub.exp_cnt) + 1);

        addsub.exp_cnt   <= std_ulogic_vector(unsigned(addsub.exp_cnt) + 1);

      end if;

      end if;

      -- mantissa check: find smaller number (magnitude-only) --

      -- mantissa check: find smaller number (magnitude-only) --

      if (unsigned(addsub.man_sreg) <= unsigned(addsub.large_man)) then

      if (unsigned(addsub.man_sreg) <= unsigned(addsub.large_man)) then

        addsub.man_comp <= '1';

        addsub.man_comp <= '1';

      else

      else

        addsub.man_comp <= '0';

        addsub.man_comp <= '0';

      end if;

      end if;

      -- actual addition/subtraction (incl. overflow) --

      -- actual addition/subtraction (incl. overflow) --

      if ((ctrl_i(ctrl_ir_funct12_7_c) xor (fpu_operands.rs1(31) xor fpu_operands.rs2(31))) = '0') then -- add

      if ((ctrl_i(ctrl_ir_funct12_7_c) xor (fpu_operands.rs1(31) xor fpu_operands.rs2(31))) = '0') then -- add

        addsub.add_stage <= std_ulogic_vector(unsigned('0' & addsub.man_l) + unsigned('0' & addsub.man_s));

        addsub.add_stage <= std_ulogic_vector(unsigned('0' & addsub.man_l) + unsigned('0' & addsub.man_s));

      else -- sub

      else -- sub

        addsub.add_stage <= std_ulogic_vector(unsigned('0' & addsub.man_l) - unsigned('0' & addsub.man_s));

        addsub.add_stage <= std_ulogic_vector(unsigned('0' & addsub.man_l) - unsigned('0' & addsub.man_s));

      end if;

      end if;

      -- result sign --

      -- result sign --

      if (ctrl_i(ctrl_ir_funct12_7_c) = '0') then -- add

      if (ctrl_i(ctrl_ir_funct12_7_c) = '0') then -- add

        if (fpu_operands.rs1(31) = fpu_operands.rs2(31)) then -- identical signs

        if (fpu_operands.rs1(31) = fpu_operands.rs2(31)) then -- identical signs

          addsub.res_sign <= fpu_operands.rs1(31);

          addsub.res_sign <= fpu_operands.rs1(31);

        else -- different signs

        else -- different signs

          if (addsub.exp_comp(1) = '1') then -- exp are equal (also check relation of mantissas)

          if (addsub.exp_comp(1) = '1') then -- exp are equal (also check relation of mantissas)

            addsub.res_sign <= fpu_operands.rs1(31) xor (not addsub.man_comp);

            addsub.res_sign <= fpu_operands.rs1(31) xor (not addsub.man_comp);

          else

          else

            addsub.res_sign <= fpu_operands.rs1(31) xor addsub.exp_comp(0);

            addsub.res_sign <= fpu_operands.rs1(31) xor addsub.exp_comp(0);

          end if;

          end if;

        end if;

        end if;

      else -- sub

      else -- sub

        if (fpu_operands.rs1(31) = fpu_operands.rs2(31)) then -- identical signs

        if (fpu_operands.rs1(31) = fpu_operands.rs2(31)) then -- identical signs

          if (addsub.exp_comp(1) = '1') then -- exp are equal (also check relation of mantissas)

          if (addsub.exp_comp(1) = '1') then -- exp are equal (also check relation of mantissas)

            addsub.res_sign <= fpu_operands.rs1(31) xor (not addsub.man_comp);

            addsub.res_sign <= fpu_operands.rs1(31) xor (not addsub.man_comp);

          else

          else

            addsub.res_sign <= fpu_operands.rs1(31) xor addsub.exp_comp(0);

            addsub.res_sign <= fpu_operands.rs1(31) xor addsub.exp_comp(0);

          end if;

          end if;

        else -- different signs

        else -- different signs

          addsub.res_sign <= fpu_operands.rs1(31);

          addsub.res_sign <= fpu_operands.rs1(31);

        end if;

        end if;

      end if;

      end if;

      -- exception flags --

      -- exception flags --

      addsub.flags(fp_exc_nv_c) <= ((fpu_operands.rs1_class(fp_class_pos_inf_c) or fpu_operands.rs1_class(fp_class_neg_inf_c)) and

      addsub.flags(fp_exc_nv_c) <= ((fpu_operands.rs1_class(fp_class_pos_inf_c) or fpu_operands.rs1_class(fp_class_neg_inf_c)) and

                                    (fpu_operands.rs2_class(fp_class_pos_inf_c) or fpu_operands.rs2_class(fp_class_neg_inf_c))); -- +/-inf +/- +/-inf

                                    (fpu_operands.rs2_class(fp_class_pos_inf_c) or fpu_operands.rs2_class(fp_class_neg_inf_c))); -- +/-inf +/- +/-inf

    end if;

    end if;

  end process adder_subtractor_core;

  end process adder_subtractor_core;

  -- exceptions - unused --

  -- exceptions - unused --

  addsub.flags(fp_exc_dz_c) <= '0'; -- division by zero -> not possible

  addsub.flags(fp_exc_dz_c) <= '0'; -- division by zero -> not possible

  addsub.flags(fp_exc_of_c) <= '0'; -- not possible here (but may occur in normalizer)

  addsub.flags(fp_exc_of_c) <= '0'; -- not possible here (but may occur in normalizer)

  addsub.flags(fp_exc_uf_c) <= '0'; -- not possible here (but may occur in normalizer)

  addsub.flags(fp_exc_uf_c) <= '0'; -- not possible here (but may occur in normalizer)

  addsub.flags(fp_exc_nx_c) <= '0'; -- not possible here (but may occur in normalizer)

  addsub.flags(fp_exc_nx_c) <= '0'; -- not possible here (but may occur in normalizer)

  -- exponent check: find smaller number (magnitude-only) --

  -- exponent check: find smaller number (magnitude-only) --

  addsub.small_exp <=        fpu_operands.rs1(30 downto 23)  when (addsub.exp_comp(0) = '1') else        fpu_operands.rs2(30 downto 23);

  addsub.small_exp <=        fpu_operands.rs1(30 downto 23)  when (addsub.exp_comp(0) = '1') else        fpu_operands.rs2(30 downto 23);

  addsub.large_exp <=        fpu_operands.rs2(30 downto 23)  when (addsub.exp_comp(0) = '1') else        fpu_operands.rs1(30 downto 23);

  addsub.large_exp <=        fpu_operands.rs2(30 downto 23)  when (addsub.exp_comp(0) = '1') else        fpu_operands.rs1(30 downto 23);

  addsub.small_man <= ('1' & fpu_operands.rs1(22 downto 00)) when (addsub.exp_comp(0) = '1') else ('1' & fpu_operands.rs2(22 downto 00));

  addsub.small_man <= ('1' & fpu_operands.rs1(22 downto 00)) when (addsub.exp_comp(0) = '1') else ('1' & fpu_operands.rs2(22 downto 00));

  addsub.large_man <= ('1' & fpu_operands.rs2(22 downto 00)) when (addsub.exp_comp(0) = '1') else ('1' & fpu_operands.rs1(22 downto 00));

  addsub.large_man <= ('1' & fpu_operands.rs2(22 downto 00)) when (addsub.exp_comp(0) = '1') else ('1' & fpu_operands.rs1(22 downto 00));

  -- mantissa check: find smaller number (magnitude-only) --

  -- mantissa check: find smaller number (magnitude-only) --

  addsub.man_s <= (addsub.man_sreg & addsub.man_g_ext & addsub.man_r_ext & addsub.man_s_ext) when (addsub.man_comp = '1') else (addsub.large_man & "000");

  addsub.man_s <= (addsub.man_sreg & addsub.man_g_ext & addsub.man_r_ext & addsub.man_s_ext) when (addsub.man_comp = '1') else (addsub.large_man & "000");

  addsub.man_l <= (addsub.large_man & "000") when (addsub.man_comp = '1') else (addsub.man_sreg & addsub.man_g_ext & addsub.man_r_ext & addsub.man_s_ext);

  addsub.man_l <= (addsub.large_man & "000") when (addsub.man_comp = '1') else (addsub.man_sreg & addsub.man_g_ext & addsub.man_r_ext & addsub.man_s_ext);

  -- latency --

  -- latency --

  addsub.start   <= fu_addsub.start;

  addsub.start   <= fu_addsub.start;

  addsub.done    <= addsub.latency(addsub.latency'left);

  addsub.done    <= addsub.latency(addsub.latency'left);

  fu_addsub.done <= addsub.done;

  fu_addsub.done <= addsub.done;

  -- mantissa result --

  -- mantissa result --

  addsub.res_sum <= addsub.add_stage(27 downto 0);

  addsub.res_sum <= addsub.add_stage(27 downto 0);

  -- result class --

  -- result class --

  adder_subtractor_class_core: process(rstn_i, clk_i)

  adder_subtractor_class_core: process(rstn_i, clk_i)

    variable a_pos_norm_v, a_neg_norm_v, b_pos_norm_v, b_neg_norm_v : std_ulogic;

    variable a_pos_norm_v, a_neg_norm_v, b_pos_norm_v, b_neg_norm_v : std_ulogic;

    variable a_pos_subn_v, a_neg_subn_v, b_pos_subn_v, b_neg_subn_v : std_ulogic;

    variable a_pos_subn_v, a_neg_subn_v, b_pos_subn_v, b_neg_subn_v : std_ulogic;

    variable a_pos_zero_v, a_neg_zero_v, b_pos_zero_v, b_neg_zero_v : std_ulogic;

    variable a_pos_zero_v, a_neg_zero_v, b_pos_zero_v, b_neg_zero_v : std_ulogic;

    variable a_pos_inf_v,  a_neg_inf_v,  b_pos_inf_v,  b_neg_inf_v  : std_ulogic;

    variable a_pos_inf_v,  a_neg_inf_v,  b_pos_inf_v,  b_neg_inf_v  : std_ulogic;

    variable a_snan_v,     a_qnan_v,     b_snan_v,     b_qnan_v     : std_ulogic;

    variable a_snan_v,     a_qnan_v,     b_snan_v,     b_qnan_v     : std_ulogic;

  begin

  begin

    if (rstn_i = '0') then

    if (rstn_i = '0') then

      addsub.res_class(fp_class_pos_inf_c)  <= def_rst_val_c;

      addsub.res_class <= (others => def_rst_val_c);

      addsub.res_class(fp_class_neg_inf_c)  <= def_rst_val_c;

      addsub.res_class(fp_class_pos_zero_c) <= def_rst_val_c;

      addsub.res_class(fp_class_neg_zero_c) <= def_rst_val_c;

      addsub.res_class(fp_class_qnan_c)     <= def_rst_val_c;

    elsif rising_edge(clk_i) then

    elsif rising_edge(clk_i) then

      -- minions --

      -- minions --

      a_pos_norm_v := fpu_operands.rs1_class(fp_class_pos_norm_c);    b_pos_norm_v := fpu_operands.rs2_class(fp_class_pos_norm_c);

      a_pos_norm_v := fpu_operands.rs1_class(fp_class_pos_norm_c);    b_pos_norm_v := fpu_operands.rs2_class(fp_class_pos_norm_c);

      a_neg_norm_v := fpu_operands.rs1_class(fp_class_neg_norm_c);    b_neg_norm_v := fpu_operands.rs2_class(fp_class_neg_norm_c);

      a_neg_norm_v := fpu_operands.rs1_class(fp_class_neg_norm_c);    b_neg_norm_v := fpu_operands.rs2_class(fp_class_neg_norm_c);

      a_pos_subn_v := fpu_operands.rs1_class(fp_class_pos_denorm_c);  b_pos_subn_v := fpu_operands.rs2_class(fp_class_pos_denorm_c);

      a_pos_subn_v := fpu_operands.rs1_class(fp_class_pos_denorm_c);  b_pos_subn_v := fpu_operands.rs2_class(fp_class_pos_denorm_c);

      a_neg_subn_v := fpu_operands.rs1_class(fp_class_neg_denorm_c);  b_neg_subn_v := fpu_operands.rs2_class(fp_class_neg_denorm_c);

      a_neg_subn_v := fpu_operands.rs1_class(fp_class_neg_denorm_c);  b_neg_subn_v := fpu_operands.rs2_class(fp_class_neg_denorm_c);

      a_pos_zero_v := fpu_operands.rs1_class(fp_class_pos_zero_c);    b_pos_zero_v := fpu_operands.rs2_class(fp_class_pos_zero_c);

      a_pos_zero_v := fpu_operands.rs1_class(fp_class_pos_zero_c);    b_pos_zero_v := fpu_operands.rs2_class(fp_class_pos_zero_c);

      a_neg_zero_v := fpu_operands.rs1_class(fp_class_neg_zero_c);    b_neg_zero_v := fpu_operands.rs2_class(fp_class_neg_zero_c);

      a_neg_zero_v := fpu_operands.rs1_class(fp_class_neg_zero_c);    b_neg_zero_v := fpu_operands.rs2_class(fp_class_neg_zero_c);

      a_pos_inf_v  := fpu_operands.rs1_class(fp_class_pos_inf_c);     b_pos_inf_v  := fpu_operands.rs2_class(fp_class_pos_inf_c);

      a_pos_inf_v  := fpu_operands.rs1_class(fp_class_pos_inf_c);     b_pos_inf_v  := fpu_operands.rs2_class(fp_class_pos_inf_c);

      a_neg_inf_v  := fpu_operands.rs1_class(fp_class_neg_inf_c);     b_neg_inf_v  := fpu_operands.rs2_class(fp_class_neg_inf_c);

      a_neg_inf_v  := fpu_operands.rs1_class(fp_class_neg_inf_c);     b_neg_inf_v  := fpu_operands.rs2_class(fp_class_neg_inf_c);

      a_snan_v     := fpu_operands.rs1_class(fp_class_snan_c);        b_snan_v     := fpu_operands.rs2_class(fp_class_snan_c);

      a_snan_v     := fpu_operands.rs1_class(fp_class_snan_c);        b_snan_v     := fpu_operands.rs2_class(fp_class_snan_c);

      a_qnan_v     := fpu_operands.rs1_class(fp_class_qnan_c);        b_qnan_v     := fpu_operands.rs2_class(fp_class_qnan_c);

      a_qnan_v     := fpu_operands.rs1_class(fp_class_qnan_c);        b_qnan_v     := fpu_operands.rs2_class(fp_class_qnan_c);

      if (ctrl_i(ctrl_ir_funct12_7_c) = '0') then -- addition

      if (ctrl_i(ctrl_ir_funct12_7_c) = '0') then -- addition

        -- +infinity --

        -- +infinity --

        addsub.res_class(fp_class_pos_inf_c) <=

        addsub.res_class(fp_class_pos_inf_c) <=

          (a_pos_inf_v  and b_pos_inf_v)  or -- +inf    + +inf

          (a_pos_inf_v  and b_pos_inf_v)  or -- +inf    + +inf

          (a_pos_inf_v  and b_pos_zero_v) or -- +inf    + +zero

          (a_pos_inf_v  and b_pos_zero_v) or -- +inf    + +zero

          (a_pos_zero_v and b_pos_inf_v)  or -- +zero   + +inf

          (a_pos_zero_v and b_pos_inf_v)  or -- +zero   + +inf

          (a_pos_inf_v  and b_neg_zero_v) or -- +inf    + -zero

          (a_pos_inf_v  and b_neg_zero_v) or -- +inf    + -zero

          (a_neg_zero_v and b_pos_inf_v)  or -- -zero   + +inf

          (a_neg_zero_v and b_pos_inf_v)  or -- -zero   + +inf

--

--

          (a_pos_inf_v  and b_pos_norm_v) or -- +inf    + +norm

          (a_pos_inf_v  and b_pos_norm_v) or -- +inf    + +norm

          (a_pos_norm_v and b_pos_inf_v)  or -- +norm   + +inf

          (a_pos_norm_v and b_pos_inf_v)  or -- +norm   + +inf

          (a_pos_inf_v  and b_pos_subn_v) or -- +inf    + +denorm

          (a_pos_inf_v  and b_pos_subn_v) or -- +inf    + +denorm

          (a_pos_subn_v and b_pos_inf_v)  or -- +denorm + +inf

          (a_pos_subn_v and b_pos_inf_v)  or -- +denorm + +inf

--

--

          (a_pos_inf_v  and b_neg_norm_v) or -- +inf    + -norm

          (a_pos_inf_v  and b_neg_norm_v) or -- +inf    + -norm

          (a_neg_norm_v and b_pos_inf_v)  or -- -norm   + +inf

          (a_neg_norm_v and b_pos_inf_v)  or -- -norm   + +inf

          (a_pos_inf_v  and b_neg_subn_v) or -- +inf    + -denorm

          (a_pos_inf_v  and b_neg_subn_v) or -- +inf    + -denorm

          (a_neg_subn_v and b_pos_inf_v);    -- -denorm + +inf

          (a_neg_subn_v and b_pos_inf_v);    -- -denorm + +inf

        -- -infinity --

        -- -infinity --

        addsub.res_class(fp_class_neg_inf_c) <=

        addsub.res_class(fp_class_neg_inf_c) <=

          (a_neg_inf_v  and b_neg_inf_v)  or -- -inf    + -inf

          (a_neg_inf_v  and b_neg_inf_v)  or -- -inf    + -inf

          (a_neg_inf_v  and b_pos_zero_v) or -- -inf    + +zero

          (a_neg_inf_v  and b_pos_zero_v) or -- -inf    + +zero

          (a_pos_zero_v and b_neg_inf_v)  or -- +zero   + -inf

          (a_pos_zero_v and b_neg_inf_v)  or -- +zero   + -inf

          (a_neg_inf_v  and b_neg_zero_v) or -- -inf    + -zero

          (a_neg_inf_v  and b_neg_zero_v) or -- -inf    + -zero

          (a_neg_zero_v and b_neg_inf_v)  or -- -zero   + -inf

          (a_neg_zero_v and b_neg_inf_v)  or -- -zero   + -inf

--

--

          (a_neg_inf_v  and b_pos_norm_v) or -- -inf    + +norm

          (a_neg_inf_v  and b_pos_norm_v) or -- -inf    + +norm

          (a_pos_norm_v and b_neg_inf_v)  or -- +norm   + -inf

          (a_pos_norm_v and b_neg_inf_v)  or -- +norm   + -inf

          (a_neg_inf_v  and b_neg_norm_v) or -- -inf    + -norm

          (a_neg_inf_v  and b_neg_norm_v) or -- -inf    + -norm

          (a_neg_norm_v and b_neg_inf_v)  or -- -norm   + -inf

          (a_neg_norm_v and b_neg_inf_v)  or -- -norm   + -inf

--

--

          (a_neg_inf_v  and b_pos_subn_v) or -- -inf    + +denorm

          (a_neg_inf_v  and b_pos_subn_v) or -- -inf    + +denorm

          (a_pos_subn_v and b_neg_inf_v)  or -- +denorm + -inf

          (a_pos_subn_v and b_neg_inf_v)  or -- +denorm + -inf

          (a_neg_inf_v  and b_neg_subn_v) or -- -inf    + -denorm

          (a_neg_inf_v  and b_neg_subn_v) or -- -inf    + -denorm

          (a_neg_subn_v and b_neg_inf_v);    -- -denorm + -inf

          (a_neg_subn_v and b_neg_inf_v);    -- -denorm + -inf

        -- +zero --

        -- +zero --

        addsub.res_class(fp_class_pos_zero_c) <=

        addsub.res_class(fp_class_pos_zero_c) <=

          (a_pos_zero_v and b_pos_zero_v) or -- +zero + +zero

          (a_pos_zero_v and b_pos_zero_v) or -- +zero + +zero

          (a_pos_zero_v and b_neg_zero_v) or -- +zero + -zero

          (a_pos_zero_v and b_neg_zero_v) or -- +zero + -zero

          (a_neg_zero_v and b_pos_zero_v);   -- -zero + +zero

          (a_neg_zero_v and b_pos_zero_v);   -- -zero + +zero

        -- -zero --

        -- -zero --

        addsub.res_class(fp_class_neg_zero_c) <=

        addsub.res_class(fp_class_neg_zero_c) <=

          (a_neg_zero_v and b_neg_zero_v);   -- -zero + -zero

          (a_neg_zero_v and b_neg_zero_v);   -- -zero + -zero

        -- qNaN --

        -- qNaN --

        addsub.res_class(fp_class_qnan_c) <=

        addsub.res_class(fp_class_qnan_c) <=

          (a_snan_v    or  b_snan_v)    or -- any input is sNaN

          (a_snan_v    or  b_snan_v)    or -- any input is sNaN

          (a_qnan_v    or  b_qnan_v)    or -- any input is qNaN

          (a_qnan_v    or  b_qnan_v)    or -- any input is qNaN

          (a_pos_inf_v and b_neg_inf_v) or -- +inf + -inf

          (a_pos_inf_v and b_neg_inf_v) or -- +inf + -inf

          (a_neg_inf_v and b_pos_inf_v);   -- -inf + +inf

          (a_neg_inf_v and b_pos_inf_v);   -- -inf + +inf

      else -- subtraction

      else -- subtraction

        -- +infinity --

        -- +infinity --

        addsub.res_class(fp_class_pos_inf_c) <=

        addsub.res_class(fp_class_pos_inf_c) <=

          (a_pos_inf_v  and b_neg_inf_v)  or -- +inf    - -inf

          (a_pos_inf_v  and b_neg_inf_v)  or -- +inf    - -inf

          (a_pos_inf_v  and b_pos_zero_v) or -- +inf    - +zero

          (a_pos_inf_v  and b_pos_zero_v) or -- +inf    - +zero

          (a_pos_inf_v  and b_neg_zero_v) or -- +inf    - -zero

          (a_pos_inf_v  and b_neg_zero_v) or -- +inf    - -zero

          (a_pos_inf_v  and b_pos_norm_v) or -- +inf    - +norm

          (a_pos_inf_v  and b_pos_norm_v) or -- +inf    - +norm

          (a_pos_inf_v  and b_pos_subn_v) or -- +inf    - +denorm

          (a_pos_inf_v  and b_pos_subn_v) or -- +inf    - +denorm

          (a_pos_inf_v  and b_neg_norm_v) or -- +inf    - -norm

          (a_pos_inf_v  and b_neg_norm_v) or -- +inf    - -norm

          (a_pos_inf_v  and b_neg_subn_v) or -- +inf    - -denorm

          (a_pos_inf_v  and b_neg_subn_v) or -- +inf    - -denorm

--

--

          (a_pos_zero_v and b_neg_inf_v)  or -- +zero   - -inf

          (a_pos_zero_v and b_neg_inf_v)  or -- +zero   - -inf

          (a_neg_zero_v and b_neg_inf_v)  or -- -zero   - -inf

          (a_neg_zero_v and b_neg_inf_v)  or -- -zero   - -inf

--

--

          (a_pos_norm_v and b_neg_inf_v)  or -- +norm   - -inf

          (a_pos_norm_v and b_neg_inf_v)  or -- +norm   - -inf

          (a_pos_subn_v and b_neg_inf_v)  or -- +denorm - -inf

          (a_pos_subn_v and b_neg_inf_v)  or -- +denorm - -inf

          (a_neg_norm_v and b_neg_inf_v)  or -- -norm   - -inf

          (a_neg_norm_v and b_neg_inf_v)  or -- -norm   - -inf

          (a_neg_subn_v and b_neg_inf_v);    -- -denorm - -inf

          (a_neg_subn_v and b_neg_inf_v);    -- -denorm - -inf

        -- -infinity --

        -- -infinity --

        addsub.res_class(fp_class_neg_inf_c) <=

        addsub.res_class(fp_class_neg_inf_c) <=

          (a_neg_inf_v  and b_pos_inf_v)  or -- -inf    - +inf

          (a_neg_inf_v  and b_pos_inf_v)  or -- -inf    - +inf

          (a_neg_inf_v  and b_pos_zero_v) or -- -inf    - +zero

          (a_neg_inf_v  and b_pos_zero_v) or -- -inf    - +zero

          (a_neg_inf_v  and b_neg_zero_v) or -- -inf    - -zero

          (a_neg_inf_v  and b_neg_zero_v) or -- -inf    - -zero

          (a_neg_inf_v  and b_pos_norm_v) or -- -inf    - +norm

          (a_neg_inf_v  and b_pos_norm_v) or -- -inf    - +norm

          (a_neg_inf_v  and b_pos_subn_v) or -- -inf    - +denorm

          (a_neg_inf_v  and b_pos_subn_v) or -- -inf    - +denorm

          (a_neg_inf_v  and b_neg_norm_v) or -- -inf    - -norm

          (a_neg_inf_v  and b_neg_norm_v) or -- -inf    - -norm

          (a_neg_inf_v  and b_neg_subn_v) or -- -inf    - -denorm

          (a_neg_inf_v  and b_neg_subn_v) or -- -inf    - -denorm

--

--

          (a_pos_zero_v and b_pos_inf_v)  or -- +zero   - +inf

          (a_pos_zero_v and b_pos_inf_v)  or -- +zero   - +inf

          (a_neg_zero_v and b_pos_inf_v)  or -- -zero   - +inf

          (a_neg_zero_v and b_pos_inf_v)  or -- -zero   - +inf

--

--

          (a_pos_norm_v and b_pos_inf_v)  or -- +norm   - +inf

          (a_pos_norm_v and b_pos_inf_v)  or -- +norm   - +inf

          (a_pos_subn_v and b_pos_inf_v)  or -- +denorm - +inf

          (a_pos_subn_v and b_pos_inf_v)  or -- +denorm - +inf

          (a_neg_norm_v and b_pos_inf_v)  or -- -norm   - +inf

          (a_neg_norm_v and b_pos_inf_v)  or -- -norm   - +inf

          (a_neg_subn_v and b_pos_inf_v);    -- -denorm - +inf

          (a_neg_subn_v and b_pos_inf_v);    -- -denorm - +inf

        -- +zero --

        -- +zero --

        addsub.res_class(fp_class_pos_zero_c) <=

        addsub.res_class(fp_class_pos_zero_c) <=

          (a_pos_zero_v and b_pos_zero_v) or -- +zero - +zero

          (a_pos_zero_v and b_pos_zero_v) or -- +zero - +zero

          (a_pos_zero_v and b_neg_zero_v) or -- +zero - -zero

          (a_pos_zero_v and b_neg_zero_v) or -- +zero - -zero

          (a_neg_zero_v and b_neg_zero_v);   -- -zero - -zero

          (a_neg_zero_v and b_neg_zero_v);   -- -zero - -zero

        -- -zero --

        -- -zero --

        addsub.res_class(fp_class_neg_zero_c) <=

        addsub.res_class(fp_class_neg_zero_c) <=

          (a_neg_zero_v and b_pos_zero_v);   -- -zero - +zero

          (a_neg_zero_v and b_pos_zero_v);   -- -zero - +zero

        -- qNaN --

        -- qNaN --

        addsub.res_class(fp_class_qnan_c) <=

        addsub.res_class(fp_class_qnan_c) <=

          (a_snan_v    or  b_snan_v)    or -- any input is sNaN

          (a_snan_v    or  b_snan_v)    or -- any input is sNaN

          (a_qnan_v    or  b_qnan_v)    or -- any input is qNaN

          (a_qnan_v    or  b_qnan_v)    or -- any input is qNaN

          (a_pos_inf_v and b_pos_inf_v) or -- +inf - +inf

          (a_pos_inf_v and b_pos_inf_v) or -- +inf - +inf

          (a_neg_inf_v and b_neg_inf_v);   -- -inf - -inf

          (a_neg_inf_v and b_neg_inf_v);   -- -inf - -inf

      end if;

      end if;

      -- normal --

      -- normal --

      addsub.res_class(fp_class_pos_norm_c) <= (a_pos_norm_v or a_neg_norm_v) and (b_pos_norm_v or b_neg_norm_v); -- +/-norm +/- +-/norm [sign is irrelevant here]

      addsub.res_class(fp_class_pos_norm_c) <= (a_pos_norm_v or a_neg_norm_v) and (b_pos_norm_v or b_neg_norm_v); -- +/-norm +/- +-/norm [sign is irrelevant here]

      addsub.res_class(fp_class_neg_norm_c) <= (a_pos_norm_v or a_neg_norm_v) and (b_pos_norm_v or b_neg_norm_v); -- +/-norm +/- +-/norm [sign is irrelevant here]

      addsub.res_class(fp_class_neg_norm_c) <= (a_pos_norm_v or a_neg_norm_v) and (b_pos_norm_v or b_neg_norm_v); -- +/-norm +/- +-/norm [sign is irrelevant here]

      -- sNaN --

      -- sNaN --

      addsub.res_class(fp_class_snan_c) <= (a_snan_v or b_snan_v); -- any input is sNaN

      addsub.res_class(fp_class_snan_c) <= (a_snan_v or b_snan_v); -- any input is sNaN

    end if;

  end process adder_subtractor_class_core;

  -- subnormal result --

      -- subnormal result --

  addsub.res_class(fp_class_pos_denorm_c) <= '0'; -- is evaluated by the normalizer

      addsub.res_class(fp_class_pos_denorm_c) <= '0'; -- is evaluated by the normalizer

  addsub.res_class(fp_class_neg_denorm_c) <= '0'; -- is evaluated by the normalizer

  addsub.res_class(fp_class_neg_denorm_c) <= '0'; -- is evaluated by the normalizer

    end if;

  end process adder_subtractor_class_core;

  -- unused --

  -- unused --

  fu_addsub.result <= (others => '0');

  fu_addsub.result <= (others => '0');

  fu_addsub.flags  <= (others => '0');

  fu_addsub.flags  <= (others => '0');

-- ****************************************************************************************************************************

-- ****************************************************************************************************************************

-- FPU Core - Normalize & Round

-- FPU Core - Normalize & Round

-- ****************************************************************************************************************************

-- ****************************************************************************************************************************

  -- Normalizer Input -----------------------------------------------------------------------

  -- Normalizer Input -----------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  normalizer_input_select: process(funct_ff, addsub, multiplier, fu_conv_i2f)

  normalizer_input_select: process(funct_ff, addsub, multiplier, fu_conv_i2f)

  begin

  begin

    case funct_ff is

    case funct_ff is

      when op_addsub_c => -- addition/subtraction

      when op_addsub_c => -- addition/subtraction

        normalizer.mode      <= '0'; -- normalization

        normalizer.mode      <= '0'; -- normalization

        normalizer.sign      <= addsub.res_sign;

        normalizer.sign      <= addsub.res_sign;

        normalizer.xexp      <= addsub.exp_cnt;

        normalizer.xexp      <= addsub.exp_cnt;

        normalizer.xmantissa(47 downto 23) <= addsub.res_sum(27 downto 3);

        normalizer.xmantissa(47 downto 23) <= addsub.res_sum(27 downto 3);

        normalizer.xmantissa(22) <= addsub.res_sum(2);

        normalizer.xmantissa(22) <= addsub.res_sum(2);

        normalizer.xmantissa(21) <= addsub.res_sum(1);

        normalizer.xmantissa(21) <= addsub.res_sum(1);

        normalizer.xmantissa(20 downto 01) <= (others => '0');

        normalizer.xmantissa(20 downto 01) <= (others => '0');

        normalizer.xmantissa(00) <= addsub.res_sum(0);

        normalizer.xmantissa(00) <= addsub.res_sum(0);

        normalizer.class     <= addsub.res_class;

        normalizer.class     <= addsub.res_class;

        normalizer.flags_in  <= addsub.flags;

        normalizer.flags_in  <= addsub.flags;

        normalizer.start     <= addsub.done;

        normalizer.start     <= addsub.done;

      when op_mul_c => -- multiplication

      when op_mul_c => -- multiplication

        normalizer.mode      <= '0'; -- normalization

        normalizer.mode      <= '0'; -- normalization

        normalizer.sign      <= multiplier.sign;

        normalizer.sign      <= multiplier.sign;

        normalizer.xexp      <= '0' & multiplier.exp_res(7 downto 0);

        normalizer.xexp      <= '0' & multiplier.exp_res(7 downto 0);

        normalizer.xmantissa <= multiplier.product;

        normalizer.xmantissa <= multiplier.product;

        normalizer.class     <= multiplier.res_class;

        normalizer.class     <= multiplier.res_class;

        normalizer.flags_in  <= multiplier.flags;

        normalizer.flags_in  <= multiplier.flags;

        normalizer.start     <= multiplier.done;

        normalizer.start     <= multiplier.done;

      when others => -- op_i2f_c

      when others => -- op_i2f_c

        normalizer.mode      <= '1'; -- int_to_float

        normalizer.mode      <= '1'; -- int_to_float

        normalizer.sign      <= fu_conv_i2f.sign;

        normalizer.sign      <= fu_conv_i2f.sign;

        normalizer.xexp      <= "001111111"; -- bias = 127

        normalizer.xexp      <= "001111111"; -- bias = 127

        normalizer.xmantissa <= (others => '0'); -- don't care

        normalizer.xmantissa <= (others => '0'); -- don't care

        normalizer.class     <= (others => '0'); -- don't care

        normalizer.class     <= (others => '0'); -- don't care

        normalizer.flags_in  <= (others => '0'); -- no flags yet

        normalizer.flags_in  <= (others => '0'); -- no flags yet

        normalizer.start     <= fu_conv_i2f.done;

        normalizer.start     <= fu_conv_i2f.done;

    end case;

    end case;

  end process normalizer_input_select;

  end process normalizer_input_select;

  -- Normalizer & Rounding Unit -------------------------------------------------------------

  -- Normalizer & Rounding Unit -------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  neorv32_cpu_cp_fpu_normalizer_inst: neorv32_cpu_cp_fpu_normalizer

  neorv32_cpu_cp_fpu_normalizer_inst: neorv32_cpu_cp_fpu_normalizer

  port map (

  port map (

    -- control --

    -- control --

    clk_i      => clk_i,                -- global clock, rising edge

    clk_i      => clk_i,                -- global clock, rising edge

    rstn_i     => rstn_i,               -- global reset, low-active, async

    rstn_i     => rstn_i,               -- global reset, low-active, async

    start_i    => normalizer.start,     -- trigger operation

    start_i    => normalizer.start,     -- trigger operation

    rmode_i    => fpu_operands.frm,     -- rounding mode

    rmode_i    => fpu_operands.frm,     -- rounding mode

    funct_i    => normalizer.mode,      -- operation mode

    funct_i    => normalizer.mode,      -- operation mode

    -- input --

    -- input --

    sign_i     => normalizer.sign,      -- sign

    sign_i     => normalizer.sign,      -- sign

    exponent_i => normalizer.xexp,      -- extended exponent

    exponent_i => normalizer.xexp,      -- extended exponent

    mantissa_i => normalizer.xmantissa, -- extended mantissa

    mantissa_i => normalizer.xmantissa, -- extended mantissa

    integer_i  => fu_conv_i2f.result,   -- integer input

    integer_i  => fu_conv_i2f.result,   -- integer input

    class_i    => normalizer.class,     -- input number class

    class_i    => normalizer.class,     -- input number class

    flags_i    => normalizer.flags_in,  -- exception flags input

    flags_i    => normalizer.flags_in,  -- exception flags input

    -- output --

    -- output --

    result_o   => normalizer.result,    -- result (float or int)

    result_o   => normalizer.result,    -- result (float or int)

    flags_o    => normalizer.flags_out, -- exception flags

    flags_o    => normalizer.flags_out, -- exception flags

    done_o     => normalizer.done       -- operation done

    done_o     => normalizer.done       -- operation done

);

);

-- ****************************************************************************************************************************

-- ****************************************************************************************************************************

-- FPU Core - Result

-- FPU Core - Result

-- ****************************************************************************************************************************

-- ****************************************************************************************************************************

  -- Result Output to CPU Pipeline ----------------------------------------------------------

  -- Result Output to CPU Pipeline ----------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  output_gate: process(rstn_i, clk_i)

  output_gate: process(rstn_i, clk_i)

  begin

  begin

    if (rstn_i = '0') then

    if (rstn_i = '0') then

      res_o    <= (others => def_rst_val_c);

      res_o    <= (others => def_rst_val_c);

      fflags_o <= (others => def_rst_val_c);

      fflags_o <= (others => def_rst_val_c);

    elsif rising_edge(clk_i) then

    elsif rising_edge(clk_i) then

      if (ctrl_engine.valid = '1') then

      if (ctrl_engine.valid = '1') then

        case funct_ff is

        case funct_ff is

          when op_class_c =>

          when op_class_c =>

            res_o    <= fu_classify.result;

            res_o    <= fu_classify.result;

            fflags_o <= fu_classify.flags;

            fflags_o <= fu_classify.flags;

          when op_comp_c =>

          when op_comp_c =>

            res_o    <= fu_compare.result;

            res_o    <= fu_compare.result;

            fflags_o <= fu_compare.flags;

            fflags_o <= fu_compare.flags;

          when op_f2i_c =>

          when op_f2i_c =>

            res_o    <= fu_conv_f2i.result;

            res_o    <= fu_conv_f2i.result;

            fflags_o <= fu_conv_f2i.flags;

            fflags_o <= fu_conv_f2i.flags;

          when op_sgnj_c =>

          when op_sgnj_c =>

            res_o    <= fu_sign_inject.result;

            res_o    <= fu_sign_inject.result;

            fflags_o <= fu_sign_inject.flags;

            fflags_o <= fu_sign_inject.flags;

          when op_minmax_c =>

          when op_minmax_c =>

            res_o    <= fu_min_max.result;

            res_o    <= fu_min_max.result;

            fflags_o <= fu_min_max.flags;

            fflags_o <= fu_min_max.flags;

          when others => -- op_mul_c, op_addsub_c, op_i2f_c, ...

          when others => -- op_mul_c, op_addsub_c, op_i2f_c, ...

            res_o    <= normalizer.result;

            res_o    <= normalizer.result;

            fflags_o <= normalizer.flags_out;

            fflags_o <= normalizer.flags_out;

        end case;

        end case;

      else

      else

        res_o    <= (others => '0');

        res_o    <= (others => '0');

        fflags_o <= (others => '0');

        fflags_o <= (others => '0');

      end if;

      end if;

    end if;

    end if;

  end process output_gate;

  end process output_gate;

  -- operation done --

  -- operation done --

  fu_core_done <= fu_compare.done or fu_classify.done or fu_sign_inject.done or fu_min_max.done or normalizer.done or fu_conv_f2i.done;

  fu_core_done <= fu_compare.done or fu_classify.done or fu_sign_inject.done or fu_min_max.done or normalizer.done or fu_conv_f2i.done;

end neorv32_cpu_cp_fpu_rtl;

end neorv32_cpu_cp_fpu_rtl;

-- ###########################################################################################################################################

-- ###########################################################################################################################################

-- ###########################################################################################################################################

-- ###########################################################################################################################################

-- #################################################################################################

-- #################################################################################################

-- # << NEORV32 - Single-Precision Floating-Point Unit: Normalizer and Rounding Unit >>            #

-- # << NEORV32 - Single-Precision Floating-Point Unit: Normalizer and Rounding Unit >>            #

-- # ********************************************************************************************* #

-- # ********************************************************************************************* #

-- # This unit also performs integer-to-float conversions.                                         #

-- # This unit also performs integer-to-float conversions.                                         #

-- # ********************************************************************************************* #

-- # ********************************************************************************************* #

-- # BSD 3-Clause License                                                                          #

-- # BSD 3-Clause License                                                                          #

-- #                                                                                               #

-- #                                                                                               #

-- # Copyright (c) 2021, Stephan Nolting. All rights reserved.                                     #

-- # Copyright (c) 2021, Stephan Nolting. All rights reserved.                                     #

-- #                                                                                               #

-- #                                                                                               #

-- # Redistribution and use in source and binary forms, with or without modification, are          #

-- # Redistribution and use in source and binary forms, with or without modification, are          #

-- # permitted provided that the following conditions are met:                                     #

-- # permitted provided that the following conditions are met:                                     #

-- #                                                                                               #

-- #                                                                                               #

-- # 1. Redistributions of source code must retain the above copyright notice, this list of        #

-- # 1. Redistributions of source code must retain the above copyright notice, this list of        #

-- #    conditions and the following disclaimer.                                                   #

-- #    conditions and the following disclaimer.                                                   #

-- #                                                                                               #

-- #                                                                                               #

-- # 2. Redistributions in binary form must reproduce the above copyright notice, this list of     #

-- # 2. Redistributions in binary form must reproduce the above copyright notice, this list of     #

-- #    conditions and the following disclaimer in the documentation and/or other materials        #

-- #    conditions and the following disclaimer in the documentation and/or other materials        #

-- #    provided with the distribution.                                                            #

-- #    provided with the distribution.                                                            #

-- #                                                                                               #

-- #                                                                                               #

-- # 3. Neither the name of the copyright holder nor the names of its contributors may be used to  #

-- # 3. Neither the name of the copyright holder nor the names of its contributors may be used to  #

-- #    endorse or promote products derived from this software without specific prior written      #

-- #    endorse or promote products derived from this software without specific prior written      #

-- #    permission.                                                                                #

-- #    permission.                                                                                #

-- #                                                                                               #

-- #                                                                                               #

-- # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS   #

-- # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS   #

-- # OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF               #

-- # OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF               #

-- # MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE    #

-- # MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE    #

-- # COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,     #

-- # COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,     #

-- # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE #

-- # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE #

-- # GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED    #

-- # GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED    #

-- # AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING     #

-- # AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING     #

-- # NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED  #

-- # NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED  #

-- # OF THE POSSIBILITY OF SUCH DAMAGE.                                                            #

-- # OF THE POSSIBILITY OF SUCH DAMAGE.                                                            #

-- # ********************************************************************************************* #

-- # ********************************************************************************************* #

-- # The NEORV32 Processor - https://github.com/stnolting/neorv32              (c) Stephan Nolting #

-- # The NEORV32 Processor - https://github.com/stnolting/neorv32              (c) Stephan Nolting #

-- #################################################################################################

-- #################################################################################################

library ieee;

library ieee;

use ieee.std_logic_1164.all;

use ieee.std_logic_1164.all;

use ieee.numeric_std.all;

use ieee.numeric_std.all;

library neorv32;

library neorv32;

use neorv32.neorv32_package.all;

use neorv32.neorv32_package.all;

entity neorv32_cpu_cp_fpu_normalizer is

entity neorv32_cpu_cp_fpu_normalizer is

  port (

  port (

    -- control --

    -- control --

    clk_i      : in  std_ulogic; -- global clock, rising edge

    clk_i      : in  std_ulogic; -- global clock, rising edge

    rstn_i     : in  std_ulogic; -- global reset, low-active, async

    rstn_i     : in  std_ulogic; -- global reset, low-active, async

    start_i    : in  std_ulogic; -- trigger operation

    start_i    : in  std_ulogic; -- trigger operation

    rmode_i    : in  std_ulogic_vector(02 downto 0); -- rounding mode

    rmode_i    : in  std_ulogic_vector(02 downto 0); -- rounding mode

    funct_i    : in  std_ulogic; -- operating mode (0=norm&round, 1=int-to-float)

    funct_i    : in  std_ulogic; -- operating mode (0=norm&round, 1=int-to-float)

    -- input --

    -- input --

    sign_i     : in  std_ulogic; -- sign

    sign_i     : in  std_ulogic; -- sign

    exponent_i : in  std_ulogic_vector(08 downto 0); -- extended exponent

    exponent_i : in  std_ulogic_vector(08 downto 0); -- extended exponent

    mantissa_i : in  std_ulogic_vector(47 downto 0); -- extended mantissa

    mantissa_i : in  std_ulogic_vector(47 downto 0); -- extended mantissa

    integer_i  : in  std_ulogic_vector(31 downto 0); -- integer input

    integer_i  : in  std_ulogic_vector(31 downto 0); -- integer input

    class_i    : in  std_ulogic_vector(09 downto 0); -- input number class

    class_i    : in  std_ulogic_vector(09 downto 0); -- input number class

    flags_i    : in  std_ulogic_vector(04 downto 0); -- exception flags input

    flags_i    : in  std_ulogic_vector(04 downto 0); -- exception flags input

    -- output --

    -- output --

    result_o   : out std_ulogic_vector(31 downto 0); -- float result

    result_o   : out std_ulogic_vector(31 downto 0); -- float result

    flags_o    : out std_ulogic_vector(04 downto 0); -- exception flags output

    flags_o    : out std_ulogic_vector(04 downto 0); -- exception flags output

    done_o     : out std_ulogic -- operation done

    done_o     : out std_ulogic -- operation done

);

);

end neorv32_cpu_cp_fpu_normalizer;

end neorv32_cpu_cp_fpu_normalizer;

architecture neorv32_cpu_cp_fpu_normalizer_rtl of neorv32_cpu_cp_fpu_normalizer is

architecture neorv32_cpu_cp_fpu_normalizer_rtl of neorv32_cpu_cp_fpu_normalizer is

  -- controller --

  -- controller --

  type ctrl_engine_state_t is (S_IDLE, S_PREPARE_I2F, S_CHECK_I2F, S_PREPARE_NORM, S_PREPARE_SHIFT, S_NORMALIZE_BUSY, S_ROUND, S_CHECK, S_FINALIZE);

  type ctrl_engine_state_t is (S_IDLE, S_PREPARE_I2F, S_CHECK_I2F, S_PREPARE_NORM, S_PREPARE_SHIFT, S_NORMALIZE_BUSY, S_ROUND, S_CHECK, S_FINALIZE);

  type ctrl_t is record

  type ctrl_t is record

    state   : ctrl_engine_state_t; -- current state

    state   : ctrl_engine_state_t; -- current state

    norm_r  : std_ulogic; -- normalization round 0 or 1

    norm_r  : std_ulogic; -- normalization round 0 or 1

    cnt     : std_ulogic_vector(08 downto 0); -- interation counter/exponent (incl. overflow)

    cnt     : std_ulogic_vector(08 downto 0); -- interation counter/exponent (incl. overflow)

    cnt_pre : std_ulogic_vector(08 downto 0);

    cnt_pre : std_ulogic_vector(08 downto 0);

    cnt_of  : std_ulogic; -- counter overflow

    cnt_of  : std_ulogic; -- counter overflow

    cnt_uf  : std_ulogic; -- counter underflow

    cnt_uf  : std_ulogic; -- counter underflow

    rounded : std_ulogic; -- output is rounded

    rounded : std_ulogic; -- output is rounded

    res_sgn : std_ulogic;

    res_sgn : std_ulogic;

    res_exp : std_ulogic_vector(07 downto 0);

    res_exp : std_ulogic_vector(07 downto 0);

    res_man : std_ulogic_vector(22 downto 0);

    res_man : std_ulogic_vector(22 downto 0);

    class   : std_ulogic_vector(09 downto 0);

    class   : std_ulogic_vector(09 downto 0);

    flags   : std_ulogic_vector(04 downto 0);

    flags   : std_ulogic_vector(04 downto 0);

  end record;

  end record;

  signal ctrl : ctrl_t;

  signal ctrl : ctrl_t;

  -- normalization shift register --

  -- normalization shift register --

  type sreg_t is record

  type sreg_t is record

    done  : std_ulogic;

    done  : std_ulogic;

    dir   : std_ulogic; -- shift direction: 0=right, 1=left

    dir   : std_ulogic; -- shift direction: 0=right, 1=left

    zero  : std_ulogic;

    zero  : std_ulogic;

    upper : std_ulogic_vector(31 downto 0);

    upper : std_ulogic_vector(31 downto 0);

    lower : std_ulogic_vector(22 downto 0);

    lower : std_ulogic_vector(22 downto 0);

    ext_g : std_ulogic; -- guard bit

    ext_g : std_ulogic; -- guard bit

    ext_r : std_ulogic; -- round bit

    ext_r : std_ulogic; -- round bit

    ext_s : std_ulogic; -- sticky bit

    ext_s : std_ulogic; -- sticky bit

  end record;

  end record;

  signal sreg : sreg_t;

  signal sreg : sreg_t;

  -- rounding unit --

  -- rounding unit --

  type round_t is record

  type round_t is record

    en     : std_ulogic; -- enable rounding

    en     : std_ulogic; -- enable rounding

    sub    : std_ulogic; -- 0=decrement, 1=increment

    sub    : std_ulogic; -- 0=decrement, 1=increment

    output : std_ulogic_vector(24 downto 0); -- mantissa size + hidden one + 1

    output : std_ulogic_vector(24 downto 0); -- mantissa size + hidden one + 1

  end record;

  end record;

  signal round : round_t;

  signal round : round_t;

begin

begin

  -- Control Engine -------------------------------------------------------------------------

  -- Control Engine -------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  ctrl_engine: process(rstn_i, clk_i)

  ctrl_engine: process(rstn_i, clk_i)

  begin

  begin

    if (rstn_i = '0') then

    if (rstn_i = '0') then

      ctrl.state   <= S_IDLE;

      ctrl.state   <= S_IDLE;

      ctrl.norm_r  <= def_rst_val_c;

      ctrl.norm_r  <= def_rst_val_c;

      ctrl.cnt     <= (others => def_rst_val_c);

      ctrl.cnt     <= (others => def_rst_val_c);

      ctrl.cnt_pre <= (others => def_rst_val_c);

      ctrl.cnt_pre <= (others => def_rst_val_c);

      ctrl.cnt_of  <= def_rst_val_c;

      ctrl.cnt_of  <= def_rst_val_c;

      ctrl.cnt_uf  <= def_rst_val_c;

      ctrl.cnt_uf  <= def_rst_val_c;

      ctrl.rounded <= def_rst_val_c;

      ctrl.rounded <= def_rst_val_c;

      ctrl.res_exp <= (others => def_rst_val_c);

      ctrl.res_exp <= (others => def_rst_val_c);

      ctrl.res_man <= (others => def_rst_val_c);

      ctrl.res_man <= (others => def_rst_val_c);

      ctrl.res_sgn <= def_rst_val_c;

      ctrl.res_sgn <= def_rst_val_c;

      ctrl.class   <= (others => def_rst_val_c);

      ctrl.class   <= (others => def_rst_val_c);

      ctrl.flags   <= (others => def_rst_val_c);

      ctrl.flags   <= (others => def_rst_val_c);

--

--

      sreg.upper   <= (others => def_rst_val_c);

      sreg.upper   <= (others => def_rst_val_c);

      sreg.lower   <= (others => def_rst_val_c);

      sreg.lower   <= (others => def_rst_val_c);

      sreg.dir     <= def_rst_val_c;

      sreg.dir     <= def_rst_val_c;

      sreg.ext_g   <= def_rst_val_c;

      sreg.ext_g   <= def_rst_val_c;

      sreg.ext_r   <= def_rst_val_c;

      sreg.ext_r   <= def_rst_val_c;

      sreg.ext_s   <= def_rst_val_c;

      sreg.ext_s   <= def_rst_val_c;

--

--

      done_o       <= '0';

      done_o       <= '0';

    elsif rising_edge(clk_i) then

    elsif rising_edge(clk_i) then

      -- defaults --

      -- defaults --

      ctrl.cnt_pre <= ctrl.cnt;

      ctrl.cnt_pre <= ctrl.cnt;

      done_o       <= '0';

      done_o       <= '0';

      -- exponent counter underflow/overflow --

      -- exponent counter underflow/overflow --

      if ((ctrl.cnt_pre(8 downto 7) = "01") and (ctrl.cnt(8 downto 7) = "10")) then -- overflow

      if ((ctrl.cnt_pre(8 downto 7) = "01") and (ctrl.cnt(8 downto 7) = "10")) then -- overflow

        ctrl.cnt_of <= '1';

        ctrl.cnt_of <= '1';

      elsif (ctrl.cnt_pre(8 downto 7) = "00") and (ctrl.cnt(8 downto 7) = "11") then -- underflow

      elsif (ctrl.cnt_pre(8 downto 7) = "00") and (ctrl.cnt(8 downto 7) = "11") then -- underflow

        ctrl.cnt_uf <= '1';

        ctrl.cnt_uf <= '1';

      end if;

      end if;

      -- fsm --

      -- fsm --

      case ctrl.state is

      case ctrl.state is

        when S_IDLE => -- wait for operation trigger

        when S_IDLE => -- wait for operation trigger

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          ctrl.norm_r  <= '0'; -- start with first normalization

          ctrl.norm_r  <= '0'; -- start with first normalization

          ctrl.rounded <= '0'; -- not rounded yet

          ctrl.rounded <= '0'; -- not rounded yet

          ctrl.cnt_of  <= '0';

          ctrl.cnt_of  <= '0';

          ctrl.cnt_uf  <= '0';

          ctrl.cnt_uf  <= '0';

--

--

          if (start_i = '1') then

          if (start_i = '1') then

            ctrl.cnt     <= exponent_i;

            ctrl.cnt     <= exponent_i;

            ctrl.res_sgn <= sign_i;

            ctrl.res_sgn <= sign_i;

            ctrl.class   <= class_i;

            ctrl.class   <= class_i;

            ctrl.flags   <= flags_i;

            ctrl.flags   <= flags_i;

            if (funct_i = '0') then -- float -> float

            if (funct_i = '0') then -- float -> float

              ctrl.state <= S_PREPARE_NORM;

              ctrl.state <= S_PREPARE_NORM;

            else -- integer -> float

            else -- integer -> float

              ctrl.state <= S_PREPARE_I2F;

              ctrl.state <= S_PREPARE_I2F;

            end if;

            end if;

          end if;

          end if;

        when S_PREPARE_I2F => -- prepare integer-to-float conversion

        when S_PREPARE_I2F => -- prepare integer-to-float conversion

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          sreg.upper <= integer_i;

          sreg.upper <= integer_i;

          sreg.lower <= (others => '0');

          sreg.lower <= (others => '0');

          sreg.ext_g <= '0';

          sreg.ext_g <= '0';

          sreg.ext_r <= '0';

          sreg.ext_r <= '0';

          sreg.ext_s <= '0';

          sreg.ext_s <= '0';

          sreg.dir   <= '0'; -- shift right

          sreg.dir   <= '0'; -- shift right

          ctrl.state <= S_CHECK_I2F;

          ctrl.state <= S_CHECK_I2F;

        when S_CHECK_I2F => -- check if converting zero

        when S_CHECK_I2F => -- check if converting zero

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          if (sreg.zero = '1') then -- all zero

          if (sreg.zero = '1') then -- all zero

            ctrl.class(fp_class_pos_zero_c) <= '1';

            ctrl.class(fp_class_pos_zero_c) <= '1';

            ctrl.state <= S_FINALIZE;

            ctrl.state <= S_FINALIZE;

          else

          else

            ctrl.state <= S_NORMALIZE_BUSY;

            ctrl.state <= S_NORMALIZE_BUSY;

          end if;

          end if;

        when S_PREPARE_NORM => -- prepare "normal" normalization & rounding

        when S_PREPARE_NORM => -- prepare "normal" normalization & rounding

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          sreg.upper(31 downto 02) <= (others => '0');

          sreg.upper(31 downto 02) <= (others => '0');

          sreg.upper(01 downto 00) <= mantissa_i(47 downto 46);

          sreg.upper(01 downto 00) <= mantissa_i(47 downto 46);

          sreg.lower <= mantissa_i(45 downto 23);

          sreg.lower <= mantissa_i(45 downto 23);

          sreg.ext_g <= mantissa_i(22);

          sreg.ext_g <= mantissa_i(22);

          sreg.ext_r <= mantissa_i(21);

          sreg.ext_r <= mantissa_i(21);

          sreg.ext_s <= or_reduce_f(mantissa_i(20 downto 0));

          if (or_reduce_f(mantissa_i(20 downto 0)) = '1') then

            sreg.ext_s <= '1';

          else

            sreg.ext_s <= '0';

          end if;

          -- check for special cases --

          -- check for special cases --

          if ((ctrl.class(fp_class_snan_c)       or ctrl.class(fp_class_qnan_c)       or -- NaN

          if ((ctrl.class(fp_class_snan_c)       or ctrl.class(fp_class_qnan_c)       or -- NaN

               ctrl.class(fp_class_neg_zero_c)   or ctrl.class(fp_class_pos_zero_c)   or -- zero

               ctrl.class(fp_class_neg_zero_c)   or ctrl.class(fp_class_pos_zero_c)   or -- zero

               ctrl.class(fp_class_neg_denorm_c) or ctrl.class(fp_class_pos_denorm_c) or -- subnormal

               ctrl.class(fp_class_neg_denorm_c) or ctrl.class(fp_class_pos_denorm_c) or -- subnormal

               ctrl.class(fp_class_neg_inf_c)    or ctrl.class(fp_class_pos_inf_c)    or -- infinity

               ctrl.class(fp_class_neg_inf_c)    or ctrl.class(fp_class_pos_inf_c)    or -- infinity

               ctrl.flags(fp_exc_uf_c) or -- underflow

               ctrl.flags(fp_exc_uf_c) or -- underflow

               ctrl.flags(fp_exc_of_c) or -- overflow

               ctrl.flags(fp_exc_of_c) or -- overflow

               ctrl.flags(fp_exc_nv_c)) = '1') then -- invalid

               ctrl.flags(fp_exc_nv_c)) = '1') then -- invalid

            ctrl.state <= S_FINALIZE;

            ctrl.state <= S_FINALIZE;

          else

          else

            ctrl.state <= S_PREPARE_SHIFT;

            ctrl.state <= S_PREPARE_SHIFT;

          end if;

          end if;

        when S_PREPARE_SHIFT => -- prepare shift direction (for "normal" normalization only)

        when S_PREPARE_SHIFT => -- prepare shift direction (for "normal" normalization only)

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          if (sreg.zero = '0') then -- number < 1.0

          if (sreg.zero = '0') then -- number < 1.0

            sreg.dir <= '0'; -- shift right

            sreg.dir <= '0'; -- shift right

          else -- number >= 1.0

          else -- number >= 1.0

            sreg.dir <= '1'; -- shift left

            sreg.dir <= '1'; -- shift left

          end if;

          end if;

          ctrl.state <= S_NORMALIZE_BUSY;

          ctrl.state <= S_NORMALIZE_BUSY;

        when S_NORMALIZE_BUSY => -- running normalization cycle

        when S_NORMALIZE_BUSY => -- running normalization cycle

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          -- shift until normalized or exception --

          -- shift until normalized or exception --

          if (sreg.done = '1') or (ctrl.cnt_uf = '1') or (ctrl.cnt_of = '1') then

          if (sreg.done = '1') or (ctrl.cnt_uf = '1') or (ctrl.cnt_of = '1') then

            -- normalization control --

            -- normalization control --

            ctrl.norm_r <= '1';

            ctrl.norm_r <= '1';

            if (ctrl.norm_r = '0') then -- first normalization cycle done

            if (ctrl.norm_r = '0') then -- first normalization cycle done

              ctrl.state <= S_ROUND;

              ctrl.state <= S_ROUND;

            else -- second normalization cycle done

            else -- second normalization cycle done

              ctrl.state <= S_CHECK;

              ctrl.state <= S_CHECK;

            end if;

            end if;

          else

          else

            if (sreg.dir = '0') then -- shift right

            if (sreg.dir = '0') then -- shift right

              ctrl.cnt   <= std_ulogic_vector(unsigned(ctrl.cnt) + 1);

              ctrl.cnt   <= std_ulogic_vector(unsigned(ctrl.cnt) + 1);

              sreg.upper <= '0' & sreg.upper(sreg.upper'left downto 1);

              sreg.upper <= '0' & sreg.upper(sreg.upper'left downto 1);

              sreg.lower <= sreg.upper(0) & sreg.lower(sreg.lower'left downto 1);

              sreg.lower <= sreg.upper(0) & sreg.lower(sreg.lower'left downto 1);

              sreg.ext_g <= sreg.lower(0);

              sreg.ext_g <= sreg.lower(0);

              sreg.ext_r <= sreg.ext_g;

              sreg.ext_r <= sreg.ext_g;

              sreg.ext_s <= sreg.ext_r or sreg.ext_s; -- sticky bit

              sreg.ext_s <= sreg.ext_r or sreg.ext_s; -- sticky bit

            else -- shift left

            else -- shift left

              ctrl.cnt   <= std_ulogic_vector(unsigned(ctrl.cnt) - 1);

              ctrl.cnt   <= std_ulogic_vector(unsigned(ctrl.cnt) - 1);

              sreg.upper <= sreg.upper(sreg.upper'left-1 downto 0) & sreg.lower(sreg.lower'left);

              sreg.upper <= sreg.upper(sreg.upper'left-1 downto 0) & sreg.lower(sreg.lower'left);

              sreg.lower <= sreg.lower(sreg.lower'left-1 downto 0) & sreg.ext_g;

              sreg.lower <= sreg.lower(sreg.lower'left-1 downto 0) & sreg.ext_g;

              sreg.ext_g <= sreg.ext_r;

              sreg.ext_g <= sreg.ext_r;

              sreg.ext_r <= sreg.ext_s;

              sreg.ext_r <= sreg.ext_s;

              sreg.ext_s <= sreg.ext_s; -- sticky bit

              sreg.ext_s <= sreg.ext_s; -- sticky bit

            end if;

            end if;

          end if;

          end if;

        when S_ROUND => -- rounding cycle (after first normalization)

        when S_ROUND => -- rounding cycle (after first normalization)

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          ctrl.rounded <= ctrl.rounded or round.en;

          ctrl.rounded <= ctrl.rounded or round.en;

          sreg.upper(31 downto 02) <= (others => '0');

          sreg.upper(31 downto 02) <= (others => '0');

          sreg.upper(01 downto 00) <= round.output(24 downto 23);

          sreg.upper(01 downto 00) <= round.output(24 downto 23);

          sreg.lower <= round.output(22 downto 00);

          sreg.lower <= round.output(22 downto 00);

          sreg.ext_g <= '0';

          sreg.ext_g <= '0';

          sreg.ext_r <= '0';

          sreg.ext_r <= '0';

          sreg.ext_s <= '0';

          sreg.ext_s <= '0';

          ctrl.state <= S_PREPARE_SHIFT;

          ctrl.state <= S_PREPARE_SHIFT;

        when S_CHECK => -- check for overflow/underflow

        when S_CHECK => -- check for overflow/underflow

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          if (ctrl.cnt_uf = '1') then -- underflow

          if (ctrl.cnt_uf = '1') then -- underflow

            ctrl.flags(fp_exc_uf_c) <= '1';

            ctrl.flags(fp_exc_uf_c) <= '1';

          elsif (ctrl.cnt_of = '1') then -- overflow

          elsif (ctrl.cnt_of = '1') then -- overflow

            ctrl.flags(fp_exc_of_c) <= '1';

            ctrl.flags(fp_exc_of_c) <= '1';

          elsif (ctrl.cnt(7 downto 0) = x"00") then -- subnormal

          elsif (ctrl.cnt(7 downto 0) = x"00") then -- subnormal

            ctrl.flags(fp_exc_uf_c) <= '1';

            ctrl.flags(fp_exc_uf_c) <= '1';

          elsif (ctrl.cnt(7 downto 0) = x"FF") then -- infinity

          elsif (ctrl.cnt(7 downto 0) = x"FF") then -- infinity

            ctrl.flags(fp_exc_of_c) <= '1';

            ctrl.flags(fp_exc_of_c) <= '1';

          end if;

          end if;

          ctrl.state  <= S_FINALIZE;

          ctrl.state  <= S_FINALIZE;

        when S_FINALIZE => -- result finalization

        when S_FINALIZE => -- result finalization

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          -- generate result word (the ORDER of checks is imporatant here!) --

          -- generate result word (the ORDER of checks is imporatant here!) --

          if (ctrl.class(fp_class_snan_c) = '1') or (ctrl.class(fp_class_qnan_c) = '1') then -- sNaN / qNaN

          if (ctrl.class(fp_class_snan_c) = '1') or (ctrl.class(fp_class_qnan_c) = '1') then -- sNaN / qNaN

            ctrl.res_sgn <= fp_single_qnan_c(31);

            ctrl.res_sgn <= fp_single_qnan_c(31);

            ctrl.res_exp <= fp_single_qnan_c(30 downto 23);

            ctrl.res_exp <= fp_single_qnan_c(30 downto 23);

            ctrl.res_man <= fp_single_qnan_c(22 downto 00);

            ctrl.res_man <= fp_single_qnan_c(22 downto 00);

          elsif (ctrl.class(fp_class_neg_inf_c) = '1') or (ctrl.class(fp_class_pos_inf_c) = '1') or -- infinity

          elsif (ctrl.class(fp_class_neg_inf_c) = '1') or (ctrl.class(fp_class_pos_inf_c) = '1') or -- infinity

                (ctrl.flags(fp_exc_of_c) = '1') then -- overflow

                (ctrl.flags(fp_exc_of_c) = '1') then -- overflow

            ctrl.res_exp <= fp_single_pos_inf_c(30 downto 23); -- keep original sign

            ctrl.res_exp <= fp_single_pos_inf_c(30 downto 23); -- keep original sign

            ctrl.res_man <= fp_single_pos_inf_c(22 downto 00);

            ctrl.res_man <= fp_single_pos_inf_c(22 downto 00);

          elsif (ctrl.class(fp_class_neg_zero_c) = '1') or (ctrl.class(fp_class_pos_zero_c) = '1') then -- zero

          elsif (ctrl.class(fp_class_neg_zero_c) = '1') or (ctrl.class(fp_class_pos_zero_c) = '1') then -- zero

            ctrl.res_sgn <= ctrl.class(fp_class_neg_zero_c);

            ctrl.res_sgn <= ctrl.class(fp_class_neg_zero_c);

            ctrl.res_exp <= fp_single_pos_zero_c(30 downto 23);

            ctrl.res_exp <= fp_single_pos_zero_c(30 downto 23);

            ctrl.res_man <= fp_single_pos_zero_c(22 downto 00);

            ctrl.res_man <= fp_single_pos_zero_c(22 downto 00);

          elsif (ctrl.flags(fp_exc_uf_c) = '1') or -- underflow

          elsif (ctrl.flags(fp_exc_uf_c) = '1') or -- underflow

                (sreg.zero = '1') or (ctrl.class(fp_class_neg_denorm_c) = '1') or (ctrl.class(fp_class_pos_denorm_c) = '1') then -- denormalized (flush-to-zero)

                (sreg.zero = '1') or (ctrl.class(fp_class_neg_denorm_c) = '1') or (ctrl.class(fp_class_pos_denorm_c) = '1') then -- denormalized (flush-to-zero)

            ctrl.res_exp <= fp_single_pos_zero_c(30 downto 23); -- keep original sign

            ctrl.res_exp <= fp_single_pos_zero_c(30 downto 23); -- keep original sign

            ctrl.res_man <= fp_single_pos_zero_c(22 downto 00);

            ctrl.res_man <= fp_single_pos_zero_c(22 downto 00);

          else -- result is ok

          else -- result is ok

            ctrl.res_exp <= ctrl.cnt(7 downto 0);

            ctrl.res_exp <= ctrl.cnt(7 downto 0);

            ctrl.res_man <= sreg.lower;

            ctrl.res_man <= sreg.lower;

          end if;

          end if;

          -- generate exception flags --

          -- generate exception flags --

          ctrl.flags(fp_exc_nv_c) <= ctrl.flags(fp_exc_nv_c) or ctrl.class(fp_class_snan_c); -- invalid if input is SIGNALING NaN

          ctrl.flags(fp_exc_nv_c) <= ctrl.flags(fp_exc_nv_c) or ctrl.class(fp_class_snan_c); -- invalid if input is SIGNALING NaN

          ctrl.flags(fp_exc_nx_c) <= ctrl.flags(fp_exc_nx_c) or ctrl.rounded; -- inexcat if result is rounded

          ctrl.flags(fp_exc_nx_c) <= ctrl.flags(fp_exc_nx_c) or ctrl.rounded; -- inexcat if result is rounded

--

--

          done_o     <= '1';

          done_o     <= '1';

          ctrl.state <= S_IDLE;

          ctrl.state <= S_IDLE;

        when others => -- undefined

        when others => -- undefined

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          ctrl.state <= S_IDLE;

          ctrl.state <= S_IDLE;

      end case;

      end case;

    end if;

    end if;

  end process ctrl_engine;

  end process ctrl_engine;

  -- stop shifting when normalized --

  -- stop shifting when normalized --

  sreg.done <= (not or_reduce_f(sreg.upper(sreg.upper'left downto 1))) and sreg.upper(0); -- input is zero, hidden one is set

  sreg.done <= '1' when (or_reduce_f(sreg.upper(sreg.upper'left downto 1)) = '0') and (sreg.upper(0) = '1') else '0'; -- input is zero, hidden one is set

  -- all-zero including hidden bit --

  -- all-zero including hidden bit --

  sreg.zero <= not or_reduce_f(sreg.upper);

  sreg.zero <= '1' when (or_reduce_f(sreg.upper) = '0') else '0';

  -- result --

  -- result --

  result_o(31)           <= ctrl.res_sgn;

  result_o(31)           <= ctrl.res_sgn;

  result_o(30 downto 23) <= ctrl.res_exp;

  result_o(30 downto 23) <= ctrl.res_exp;

  result_o(22 downto  0) <= ctrl.res_man;

  result_o(22 downto  0) <= ctrl.res_man;

  -- exception flags --

  -- exception flags --

  flags_o(fp_exc_nv_c) <= ctrl.flags(fp_exc_nv_c); -- invalid operation

  flags_o(fp_exc_nv_c) <= ctrl.flags(fp_exc_nv_c); -- invalid operation

  flags_o(fp_exc_dz_c) <= ctrl.flags(fp_exc_dz_c); -- divide by zero

  flags_o(fp_exc_dz_c) <= ctrl.flags(fp_exc_dz_c); -- divide by zero

  flags_o(fp_exc_of_c) <= ctrl.flags(fp_exc_of_c); -- overflow

  flags_o(fp_exc_of_c) <= ctrl.flags(fp_exc_of_c); -- overflow

  flags_o(fp_exc_uf_c) <= ctrl.flags(fp_exc_uf_c); -- underflow

  flags_o(fp_exc_uf_c) <= ctrl.flags(fp_exc_uf_c); -- underflow

  flags_o(fp_exc_nx_c) <= ctrl.flags(fp_exc_nx_c); -- inexact

  flags_o(fp_exc_nx_c) <= ctrl.flags(fp_exc_nx_c); -- inexact

  -- Rounding -------------------------------------------------------------------------------

  -- Rounding -------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  rounding_unit_ctrl: process(rmode_i, sreg)

  rounding_unit_ctrl: process(rmode_i, sreg)

  begin

  begin

    -- defaults --

    -- defaults --

    round.en  <= '0';

    round.en  <= '0';

    round.sub <= '0';

    round.sub <= '0';

    -- rounding mode --

    -- rounding mode --

    case rmode_i(2 downto 0) is

    case rmode_i(2 downto 0) is

      when "000" => -- round to nearest, ties to even

      when "000" => -- round to nearest, ties to even

        if (sreg.ext_g = '0') then

        if (sreg.ext_g = '0') then

          round.en <= '0'; -- round down (do nothing)

          round.en <= '0'; -- round down (do nothing)

        else

        else

          if (sreg.ext_r = '0') and (sreg.ext_s = '0') then -- tie!

          if (sreg.ext_r = '0') and (sreg.ext_s = '0') then -- tie!

            round.en <= sreg.lower(0); -- round up if LSB of mantissa is set

            round.en <= sreg.lower(0); -- round up if LSB of mantissa is set

          else

          else

            round.en <= '1'; -- round up

            round.en <= '1'; -- round up

          end if;

          end if;

        end if;

        end if;

        round.sub <= '0'; -- increment

        round.sub <= '0'; -- increment

      when "001" => -- round towards zero

      when "001" => -- round towards zero

        round.en <= '0'; -- no rounding -> just truncate

        round.en <= '0'; -- no rounding -> just truncate

      when "010" => -- round down (towards -infinity)

      when "010" => -- round down (towards -infinity)

        round.en  <= sreg.ext_g or sreg.ext_r or sreg.ext_s;

        round.en  <= sreg.ext_g or sreg.ext_r or sreg.ext_s;

        round.sub <= '1'; -- decrement

        round.sub <= '1'; -- decrement

      when "011" => -- round up (towards +infinity)

      when "011" => -- round up (towards +infinity)

        round.en  <= sreg.ext_g or sreg.ext_r or sreg.ext_s;

        round.en  <= sreg.ext_g or sreg.ext_r or sreg.ext_s;

        round.sub <= '0'; -- increment

        round.sub <= '0'; -- increment

      when "100" => -- round to nearest, ties to max magnitude

      when "100" => -- round to nearest, ties to max magnitude

        round.en <= '0'; -- FIXME / TODO

        round.en <= '0'; -- FIXME / TODO

      when others => -- undefined

      when others => -- undefined

        round.en <= '0';

        round.en <= '0';

    end case;

    end case;

  end process rounding_unit_ctrl;

  end process rounding_unit_ctrl;

  -- incrementer/decrementer --

  -- incrementer/decrementer --

  rounding_unit_add: process(round, sreg)

  rounding_unit_add: process(round, sreg)

    variable tmp_v : std_ulogic_vector(24 downto 0);

    variable tmp_v : std_ulogic_vector(24 downto 0);

  begin

  begin

    tmp_v := '0' & sreg.upper(0) & sreg.lower;

    tmp_v := '0' & sreg.upper(0) & sreg.lower;

    if (round.en = '1') then

    if (round.en = '1') then

      if (round.sub = '0') then -- increment

      if (round.sub = '0') then -- increment

        round.output <= std_ulogic_vector(unsigned(tmp_v) + 1);

        round.output <= std_ulogic_vector(unsigned(tmp_v) + 1);

      else -- decrement

      else -- decrement

        round.output <= std_ulogic_vector(unsigned(tmp_v) - 1);

        round.output <= std_ulogic_vector(unsigned(tmp_v) - 1);

      end if;

      end if;

    else -- do nothing

    else -- do nothing

      round.output <= tmp_v;

      round.output <= tmp_v;

    end if;

    end if;

  end process rounding_unit_add;

  end process rounding_unit_add;

end neorv32_cpu_cp_fpu_normalizer_rtl;

end neorv32_cpu_cp_fpu_normalizer_rtl;

-- ###########################################################################################################################################

-- ###########################################################################################################################################

-- ###########################################################################################################################################

-- ###########################################################################################################################################

-- #################################################################################################

-- #################################################################################################

-- # << NEORV32 - Single-Precision Floating-Point Unit: Float-To-Int Converter >>                  #

-- # << NEORV32 - Single-Precision Floating-Point Unit: Float-To-Int Converter >>                  #

-- # ********************************************************************************************* #

-- # ********************************************************************************************* #

-- # BSD 3-Clause License                                                                          #

-- # BSD 3-Clause License                                                                          #

-- #                                                                                               #

-- #                                                                                               #

-- # Copyright (c) 2021, Stephan Nolting. All rights reserved.                                     #

-- # Copyright (c) 2021, Stephan Nolting. All rights reserved.                                     #

-- #                                                                                               #

-- #                                                                                               #

-- # Redistribution and use in source and binary forms, with or without modification, are          #

-- # Redistribution and use in source and binary forms, with or without modification, are          #

-- # permitted provided that the following conditions are met:                                     #

-- # permitted provided that the following conditions are met:                                     #

-- #                                                                                               #

-- #                                                                                               #

-- # 1. Redistributions of source code must retain the above copyright notice, this list of        #

-- # 1. Redistributions of source code must retain the above copyright notice, this list of        #

-- #    conditions and the following disclaimer.                                                   #

-- #    conditions and the following disclaimer.                                                   #

-- #                                                                                               #

-- #                                                                                               #

-- # 2. Redistributions in binary form must reproduce the above copyright notice, this list of     #

-- # 2. Redistributions in binary form must reproduce the above copyright notice, this list of     #

-- #    conditions and the following disclaimer in the documentation and/or other materials        #

-- #    conditions and the following disclaimer in the documentation and/or other materials        #

-- #    provided with the distribution.                                                            #

-- #    provided with the distribution.                                                            #

-- #                                                                                               #

-- #                                                                                               #

-- # 3. Neither the name of the copyright holder nor the names of its contributors may be used to  #

-- # 3. Neither the name of the copyright holder nor the names of its contributors may be used to  #

-- #    endorse or promote products derived from this software without specific prior written      #

-- #    endorse or promote products derived from this software without specific prior written      #

-- #    permission.                                                                                #

-- #    permission.                                                                                #

-- #                                                                                               #

-- #                                                                                               #

-- # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS   #

-- # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS   #

-- # OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF               #

-- # OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF               #

-- # MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE    #

-- # MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE    #

-- # COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,     #

-- # COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,     #

-- # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE #

-- # EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE #

-- # GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED    #

-- # GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED    #

-- # AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING     #

-- # AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING     #

-- # NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED  #

-- # NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED  #

-- # OF THE POSSIBILITY OF SUCH DAMAGE.                                                            #

-- # OF THE POSSIBILITY OF SUCH DAMAGE.                                                            #

-- # ********************************************************************************************* #

-- # ********************************************************************************************* #

-- # The NEORV32 Processor - https://github.com/stnolting/neorv32              (c) Stephan Nolting #

-- # The NEORV32 Processor - https://github.com/stnolting/neorv32              (c) Stephan Nolting #

-- #################################################################################################

-- #################################################################################################

library ieee;

library ieee;

use ieee.std_logic_1164.all;

use ieee.std_logic_1164.all;

use ieee.numeric_std.all;

use ieee.numeric_std.all;

library neorv32;

library neorv32;

use neorv32.neorv32_package.all;

use neorv32.neorv32_package.all;

entity neorv32_cpu_cp_fpu_f2i is

entity neorv32_cpu_cp_fpu_f2i is

  port (

  port (

    -- control --

    -- control --

    clk_i      : in  std_ulogic; -- global clock, rising edge

    clk_i      : in  std_ulogic; -- global clock, rising edge

    rstn_i     : in  std_ulogic; -- global reset, low-active, async

    rstn_i     : in  std_ulogic; -- global reset, low-active, async

    start_i    : in  std_ulogic; -- trigger operation

    start_i    : in  std_ulogic; -- trigger operation

    rmode_i    : in  std_ulogic_vector(02 downto 0); -- rounding mode

    rmode_i    : in  std_ulogic_vector(02 downto 0); -- rounding mode

    funct_i    : in  std_ulogic; -- 0=signed, 1=unsigned

    funct_i    : in  std_ulogic; -- 0=signed, 1=unsigned

    -- input --

    -- input --

    sign_i     : in  std_ulogic; -- sign

    sign_i     : in  std_ulogic; -- sign

    exponent_i : in  std_ulogic_vector(07 downto 0); -- exponent

    exponent_i : in  std_ulogic_vector(07 downto 0); -- exponent

    mantissa_i : in  std_ulogic_vector(22 downto 0); -- mantissa

    mantissa_i : in  std_ulogic_vector(22 downto 0); -- mantissa

    class_i    : in  std_ulogic_vector(09 downto 0); -- operand class

    class_i    : in  std_ulogic_vector(09 downto 0); -- operand class

    -- output --

    -- output --

    result_o   : out std_ulogic_vector(31 downto 0); -- integer result

    result_o   : out std_ulogic_vector(31 downto 0); -- integer result

    flags_o    : out std_ulogic_vector(04 downto 0); -- exception flags

    flags_o    : out std_ulogic_vector(04 downto 0); -- exception flags

    done_o     : out std_ulogic -- operation done

    done_o     : out std_ulogic -- operation done

);

);

end neorv32_cpu_cp_fpu_f2i;

end neorv32_cpu_cp_fpu_f2i;

architecture neorv32_cpu_cp_fpu_f2i_rtl of neorv32_cpu_cp_fpu_f2i is

architecture neorv32_cpu_cp_fpu_f2i_rtl of neorv32_cpu_cp_fpu_f2i is

  -- controller --

  -- controller --

  type ctrl_engine_state_t is (S_IDLE, S_PREPARE_F2I, S_NORMALIZE_BUSY, S_ROUND, S_FINALIZE);

  type ctrl_engine_state_t is (S_IDLE, S_PREPARE_F2I, S_NORMALIZE_BUSY, S_ROUND, S_FINALIZE);

  type ctrl_t is record

  type ctrl_t is record

    state      : ctrl_engine_state_t; -- current state

    state      : ctrl_engine_state_t; -- current state

    unsign     : std_ulogic;

    unsign     : std_ulogic;

    cnt        : std_ulogic_vector(07 downto 0); -- interation counter/exponent

    cnt        : std_ulogic_vector(07 downto 0); -- interation counter/exponent

    sign       : std_ulogic;

    sign       : std_ulogic;

    class      : std_ulogic_vector(09 downto 0);

    class      : std_ulogic_vector(09 downto 0);

    rounded    : std_ulogic; -- output is rounded

    rounded    : std_ulogic; -- output is rounded

    over       : std_ulogic; -- output is overflowing

    over       : std_ulogic; -- output is overflowing

    under      : std_ulogic; -- output in underflowing

    under      : std_ulogic; -- output in underflowing

    result_tmp : std_ulogic_vector(31 downto 0);

    result_tmp : std_ulogic_vector(31 downto 0);

    result     : std_ulogic_vector(31 downto 0);

    result     : std_ulogic_vector(31 downto 0);

  end record;

  end record;

  signal ctrl : ctrl_t;

  signal ctrl : ctrl_t;

  -- conversion shift register --

  -- conversion shift register --

  type sreg_t is record

  type sreg_t is record

    int   : std_ulogic_vector(31 downto 0); -- including hidden-zero

    int   : std_ulogic_vector(31 downto 0); -- including hidden-zero

    mant  : std_ulogic_vector(22 downto 0);

    mant  : std_ulogic_vector(22 downto 0);

    ext_g : std_ulogic; -- guard bit

    ext_g : std_ulogic; -- guard bit

    ext_r : std_ulogic; -- round bit

    ext_r : std_ulogic; -- round bit

    ext_s : std_ulogic; -- sticky bit

    ext_s : std_ulogic; -- sticky bit

  end record;

  end record;

  signal sreg : sreg_t;

  signal sreg : sreg_t;

  -- rounding unit --

  -- rounding unit --

  type round_t is record

  type round_t is record

    en     : std_ulogic; -- enable rounding

    en     : std_ulogic; -- enable rounding

    sub    : std_ulogic; -- 0=decrement, 1=increment

    sub    : std_ulogic; -- 0=decrement, 1=increment

    output : std_ulogic_vector(32 downto 0); -- result + overflow

    output : std_ulogic_vector(32 downto 0); -- result + overflow

  end record;

  end record;

  signal round : round_t;

  signal round : round_t;

begin

begin

  -- Control Engine -------------------------------------------------------------------------

  -- Control Engine -------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  ctrl_engine: process(rstn_i, clk_i)

  ctrl_engine: process(rstn_i, clk_i)

  begin

  begin

    if (rstn_i = '0') then

    if (rstn_i = '0') then

      ctrl.state      <= S_IDLE;

      ctrl.state      <= S_IDLE;

      ctrl.cnt        <= (others => def_rst_val_c);

      ctrl.cnt        <= (others => def_rst_val_c);

      ctrl.sign       <= def_rst_val_c;

      ctrl.sign       <= def_rst_val_c;

      ctrl.class      <= (others => def_rst_val_c);

      ctrl.class      <= (others => def_rst_val_c);

      ctrl.rounded    <= def_rst_val_c;

      ctrl.rounded    <= def_rst_val_c;

      ctrl.over       <= def_rst_val_c;

      ctrl.over       <= def_rst_val_c;

      ctrl.under      <= def_rst_val_c;

      ctrl.under      <= def_rst_val_c;

      ctrl.unsign     <= def_rst_val_c;

      ctrl.unsign     <= def_rst_val_c;

      ctrl.result     <= (others => def_rst_val_c);

      ctrl.result     <= (others => def_rst_val_c);

      ctrl.result_tmp <= (others => def_rst_val_c);

      ctrl.result_tmp <= (others => def_rst_val_c);

      sreg.int        <= (others => def_rst_val_c);

      sreg.int        <= (others => def_rst_val_c);

      sreg.mant       <= (others => def_rst_val_c);

      sreg.mant       <= (others => def_rst_val_c);

      sreg.ext_s      <= def_rst_val_c;

      sreg.ext_s      <= def_rst_val_c;

      done_o          <= '0';

      done_o          <= '0';

    elsif rising_edge(clk_i) then

    elsif rising_edge(clk_i) then

      -- defaults --

      -- defaults --

      done_o <= '0';

      done_o <= '0';

      -- fsm --

      -- fsm --

      case ctrl.state is

      case ctrl.state is

        when S_IDLE => -- wait for operation trigger

        when S_IDLE => -- wait for operation trigger

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          ctrl.rounded <= '0'; -- not rounded yet

          ctrl.rounded <= '0'; -- not rounded yet

          ctrl.over    <= '0'; -- not overflowing yet

          ctrl.over    <= '0'; -- not overflowing yet

          ctrl.under   <= '0'; -- not underflowing yet

          ctrl.under   <= '0'; -- not underflowing yet

          ctrl.unsign  <= funct_i;

          ctrl.unsign  <= funct_i;

          sreg.ext_s   <= '0'; -- init

          sreg.ext_s   <= '0'; -- init

          if (start_i = '1') then

          if (start_i = '1') then

            ctrl.cnt    <= exponent_i;

            ctrl.cnt    <= exponent_i;

            ctrl.sign   <= sign_i;

            ctrl.sign   <= sign_i;

            ctrl.class  <= class_i;

            ctrl.class  <= class_i;

            sreg.mant   <= mantissa_i;

            sreg.mant   <= mantissa_i;

            ctrl.state  <= S_PREPARE_F2I;

            ctrl.state  <= S_PREPARE_F2I;

          end if;

          end if;

        when S_PREPARE_F2I => -- prepare float-to-integer conversion

        when S_PREPARE_F2I => -- prepare float-to-integer conversion

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          if (unsigned(ctrl.cnt) < 126) then -- less than 0.5

          if (unsigned(ctrl.cnt) < 126) then -- less than 0.5

            sreg.int    <= (others => '0');

            sreg.int    <= (others => '0');

            ctrl.under  <= '1'; -- this is an underflow!

            ctrl.under  <= '1'; -- this is an underflow!

            ctrl.cnt    <= (others => '0');

            ctrl.cnt    <= (others => '0');

          elsif (unsigned(ctrl.cnt) = 126) then -- num < 1.0 but num >= 0.5

          elsif (unsigned(ctrl.cnt) = 126) then -- num < 1.0 but num >= 0.5

            sreg.int    <= (others => '0');

            sreg.int    <= (others => '0');

            sreg.mant   <= '1' & sreg.mant(sreg.mant'left downto 1);

            sreg.mant   <= '1' & sreg.mant(sreg.mant'left downto 1);

            ctrl.cnt    <= (others => '0');

            ctrl.cnt    <= (others => '0');

          else

          else

            sreg.int    <= (others => '0');

            sreg.int    <= (others => '0');

            sreg.int(0) <= '1'; -- hidden one

            sreg.int(0) <= '1'; -- hidden one

            ctrl.cnt    <= std_ulogic_vector(unsigned(ctrl.cnt) - 127); -- remove bias to get raw number of left shifts

            ctrl.cnt    <= std_ulogic_vector(unsigned(ctrl.cnt) - 127); -- remove bias to get raw number of left shifts

          end if;

          end if;

          -- check terminal cases --

          -- check terminal cases --

          if ((ctrl.class(fp_class_neg_inf_c)  or ctrl.class(fp_class_pos_inf_c) or

          if ((ctrl.class(fp_class_neg_inf_c)  or ctrl.class(fp_class_pos_inf_c) or

               ctrl.class(fp_class_neg_zero_c) or ctrl.class(fp_class_pos_zero_c) or

               ctrl.class(fp_class_neg_zero_c) or ctrl.class(fp_class_pos_zero_c) or

               ctrl.class(fp_class_snan_c)     or ctrl.class(fp_class_qnan_c)) = '1') then

               ctrl.class(fp_class_snan_c)     or ctrl.class(fp_class_qnan_c)) = '1') then

            ctrl.state <= S_FINALIZE;

            ctrl.state <= S_FINALIZE;

          else

          else

            ctrl.state <= S_NORMALIZE_BUSY;

            ctrl.state <= S_NORMALIZE_BUSY;

          end if;

          end if;

        when S_NORMALIZE_BUSY => -- running normalization cycle

        when S_NORMALIZE_BUSY => -- running normalization cycle

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          sreg.ext_s <= sreg.ext_s or or_reduce_f(sreg.mant(sreg.mant'left-2 downto 0)); -- sticky bit

          if (or_reduce_f(sreg.mant(sreg.mant'left-2 downto 0)) = '1') then

            sreg.ext_s <= '1'; -- sticky bit

          end if;

          if (or_reduce_f(ctrl.cnt(ctrl.cnt'left-1 downto 0)) = '0') then

          if (or_reduce_f(ctrl.cnt(ctrl.cnt'left-1 downto 0)) = '0') then

            if (ctrl.unsign = '0') then -- signed conversion

            if (ctrl.unsign = '0') then -- signed conversion

              ctrl.over <= ctrl.over or sreg.int(sreg.int'left); -- update overrun flag again to check for numerical overflow into sign bit

              ctrl.over <= ctrl.over or sreg.int(sreg.int'left); -- update overrun flag again to check for numerical overflow into sign bit

            end if;

            end if;

            ctrl.state <= S_ROUND;

            ctrl.state <= S_ROUND;

          else -- shift left

          else -- shift left

            ctrl.cnt  <= std_ulogic_vector(unsigned(ctrl.cnt) - 1);

            ctrl.cnt  <= std_ulogic_vector(unsigned(ctrl.cnt) - 1);

            sreg.int  <= sreg.int(sreg.int'left-1 downto 0) & sreg.mant(sreg.mant'left);

            sreg.int  <= sreg.int(sreg.int'left-1 downto 0) & sreg.mant(sreg.mant'left);

            sreg.mant <= sreg.mant(sreg.mant'left-1 downto 0) & '0';

            sreg.mant <= sreg.mant(sreg.mant'left-1 downto 0) & '0';

            ctrl.over <= ctrl.over or sreg.int(sreg.int'left);

            ctrl.over <= ctrl.over or sreg.int(sreg.int'left);

          end if;

          end if;

        when S_ROUND => -- rounding cycle

        when S_ROUND => -- rounding cycle

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          ctrl.rounded    <= ctrl.rounded or round.en;

          ctrl.rounded    <= ctrl.rounded or round.en;

          ctrl.over       <= ctrl.over or round.output(round.output'left); -- overflow after rounding

          ctrl.over       <= ctrl.over or round.output(round.output'left); -- overflow after rounding

          ctrl.result_tmp <= round.output(round.output'left-1 downto 0);

          ctrl.result_tmp <= round.output(round.output'left-1 downto 0);

          ctrl.state      <= S_FINALIZE;

          ctrl.state      <= S_FINALIZE;

        when S_FINALIZE => -- check for corner cases and finalize result

        when S_FINALIZE => -- check for corner cases and finalize result

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          if (ctrl.unsign = '1') then -- unsigned conversion

          if (ctrl.unsign = '1') then -- unsigned conversion

            if (ctrl.class(fp_class_snan_c) = '1') or (ctrl.class(fp_class_qnan_c) = '1') or (ctrl.class(fp_class_pos_inf_c) = '1') or -- NaN or +inf

            if (ctrl.class(fp_class_snan_c) = '1') or (ctrl.class(fp_class_qnan_c) = '1') or (ctrl.class(fp_class_pos_inf_c) = '1') or -- NaN or +inf

               ((ctrl.sign = '0') and (ctrl.over = '1')) then -- positive out-of-range

               ((ctrl.sign = '0') and (ctrl.over = '1')) then -- positive out-of-range

              ctrl.result <= x"ffffffff";

              ctrl.result <= x"ffffffff";

            elsif (ctrl.class(fp_class_neg_zero_c) = '1') or (ctrl.class(fp_class_pos_zero_c) = '1') or (ctrl.class(fp_class_neg_inf_c) = '1') or -- subnormal zero or -inf

            elsif (ctrl.class(fp_class_neg_zero_c) = '1') or (ctrl.class(fp_class_pos_zero_c) = '1') or (ctrl.class(fp_class_neg_inf_c) = '1') or -- subnormal zero or -inf

               (ctrl.sign = '1') or (ctrl.under = '1') then -- negative out-of-range or underflow

               (ctrl.sign = '1') or (ctrl.under = '1') then -- negative out-of-range or underflow

              ctrl.result <= x"00000000";

              ctrl.result <= x"00000000";

            else

            else

              ctrl.result <= ctrl.result_tmp;

              ctrl.result <= ctrl.result_tmp;

            end if;

            end if;

          else -- signed conversion

          else -- signed conversion

            if (ctrl.class(fp_class_snan_c) = '1') or (ctrl.class(fp_class_qnan_c) = '1') or (ctrl.class(fp_class_pos_inf_c) = '1') or  -- NaN or +inf

            if (ctrl.class(fp_class_snan_c) = '1') or (ctrl.class(fp_class_qnan_c) = '1') or (ctrl.class(fp_class_pos_inf_c) = '1') or  -- NaN or +inf

                  ((ctrl.sign = '0') and (ctrl.over = '1')) then -- positive out-of-range

                  ((ctrl.sign = '0') and (ctrl.over = '1')) then -- positive out-of-range

              ctrl.result <= x"7fffffff";

              ctrl.result <= x"7fffffff";

            elsif (ctrl.class(fp_class_neg_zero_c) = '1') or (ctrl.class(fp_class_pos_zero_c) = '1') or (ctrl.under = '1') then -- subnormal zero or underflow

            elsif (ctrl.class(fp_class_neg_zero_c) = '1') or (ctrl.class(fp_class_pos_zero_c) = '1') or (ctrl.under = '1') then -- subnormal zero or underflow

              ctrl.result <= x"00000000";

              ctrl.result <= x"00000000";

            elsif (ctrl.class(fp_class_neg_inf_c) = '1') or ((ctrl.sign = '1') and (ctrl.over = '1')) then -- -inf or negative out-of-range

            elsif (ctrl.class(fp_class_neg_inf_c) = '1') or ((ctrl.sign = '1') and (ctrl.over = '1')) then -- -inf or negative out-of-range

              ctrl.result <= x"80000000";

              ctrl.result <= x"80000000";

            else -- result is ok, make sign adaption

            else -- result is ok, make sign adaption

              if (ctrl.sign = '1') then

              if (ctrl.sign = '1') then

                ctrl.result <= std_ulogic_vector(0 - unsigned(ctrl.result_tmp)); -- abs()

                ctrl.result <= std_ulogic_vector(0 - unsigned(ctrl.result_tmp)); -- abs()

              else

              else

                ctrl.result <= ctrl.result_tmp;

                ctrl.result <= ctrl.result_tmp;

              end if;

              end if;

            end if;

            end if;

          end if;

          end if;

          done_o     <= '1';

          done_o     <= '1';

          ctrl.state <= S_IDLE;

          ctrl.state <= S_IDLE;

        when others => -- undefined

        when others => -- undefined

        -- ------------------------------------------------------------

        -- ------------------------------------------------------------

          ctrl.state <= S_IDLE;

          ctrl.state <= S_IDLE;

      end case;

      end case;

    end if;

    end if;

  end process ctrl_engine;

  end process ctrl_engine;

  -- result --

  -- result --

  result_o <= ctrl.result;

  result_o <= ctrl.result;

  -- exception flags --

  -- exception flags --

  flags_o(fp_exc_nv_c) <= ctrl.class(fp_class_snan_c) or ctrl.class(fp_class_qnan_c); -- invalid operation

  flags_o(fp_exc_nv_c) <= ctrl.class(fp_class_snan_c) or ctrl.class(fp_class_qnan_c); -- invalid operation

  flags_o(fp_exc_dz_c) <= '0'; -- divide by zero - not possible here

  flags_o(fp_exc_dz_c) <= '0'; -- divide by zero - not possible here

  flags_o(fp_exc_of_c) <= ctrl.over or ctrl.class(fp_class_pos_inf_c) or ctrl.class(fp_class_neg_inf_c); -- overflow

  flags_o(fp_exc_of_c) <= ctrl.over or ctrl.class(fp_class_pos_inf_c) or ctrl.class(fp_class_neg_inf_c); -- overflow

  flags_o(fp_exc_uf_c) <= ctrl.under; -- underflow

  flags_o(fp_exc_uf_c) <= ctrl.under; -- underflow

  flags_o(fp_exc_nx_c) <= ctrl.rounded; -- inexact if result was rounded

  flags_o(fp_exc_nx_c) <= ctrl.rounded; -- inexact if result was rounded

  -- Rounding -------------------------------------------------------------------------------

  -- Rounding -------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  -- -------------------------------------------------------------------------------------------

  rounding_unit_ctrl: process(rmode_i, sreg)

  rounding_unit_ctrl: process(rmode_i, sreg)

  begin

  begin

    -- defaults --

    -- defaults --

    round.en  <= '0';

    round.en  <= '0';

    round.sub <= '0';

    round.sub <= '0';

    -- rounding mode --

    -- rounding mode --

    case rmode_i(2 downto 0) is

    case rmode_i(2 downto 0) is

      when "000" => -- round to nearest, ties to even

      when "000" => -- round to nearest, ties to even

        if (sreg.ext_g = '0') then

        if (sreg.ext_g = '0') then

          round.en <= '0'; -- round down (do nothing)

          round.en <= '0'; -- round down (do nothing)

        else

        else

          if (sreg.ext_r = '0') and (sreg.ext_s = '0') then -- tie!

          if (sreg.ext_r = '0') and (sreg.ext_s = '0') then -- tie!

            round.en <= sreg.int(0); -- round up if LSB of integer is set

            round.en <= sreg.int(0); -- round up if LSB of integer is set

          else

          else

            round.en <= '1'; -- round up

            round.en <= '1'; -- round up

          end if;

          end if;

        end if;

        end if;

        round.sub <= '0'; -- increment

        round.sub <= '0'; -- increment

      when "001" => -- round towards zero

      when "001" => -- round towards zero

        round.en <= '0'; -- no rounding -> just truncate

        round.en <= '0'; -- no rounding -> just truncate

      when "010" => -- round down (towards -infinity)

      when "010" => -- round down (towards -infinity)

        round.en  <= sreg.ext_g or sreg.ext_r or sreg.ext_s;

        round.en  <= sreg.ext_g or sreg.ext_r or sreg.ext_s;

        round.sub <= '1'; -- decrement

        round.sub <= '1'; -- decrement

      when "011" => -- round up (towards +infinity)

      when "011" => -- round up (towards +infinity)

        round.en  <= sreg.ext_g or sreg.ext_r or sreg.ext_s;

        round.en  <= sreg.ext_g or sreg.ext_r or sreg.ext_s;

        round.sub <= '0'; -- increment

        round.sub <= '0'; -- increment

      when "100" => -- round to nearest, ties to max magnitude

      when "100" => -- round to nearest, ties to max magnitude

        round.en <= '0'; -- FIXME / TODO

        round.en <= '0'; -- FIXME / TODO

      when others => -- undefined

      when others => -- undefined

        round.en <= '0';

        round.en <= '0';

    end case;

    end case;

  end process rounding_unit_ctrl;

  end process rounding_unit_ctrl;

  -- rounding: guard and round bits --

  -- rounding: guard and round bits --

  sreg.ext_g <= sreg.mant(sreg.mant'left);

  sreg.ext_g <= sreg.mant(sreg.mant'left);

  sreg.ext_r <= sreg.mant(sreg.mant'left-1);

  sreg.ext_r <= sreg.mant(sreg.mant'left-1);

  -- incrementer/decrementer --

  -- incrementer/decrementer --

  rounding_unit_add: process(round, sreg)

  rounding_unit_add: process(round, sreg)

    variable tmp_v : std_ulogic_vector(32 downto 0); -- including overflow

    variable tmp_v : std_ulogic_vector(32 downto 0); -- including overflow

  begin

  begin

    tmp_v := '0' & sreg.int;

    tmp_v := '0' & sreg.int;

    if (round.en = '1') then

    if (round.en = '1') then

      if (round.sub = '0') then -- increment

      if (round.sub = '0') then -- increment

        round.output <= std_ulogic_vector(unsigned(tmp_v) + 1);

        round.output <= std_ulogic_vector(unsigned(tmp_v) + 1);

      else -- decrement

      else -- decrement

        round.output <= std_ulogic_vector(unsigned(tmp_v) - 1);

        round.output <= std_ulogic_vector(unsigned(tmp_v) - 1);

      end if;

      end if;

    else -- do nothing

    else -- do nothing

      round.output <= tmp_v;

      round.output <= tmp_v;

    end if;

    end if;

  end process rounding_unit_add;

  end process rounding_unit_add;

end neorv32_cpu_cp_fpu_f2i_rtl;

end neorv32_cpu_cp_fpu_f2i_rtl;

Browse

Tools

Subversion Repositories neorv32

[/] [neorv32/] [trunk/] [rtl/] [core/] [neorv32_cpu_cp_fpu.vhd] - Diff between revs 73 and 74