OpenCores

Rev 12	Rev 21
`--------------------------------------------------------------------------------`	`--------------------------------------------------------------------------------`
`-- mips_mult.vhdl -- multiplier from Plasma project, slightly modified.`	`-- mips_mult.vhdl -- multiplier from Plasma project, slightly modified.`
`--`	`--`
`-- The original file from Plasma has been adapted to the Ion core. Changes are`	`-- The original file from Plasma has been adapted to the Ion core. Changes are`
`-- tagged with '@ion'. There are a few notes at the end of the file with the`	`-- tagged with '@ion'. There are a few notes at the end of the file with the`
`-- rationale for the changes -- useful only if any trouble shows up later.`	`-- rationale for the changes -- useful only if any trouble shows up later.`
`-- The structure has not changed, only a few implementation details.`	`-- The structure has not changed, only a few implementation details.`
`--------------------------------------------------------------------------------`	`--------------------------------------------------------------------------------`
`---------------------------------------------------------------------`	`---------------------------------------------------------------------`
`-- TITLE: Multiplication and Division Unit`	`-- TITLE: Multiplication and Division Unit`
`-- AUTHORS: Steve Rhoads (rhoadss@yahoo.com)`	`-- AUTHORS: Steve Rhoads (rhoadss@yahoo.com)`
`-- DATE CREATED: 1/31/01`	`-- DATE CREATED: 1/31/01`
`-- FILENAME: mult.vhd`	`-- FILENAME: mult.vhd`
`-- PROJECT: Plasma CPU core`	`-- PROJECT: Plasma CPU core`
`-- COPYRIGHT: Software placed into the public domain by the author.`	`-- COPYRIGHT: Software placed into the public domain by the author.`
`-- Software 'as is' without warranty. Author liable for nothing.`	`-- Software 'as is' without warranty. Author liable for nothing.`
`-- DESCRIPTION:`	`-- DESCRIPTION:`
`-- Implements the multiplication and division unit in 32 clocks.`	`-- Implements the multiplication and division unit in 32 clocks.`
`--`	`--`
`-- To reduce space, compile your code using the flag "-mno-mul" which`	`-- To reduce space, compile your code using the flag "-mno-mul" which`
`-- will use software base routines in math.c if USE_SW_MULT is defined.`	`-- will use software base routines in math.c if USE_SW_MULT is defined.`
`-- Then remove references to the entity mult in mlite_cpu.vhd.`	`-- Then remove references to the entity mult in mlite_cpu.vhd.`
`--`	`--`
`-- MULTIPLICATION`	`-- MULTIPLICATION`
`-- long64 answer = 0`	`-- long64 answer = 0`
`-- for(i = 0; i < 32; ++i)`	`-- for(i = 0; i < 32; ++i)`
`-- {`	`-- {`
`-- answer = (answer >> 1) + (((b&1)?a:0) << 31);`	`-- answer = (answer >> 1) + (((b&1)?a:0) << 31);`
`-- b = b >> 1;`	`-- b = b >> 1;`
`-- }`	`-- }`
`--`	`--`
`-- DIVISION`	`-- DIVISION`
`-- long upper=a, lower=0;`	`-- long upper=a, lower=0;`
`-- a = b << 31;`	`-- a = b << 31;`
`-- for(i = 0; i < 32; ++i)`	`-- for(i = 0; i < 32; ++i)`
`-- {`	`-- {`
`-- lower = lower << 1;`	`-- lower = lower << 1;`
`-- if(upper >= a && a && b < 2)`	`-- if(upper >= a && a && b < 2)`
`-- {`	`-- {`
`-- upper = upper - a;`	`-- upper = upper - a;`
`-- lower \|= 1;`	`-- lower \|= 1;`
`-- }`	`-- }`
`-- a = ((b&2) << 30) \| (a >> 1);`	`-- a = ((b&2) << 30) \| (a >> 1);`
`-- b = b >> 1;`	`-- b = b >> 1;`
`-- }`	`-- }`
`---------------------------------------------------------------------`	`---------------------------------------------------------------------`
`library ieee;`	`library ieee;`
`use ieee.std_logic_1164.all;`	`use ieee.std_logic_1164.all;`
`use ieee.std_logic_unsigned.all;`	`use ieee.std_logic_unsigned.all;`
`use IEEE.std_logic_arith.all;`	`use IEEE.std_logic_arith.all;`
`use work.mips_pkg.all;`	`use work.mips_pkg.all;`

`entity mips_mult is`	`entity mips_mult is`
`generic(mult_type : string := "DEFAULT");`	`generic(mult_type : string := "DEFAULT");`
`port(clk : in std_logic;`	`port(clk : in std_logic;`
`reset_in : in std_logic;`	`reset_in : in std_logic;`
`a, b : in std_logic_vector(31 downto 0);`	`a, b : in std_logic_vector(31 downto 0);`
`mult_func : in t_mult_function;`	`mult_func : in t_mult_function;`
`c_mult : out std_logic_vector(31 downto 0);`	`c_mult : out std_logic_vector(31 downto 0);`
`pause_out : out std_logic);`	`pause_out : out std_logic);`
`end; --entity mult`	`end; --entity mult`

`architecture logic of mips_mult is`	`architecture logic of mips_mult is`

`constant MODE_MULT : std_logic := '1';`	`constant MODE_MULT : std_logic := '1';`
`constant MODE_DIV : std_logic := '0';`	`constant MODE_DIV : std_logic := '0';`

`signal mode_reg : std_logic;`	`signal mode_reg : std_logic;`
`signal negate_reg : std_logic;`	`signal negate_reg : std_logic;`
`signal sign_reg : std_logic;`	`signal sign_reg : std_logic;`
`signal sign2_reg : std_logic;`	`signal sign2_reg : std_logic;`
`signal count_reg : std_logic_vector(5 downto 0);`	`signal count_reg : std_logic_vector(5 downto 0);`
`signal aa_reg : std_logic_vector(31 downto 0);`	`signal aa_reg : std_logic_vector(31 downto 0);`
`signal bb_reg : std_logic_vector(31 downto 0);`	`signal bb_reg : std_logic_vector(31 downto 0);`
`signal upper_reg : std_logic_vector(31 downto 0);`	`signal upper_reg : std_logic_vector(31 downto 0);`
`signal lower_reg : std_logic_vector(31 downto 0);`	`signal lower_reg : std_logic_vector(31 downto 0);`

`signal a_neg : std_logic_vector(31 downto 0);`	`signal a_neg : std_logic_vector(31 downto 0);`
`signal b_neg : std_logic_vector(31 downto 0);`	`signal b_neg : std_logic_vector(31 downto 0);`
`signal sum : std_logic_vector(32 downto 0);`	`signal sum : std_logic_vector(32 downto 0);`
`signal sum_a : std_logic_vector(32 downto 0);`	`signal sum_a : std_logic_vector(32 downto 0);`
`signal sum_b : std_logic_vector(32 downto 0);`	`signal sum_b : std_logic_vector(32 downto 0);`

`begin`	`begin`

`-- @ion Output mux no longer uses function bv_negate. Removing one input that`	`-- @ion Output mux no longer uses function bv_negate. Removing one input that`
`-- is no longer needed, even if constant, may help in some FPGA architectures`	`-- is no longer needed, even if constant, may help in some FPGA architectures`
`-- too.`	`-- too.`
`-- See @note2`	`-- See @note2`
`-- Result`	`-- Result`
`c_mult <= lower_reg when mult_func = MULT_READ_LO and`	`c_mult <= lower_reg when mult_func = MULT_READ_LO and`
`negate_reg = '0' else`	`negate_reg = '0' else`
`not(lower_reg) + 1 when mult_func = MULT_READ_LO and`	`not(lower_reg) + 1 when mult_func = MULT_READ_LO and`
`--bv_negate(lower_reg) when mult_func = MULT_READ_LO and`	`--bv_negate(lower_reg) when mult_func = MULT_READ_LO and`
`negate_reg = '1' else`	`negate_reg = '1' else`
`upper_reg; -- when mult_func = MULT_READ_HI else`	`upper_reg; -- when mult_func = MULT_READ_HI else`
`--ZERO;`	`--ZERO;`

`-- @ion Stall pipeline while operation completes even if output is not needed`	`-- @ion Stall pipeline while operation completes even if output is not needed`
`-- immediately.`	`-- immediately.`
`-- See @note3`	`-- See @note3`
`pause_out <= '1' when (count_reg(5 downto 0) /= "000000") else '0'; --and`	`pause_out <= '1' when (count_reg(5 downto 0) /= "000000") else '0'; --and`
`--(mult_func = MULT_READ_LO or mult_func = MULT_READ_HI) else '0';`	`--(mult_func = MULT_READ_LO or mult_func = MULT_READ_HI) else '0';`

`-- ABS and remainder signals`	`-- ABS and remainder signals`
`a_neg <= not(a) + 1; --bv_negate(a); -- @ion @note2`	`a_neg <= not(a) + 1; --bv_negate(a); -- @ion @note2`
`b_neg <= not(b) + 1; --bv_negate(b); -- @ion @note2`	`b_neg <= not(b) + 1; --bv_negate(b); -- @ion @note2`

`-- @ion Replaced function bv_adder with straight vector code`	`-- @ion Replaced function bv_adder with straight vector code`
`--sum <= bv_adder(upper_reg, aa_reg, mode_reg);`	`--sum <= bv_adder(upper_reg, aa_reg, mode_reg);`
`sum_a <= ('0' & upper_reg); -- No sign extension: MSB of sum is special`	`sum_a <= ('0' & upper_reg); -- No sign extension: MSB of sum is special`
`sum_b <= ('0' & aa_reg);`	`sum_b <= ('0' & aa_reg);`
`with mode_reg select sum <=`	`with mode_reg select sum <=`
`sum_a + sum_b when '1',`	`sum_a + sum_b when '1',`
`sum_a - sum_b when others;`	`sum_a - sum_b when others;`

`--multiplication/division unit`	`--multiplication/division unit`
`mult_proc: process(clk, reset_in, a, b, mult_func,`	`mult_proc: process(clk, reset_in, a, b, mult_func,`
`a_neg, b_neg, sum, sign_reg, mode_reg, negate_reg,`	`a_neg, b_neg, sum, sign_reg, mode_reg, negate_reg,`
`count_reg, aa_reg, bb_reg, upper_reg, lower_reg)`	`count_reg, aa_reg, bb_reg, upper_reg, lower_reg)`
`variable count : std_logic_vector(2 downto 0);`	`variable count : std_logic_vector(2 downto 0);`
`begin`	`begin`
`count := "001";`	`count := "001";`
	`-- @ion Old asynchronous reset converted to synchronous, for consistency`
	`-- (Code indenting mangled by the new 'if' level)`
	`--if reset_in = '1' then`
	`if rising_edge(clk) then`
`if reset_in = '1' then`	`if reset_in = '1' then`
`mode_reg <= '0';`	`mode_reg <= '0';`
`negate_reg <= '0';`	`negate_reg <= '0';`
`sign_reg <= '0';`	`sign_reg <= '0';`
`sign2_reg <= '0';`	`sign2_reg <= '0';`
`count_reg <= "000000";`	`count_reg <= "000000";`
`aa_reg <= ZERO;`	`aa_reg <= ZERO;`
`bb_reg <= ZERO;`	`bb_reg <= ZERO;`
`upper_reg <= ZERO;`	`upper_reg <= ZERO;`
`lower_reg <= ZERO;`	`lower_reg <= ZERO;`
`elsif rising_edge(clk) then`	`--elsif rising_edge(clk) then`
	`else`
`case mult_func is`	`case mult_func is`
`when MULT_WRITE_LO =>`	`when MULT_WRITE_LO =>`
`lower_reg <= a;`	`lower_reg <= a;`
`negate_reg <= '0';`	`negate_reg <= '0';`
`when MULT_WRITE_HI =>`	`when MULT_WRITE_HI =>`
`upper_reg <= a;`	`upper_reg <= a;`
`negate_reg <= '0';`	`negate_reg <= '0';`
`when MULT_MULT =>`	`when MULT_MULT =>`
`mode_reg <= MODE_MULT;`	`mode_reg <= MODE_MULT;`
`aa_reg <= a;`	`aa_reg <= a;`
`bb_reg <= b;`	`bb_reg <= b;`
`upper_reg <= ZERO;`	`upper_reg <= ZERO;`
`count_reg <= "100000";`	`count_reg <= "100000";`
`negate_reg <= '0';`	`negate_reg <= '0';`
`sign_reg <= '0';`	`sign_reg <= '0';`
`sign2_reg <= '0';`	`sign2_reg <= '0';`
`when MULT_SIGNED_MULT =>`	`when MULT_SIGNED_MULT =>`
`mode_reg <= MODE_MULT;`	`mode_reg <= MODE_MULT;`
`if b(31) = '0' then`	`if b(31) = '0' then`
`aa_reg <= a;`	`aa_reg <= a;`
`bb_reg <= b;`	`bb_reg <= b;`
`sign_reg <= a(31);`	`sign_reg <= a(31);`
`else`	`else`
`aa_reg <= a_neg;`	`aa_reg <= a_neg;`
`bb_reg <= b_neg;`	`bb_reg <= b_neg;`
`sign_reg <= a_neg(31);`	`sign_reg <= a_neg(31);`
`end if;`	`end if;`
`sign2_reg <= '0';`	`sign2_reg <= '0';`
`upper_reg <= ZERO;`	`upper_reg <= ZERO;`
`count_reg <= "100000";`	`count_reg <= "100000";`
`negate_reg <= '0';`	`negate_reg <= '0';`
`when MULT_DIVIDE =>`	`when MULT_DIVIDE =>`
`mode_reg <= MODE_DIV;`	`mode_reg <= MODE_DIV;`
`aa_reg <= b(0) & ZERO(30 downto 0);`	`aa_reg <= b(0) & ZERO(30 downto 0);`
`bb_reg <= b;`	`bb_reg <= b;`
`upper_reg <= a;`	`upper_reg <= a;`
`count_reg <= "100000";`	`count_reg <= "100000";`
`negate_reg <= '0';`	`negate_reg <= '0';`
`when MULT_SIGNED_DIVIDE =>`	`when MULT_SIGNED_DIVIDE =>`
`mode_reg <= MODE_DIV;`	`mode_reg <= MODE_DIV;`
`if b(31) = '0' then`	`if b(31) = '0' then`
`aa_reg(31) <= b(0);`	`aa_reg(31) <= b(0);`
`bb_reg <= b;`	`bb_reg <= b;`
`else`	`else`
`aa_reg(31) <= b_neg(0);`	`aa_reg(31) <= b_neg(0);`
`bb_reg <= b_neg;`	`bb_reg <= b_neg;`
`end if;`	`end if;`
`if a(31) = '0' then`	`if a(31) = '0' then`
`upper_reg <= a;`	`upper_reg <= a;`
`else`	`else`
`upper_reg <= a_neg;`	`upper_reg <= a_neg;`
`end if;`	`end if;`
`aa_reg(30 downto 0) <= ZERO(30 downto 0);`	`aa_reg(30 downto 0) <= ZERO(30 downto 0);`
`count_reg <= "100000";`	`count_reg <= "100000";`
`negate_reg <= a(31) xor b(31);`	`negate_reg <= a(31) xor b(31);`
`when others =>`	`when others =>`

`if count_reg /= "000000" then`	`if count_reg /= "000000" then`
`if mode_reg = MODE_MULT then`	`if mode_reg = MODE_MULT then`
`-- Multiplication`	`-- Multiplication`
`if bb_reg(0) = '1' then`	`if bb_reg(0) = '1' then`
`upper_reg <= (sign_reg xor sum(32)) & sum(31 downto 1);`	`upper_reg <= (sign_reg xor sum(32)) & sum(31 downto 1);`
`lower_reg <= sum(0) & lower_reg(31 downto 1);`	`lower_reg <= sum(0) & lower_reg(31 downto 1);`
`sign2_reg <= sign2_reg or sign_reg;`	`sign2_reg <= sign2_reg or sign_reg;`
`sign_reg <= '0';`	`sign_reg <= '0';`
`bb_reg <= '0' & bb_reg(31 downto 1);`	`bb_reg <= '0' & bb_reg(31 downto 1);`
`-- The following six lines are optional for speedup`	`-- The following six lines are optional for speedup`
`--elsif bb_reg(3 downto 0) = "0000" and sign2_reg = '0' and`	`--elsif bb_reg(3 downto 0) = "0000" and sign2_reg = '0' and`
`-- count_reg(5 downto 2) /= "0000" then`	`-- count_reg(5 downto 2) /= "0000" then`
`-- upper_reg <= "0000" & upper_reg(31 downto 4);`	`-- upper_reg <= "0000" & upper_reg(31 downto 4);`
`-- lower_reg <= upper_reg(3 downto 0) & lower_reg(31 downto 4);`	`-- lower_reg <= upper_reg(3 downto 0) & lower_reg(31 downto 4);`
`-- count := "100";`	`-- count := "100";`
`-- bb_reg <= "0000" & bb_reg(31 downto 4);`	`-- bb_reg <= "0000" & bb_reg(31 downto 4);`
`else`	`else`
`upper_reg <= sign2_reg & upper_reg(31 downto 1);`	`upper_reg <= sign2_reg & upper_reg(31 downto 1);`
`lower_reg <= upper_reg(0) & lower_reg(31 downto 1);`	`lower_reg <= upper_reg(0) & lower_reg(31 downto 1);`
`bb_reg <= '0' & bb_reg(31 downto 1);`	`bb_reg <= '0' & bb_reg(31 downto 1);`
`end if;`	`end if;`
`else`	`else`
`-- Division`	`-- Division`
`if sum(32) = '0' and aa_reg /= ZERO and`	`if sum(32) = '0' and aa_reg /= ZERO and`
`bb_reg(31 downto 1) = ZERO(31 downto 1) then`	`bb_reg(31 downto 1) = ZERO(31 downto 1) then`
`upper_reg <= sum(31 downto 0);`	`upper_reg <= sum(31 downto 0);`
`lower_reg(0) <= '1';`	`lower_reg(0) <= '1';`
`else`	`else`
`lower_reg(0) <= '0';`	`lower_reg(0) <= '0';`
`end if;`	`end if;`
`aa_reg <= bb_reg(1) & aa_reg(31 downto 1);`	`aa_reg <= bb_reg(1) & aa_reg(31 downto 1);`
`lower_reg(31 downto 1) <= lower_reg(30 downto 0);`	`lower_reg(31 downto 1) <= lower_reg(30 downto 0);`
`bb_reg <= '0' & bb_reg(31 downto 1);`	`bb_reg <= '0' & bb_reg(31 downto 1);`
`end if;`	`end if;`
`count_reg <= count_reg - count;`	`count_reg <= count_reg - count;`
`end if; --count`	`end if; --count`

`end case;`	`end case;`

`end if;`	`end if;`
	`end if;`

`end process;`	`end process;`

`end; --architecture logic`	`end; --architecture logic`

`--------------------------------------------------------------------------------`	`--------------------------------------------------------------------------------`
`-- @note1 : bv_adder function removed`	`-- @note1 : bv_adder function removed`
`-- This function was a slightly modified adder/substractor coded in a bitwise`	`-- This function was a slightly modified adder/substractor coded in a bitwise`
`-- manner that made it hard for synth tools to recognize it as such. At least`	`-- manner that made it hard for synth tools to recognize it as such. At least`
`-- that's what I think. Replacing it with straigth code results in smaller and`	`-- that's what I think. Replacing it with straigth code results in smaller and`
`-- faster logic (about 23% faster).`	`-- faster logic (about 23% faster).`
`--`	`--`
`-- @note2 : bv_negate function removed`	`-- @note2 : bv_negate function removed`
`-- This function computed a 2's complement bitwise. Removed on the same grounds`	`-- This function computed a 2's complement bitwise. Removed on the same grounds`
`-- as @note1 but with no apparent improvement in synthesis results.`	`-- as @note1 but with no apparent improvement in synthesis results.`
`--`	`--`
`-- @note3 : pause_out active until operation complete`	`-- @note3 : pause_out active until operation complete`
`-- The original Plasma module allowed the pipeline and the multiplier to run`	`-- The original Plasma module allowed the pipeline and the multiplier to run`
`-- concurrently until the multiplier result was needed, and only then the`	`-- concurrently until the multiplier result was needed, and only then the`
`-- pipeline was stalled.`	`-- pipeline was stalled if the mul/div operation had not finished yet.`
`-- We want to make sure we can abort a mul/div so for the time being we stall`	`-- We want to make sure we can abort a mul/div so for the time being we stall`
`-- until the operation is complete.`	`-- until the operation is complete.`
`-- note that if we later want to change this, the parent module will need`	`-- I think that's what the libraries and the toolchain assume anyway.`
	`-- Note that if we later want to change this, the parent module will need`
`-- changes too (logic for p1_muldiv_running).`	`-- changes too (logic for p1_muldiv_running).`

--------------------------------------------------------------------------------

--------------------------------------------------------------------------------

-- mips_mult.vhdl -- multiplier from Plasma project, slightly modified.

-- mips_mult.vhdl -- multiplier from Plasma project, slightly modified.

--

--

-- The original file from Plasma has been adapted to the Ion core. Changes are

-- The original file from Plasma has been adapted to the Ion core. Changes are

-- tagged with '@ion'. There are a few notes at the end of the file with the

-- tagged with '@ion'. There are a few notes at the end of the file with the

-- rationale for the changes -- useful only if any trouble shows up later.

-- rationale for the changes -- useful only if any trouble shows up later.

-- The structure has not changed, only a few implementation details.

-- The structure has not changed, only a few implementation details.

--------------------------------------------------------------------------------

--------------------------------------------------------------------------------

---------------------------------------------------------------------

---------------------------------------------------------------------

-- TITLE: Multiplication and Division Unit

-- TITLE: Multiplication and Division Unit

-- AUTHORS: Steve Rhoads (rhoadss@yahoo.com)

-- AUTHORS: Steve Rhoads (rhoadss@yahoo.com)

-- DATE CREATED: 1/31/01

-- DATE CREATED: 1/31/01

-- FILENAME: mult.vhd

-- FILENAME: mult.vhd

-- PROJECT: Plasma CPU core

-- PROJECT: Plasma CPU core

-- COPYRIGHT: Software placed into the public domain by the author.

-- COPYRIGHT: Software placed into the public domain by the author.

--    Software 'as is' without warranty.  Author liable for nothing.

--    Software 'as is' without warranty.  Author liable for nothing.

-- DESCRIPTION:

-- DESCRIPTION:

--    Implements the multiplication and division unit in 32 clocks.

--    Implements the multiplication and division unit in 32 clocks.

--

--

--    To reduce space, compile your code using the flag "-mno-mul" which

--    To reduce space, compile your code using the flag "-mno-mul" which

--    will use software base routines in math.c if USE_SW_MULT is defined.

--    will use software base routines in math.c if USE_SW_MULT is defined.

--    Then remove references to the entity mult in mlite_cpu.vhd.

--    Then remove references to the entity mult in mlite_cpu.vhd.

--

--

-- MULTIPLICATION

-- MULTIPLICATION

-- long64 answer = 0

-- long64 answer = 0

-- for(i = 0; i < 32; ++i)

-- for(i = 0; i < 32; ++i)

-- {

-- {

--    answer = (answer >> 1) + (((b&1)?a:0) << 31);

--    answer = (answer >> 1) + (((b&1)?a:0) << 31);

--    b = b >> 1;

--    b = b >> 1;

-- }

-- }

--

--

-- DIVISION

-- DIVISION

-- long upper=a, lower=0;

-- long upper=a, lower=0;

-- a = b << 31;

-- a = b << 31;

-- for(i = 0; i < 32; ++i)

-- for(i = 0; i < 32; ++i)

-- {

-- {

--    lower = lower << 1;

--    lower = lower << 1;

--    if(upper >= a && a && b < 2)

--    if(upper >= a && a && b < 2)

--    {

--    {

--       upper = upper - a;

--       upper = upper - a;

--       lower |= 1;

--       lower |= 1;

--    }

--    }

--    a = ((b&2) << 30) | (a >> 1);

--    a = ((b&2) << 30) | (a >> 1);

--    b = b >> 1;

--    b = b >> 1;

-- }

-- }

---------------------------------------------------------------------

---------------------------------------------------------------------

library ieee;

library ieee;

use ieee.std_logic_1164.all;

use ieee.std_logic_1164.all;

use ieee.std_logic_unsigned.all;

use ieee.std_logic_unsigned.all;

use IEEE.std_logic_arith.all;

use IEEE.std_logic_arith.all;

use work.mips_pkg.all;

use work.mips_pkg.all;

entity mips_mult is

entity mips_mult is

   generic(mult_type  : string := "DEFAULT");

   generic(mult_type  : string := "DEFAULT");

   port(clk       : in std_logic;

   port(clk       : in std_logic;

        reset_in  : in std_logic;

        reset_in  : in std_logic;

        a, b      : in std_logic_vector(31 downto 0);

        a, b      : in std_logic_vector(31 downto 0);

        mult_func : in t_mult_function;

        mult_func : in t_mult_function;

        c_mult    : out std_logic_vector(31 downto 0);

        c_mult    : out std_logic_vector(31 downto 0);

        pause_out : out std_logic);

        pause_out : out std_logic);

end; --entity mult

end; --entity mult

architecture logic of mips_mult is

architecture logic of mips_mult is

   constant MODE_MULT : std_logic := '1';

   constant MODE_MULT : std_logic := '1';

   constant MODE_DIV  : std_logic := '0';

   constant MODE_DIV  : std_logic := '0';

   signal mode_reg    : std_logic;

   signal mode_reg    : std_logic;

   signal negate_reg  : std_logic;

   signal negate_reg  : std_logic;

   signal sign_reg    : std_logic;

   signal sign_reg    : std_logic;

   signal sign2_reg   : std_logic;

   signal sign2_reg   : std_logic;

   signal count_reg   : std_logic_vector(5 downto 0);

   signal count_reg   : std_logic_vector(5 downto 0);

   signal aa_reg      : std_logic_vector(31 downto 0);

   signal aa_reg      : std_logic_vector(31 downto 0);

   signal bb_reg      : std_logic_vector(31 downto 0);

   signal bb_reg      : std_logic_vector(31 downto 0);

   signal upper_reg   : std_logic_vector(31 downto 0);

   signal upper_reg   : std_logic_vector(31 downto 0);

   signal lower_reg   : std_logic_vector(31 downto 0);

   signal lower_reg   : std_logic_vector(31 downto 0);

   signal a_neg       : std_logic_vector(31 downto 0);

   signal a_neg       : std_logic_vector(31 downto 0);

   signal b_neg       : std_logic_vector(31 downto 0);

   signal b_neg       : std_logic_vector(31 downto 0);

   signal sum         : std_logic_vector(32 downto 0);

   signal sum         : std_logic_vector(32 downto 0);

   signal sum_a       : std_logic_vector(32 downto 0);

   signal sum_a       : std_logic_vector(32 downto 0);

   signal sum_b       : std_logic_vector(32 downto 0);

   signal sum_b       : std_logic_vector(32 downto 0);

begin

begin

   -- @ion Output mux no longer uses function bv_negate. Removing one input that

   -- @ion Output mux no longer uses function bv_negate. Removing one input that

   -- is no longer needed, even if constant, may help in some FPGA architectures

   -- is no longer needed, even if constant, may help in some FPGA architectures

   -- too.

   -- too.

   -- See @note2

   -- See @note2

   -- Result

   -- Result

   c_mult <= lower_reg              when mult_func = MULT_READ_LO and

   c_mult <= lower_reg              when mult_func = MULT_READ_LO and

                                         negate_reg = '0' else

                                         negate_reg = '0' else

             not(lower_reg) + 1     when mult_func = MULT_READ_LO and

             not(lower_reg) + 1     when mult_func = MULT_READ_LO and

             --bv_negate(lower_reg)   when mult_func = MULT_READ_LO and

             --bv_negate(lower_reg)   when mult_func = MULT_READ_LO and

                                         negate_reg = '1' else

                                         negate_reg = '1' else

             upper_reg;             -- when mult_func = MULT_READ_HI else

             upper_reg;             -- when mult_func = MULT_READ_HI else

             --ZERO;

             --ZERO;

   -- @ion Stall pipeline while operation completes even if output is not needed

   -- @ion Stall pipeline while operation completes even if output is not needed

   -- immediately.

   -- immediately.

   -- See @note3

   -- See @note3

   pause_out <= '1' when (count_reg(5 downto 0) /= "000000") else '0'; --and

   pause_out <= '1' when (count_reg(5 downto 0) /= "000000") else '0'; --and

             --(mult_func = MULT_READ_LO or mult_func = MULT_READ_HI) else '0';

             --(mult_func = MULT_READ_LO or mult_func = MULT_READ_HI) else '0';

   -- ABS and remainder signals

   -- ABS and remainder signals

   a_neg <= not(a) + 1; --bv_negate(a); -- @ion @note2

   a_neg <= not(a) + 1; --bv_negate(a); -- @ion @note2

   b_neg <= not(b) + 1; --bv_negate(b); -- @ion @note2

   b_neg <= not(b) + 1; --bv_negate(b); -- @ion @note2

   -- @ion Replaced function bv_adder with straight vector code

   -- @ion Replaced function bv_adder with straight vector code

   --sum <= bv_adder(upper_reg, aa_reg, mode_reg);

   --sum <= bv_adder(upper_reg, aa_reg, mode_reg);

   sum_a <= ('0' & upper_reg); -- No sign extension: MSB of sum is special

   sum_a <= ('0' & upper_reg); -- No sign extension: MSB of sum is special

   sum_b <= ('0' & aa_reg);

   sum_b <= ('0' & aa_reg);

   with mode_reg select sum <=

   with mode_reg select sum <=

        sum_a + sum_b when '1',

        sum_a + sum_b when '1',

        sum_a - sum_b when others;

        sum_a - sum_b when others;

   --multiplication/division unit

   --multiplication/division unit

   mult_proc: process(clk, reset_in, a, b, mult_func,

   mult_proc: process(clk, reset_in, a, b, mult_func,

      a_neg, b_neg, sum, sign_reg, mode_reg, negate_reg,

      a_neg, b_neg, sum, sign_reg, mode_reg, negate_reg,

      count_reg, aa_reg, bb_reg, upper_reg, lower_reg)

      count_reg, aa_reg, bb_reg, upper_reg, lower_reg)

      variable count : std_logic_vector(2 downto 0);

      variable count : std_logic_vector(2 downto 0);

   begin

   begin

      count := "001";

      count := "001";

      -- @ion Old asynchronous reset converted to synchronous, for consistency

      -- (Code indenting mangled by the new 'if' level)

      --if reset_in = '1' then

      if rising_edge(clk) then

      if reset_in = '1' then

      if reset_in = '1' then

         mode_reg <= '0';

         mode_reg <= '0';

         negate_reg <= '0';

         negate_reg <= '0';

         sign_reg <= '0';

         sign_reg <= '0';

         sign2_reg <= '0';

         sign2_reg <= '0';

         count_reg <= "000000";

         count_reg <= "000000";

         aa_reg <= ZERO;

         aa_reg <= ZERO;

         bb_reg <= ZERO;

         bb_reg <= ZERO;

         upper_reg <= ZERO;

         upper_reg <= ZERO;

         lower_reg <= ZERO;

         lower_reg <= ZERO;

      elsif rising_edge(clk) then

      --elsif rising_edge(clk) then

      else

         case mult_func is

         case mult_func is

            when MULT_WRITE_LO =>

            when MULT_WRITE_LO =>

               lower_reg <= a;

               lower_reg <= a;

               negate_reg <= '0';

               negate_reg <= '0';

            when MULT_WRITE_HI =>

            when MULT_WRITE_HI =>

               upper_reg <= a;

               upper_reg <= a;

               negate_reg <= '0';

               negate_reg <= '0';

            when MULT_MULT =>

            when MULT_MULT =>

               mode_reg <= MODE_MULT;

               mode_reg <= MODE_MULT;

               aa_reg <= a;

               aa_reg <= a;

               bb_reg <= b;

               bb_reg <= b;

               upper_reg <= ZERO;

               upper_reg <= ZERO;

               count_reg <= "100000";

               count_reg <= "100000";

               negate_reg <= '0';

               negate_reg <= '0';

               sign_reg <= '0';

               sign_reg <= '0';

               sign2_reg <= '0';

               sign2_reg <= '0';

            when MULT_SIGNED_MULT =>

            when MULT_SIGNED_MULT =>

               mode_reg <= MODE_MULT;

               mode_reg <= MODE_MULT;

               if b(31) = '0' then

               if b(31) = '0' then

                  aa_reg <= a;

                  aa_reg <= a;

                  bb_reg <= b;

                  bb_reg <= b;

                  sign_reg <= a(31);

                  sign_reg <= a(31);

               else

               else

                  aa_reg <= a_neg;

                  aa_reg <= a_neg;

                  bb_reg <= b_neg;

                  bb_reg <= b_neg;

                  sign_reg <= a_neg(31);

                  sign_reg <= a_neg(31);

               end if;

               end if;

               sign2_reg <= '0';

               sign2_reg <= '0';

               upper_reg <= ZERO;

               upper_reg <= ZERO;

               count_reg <= "100000";

               count_reg <= "100000";

               negate_reg <= '0';

               negate_reg <= '0';

            when MULT_DIVIDE =>

            when MULT_DIVIDE =>

               mode_reg <= MODE_DIV;

               mode_reg <= MODE_DIV;

               aa_reg <= b(0) & ZERO(30 downto 0);

               aa_reg <= b(0) & ZERO(30 downto 0);

               bb_reg <= b;

               bb_reg <= b;

               upper_reg <= a;

               upper_reg <= a;

               count_reg <= "100000";

               count_reg <= "100000";

               negate_reg <= '0';

               negate_reg <= '0';

            when MULT_SIGNED_DIVIDE =>

            when MULT_SIGNED_DIVIDE =>

               mode_reg <= MODE_DIV;

               mode_reg <= MODE_DIV;

               if b(31) = '0' then

               if b(31) = '0' then

                  aa_reg(31) <= b(0);

                  aa_reg(31) <= b(0);

                  bb_reg <= b;

                  bb_reg <= b;

               else

               else

                  aa_reg(31) <= b_neg(0);

                  aa_reg(31) <= b_neg(0);

                  bb_reg <= b_neg;

                  bb_reg <= b_neg;

               end if;

               end if;

               if a(31) = '0' then

               if a(31) = '0' then

                  upper_reg <= a;

                  upper_reg <= a;

               else

               else

                  upper_reg <= a_neg;

                  upper_reg <= a_neg;

               end if;

               end if;

               aa_reg(30 downto 0) <= ZERO(30 downto 0);

               aa_reg(30 downto 0) <= ZERO(30 downto 0);

               count_reg <= "100000";

               count_reg <= "100000";

               negate_reg <= a(31) xor b(31);

               negate_reg <= a(31) xor b(31);

            when others =>

            when others =>

               if count_reg /= "000000" then

               if count_reg /= "000000" then

                  if mode_reg = MODE_MULT then

                  if mode_reg = MODE_MULT then

                     -- Multiplication

                     -- Multiplication

                     if bb_reg(0) = '1' then

                     if bb_reg(0) = '1' then

                        upper_reg <= (sign_reg xor sum(32)) & sum(31 downto 1);

                        upper_reg <= (sign_reg xor sum(32)) & sum(31 downto 1);

                        lower_reg <= sum(0) & lower_reg(31 downto 1);

                        lower_reg <= sum(0) & lower_reg(31 downto 1);

                        sign2_reg <= sign2_reg or sign_reg;

                        sign2_reg <= sign2_reg or sign_reg;

                        sign_reg <= '0';

                        sign_reg <= '0';

                        bb_reg <= '0' & bb_reg(31 downto 1);

                        bb_reg <= '0' & bb_reg(31 downto 1);

                     -- The following six lines are optional for speedup

                     -- The following six lines are optional for speedup

                     --elsif bb_reg(3 downto 0) = "0000" and sign2_reg = '0' and

                     --elsif bb_reg(3 downto 0) = "0000" and sign2_reg = '0' and

                     --      count_reg(5 downto 2) /= "0000" then

                     --      count_reg(5 downto 2) /= "0000" then

                     --   upper_reg <= "0000" & upper_reg(31 downto 4);

                     --   upper_reg <= "0000" & upper_reg(31 downto 4);

                     --   lower_reg <=  upper_reg(3 downto 0) & lower_reg(31 downto 4);

                     --   lower_reg <=  upper_reg(3 downto 0) & lower_reg(31 downto 4);

                     --   count := "100";

                     --   count := "100";

                     --   bb_reg <= "0000" & bb_reg(31 downto 4);

                     --   bb_reg <= "0000" & bb_reg(31 downto 4);

                     else

                     else

                        upper_reg <= sign2_reg & upper_reg(31 downto 1);

                        upper_reg <= sign2_reg & upper_reg(31 downto 1);

                        lower_reg <= upper_reg(0) & lower_reg(31 downto 1);

                        lower_reg <= upper_reg(0) & lower_reg(31 downto 1);

                        bb_reg <= '0' & bb_reg(31 downto 1);

                        bb_reg <= '0' & bb_reg(31 downto 1);

                     end if;

                     end if;

                  else

                  else

                     -- Division

                     -- Division

                     if sum(32) = '0' and aa_reg /= ZERO and

                     if sum(32) = '0' and aa_reg /= ZERO and

                           bb_reg(31 downto 1) = ZERO(31 downto 1) then

                           bb_reg(31 downto 1) = ZERO(31 downto 1) then

                        upper_reg <= sum(31 downto 0);

                        upper_reg <= sum(31 downto 0);

                        lower_reg(0) <= '1';

                        lower_reg(0) <= '1';

                     else

                     else

                        lower_reg(0) <= '0';

                        lower_reg(0) <= '0';

                     end if;

                     end if;

                     aa_reg <= bb_reg(1) & aa_reg(31 downto 1);

                     aa_reg <= bb_reg(1) & aa_reg(31 downto 1);

                     lower_reg(31 downto 1) <= lower_reg(30 downto 0);

                     lower_reg(31 downto 1) <= lower_reg(30 downto 0);

                     bb_reg <= '0' & bb_reg(31 downto 1);

                     bb_reg <= '0' & bb_reg(31 downto 1);

                  end if;

                  end if;

                  count_reg <= count_reg - count;

                  count_reg <= count_reg - count;

               end if; --count

               end if; --count

         end case;

         end case;

      end if;

      end if;

      end if;

   end process;

   end process;

end; --architecture logic

end; --architecture logic

--------------------------------------------------------------------------------

--------------------------------------------------------------------------------

-- @note1 : bv_adder function removed

-- @note1 : bv_adder function removed

-- This function was a slightly modified adder/substractor coded in a bitwise

-- This function was a slightly modified adder/substractor coded in a bitwise

-- manner that made it hard for synth tools to recognize it as such. At least

-- manner that made it hard for synth tools to recognize it as such. At least

-- that's what I think. Replacing it with straigth code results in smaller and

-- that's what I think. Replacing it with straigth code results in smaller and

-- faster logic (about 23% faster).

-- faster logic (about 23% faster).

--

--

-- @note2 : bv_negate function removed

-- @note2 : bv_negate function removed

-- This function computed a 2's complement bitwise. Removed on the same grounds

-- This function computed a 2's complement bitwise. Removed on the same grounds

-- as @note1 but with no apparent improvement in synthesis results.

-- as @note1 but with no apparent improvement in synthesis results.

--

--

-- @note3 : pause_out active until operation complete

-- @note3 : pause_out active until operation complete

-- The original Plasma module allowed the pipeline and the multiplier to run

-- The original Plasma module allowed the pipeline and the multiplier to run

-- concurrently until the multiplier result was needed, and only then the

-- concurrently until the multiplier result was needed, and only then the

-- pipeline was stalled.

-- pipeline was stalled if the mul/div operation had not finished yet.

-- We want to make sure we can abort a mul/div so for the time being we stall

-- We want to make sure we can abort a mul/div so for the time being we stall

-- until the operation is complete.

-- until the operation is complete.

-- note that if we later want to change this, the parent module will need

-- I *think* that's what the libraries and the toolchain assume anyway.

-- Note that if we later want to change this, the parent module will need

-- changes too (logic for p1_muldiv_running).

-- changes too (logic for p1_muldiv_running).

Browse

Tools

Subversion Repositories ion

[/] [ion/] [trunk/] [vhdl/] [mips_mult.vhdl] - Diff between revs 12 and 21