1 |
69 |
rhoads |
---------------------------------------------------------------------
|
2 |
|
|
-- TITLE: Pipeline
|
3 |
|
|
-- AUTHOR: Steve Rhoads (rhoadss@yahoo.com)
|
4 |
|
|
-- DATE CREATED: 6/24/02
|
5 |
|
|
-- FILENAME: pipeline.vhd
|
6 |
|
|
-- PROJECT: Plasma CPU core
|
7 |
|
|
-- COPYRIGHT: Software placed into the public domain by the author.
|
8 |
|
|
-- Software 'as is' without warranty. Author liable for nothing.
|
9 |
|
|
-- DESCRIPTION:
|
10 |
|
|
-- Controls the three stage pipeline by delaying the signals:
|
11 |
|
|
-- a_bus, b_bus, alu/shift/mult_func, c_source, and rs_index.
|
12 |
|
|
---------------------------------------------------------------------
|
13 |
|
|
library ieee;
|
14 |
|
|
use ieee.std_logic_1164.all;
|
15 |
|
|
use work.mlite_pack.all;
|
16 |
|
|
|
17 |
|
|
--Note: sigD <= sig after rising_edge(clk)
|
18 |
|
|
entity pipeline is
|
19 |
|
|
port(clk : in std_logic;
|
20 |
|
|
reset : in std_logic;
|
21 |
|
|
a_bus : in std_logic_vector(31 downto 0);
|
22 |
|
|
a_busD : out std_logic_vector(31 downto 0);
|
23 |
|
|
b_bus : in std_logic_vector(31 downto 0);
|
24 |
|
|
b_busD : out std_logic_vector(31 downto 0);
|
25 |
|
|
alu_func : in alu_function_type;
|
26 |
|
|
alu_funcD : out alu_function_type;
|
27 |
|
|
shift_func : in shift_function_type;
|
28 |
|
|
shift_funcD : out shift_function_type;
|
29 |
|
|
mult_func : in mult_function_type;
|
30 |
|
|
mult_funcD : out mult_function_type;
|
31 |
|
|
reg_dest : in std_logic_vector(31 downto 0);
|
32 |
|
|
reg_destD : out std_logic_vector(31 downto 0);
|
33 |
|
|
rd_index : in std_logic_vector(5 downto 0);
|
34 |
|
|
rd_indexD : out std_logic_vector(5 downto 0);
|
35 |
|
|
|
36 |
|
|
rs_index : in std_logic_vector(5 downto 0);
|
37 |
|
|
rt_index : in std_logic_vector(5 downto 0);
|
38 |
|
|
pc_source : in pc_source_type;
|
39 |
|
|
mem_source : in mem_source_type;
|
40 |
|
|
a_source : in a_source_type;
|
41 |
|
|
b_source : in b_source_type;
|
42 |
|
|
c_source : in c_source_type;
|
43 |
|
|
c_bus : in std_logic_vector(31 downto 0);
|
44 |
|
|
pause_any : in std_logic;
|
45 |
|
|
pause_pipeline : out std_logic);
|
46 |
|
|
end; --entity pipeline
|
47 |
|
|
|
48 |
|
|
architecture logic of pipeline is
|
49 |
107 |
rhoads |
signal rd_index_reg : std_logic_vector(5 downto 0);
|
50 |
|
|
signal reg_dest_reg : std_logic_vector(31 downto 0);
|
51 |
122 |
rhoads |
signal reg_dest_delay : std_logic_vector(31 downto 0);
|
52 |
107 |
rhoads |
signal c_source_reg : c_source_type;
|
53 |
|
|
signal pause_enable_reg : std_logic;
|
54 |
69 |
rhoads |
begin
|
55 |
|
|
|
56 |
|
|
--When operating in three stage pipeline mode, the following signals
|
57 |
|
|
--are delayed by one clock cycle: a_bus, b_bus, alu/shift/mult_func,
|
58 |
|
|
--c_source, and rd_index.
|
59 |
|
|
pipeline3: process(clk, reset, a_bus, b_bus, alu_func, shift_func, mult_func,
|
60 |
107 |
rhoads |
rd_index, rd_index_reg, pause_any, pause_enable_reg,
|
61 |
96 |
rhoads |
rs_index, rt_index,
|
62 |
82 |
rhoads |
pc_source, mem_source, a_source, b_source, c_source, c_source_reg,
|
63 |
122 |
rhoads |
reg_dest, reg_dest_reg, reg_dest_delay, c_bus)
|
64 |
69 |
rhoads |
variable pause_mult_clock : std_logic;
|
65 |
107 |
rhoads |
variable freeze_pipeline : std_logic;
|
66 |
69 |
rhoads |
begin
|
67 |
128 |
rhoads |
if (pc_source /= FROM_INC4 and pc_source /= FROM_OPCODE25_0) or
|
68 |
|
|
mem_source /= MEM_FETCH or
|
69 |
|
|
(mult_func = MULT_READ_LO or mult_func = MULT_READ_HI) then
|
70 |
69 |
rhoads |
pause_mult_clock := '1';
|
71 |
|
|
else
|
72 |
|
|
pause_mult_clock := '0';
|
73 |
|
|
end if;
|
74 |
|
|
|
75 |
107 |
rhoads |
freeze_pipeline := not (pause_mult_clock and pause_enable_reg) and pause_any;
|
76 |
|
|
pause_pipeline <= pause_mult_clock and pause_enable_reg;
|
77 |
69 |
rhoads |
rd_indexD <= rd_index_reg;
|
78 |
|
|
|
79 |
204 |
rhoads |
-- The value written back into the register bank, signal reg_dest is tricky.
|
80 |
|
|
-- If reg_dest comes from the ALU via the signal c_bus, it is already delayed
|
81 |
|
|
-- into stage #3, because a_busD and b_busD are delayed. If reg_dest comes from
|
82 |
|
|
-- c_memory, pc_current, or pc_plus4 then reg_dest hasn't yet been delayed into
|
83 |
|
|
-- stage #3.
|
84 |
|
|
-- Instead of delaying c_memory, pc_current, and pc_plus4, these signals
|
85 |
|
|
-- are multiplexed into reg_dest which is then delayed. The decision to use
|
86 |
|
|
-- the already delayed c_bus or the delayed value of reg_dest (reg_dest_reg) is
|
87 |
|
|
-- based on a delayed value of c_source (c_source_reg).
|
88 |
|
|
|
89 |
128 |
rhoads |
if c_source_reg = C_FROM_ALU then
|
90 |
122 |
rhoads |
reg_dest_delay <= c_bus; --delayed by 1 clock cycle via a_busD & b_busD
|
91 |
69 |
rhoads |
else
|
92 |
122 |
rhoads |
reg_dest_delay <= reg_dest_reg; --need to delay 1 clock cycle from reg_dest
|
93 |
69 |
rhoads |
end if;
|
94 |
122 |
rhoads |
reg_destD <= reg_dest_delay;
|
95 |
69 |
rhoads |
|
96 |
|
|
if reset = '1' then
|
97 |
128 |
rhoads |
a_busD <= ZERO;
|
98 |
|
|
b_busD <= ZERO;
|
99 |
|
|
alu_funcD <= ALU_NOTHING;
|
100 |
|
|
shift_funcD <= SHIFT_NOTHING;
|
101 |
|
|
mult_funcD <= MULT_NOTHING;
|
102 |
|
|
reg_dest_reg <= ZERO;
|
103 |
|
|
c_source_reg <= "000";
|
104 |
69 |
rhoads |
rd_index_reg <= "000000";
|
105 |
128 |
rhoads |
pause_enable_reg <= '0';
|
106 |
69 |
rhoads |
elsif rising_edge(clk) then
|
107 |
101 |
rhoads |
if freeze_pipeline = '0' then
|
108 |
107 |
rhoads |
if (rs_index = "000000" or rs_index /= rd_index_reg) or
|
109 |
128 |
rhoads |
(a_source /= A_FROM_REG_SOURCE or pause_enable_reg = '0') then
|
110 |
107 |
rhoads |
a_busD <= a_bus;
|
111 |
|
|
else
|
112 |
122 |
rhoads |
a_busD <= reg_dest_delay; --rs from previous operation (bypass stage)
|
113 |
107 |
rhoads |
end if;
|
114 |
|
|
|
115 |
|
|
if (rt_index = "000000" or rt_index /= rd_index_reg) or
|
116 |
128 |
rhoads |
(b_source /= B_FROM_REG_TARGET or pause_enable_reg = '0') then
|
117 |
107 |
rhoads |
b_busD <= b_bus;
|
118 |
|
|
else
|
119 |
122 |
rhoads |
b_busD <= reg_dest_delay; --rt from previous operation
|
120 |
107 |
rhoads |
end if;
|
121 |
|
|
|
122 |
|
|
alu_funcD <= alu_func;
|
123 |
|
|
shift_funcD <= shift_func;
|
124 |
|
|
mult_funcD <= mult_func;
|
125 |
|
|
reg_dest_reg <= reg_dest;
|
126 |
|
|
c_source_reg <= c_source;
|
127 |
101 |
rhoads |
rd_index_reg <= rd_index;
|
128 |
|
|
end if;
|
129 |
107 |
rhoads |
|
130 |
|
|
if pause_enable_reg = '0' and pause_any = '0' then
|
131 |
|
|
pause_enable_reg <= '1'; --enable pause_pipeline
|
132 |
|
|
elsif pause_mult_clock = '1' then
|
133 |
|
|
pause_enable_reg <= '0'; --disable pause_pipeline
|
134 |
|
|
end if;
|
135 |
69 |
rhoads |
end if;
|
136 |
|
|
|
137 |
|
|
end process; --pipeline3
|
138 |
|
|
|
139 |
|
|
end; --logic
|