URL
https://opencores.org/ocsvn/raytrac/raytrac/trunk
Subversion Repositories raytrac
Compare Revisions
- This comparison shows the changes necessary to convert path
/raytrac/trunk
- from Rev 99 to Rev 100
- ↔ Reverse comparison
Rev 99 → Rev 100
/fpbranch/add/ema2.vhd
1,6 → 1,6
------------------------------------------------ |
--! @file ema2.vhd |
--! @brief RayTrac Exponent Managment Adder |
--! @brief RayTrac Floating Point Adder |
--! @author Julián Andrés Guarín Reyes |
-------------------------------------------------- |
|
40,13 → 40,7
end ema2; |
|
architecture ema2_arch of ema2 is |
component sadd2 |
port ( |
a,b:in std_logic_vector(25 downto 0); |
dpc:in std_logic; |
res:out std_logic_vector(25 downto 0) |
); |
end component; |
|
component lpm_mult |
generic ( |
lpm_hint : string; |
68,11 → 62,11
signal s4slab : std_logic_vector(15 downto 0); |
signal s2slab : std_logic_vector(16 downto 0); |
signal b1s,s4nrmP : std_logic_vector(22 downto 0); -- Inversor de la mantissa |
signal s0a,s0b,s1a,s1b,sssa,sssb,s3a : std_logic_vector(31 downto 0); -- Float 32 bit |
signal s0a,s0b,s1a,s1b, : std_logic_vector(31 downto 0); -- Float 32 bit |
signal s1sma,s2sma,s2smb,s3sma,s3smb,s3ures,s4ures : std_logic_vector(24 downto 0); -- Signed mantissas |
signal s3res : std_logic_vector(25 downto 0); -- Signed mantissa result |
signal s1pS,s1pH,s1pL,s4nrmL,s4nrmH,s4nrmS : std_logic_vector(17 downto 0); -- Shifert Product |
signal s3sgb,s0zeroa,s0zerob,s1z,s4sgr : std_logic; |
signal s0zeroa,s0zerob,s1z,s4sgr : std_logic; |
|
begin |
|
/fpbranch/add/ema3.vhd
32,10 → 32,9
|
entity ema3 is |
port ( |
clk : in std_logic; |
clk,dpc : in std_logic; |
a32,b32,c32 : in std_logic_vector (31 downto 0); |
exp : out std_logic_vector (7 downto 0); |
sma,smb,smc : out std_logic_vector (24 downto 0) |
res32 : out std_logic_vector (31 downto 0) |
|
|
|
59,12 → 58,18
); |
end component; |
|
signal bss,css : std_logic_vector(22 downto 0); |
signal sa,sb,sc,ssa,ssb,ssc,s4a : std_logic_vector(31 downto 0); |
signal s4umb,s4umc : std_logic_vector(23 downto 0); |
signal s4sma,s4smb,s4smc : std_logic_vector(24 downto 0); |
signal sspHb,sspLb,sspHc,sspLc : std_logic_vector(35 downto 0); |
signal s4sgb,s4sgc,zeroa,zerob,zeroc,sszb,sszc : std_logic; |
signal s2slrb,s2slrc : std_logic_vector(1 downto 0); |
signal s3lshift,s4lshift : std_logic_vector(4 downto 0); |
signal s2exp,s3exp,s4exp : std_logic_vector(7 downto 0); |
signal s4slab : std_logic_vector(15 downto 0); |
signal s2slabb,s2slabc : std_logic_vector(16 downto 0); |
signal b1s,c1s,s4nrmP : std_logic_vector(22 downto 0); -- Inversor de la mantissa |
signal s0a,s0b,s0c,s1a,s1b,s1c : std_logic_vector(31 downto 0); -- Float 32 bit |
signal s1sma,s2sma,s2smb,s2smc,s3sma,s3smb,s3smc : std_logic_vector(24 downto 0); -- Signed mantissas |
signal s3res : std_logic_vector(26 downto 0); -- Signed mantissa result |
signal s3ures,s4ures : std_logic_vector(25 downto 0); |
signal s1pSb,s1pHb,s1pLb,s1pSc,s1pHc,s1pLc,s4nrmL,s4nrmH,s4nrmS : std_logic_vector(17 downto 0); -- Shifert Product |
signal s0zeroa,s0zerob,s0zeroc,s1zb,s1zc,s4sgr : std_logic; |
begin |
|
process (clk) |
72,133 → 77,261
if clk'event and clk='1' then |
|
--!Registro de entrada |
sa <= a32; |
sb <= b32; |
sc <= c32; |
s0a <= a32; |
s0b(31) <= dpc xor b32(31); --! Importante: Integrar el signo en el operando B |
s0b(30 downto 0) <= b32(30 downto 0); |
s0c <= c32; |
|
--!Primera etapa a vs. b |
if sa(30 downto 23) >= sb (30 downto 23) and sa(30 downto 23) >=sc(30 downto 23) then |
--!Etapa 0, Escoger el mayor exponente que sera el resultado desnormalizado, calcula cuanto debe ser el corrimiento de la mantissa con menor exponente y reorganiza los operandos, si el mayor es b, intercambia las posición si el mayor es a las posiciones la mantiene. Zero check. |
if s0a(30 downto 23) >= s0b (30 downto 23) and s0a(30 downto 23) >=s0c(30 downto 23) then |
--!signo,exponente,mantissa de b yc |
ssb(31) <= sb(31); |
ssb(30 downto 23) <= sa(30 downto 23) - sb(30 downto 23); |
ssb(22 downto 0) <= sb(22 downto 0); |
sszb <= zerob; |
ssc(31) <= sc(31); |
ssc(30 downto 23) <= sa(30 downto 23) - sc(30 downto 23); |
ssc(22 downto 0) <= sc(22 downto 0); |
sszc <= zeroc; |
s1b(31) <= s0b(31); |
s1b(30 downto 23) <= s0a(30 downto 23) - s0b(30 downto 23); |
s1b(22 downto 0) <= s0b(22 downto 0); |
s1zb <= s0zerob; |
ssc(31) <= s0c(31); |
s1c(30 downto 23) <= s0a(30 downto 23) - s0c(30 downto 23); |
s1c(22 downto 0) <= s0c(22 downto 0); |
s1zc <= s0zeroc; |
--!clasifica a |
ssa <= sa; |
elsif sb(30 downto 23) >= sc (30 downto 23) then |
s1a <= s0a; |
elsif s0b(30 downto 23) >= s0c (30 downto 23) then |
--!signo,exponente,mantissa |
ssb(31) <= sa(31); |
ssb(30 downto 23) <= sb(30 downto 23)-sa(30 downto 23); |
ssb(22 downto 0) <= sa(22 downto 0); |
sszb <= zeroa; |
ssc(31) <= sc(31); |
ssc(30 downto 23) <= sb(30 downto 23) - sc(30 downto 23); |
ssc(22 downto 0) <= sc(22 downto 0); |
sszc <= zeroc; |
s1b(31) <= s0a(31); |
s1b(30 downto 23) <= s0b(30 downto 23)-s0a(30 downto 23); |
s1b(22 downto 0) <= s0a(22 downto 0); |
s1zb <= s0zeroa; |
s1c(31) <= s0c(31); |
s1c(30 downto 23) <= s0b(30 downto 23) - s0c(30 downto 23); |
s1c(22 downto 0) <= s0c(22 downto 0); |
s1zc <= s0zeroc; |
--!clasifica b |
ssa <= sb; |
s1a <= s0b; |
else |
--!signo,exponente,mantissa |
ssb(31) <= sb(31); |
ssb(30 downto 23) <= sc(30 downto 23)-sb(30 downto 23); |
ssb(22 downto 0) <= sb(22 downto 0); |
sszb <= zerob; |
ssc(31) <= sa(31); |
ssc(30 downto 23) <= sc(30 downto 23) - sa(30 downto 23); |
ssc(22 downto 0) <= sa(22 downto 0); |
sszc <= zeroa; |
s1b(31) <= s0b(31); |
s1b(30 downto 23) <= s0c(30 downto 23)-s0b(30 downto 23); |
s1b(22 downto 0) <= s0b(22 downto 0); |
s1zb <= s0zerob; |
s1c(31) <= s0a(31); |
s1c(30 downto 23) <= s0c(30 downto 23) - s0a(30 downto 23); |
s1c(22 downto 0) <= s0a(22 downto 0); |
s1zc <= s0zeroa; |
--!clasifica c |
ssa <= sc; |
s1a <= s0c; |
end if; |
|
|
|
--! Segunda etapa corrimiento y denormalización de mantissas |
s4a <= ssa; |
s4sgb <= ssb(31); |
s4sgc <= ssc(31); |
--! Etapa 1: Denormalización de las mantissas. |
|
--! A |
s2exp <= s1a(30 downto 23); |
s2sma <= s1sma; |
|
for i in 17 downto 0 loop |
s4umb(i) <= sspHb(17-i) or sspLb(23-i); |
s4umc(i) <= sspHc(17-i) or sspLc(23-i); |
|
--! B & C |
for i in 23 downto 15 loop |
s2smb(i) <= s1pLb(23-i) xor s1b(31); |
s2smc(i) <= s1pLc(23-i) xor s1c(31); |
end loop; |
for i in 23 downto 18 loop |
s4umb(i) <= sspLb(23-i); |
s4umc(i) <= sspLc(23-i); |
for i in 14 downto 6 loop |
s2smb(i) <= (s1pHc(14-i) or s1pLb(14-i+9)) xor s1b(31); |
s2smc(i) <= (s1pHc(14-i) or s1pLb(14-i+9)) xor s1c(31); |
end loop; |
for i in 5 downto 0 loop |
s2smb(i) <= (s1pSb(5-i) or s1pHb(5-i+9)) xor s1b(31); |
s2smc(i) <= (s1pSc(5-i) or s1pHc(5-i+9)) xor s1c(31); |
end loop; |
|
if s1b(30 downto 28)>"000" then |
s2slrb <= "11"; |
else |
s2slrb <= s1b(27 downto 26); |
end if; |
if s1c(30 downto 28)>"000" then |
s2slrc <= "11"; |
else |
s2slrc <= s1c(27 downto 26); |
end if; |
|
--! Tercera etapa signar la mantissa y entregar el exponente. |
sma <= s4sma + s4a(31); |
smb <= s4smb + s4sgb; |
smc <= s4smc + s4sgc; |
exp <= s4a(30 downto 23); |
s2smb(24) <= s1b(31); |
s2smc(24) <= s1c(31); |
|
--! Etapa2: Finalizar la denormalización de b y c. |
--! A |
s3sma <= s2sma; |
s3exp <= s2exp; |
|
--! B |
case (s2slrb) is |
when "00" => |
s3smb <= s2smb(24 downto 0)+s2smb(24); |
when "01" => |
s3smb <= ( s2slabb(8 downto 0) & s2smb(23 downto 8) ) + s2smb(24); |
when "10" => |
s3smb <= ( s2slabb(16 downto 0) & s2smb(23 downto 16)) + s2smb(24); |
when others => |
s3smb <= (others => '0'); |
end case; |
|
--! C |
case (s2slrc) is |
when "00" => |
s3smc <= s2smc(24 downto 0)+s2smc(24); |
when "01" => |
s3smc <= ( s2slabc(8 downto 0) & s2smc(23 downto 8) ) + s2smc(24); |
when "10" => |
s3smc <= ( s2slabc(16 downto 0) & s2smc(23 downto 16)) + s2smc(24); |
when others => |
s3smc <= (others => '0'); |
end case; |
|
--! Etapa 3: Etapa 3 Realizar la suma, quitar el signo de la mantissa y codificar el corrimiento hacia la izquierda. |
s4ures <= s3ures+s3res(25); --Resultado no signado |
s4sgr <= s3res(25); --Signo |
s4exp <= s3exp; --Exponente |
s4lshift <= s3lshift; --Corrimiento hacia la izquierda. |
|
--! Etapa 4: Corrimiento y normalización de la mantissa resultado. |
res32(31) <= s4sgr; |
if s4ures(25)='1' then |
res32(22 downto 0) <= s4ures(24 downto 2); |
res32(30 downto 23) <= s4exp+2; |
elsif s4ures(24)='1' then |
res32(22 downto 0) <= s4ures(23 downto 1); |
res32(30 downto 23) <= s4exp+1; |
else |
case s4lshift(4 downto 3) is |
when "00" => |
res32(22 downto 0) <= s4nrmP(22 downto 0); |
res32(30 downto 23) <= s4exp - s4lshift; |
when "01" => |
res32(22 downto 0) <= s4nrmP(14 downto 0) & s4slab(7 downto 0); |
res32(30 downto 23) <= s4exp - s4lshift; |
when "10" => |
res32(22 downto 0) <= s4nrmP(6 downto 0) & s4slab(15 downto 0); |
res32(30 downto 23) <= s4exp - s4lshift; |
when others => |
res32(30 downto 0) <= (others => '0'); |
end case; |
|
end if; |
|
end if; |
end process; |
|
--! Combinatorial Gremlin |
highshiftermultb:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",18,18,36) |
port map (shl(conv_std_logic_vector(1,18),ssb(30 downto 23)),bss(22 downto 5),sspHb); |
lowshiftermultb:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",18,18,36) |
port map (shl(conv_std_logic_vector(1,18),ssb(30 downto 23)),conv_std_logic_vector(0,12)&bss(4 downto 0)&sszb,sspLb); |
highshiftermultc:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",18,18,36) |
port map (shl(conv_std_logic_vector(1,18),ssc(30 downto 23)),css(22 downto 5),sspHc); |
lowshiftermultc:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",18,18,36) |
port map (shl(conv_std_logic_vector(1,18),ssc(30 downto 23)),conv_std_logic_vector(0,12)&css(4 downto 0)&sszc,sspLc); |
|
--!Signar b y c |
signbc: |
for i in 23 downto 0 generate |
s4smb(i) <= s4sgb xor s4umb(i); |
s4smc(i) <= s4sgc xor s4umc(i); |
end generate; |
s4smb(24) <= s4sgb; |
s4smc(24) <= s4sgc; |
|
--!Signar a |
signa: |
for i in 22 downto 0 generate |
s4sma(i) <= s4a(31) xor s4a(i); |
end generate; |
s4sma(23) <= not(s4a(31)); |
s4sma(24) <= s4a(31); |
|
--! zero |
process (sc,sb,sa) |
--! Combinatorial gremlin, Etapa 0, Escoger el mayor exponente que sera el resultado desnormalizado,\n |
--! calcula cuanto debe ser el corrimiento de la mantissa con menor exponente y reorganiza los operandos,\n |
--! si el mayor es b, intercambia las posición si el mayor es a las posiciones la mantiene. Zero check.\n |
process (s0b(30 downto 23),s0a(30 downto 23)) |
begin |
s0zerob <='0'; |
s0zeroa <='0'; |
s0zeroc <='0'; |
|
zeroc <= '0'; |
zerob <= '0'; |
zeroa <= '0'; |
|
for i in 30 downto 23 loop |
if sa(i)='1' then |
zeroa <= '1'; |
if s0a(i)='1' then |
s0zeroa <= '1'; |
end if; |
if sb(i)='1' then |
zerob <='1'; |
if s0b(i)='1' then |
s0zerob <='1'; |
end if; |
if sc(i)='1' then |
zeroc <='1'; |
if s0c(i)='1' then |
s0zeroc <='1'; |
end if; |
|
|
end loop; |
end process; |
--! ssb2bssInversor de posicion |
ssb2bss: |
end process; |
|
--! Combinatorial Gremlin, Etapa 1 Denormalización de las mantissas. |
denormsupershiftermultb:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",9,9,18) |
port map ("00"&shl(conv_std_logic_vector(1,7),s1b(25 downto 23)),conv_std_logic_vector(0,3)&b1s(22 downto 17),s1pSb); |
denormhighshiftermultb:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",9,9,18) |
port map ("00"&shl(conv_std_logic_vector(1,7),s1b(25 downto 23)),b1s(16 downto 8),s1pHb); |
denormlowshiftermultb:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",9,9,18) |
port map ("00"&shl(conv_std_logic_vector(1,7),s1b(25 downto 23)),b1s(7 downto 0)&s1zb,s1pLb); |
denormsupershiftermultc:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",9,9,18) |
port map ("00"&shl(conv_std_logic_vector(1,7),s1c(25 downto 23)),conv_std_logic_vector(0,3)&c1s(22 downto 17),s1pSc); |
denormhighshiftermultc:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",9,9,18) |
port map ("00"&shl(conv_std_logic_vector(1,7),s1c(25 downto 23)),c1s(16 downto 8),s1pHc); |
denormlowshiftermultc:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",9,9,18) |
port map ("00"&shl(conv_std_logic_vector(1,7),s1c(25 downto 23)),c1s(7 downto 0)&s1zc,s1pLc); |
s1b2b1s: |
for i in 22 downto 0 generate |
bss(i) <= ssb(22-i); |
css(i) <= ssc(22-i); |
end generate ssb2bss; |
b1s(i) <= s1b(22-i); |
end generate s1b2b1s; |
s1c2c1s: |
for i in 22 downto 0 generate |
c1s(i) <= s1c(22-i); |
end generate s1c2c1s; |
signa: |
for i in 22 downto 0 generate |
s1sma(i) <= s1a(31) xor s1a(i); |
end generate; |
s1sma(23) <= not(s1a(31)); |
s1sma(24) <= s1a(31); |
|
--! Combinatorial Gremlin, Etapa2: Finalizar la denormalización de b. |
s2signslab: |
for i in 16 downto 0 generate |
s2slabb(i) <= s2smb(24); |
s2slabc(i) <= s2smc(24); |
end generate s2signslab; |
|
--! Combinatorial Gremlin, Etapa 3 Realizar la suma, quitar el signo de la mantissa y codificar el corrimiento hacia la izquierda. |
--adder:sadd2 |
--port map (s3sma(24)&s3sma,s3smb(24)&s3smb,dpc,s3res); |
process (s3sma,s3smb,s3smc) |
begin |
--! Magia: La suma ocurre aqui |
s3res <= (s3sma(24)&s3sma(24)&s3sma)+(s3smb(24)&s3smb(24)&s3smb)+(s3smc(24)&s3smc(24)&s3smc); |
end process; |
|
process(s3res) |
variable lshift : integer range 24 downto 0; |
begin |
lshift:=24; |
|
for i in 0 to 23 loop |
s3ures(i) <= s3res(26) xor s3res(i); |
if (s3res(26) xor s3res(i))='1' then |
lshift:=23-i; |
end if; |
end loop; |
s3ures(24) <= s3res(24) xor s3res(26); |
s3ures(25) <= s3res(25) xor s3res(26); |
s3lshift <= conv_std_logic_vector(lshift,5); |
end process; |
|
--! Combinatorial Gremlin, Etapa 4 corrimientos y normalización de la mantissa resultado. |
normsupershiftermult:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",9,9,18) |
port map (shl(conv_std_logic_vector(1,9),s4lshift(2 downto 0)),s4ures(22 downto 14),s4nrmS); |
normhighshiftermult:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",9,9,18) |
port map (shl(conv_std_logic_vector(1,9),s4lshift(2 downto 0)),s4ures(13 downto 5),s4nrmH); |
normlowshiftermult:lpm_mult |
generic map ("DEDICATED_MULTIPLIER_CIRCUITRY=YES,MAXIMIZE_SPEED=9","UNSIGNED","LPM_MULT",9,9,18) |
port map (shl(conv_std_logic_vector(1,9),s4lshift(2 downto 0)),s4ures(4 downto 0)&conv_std_logic_vector(0,4),s4nrmL); |
process (s4nrmS,s4nrmH,s4nrmL) |
begin |
s4nrmP(22 downto 14) <= s4nrmS(8 downto 0) or s4nrmH(17 downto 9); |
s4nrmP(13 downto 5) <= s4nrmH(8 downto 0) or s4nrmL(17 downto 9); |
s4nrmP(4 downto 0) <= s4nrmL(8 downto 4); |
end process; |
s4signslab: |
for i in 15 downto 0 generate |
s4slab(i) <= '0'; |
end generate s4signslab; |
end ema3_arch; |
|
|
|
|
|