URL
https://opencores.org/ocsvn/theia_gpu/theia_gpu/trunk
Subversion Repositories theia_gpu
[/] [theia_gpu/] [trunk/] [rtl/] [Module_VectorALU.v] - Rev 186
Go to most recent revision | Compare with Previous | Blame | View Log
`timescale 1ns / 1ps `include "aDefinitions.v" /********************************************************************************** Theia, Ray Cast Programable graphic Processing Unit. Copyright (C) 2010 Diego Valverde (diego.valverde.g@gmail.com) This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. ***********************************************************************************/ //-------------------------------------------------------------- module VectorALU ( input wire Clock, input wire Reset, input wire[`INSTRUCTION_OP_LENGTH-1:0] iOperation, input wire[`WIDTH-1:0] iChannel_Ax, input wire[`WIDTH-1:0] iChannel_Bx, input wire[`WIDTH-1:0] iChannel_Ay, input wire[`WIDTH-1:0] iChannel_By, input wire[`WIDTH-1:0] iChannel_Az, input wire[`WIDTH-1:0] iChannel_Bz, output wire [`WIDTH-1:0] oResultA, output wire [`WIDTH-1:0] oResultB, output wire [`WIDTH-1:0] oResultC, input wire iInputReady, output reg oBranchTaken, output reg oBranchNotTaken, output reg oReturnFromSub, input wire [`ROM_ADDRESS_WIDTH-1:0] iCurrentIP, //Connections to the O Memory output wire [`DATA_ROW_WIDTH-1:0] oOMEMWriteAddress, output wire [`DATA_ROW_WIDTH-1:0] oOMEMWriteData, output wire oOMEM_WriteEnable, //Connections to the R Memory output wire [`DATA_ROW_WIDTH-1:0] oTMEMReadAddress, input wire [`DATA_ROW_WIDTH-1:0] iTMEMReadData, input wire iTMEMDataAvailable, output wire oTMEMDataRequest, output reg OutputReady ); wire wMultiplcationUnscaled; assign wMultiplcationUnscaled = (iOperation == `IMUL) ? 1'b1 : 1'b0; //-------------------------------------------------------------- reg [7:0] InputReadyA,InputReadyB,InputReadyC; //------------------------------------------------------ /* This is the block that takes care of all tha arithmetic comparisons. Supported operations are <,>,<=,>=,==,!= */ //------------------------------------------------------ reg [`WIDTH-1:0] wMultiplicationA_Ax; reg [`WIDTH-1:0] wMultiplicationA_Bx; wire [`LONG_WIDTH-1:0] wMultiplicationA_Result; wire wMultiplicationA_InputReady; wire wMultiplicationA_OutputReady; wire wMultiplicationOutputReady, wMultiplicationOutputReadyA, wMultiplicationOutputReadyB,wMultiplicationOutputReadyC,wMultiplicationOutputReadyD; wire wAddSubAOutputReady,wAddSubBOutputReady,wAddSubCOutputReady; wire [`INSTRUCTION_OP_LENGTH-1:0] wOperation; wire [`WIDTH-1:0] wSwizzleOutputX,wSwizzleOutputY,wSwizzleOutputZ; //-------------------------------------------------------------------- reg [`WIDTH-1:0] ResultA,ResultB,ResultC; //Output Flip Flops, //This flip flop will control the outputs so that the //values of the outputs change ONLY when when there is //a positive edge of OutputReady FFD32_POSEDGE ResultAFFD ( .Clock( OutputReady ), .D( ResultA ), .Q( oResultA ) ); FFD32_POSEDGE ResultBFFD ( .Clock( OutputReady ), .D( ResultB ), .Q( oResultB ) ); FFD32_POSEDGE ResultCFFD ( .Clock( OutputReady ), .D( ResultC ), .Q( oResultC ) ); //-------------------------------------------------------------------- Swizzle3D Swizzle1 ( .Source0_X( iChannel_Bx ), .Source0_Y( iChannel_By ), .Source0_Z( iChannel_Bz ), .iOperation( iChannel_Ax ), .SwizzleX( wSwizzleOutputX ), .SwizzleY( wSwizzleOutputY ), .SwizzleZ( wSwizzleOutputZ ) ); //--------------------------------------------------------------------- wire [`LONG_WIDTH-1:0] wModulus2N_ResultA,wModulus2N_ResultB,wModulus2N_ResultC; //---------------------------------------------------------------------( wire IOW_Operation,wOMEM_We; assign IOW_Operation = (iOperation == `OMWRITE); always @ ( * ) begin if (iOperation == `RET) oReturnFromSub <= OutputReady; else oReturnFromSub <= 1'b0; end FFD_POSEDGE_SYNCRONOUS_RESET # ( 1 ) FFD1_AWE ( .Clock( Clock ), .Reset( Reset), .Enable( 1'b1 ), .D( IOW_Operation ), .Q( wOMEM_We ) ); assign oOMEM_WriteEnable = wOMEM_We & IOW_Operation; FFD_POSEDGE_SYNCRONOUS_RESET # ( `DATA_ROW_WIDTH ) FFD1_A ( .Clock( Clock ), .Reset( Reset), .Enable( iInputReady ), .D( {iChannel_Ax,iChannel_Ay,iChannel_Az} ), .Q( oOMEMWriteAddress) ); FFD_POSEDGE_SYNCRONOUS_RESET # ( `DATA_ROW_WIDTH ) FFD2_B ( .Clock( Clock ), .Reset( Reset), .Enable( iInputReady ), .D( {iChannel_Bx,iChannel_By,iChannel_Bz} ), .Q( oOMEMWriteData ) ); wire wTMReadOutputReady; assign wTMReadOutputReady = iTMEMDataAvailable; /* FFD_POSEDGE_SYNCRONOUS_RESET # ( 1 ) FFD1_ARE ( .Clock( Clock ), .Reset( Reset), .Enable( 1'b1 ), .D( iTMEMDataAvailable ), .Q( wTMReadOutputReady ) ); */ //assign oTMEMReadAddress = {iChannel_Ax,iChannel_Ay,iChannel_Az}; //We wait 1 clock cycle before be send the data read request, because //we need to lathc the values at the output wire wOpTRead; assign wOpTRead = ( iOperation == `TMREAD ) ? 1'b1 : 1'b0; wire wTMEMRequest; FFD_POSEDGE_SYNCRONOUS_RESET # ( 1 ) FFD1_ARE123 ( .Clock( Clock ), .Reset( Reset), .Enable( 1'b1 ), .D( wOpTRead ), .Q( wTMEMRequest ) ); assign oTMEMDataRequest = wTMEMRequest & wOpTRead; FFD_POSEDGE_SYNCRONOUS_RESET # ( `DATA_ROW_WIDTH ) FFD2_B445 ( .Clock( Clock ), .Reset( Reset), .Enable( iInputReady & wOpTRead ), .D( {iChannel_Ax,iChannel_Ay,iChannel_Az} ), .Q( oTMEMReadAddress ) ); /* This MUX will select the apropiated X,Y or Z depending on wheter it is XYZ iOperation. This gets defined by the bits 3 and 4 of iOperation, and only applies for oBranchTaken and Store operations. */ wire wArithmeticComparison_Result; wire ArithmeticComparison_InputReady; wire ArithmeticComparison_OutputReady; reg[`WIDTH-1:0] ArithmeticComparison_A,ArithmeticComparison_B; always @ ( * ) begin case ( {iOperation[4],iOperation[3]} ) 2'b01: ArithmeticComparison_A = iChannel_Ax; 2'b10: ArithmeticComparison_A = iChannel_Ay; 2'b11: ArithmeticComparison_A = iChannel_Az; default: ArithmeticComparison_A = 0; //Should never happen endcase end //--------------------------------------------------------------------- always @ ( * ) begin case ( {iOperation[4],iOperation[3]} ) 2'b01: ArithmeticComparison_B = iChannel_Bx; 2'b10: ArithmeticComparison_B = iChannel_By; 2'b11: ArithmeticComparison_B = iChannel_Bz; default: ArithmeticComparison_B = 0; //Should never happen endcase end //--------------------------------------------------------------------- /* The onbly instance of Aritmetic comparison in the ALU, ArithmeticComparison operations matches the 3 LSB of Global ALU iOperation for oBranchTaken Instruction family */ assign ArithmeticComparison_InputReady = iInputReady; wire wArithmeticComparisonResult; ArithmeticComparison ArithmeticComparison_1 ( .Clock( Clock ), .X( ArithmeticComparison_A ), .Y( ArithmeticComparison_B ), .iOperation( iOperation[2:0] ), .iInputReady( ArithmeticComparison_InputReady ), .OutputReady( ArithmeticComparison_OutputReady ), .Result( wArithmeticComparisonResult ) ); assign wArithmeticComparison_Result = wArithmeticComparisonResult && OutputReady; //-------------------------------------------------------------------- RADIX_R_MUL_32_FULL_PARALLEL MultiplicationChannel_A ( .Clock( Clock ), .Reset( Reset ), .A( wMultiplicationA_Ax ), .B( wMultiplicationA_Bx ), .R( wMultiplicationA_Result ), .iUnscaled( wMultiplcationUnscaled ), .iInputReady( wMultiplicationA_InputReady ), .OutputReady( wMultiplicationA_OutputReady ) ); //-------------------------------------------------------------------- always @ ( * ) begin case (iOperation) `CROSS: wMultiplicationA_Ax = iChannel_Ay; // Ay * Bz `MAG: wMultiplicationA_Ax = iChannel_Ax; `MULP: wMultiplicationA_Ax = iChannel_Ax; //Az = Ax * Ay default: wMultiplicationA_Ax = iChannel_Ax; // Ax * Bx endcase end //-------------------------------------------------------------------- //assign wMultiplicationA_Ax = iChannel_Ax; assign wMultiplicationA_InputReady = (iOperation == `CROSS || iOperation == `DOT || iOperation == `MUL || iOperation == `IMUL || iOperation == `MAG || iOperation == `MULP ) ? iInputReady : 0; //-------------------------------------------------------------------- always @ ( * ) begin case (iOperation) `MUL,`IMUL: wMultiplicationA_Bx = iChannel_Bx; //Ax*Bx `MAG: wMultiplicationA_Bx = iChannel_Ax; //Ax^2 `DOT: wMultiplicationA_Bx = iChannel_Bx; //Ax*Bx `CROSS: wMultiplicationA_Bx = iChannel_Bz; // Ay * Bz `MULP: wMultiplicationA_Bx = iChannel_Ay; //Az = Ax * Ay default: wMultiplicationA_Bx = 32'b0; endcase end //-------------------------------------------------------------------- //------------------------------------------------------ reg [`WIDTH-1:0] wMultiplicationB_Ay; reg [`WIDTH-1:0] wMultiplicationB_By; wire [`LONG_WIDTH-1:0] wMultiplicationB_Result; wire wMultiplicationB_InputReady; wire wMultiplicationB_OutputReady; RADIX_R_MUL_32_FULL_PARALLEL MultiplicationChannel_B ( .Clock( Clock ), .Reset( Reset ), .A( wMultiplicationB_Ay ), .B( wMultiplicationB_By ), .R( wMultiplicationB_Result ), .iUnscaled( wMultiplcationUnscaled ), .iInputReady( wMultiplicationB_InputReady ), .OutputReady( wMultiplicationB_OutputReady ) ); //---------------------------------------------------- always @ ( * ) begin case (iOperation) `CROSS: wMultiplicationB_Ay = iChannel_Az; // Az * By `MAG: wMultiplicationB_Ay = iChannel_Ay; default: wMultiplicationB_Ay = iChannel_Ay; // Ay * By endcase end //---------------------------------------------------- assign wMultiplicationB_InputReady = (iOperation == `CROSS || iOperation == `DOT || iOperation == `MUL || iOperation == `IMUL || iOperation == `MAG ) ? iInputReady : 0; //---------------------------------------------------- always @ ( * ) begin case (iOperation) `MUL,`IMUL: wMultiplicationB_By = iChannel_By; //Ay*By `MAG: wMultiplicationB_By = iChannel_Ay; //Ay^2 `DOT: wMultiplicationB_By = iChannel_By; //Ay*By `CROSS: wMultiplicationB_By = iChannel_By; // Az * By default: wMultiplicationB_By = 32'b0; endcase end //---------------------------------------------------- //------------------------------------------------------ reg [`WIDTH-1:0] wMultiplicationC_Az; reg [`WIDTH-1:0] wMultiplicationC_Bz; wire [`LONG_WIDTH-1:0] wMultiplicationC_Result; wire wMultiplicationC_InputReady; wire wMultiplicationC_OutputReady; RADIX_R_MUL_32_FULL_PARALLEL MultiplicationChannel_C ( .Clock( Clock ), .Reset( Reset ), .A( wMultiplicationC_Az ), .B( wMultiplicationC_Bz ), .R( wMultiplicationC_Result ), .iUnscaled( wMultiplcationUnscaled ), .iInputReady( wMultiplicationC_InputReady ), .OutputReady( wMultiplicationC_OutputReady ) ); //---------------------------------------------------- always @ ( * ) begin case (iOperation) `CROSS: wMultiplicationC_Az = iChannel_Az; //Az*Bx `MAG: wMultiplicationC_Az = iChannel_Az; default: wMultiplicationC_Az = iChannel_Az; //Az*Bz endcase end //---------------------------------------------------- assign wMultiplicationC_InputReady = ( iOperation == `CROSS || iOperation == `DOT || iOperation == `MUL || iOperation == `IMUL || iOperation == `MAG ) ? iInputReady : 0; //---------------------------------------------------- always @ ( * ) begin case (iOperation) `MUL,`IMUL: wMultiplicationC_Bz = iChannel_Bz; //Az*Bz `MAG: wMultiplicationC_Bz = iChannel_Az; //Ay^2 `DOT: wMultiplicationC_Bz = iChannel_Bz; //Az*Bz `CROSS: wMultiplicationC_Bz = iChannel_Bx; //Az*Bx default: wMultiplicationC_Bz = 32'b0; endcase end //---------------------------------------------------- reg [`WIDTH-1:0] wMultiplicationD_Aw; reg [`WIDTH-1:0] wMultiplicationD_Bw; wire [`LONG_WIDTH-1:0] wMultiplicationD_Result; wire wMultiplicationD_InputReady; wire wMultiplicationD_OutputReady; RADIX_R_MUL_32_FULL_PARALLEL MultiplicationChannel_D ( .Clock( Clock ), .Reset( Reset ), .A( wMultiplicationD_Aw ), .B( wMultiplicationD_Bw ), .R( wMultiplicationD_Result ), .iUnscaled( wMultiplcationUnscaled ), .iInputReady( wMultiplicationD_InputReady ), .OutputReady( wMultiplicationD_OutputReady ) ); assign wMultiplicationD_InputReady = (iOperation == `CROSS ) ? iInputReady : 0; //---------------------------------------------------- always @ ( * ) begin case (iOperation) `CROSS: wMultiplicationD_Aw = iChannel_Ax; //Ax*Bz default: wMultiplicationD_Aw = 32'b0; endcase end //---------------------------------------------------- always @ ( * ) begin case (iOperation) `CROSS: wMultiplicationD_Bw = iChannel_Bz; //Ax*Bz default: wMultiplicationD_Bw = 32'b0; endcase end //---------------------------------------------------- reg [`WIDTH-1:0] wMultiplicationE_Ak; reg [`WIDTH-1:0] wMultiplicationE_Bk; wire [`LONG_WIDTH-1:0] wMultiplicationE_Result; wire wMultiplicationE_InputReady; wire wMultiplicationE_OutputReady; RADIX_R_MUL_32_FULL_PARALLEL MultiplicationChannel_E ( .Clock( Clock ), .Reset( Reset ), .A( wMultiplicationE_Ak ), .B( wMultiplicationE_Bk ), .R( wMultiplicationE_Result ), .iUnscaled( wMultiplcationUnscaled ), .iInputReady( wMultiplicationE_InputReady ), .OutputReady( wMultiplicationE_OutputReady ) ); assign wMultiplicationE_InputReady = (iOperation == `CROSS ) ? iInputReady : 0; //---------------------------------------------------- always @ ( * ) begin case (iOperation) `CROSS: wMultiplicationE_Ak = iChannel_Ax; //Ax*By default: wMultiplicationE_Ak = 32'b0; endcase end //---------------------------------------------------- always @ ( * ) begin case (iOperation) `CROSS: wMultiplicationE_Bk = iChannel_By; //Ax*By default: wMultiplicationE_Bk = 32'b0; endcase end //---------------------------------------------------- reg [`WIDTH-1:0] wMultiplicationF_Al; reg [`WIDTH-1:0] wMultiplicationF_Bl; wire [`LONG_WIDTH-1:0] wMultiplicationF_Result; wire wMultiplicationF_InputReady; wire wMultiplicationF_OutputReady; RADIX_R_MUL_32_FULL_PARALLEL MultiplicationChannel_F ( .Clock( Clock ), .Reset( Reset ), .A( wMultiplicationF_Al ), .B( wMultiplicationF_Bl ), .R( wMultiplicationF_Result ), .iUnscaled( wMultiplcationUnscaled ), .iInputReady( wMultiplicationF_InputReady ), .OutputReady( wMultiplicationF_OutputReady ) ); assign wMultiplicationF_InputReady = (iOperation == `CROSS ) ? iInputReady : 0; //---------------------------------------------------- always @ ( * ) begin case (iOperation) `CROSS: wMultiplicationF_Al = iChannel_Ay; //Ay*Bx default: wMultiplicationF_Al = 32'b0; endcase end //---------------------------------------------------- always @ ( * ) begin case (iOperation) `CROSS: wMultiplicationF_Bl = iChannel_Bx; //Ay*Bx default: wMultiplicationF_Bl = 32'b0; endcase end //------------------------------------------------------ wire [`WIDTH-1:0] wDivisionA_Result; wire wDivisionA_OutputReady; wire wDivisionA_InputReady; assign wDivisionA_InputReady = ( iOperation == `DIV) ? iInputReady : 0; SignedIntegerDivision DivisionChannel_A ( .Clock( Clock ), .Reset( Reset ), .iDividend( iChannel_Ax ), .iDivisor( iChannel_Bx ), .xQuotient( wDivisionA_Result ), .iInputReady( wDivisionA_InputReady ), .OutputReady( wDivisionA_OutputReady ) ); //------------------------------------------------------ wire [`WIDTH-1:0] wDivisionB_Result; wire wDivisionB_OutputReady; wire wDivisionB_InputReady; assign wDivisionB_InputReady = ( iOperation == `DIV) ? iInputReady : 0; SignedIntegerDivision DivisionChannel_B ( .Clock( Clock ), .Reset( Reset ), .iDividend( iChannel_Ay ), .iDivisor( iChannel_By ), .xQuotient( wDivisionB_Result ), .iInputReady( wDivisionB_InputReady ), .OutputReady( wDivisionB_OutputReady ) ); //------------------------------------------------------ wire [`WIDTH-1:0] wDivisionC_Result; wire wDivisionC_OutputReady; wire wDivisionC_InputReady; assign wDivisionC_InputReady = ( iOperation == `DIV) ? iInputReady : 0; SignedIntegerDivision DivisionChannel_C ( .Clock( Clock ), .Reset( Reset ), .iDividend( iChannel_Az ), .iDivisor( iChannel_Bz ), .xQuotient( wDivisionC_Result ), .iInputReady( wDivisionC_InputReady ), .OutputReady( wDivisionC_OutputReady ) ); //-------------------------------------------------------------- /* First addtion block instance goes here. Note that all inputs/outputs to the block are wires. It has two MUXES one for each entry. */ reg [`LONG_WIDTH-1:0] wAddSubA_Ax,wAddSubA_Bx; wire [`LONG_WIDTH-1:0] wAddSubA_Result; wire wAddSubA_Operation; //Either addition or substraction reg wAddSubA_InputReady; wire wAddSubA_OutputReady; assign wAddSubA_Operation = ( iOperation == `SUB || iOperation == `CROSS || iOperation == `DEC || iOperation == `MOD ) ? 1 : 0; FixedAddSub AddSubChannel_A ( .Clock( Clock ), .Reset( Reset ), .A( wAddSubA_Ax ), .B( wAddSubA_Bx ), .R( wAddSubA_Result ), .iOperation( wAddSubA_Operation ), .iInputReady( wAddSubA_InputReady ), .OutputReady( wAddSubA_OutputReady ) ); //Diego //---------------------------- //InpuReady Mux A always @ ( * ) begin case (iOperation) `ADD: wAddSubA_InputReady = iInputReady; `SUB: wAddSubA_InputReady = iInputReady; `INC,`INCX,`INCY,`INCZ: wAddSubA_InputReady = iInputReady; `DEC: wAddSubA_InputReady = iInputReady; `MOD: wAddSubA_InputReady = iInputReady; `MAG: wAddSubA_InputReady = wMultiplicationOutputReadyA && wMultiplicationOutputReadyB; //wMultiplicationA_OutputReady //&& wMultiplicationB_OutputReady; `DOT: wAddSubA_InputReady = wMultiplicationOutputReadyA && wMultiplicationOutputReadyB; //wMultiplicationA_OutputReady //&& wMultiplicationB_OutputReady; `CROSS: wAddSubA_InputReady = wMultiplicationOutputReadyA && wMultiplicationOutputReadyB; // wMultiplicationA_OutputReady //&& wMultiplicationB_OutputReady; default: wAddSubA_InputReady = 1'b0; endcase end //---------------------------- //wAddSubA_Bx 2:1 input Mux always @ ( * ) begin case (iOperation) `ADD: wAddSubA_Ax = ( iChannel_Ax[31] == 1'b1) ? {32'hFFFFFFFF, iChannel_Ax } : { 32'b0, iChannel_Ax }; `SUB: wAddSubA_Ax = ( iChannel_Ax[31] == 1'b1) ? {32'hFFFFFFFF, iChannel_Ax } : { 32'b0, iChannel_Ax }; `INC,`INCX,`INCY,`INCZ: wAddSubA_Ax = ( iChannel_Ax[31] == 1'b1) ? {32'hFFFFFFFF, iChannel_Ax } : { 32'b0, iChannel_Ax }; `DEC: wAddSubA_Ax = ( iChannel_Ax[31] == 1'b1) ? {32'hFFFFFFFF, iChannel_Ax } : { 32'b0, iChannel_Ax }; `MOD: wAddSubA_Ax = ( iChannel_Bx[31] == 1'b1) ? {32'hFFFFFFFF, iChannel_Bx } : { 32'b0, iChannel_Bx }; `MAG: wAddSubA_Ax = wMultiplicationA_Result; `DOT: wAddSubA_Ax = wMultiplicationA_Result; `CROSS: wAddSubA_Ax = wMultiplicationA_Result; default: wAddSubA_Ax = 64'b0; endcase end //---------------------------- //wAddSubA_Bx 2:1 input Mux always @ ( * ) begin case (iOperation) `ADD: wAddSubA_Bx = ( iChannel_Bx[31] == 1'b1) ? {32'hFFFFFFFF, iChannel_Bx } : { 32'b0, iChannel_Bx }; `SUB: wAddSubA_Bx = ( iChannel_Bx[31] == 1'b1) ? {32'hFFFFFFFF, iChannel_Bx } : { 32'b0, iChannel_Bx }; `INC,`INCX: wAddSubA_Bx = (`LONG_WIDTH'd1 << `SCALE); `INCY,`INCZ: wAddSubA_Bx = `LONG_WIDTH'd0; `DEC: wAddSubA_Bx = (`LONG_WIDTH'd1 << `SCALE); `MOD: wAddSubA_Bx = (`LONG_WIDTH'd1 << `SCALE); `MAG: wAddSubA_Bx = wMultiplicationB_Result; `DOT: wAddSubA_Bx = wMultiplicationB_Result; `CROSS: wAddSubA_Bx = wMultiplicationB_Result; default: wAddSubA_Bx = 64'b0; endcase end //-------------------------------------------------------------- /* Second addtion block instance goes here. Note that all inputs/outputs to the block are wires. It has two MUXES one for each entry. */ wire [`LONG_WIDTH-1:0] wAddSubB_Result; wire wAddSubB_Operation; //Either addition or substraction reg wAddSubB_InputReady; wire wAddSubB_OutputReady; reg [`LONG_WIDTH-1:0] wAddSubB_Ay,wAddSubB_By; assign wAddSubB_Operation = ( iOperation == `SUB || iOperation == `CROSS || iOperation == `DEC || iOperation == `MOD ) ? 1 : 0; FixedAddSub AddSubChannel_B ( .Clock( Clock ), .Reset( Reset ), .A( wAddSubB_Ay ), .B( wAddSubB_By ), .R( wAddSubB_Result ), .iOperation( wAddSubB_Operation ), .iInputReady( wAddSubB_InputReady ), .OutputReady( wAddSubB_OutputReady ) ); //---------------------------- wire wMultiplicationOutputReadyC_Dealy1; FFD_POSEDGE_ASYNC_RESET # (1) FFwMultiplicationOutputReadyC_Dealy1 ( .Clock( Clock ), .Clear( Reset ), .D( wMultiplicationOutputReadyC ), .Q( wMultiplicationOutputReadyC_Dealy1 ) ); //InpuReady Mux B always @ ( * ) begin case (iOperation) `ADD: wAddSubB_InputReady = iInputReady; `SUB: wAddSubB_InputReady = iInputReady; `INC,`INCX,`INCY,`INCZ: wAddSubB_InputReady = iInputReady; `DEC: wAddSubB_InputReady = iInputReady; `MOD: wAddSubB_InputReady = iInputReady; `MAG: wAddSubB_InputReady = wAddSubAOutputReady && wMultiplicationOutputReadyC_Dealy1; //&& wMultiplicationC_OutputReady; `DOT: wAddSubB_InputReady = wAddSubAOutputReady && wMultiplicationOutputReadyC_Dealy1; //&& wMultiplicationC_OutputReady; `CROSS: wAddSubB_InputReady = wMultiplicationOutputReadyC && wMultiplicationOutputReadyD; // wMultiplicationC_OutputReady //&& wMultiplicationD_OutputReady; default: wAddSubB_InputReady = 1'b0; endcase end //---------------------------- // wAddSubB_Ay 2:1 input Mux // If the iOperation is ADD or SUB, it will simply take the inputs from // ALU Channels. If it is a VECTOR_MAGNITUDE, it take the input from the // previus ADDER_A, same for dot product. always @ ( * ) begin case (iOperation) `ADD: wAddSubB_Ay = (iChannel_Ay[31] == 1'b1) ? {32'hFFFFFFFF, iChannel_Ay} : {32'b0,iChannel_Ay}; //Ay `SUB: wAddSubB_Ay = (iChannel_Ay[31] == 1'b1) ? {32'hFFFFFFFF, iChannel_Ay} : {32'b0,iChannel_Ay}; //Ay `INC,`INCX,`INCY,`INCZ: wAddSubB_Ay = (iChannel_Ay[31] == 1'b1) ? {32'hFFFFFFFF, iChannel_Ay} : {32'b0,iChannel_Ay}; //Ay `DEC: wAddSubB_Ay = (iChannel_Ay[31] == 1'b1) ? {32'hFFFFFFFF, iChannel_Ay} : {32'b0,iChannel_Ay}; //Ay `MOD: wAddSubB_Ay = (iChannel_By[31] == 1'b1) ? {32'hFFFFFFFF, iChannel_By} : {32'b0,iChannel_By}; //Ay `MAG: wAddSubB_Ay = wAddSubA_Result; //A^2+B^2 `DOT: wAddSubB_Ay = wAddSubA_Result; //Ax*Bx + Ay*By `CROSS: wAddSubB_Ay = wMultiplicationC_Result; default: wAddSubB_Ay = 64'b0; endcase end //---------------------------- //wAddSubB_By 2:1 input Mux always @ ( * ) begin case (iOperation) `ADD: wAddSubB_By = (iChannel_By[31] == 1'b1) ? {32'hFFFFFFFF,iChannel_By } : {32'b0,iChannel_By}; //By `SUB: wAddSubB_By = (iChannel_By[31] == 1'b1) ? {32'hFFFFFFFF,iChannel_By } : {32'b0,iChannel_By}; //{32'b0,iChannel_By}; //By `INC,`INCY: wAddSubB_By = (`LONG_WIDTH'd1 << `SCALE); `INCX,`INCZ: wAddSubB_By = `LONG_WIDTH'd0; `DEC: wAddSubB_By = (`LONG_WIDTH'd1 << `SCALE); `MOD: wAddSubB_By = (`LONG_WIDTH'd1 << `SCALE); `MAG: wAddSubB_By = wMultiplicationC_Result; //C^2 `DOT: wAddSubB_By = wMultiplicationC_Result; //Az * Bz `CROSS: wAddSubB_By = wMultiplicationD_Result; default: wAddSubB_By = 32'b0; endcase end //-------------------------------------------------------------- wire [`LONG_WIDTH-1:0] wAddSubC_Result; reg [`LONG_WIDTH-1:0] wAddSubC_Az,wAddSubC_Bz; wire wAddSubC_Operation; //Either addition or substraction reg wAddSubC_InputReady; wire wAddSubC_OutputReady; reg [`LONG_WIDTH-1:0] AddSubC_Az,AddSubB_Bz; //----------------------------------------- always @ ( * ) begin case (iOperation) `CROSS: wAddSubC_Az = wMultiplicationE_Result; `MOD: wAddSubC_Az = (iChannel_Bz[31] == 1'b1) ? {32'hFFFFFFFF,iChannel_Bz} : {32'b0,iChannel_Bz}; default: wAddSubC_Az = (iChannel_Az[31] == 1'b1) ? {32'hFFFFFFFF,iChannel_Az} : {32'b0,iChannel_Az}; endcase end //----------------------------------------- always @ ( * ) begin case (iOperation) `CROSS: wAddSubC_Bz = wMultiplicationF_Result; `INC,`INCZ: wAddSubC_Bz = (`LONG_WIDTH'd1 << `SCALE); `INCX,`INCY: wAddSubC_Bz = `LONG_WIDTH'd0; `DEC: wAddSubC_Bz = (`LONG_WIDTH'd1 << `SCALE); `MOD: wAddSubC_Bz = (`LONG_WIDTH'd1 << `SCALE); default: wAddSubC_Bz = (iChannel_Bz[31] == 1'b1) ? {32'hFFFFFFFF,iChannel_Bz} : {32'b0,iChannel_Bz}; endcase end //----------------------------------------- assign wAddSubC_Operation = ( iOperation == `SUB || iOperation == `CROSS || iOperation == `DEC || iOperation == `MOD ) ? 1 : 0; FixedAddSub AddSubChannel_C ( .Clock( Clock ), .Reset( Reset ), .A( wAddSubC_Az ), .B( wAddSubC_Bz ), .R( wAddSubC_Result ), .iOperation( wAddSubC_Operation ), .iInputReady( wAddSubC_InputReady ), .OutputReady( wAddSubC_OutputReady ) ); always @ ( * ) begin case (iOperation) `CROSS: wAddSubC_InputReady = wMultiplicationE_OutputReady && wMultiplicationF_OutputReady; default: wAddSubC_InputReady = iInputReady; endcase end //------------------------------------------------------ wire [`WIDTH-1:0] wSquareRoot_Result; wire wSquareRoot_OutputReady; FixedPointSquareRoot SQROOT1 ( .Clock( Clock ), .Reset( Reset ), .Operand( wAddSubB_Result ), .iInputReady( wAddSubBOutputReady && iOperation == `MAG), .OutputReady( wSquareRoot_OutputReady ), .Result( wSquareRoot_Result ) ); //------------------------------------------------------ assign wModulus2N_ResultA = (iChannel_Ax & wAddSubA_Result ); assign wModulus2N_ResultB = (iChannel_Ay & wAddSubB_Result ); assign wModulus2N_ResultC = (iChannel_Az & wAddSubC_Result ); //&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&&// //****Mux for ResultA*** // Notice that the Dot Product or the Magnitud Result will // output in ResultA. always @ ( * ) begin case ( iOperation ) `RETURN: ResultA = iChannel_Ax; `ADD: ResultA = (wAddSubA_Result[63] == 1'b1) ? { 1'b1,wAddSubA_Result[30:0]} : {1'b0,wAddSubA_Result[30:0]};// & 32'h7FFFFFFF; `SUB: ResultA = (wAddSubA_Result[63] == 1'b1) ? { 1'b1,wAddSubA_Result[30:0]} : {1'b0,wAddSubA_Result[30:0]};//wAddSubA_Result[31:0]; `CROSS: ResultA = (wAddSubA_Result[63] == 1'b1) ? { 1'b1,wAddSubA_Result[30:0]} : {1'b0,wAddSubA_Result[30:0]};//wAddSubA_Result[31:0]; `DIV: ResultA = wDivisionA_Result; `MUL: ResultA = wMultiplicationA_Result[31:0]; `IMUL: ResultA = wMultiplicationA_Result[31:0]; `DOT: ResultA = (wAddSubB_Result[63] == 1'b1) ? { 1'b1,wAddSubB_Result[30:0]} : {1'b0,wAddSubB_Result[30:0]};//wAddSubB_Result[31:0]; `MAG: ResultA = wSquareRoot_Result; `ZERO: ResultA = 32'b0; `COPY: ResultA = iChannel_Ax; `TMREAD: ResultA = iTMEMReadData[95:64]; `LEA: ResultA = {16'b0,iCurrentIP}; `SWIZZLE3D: ResultA = wSwizzleOutputX; //Set Operations `UNSCALE: ResultA = iChannel_Ax >> `SCALE; `SETX,`RET: ResultA = iChannel_Ax; `SETY: ResultA = iChannel_Bx; `SETZ: ResultA = iChannel_Bx; `INC,`INCX,`INCY,`INCZ: ResultA = (wAddSubA_Result[63] == 1'b1) ? { 1'b1,wAddSubA_Result[30:0]} : {1'b0,wAddSubA_Result[30:0]}; `DEC: ResultA = (wAddSubA_Result[63] == 1'b1) ? { 1'b1,wAddSubA_Result[30:0]} : {1'b0,wAddSubA_Result[30:0]}; `MOD: ResultA = wModulus2N_ResultA; `FRAC: ResultA = iChannel_Ax & (`WIDTH'hFFFFFFFF >> (`WIDTH - `SCALE)); `MULP: ResultA = iChannel_Ax; `NEG: ResultA = ~iChannel_Ax + 1'b1; `XCHANGEX: ResultA = iChannel_Bx; default: begin `ifdef DEBUG // $display("%dns ALU: Error Unknown Operation: %d",$time,iOperation); // $stop(); `endif ResultA = 32'b0; end endcase end //------------------------------------------------------ //****Mux for RB*** always @ ( * ) begin case ( iOperation ) `RETURN: ResultB = iChannel_Ax; `ADD: ResultB = (wAddSubB_Result[63] == 1'b1) ? {1'b1,wAddSubB_Result[30:0]} : {1'b0,wAddSubB_Result[30:0]}; // & 32'h7FFFFFFF; `SUB: ResultB = (wAddSubB_Result[63] == 1'b1) ? {1'b1,wAddSubB_Result[30:0]} : {1'b0,wAddSubB_Result[30:0]}; //wAddSubB_Result[31:0]; `CROSS: ResultB = (wAddSubB_Result[63] == 1'b1) ? {1'b1,wAddSubB_Result[30:0]} : {1'b0,wAddSubB_Result[30:0]};//wAddSubB_Result[31:0]; `DIV: ResultB = wDivisionB_Result; `MUL: ResultB = wMultiplicationB_Result[31:0]; `IMUL: ResultB = wMultiplicationB_Result[31:0]; `DOT: ResultB = (wAddSubB_Result[63] == 1'b1) ? {1'b1,wAddSubB_Result[30:0]} : {1'b0,wAddSubB_Result[30:0]};//wAddSubB_Result[31:0]; `MAG: ResultB = wSquareRoot_Result; `ZERO: ResultB = 32'b0; `COPY: ResultB = iChannel_Ay; `TMREAD: ResultB = iTMEMReadData[63:32]; `LEA: ResultB = {16'b0,iCurrentIP}; //Set Operations `UNSCALE: ResultB = iChannel_Ay >> `SCALE; `SETX,`RET: ResultB = iChannel_By; // {Source1[95:64],Source0[63:32],Source0[31:0]}; `SETY: ResultB = iChannel_Ax; // {Source0[95:64],Source1[95:64],Source0[31:0]}; `SETZ: ResultB = iChannel_By; // {Source0[95:64],Source0[63:32],Source1[95:64]}; `SWIZZLE3D: ResultB = wSwizzleOutputY; `INC,`INCX,`INCY,`INCZ: ResultB = (wAddSubB_Result[63] == 1'b1) ? {1'b1,wAddSubB_Result[30:0]} : {1'b0,wAddSubB_Result[30:0]}; // & 32'h7FFFFFFF; `DEC: ResultB = (wAddSubB_Result[63] == 1'b1) ? {1'b1,wAddSubB_Result[30:0]} : {1'b0,wAddSubB_Result[30:0]}; // & 32'h7FFFFFFF; `MOD: ResultB = wModulus2N_ResultB; `FRAC: ResultB = iChannel_Ay & (`WIDTH'hFFFFFFFF >> (`WIDTH - `SCALE)); `MULP: ResultB = iChannel_Ay; `NEG: ResultB = ~iChannel_Ay + 1'b1; `XCHANGEX: ResultB = iChannel_Ay; default: begin `ifdef DEBUG //$display("%dns ALU: Error Unknown Operation: %d",$time,iOperation); //$stop(); `endif ResultB = 32'b0; end endcase end //------------------------------------------------------ //****Mux for RC*** always @ ( * ) begin case ( iOperation ) `RETURN: ResultC = iChannel_Ax; `ADD: ResultC = (wAddSubC_Result[63] == 1'b1) ? {1'b1,wAddSubC_Result[30:0]} : {1'b0,wAddSubC_Result[30:0]}; //wAddSubC_Result[31:0];// & 32'h7FFFFFFF; `SUB: ResultC = (wAddSubC_Result[63] == 1'b1) ? {1'b1,wAddSubC_Result[30:0]} : {1'b0,wAddSubC_Result[30:0]}; //wAddSubC_Result[31:0]; `CROSS: ResultC = (wAddSubC_Result[63] == 1'b1) ? {1'b1,wAddSubC_Result[30:0]} : {1'b0,wAddSubC_Result[30:0]};//wAddSubC_Result[31:0]; `DIV: ResultC = wDivisionC_Result; `MUL: ResultC = wMultiplicationC_Result[31:0]; `IMUL: ResultC = wMultiplicationC_Result[31:0]; `DOT: ResultC = (wAddSubB_Result[63] == 1'b1) ? {1'b1,wAddSubB_Result[30:0]} : {1'b0,wAddSubB_Result[30:0]};//wAddSubB_Result[31:0]; `MAG: ResultC = wSquareRoot_Result; `ZERO: ResultC = 32'b0; `COPY: ResultC = iChannel_Az; `TMREAD: ResultC = iTMEMReadData[31:0]; `LEA: ResultC = {16'b0,iCurrentIP}; `SWIZZLE3D: ResultC = wSwizzleOutputZ; //Set Operations `UNSCALE: ResultC = iChannel_Az >> `SCALE; `SETX,`RET: ResultC = iChannel_Bz; // {Source1[95:64],Source0[63:32],Source0[31:0]}; `SETY: ResultC = iChannel_Bz; // {Source0[95:64],Source1[95:64],Source0[31:0]}; `SETZ: ResultC = iChannel_Ax; // {Source0[95:64],Source0[63:32],Source1[95:64]}; `INC,`INCX,`INCY,`INCZ: ResultC = (wAddSubC_Result[63] == 1'b1) ? {1'b1,wAddSubC_Result[30:0]} : {1'b0,wAddSubC_Result[30:0]}; //wAddSubC_Result[31:0];// & 32'h7FFFFFFF; `DEC: ResultC = (wAddSubC_Result[63] == 1'b1) ? {1'b1,wAddSubC_Result[30:0]} : {1'b0,wAddSubC_Result[30:0]}; //wAddSubC_Result[31:0];// & 32'h7FFFFFFF; `MOD: ResultC = wModulus2N_ResultC; `FRAC: ResultC = iChannel_Az & (`WIDTH'hFFFFFFFF >> (`WIDTH - `SCALE)); `MULP: ResultC = wMultiplicationA_Result[31:0]; `NEG: ResultC = ~iChannel_Az + 1'b1; `XCHANGEX: ResultC = iChannel_Az; default: begin `ifdef DEBUG //$display("%dns ALU: Error Unknown Operation: %d",$time,iOperation); //$stop(); `endif ResultC = 32'b0; end endcase end //------------------------------------------------------------------------ always @ ( * ) begin case (iOperation) `JMP,`CALL,`RET: oBranchTaken = OutputReady; `JGX: oBranchTaken = wArithmeticComparison_Result; `JGY: oBranchTaken = wArithmeticComparison_Result; `JGZ: oBranchTaken = wArithmeticComparison_Result; `JLX: oBranchTaken = wArithmeticComparison_Result; `JLY: oBranchTaken = wArithmeticComparison_Result; `JLZ: oBranchTaken = wArithmeticComparison_Result; `JEQX: oBranchTaken = wArithmeticComparison_Result; `JEQY: oBranchTaken = wArithmeticComparison_Result; `JEQZ: oBranchTaken = wArithmeticComparison_Result; `JNEX: oBranchTaken = wArithmeticComparison_Result; `JNEY: oBranchTaken = wArithmeticComparison_Result; `JNEZ: oBranchTaken = wArithmeticComparison_Result; `JGEX: oBranchTaken = wArithmeticComparison_Result; `JGEY: oBranchTaken = wArithmeticComparison_Result; `JGEZ: oBranchTaken = wArithmeticComparison_Result; `JLEX: oBranchTaken = wArithmeticComparison_Result; `JLEY: oBranchTaken = wArithmeticComparison_Result; `JLEZ: oBranchTaken = wArithmeticComparison_Result; default: oBranchTaken = 0; endcase end always @ ( * ) begin case (iOperation) `JMP,`CALL,`RET,`JGX,`JGY,`JGZ,`JLX,`JLY,`JLZ,`JEQX,`JEQY,`JEQZ, `JNEX,`JNEY,`JNEZ,`JGEX,`JGEY,`JGEZ: oBranchNotTaken = !oBranchTaken && OutputReady; `JLEX: oBranchNotTaken = !oBranchTaken && OutputReady; `JLEY: oBranchNotTaken = !oBranchTaken && OutputReady; `JLEZ: oBranchNotTaken = !oBranchTaken && OutputReady; default: oBranchNotTaken = 0; endcase end //------------------------------------------------------------------------ //Output ready logic Stuff for Division... //Some FFT will hopefully do the trick wire wDivisionOutputReadyA,wDivisionOutputReadyB,wDivisionOutputReadyC; wire wDivisionOutputReady; assign wAddSubAOutputReady = wAddSubA_OutputReady; assign wAddSubBOutputReady = wAddSubB_OutputReady; assign wAddSubCOutputReady = wAddSubC_OutputReady; FFT1 FFT_DivisionA ( .D(1'b1), .Clock( wDivisionA_OutputReady ), .Reset( iInputReady ), .Q( wDivisionOutputReadyA ) ); FFT1 FFT_DivisionB ( .D(1'b1), .Clock( wDivisionB_OutputReady ), .Reset( iInputReady ), .Q( wDivisionOutputReadyB ) ); FFT1 FFT_DivisionC ( .D(1'b1), .Clock( wDivisionC_OutputReady ), .Reset( iInputReady ), .Q( wDivisionOutputReadyC ) ); assign wDivisionOutputReady = ( wDivisionOutputReadyA && wDivisionOutputReadyB && wDivisionOutputReadyC ); assign wMultiplicationOutputReadyA = wMultiplicationA_OutputReady; assign wMultiplicationOutputReadyB = wMultiplicationB_OutputReady; assign wMultiplicationOutputReadyC = wMultiplicationC_OutputReady; assign wMultiplicationOutputReadyD = wMultiplicationD_OutputReady; assign wMultiplicationOutputReady = ( wMultiplicationOutputReadyA && wMultiplicationOutputReadyB && wMultiplicationOutputReadyC ); wire wSquareRootOutputReady; FFT1 FFT_Sqrt ( .D(1'b1), .Clock( wSquareRoot_OutputReady ), .Reset( iInputReady ), .Q( wSquareRootOutputReady ) ); //------------------------------------------------------------------------ wire wOutputDelay1Cycle,wOutputDelay2Cycle,wOutputDelay3Cycle; FFD_POSEDGE_ASYNC_RESET # (1) FFOutputReadyDelay2 ( .Clock( Clock ), .Clear( Reset ), .D( iInputReady ), .Q( wOutputDelay1Cycle ) ); FFD_POSEDGE_ASYNC_RESET # (1) FFOutputReadyDelay22 ( .Clock( Clock ), .Clear( Reset ), .D( wOutputDelay1Cycle ), .Q( wOutputDelay2Cycle ) ); FFD_POSEDGE_ASYNC_RESET # (1) FFOutputReadyDelay222 ( .Clock( Clock && wOperation == `OMWRITE), .Clear( Reset ), .D( wOutputDelay2Cycle ), .Q( wOutputDelay3Cycle ) ); FFD_POSEDGE_SYNCRONOUS_RESET # ( `INSTRUCTION_OP_LENGTH ) SourceZ2 ( .Clock( Clock ), .Reset( Reset ), .Enable( iInputReady ), .D( iOperation ), .Q(wOperation) ); //Mux for output ready signal always @ ( * ) begin case ( wOperation ) `UNSCALE: OutputReady = wOutputDelay1Cycle; `RETURN: OutputReady = wOutputDelay1Cycle; `NOP: OutputReady = wOutputDelay1Cycle; `FRAC: OutputReady = wOutputDelay1Cycle; `NEG: OutputReady = wOutputDelay1Cycle; `OMWRITE: OutputReady = wOutputDelay3Cycle; `TMREAD: OutputReady = wTMReadOutputReady; //One cycle after TMEM data availale asserted `ifdef DEBUG //Debug Print behaves as a NOP in terms of ALU... `DEBUG_PRINT: OutputReady = wOutputDelay1Cycle; `endif `ADD,`INC,`INCX,`INCY,`INCZ: OutputReady = wAddSubAOutputReady && wAddSubBOutputReady && wAddSubCOutputReady; `SUB,`DEC: OutputReady = wAddSubAOutputReady && wAddSubBOutputReady && wAddSubCOutputReady; `DIV: OutputReady = wDivisionOutputReady; `MUL,`IMUL: OutputReady = wMultiplicationOutputReady; `MULP: OutputReady = wMultiplicationOutputReadyA; `DOT: OutputReady = wAddSubBOutputReady; `CROSS: OutputReady = wAddSubAOutputReady && wAddSubBOutputReady && wAddSubCOutputReady; `MAG: OutputReady = wSquareRootOutputReady; `ZERO: OutputReady = wOutputDelay1Cycle; `COPY: OutputReady = wOutputDelay1Cycle; `SWIZZLE3D: OutputReady = wOutputDelay1Cycle; `SETX,`SETY,`SETZ,`JMP,`LEA,`CALL,`RET: OutputReady = wOutputDelay1Cycle; `JGX,`JGY,`JGZ: OutputReady = ArithmeticComparison_OutputReady; `JLX,`JLY,`JLZ: OutputReady = ArithmeticComparison_OutputReady; `JEQX,`JEQY,`JEQZ: OutputReady = ArithmeticComparison_OutputReady; `JNEX,`JNEY,`JNEZ: OutputReady = ArithmeticComparison_OutputReady; `JGEX,`JGEY,`JGEZ: OutputReady = ArithmeticComparison_OutputReady; `JLEX,`JLEY,`JLEZ: OutputReady = ArithmeticComparison_OutputReady; `MOD: OutputReady = wAddSubAOutputReady && //TODO: wait 1 more cycle wAddSubBOutputReady && wAddSubCOutputReady; `XCHANGEX: OutputReady = wOutputDelay1Cycle; default: begin OutputReady = 32'b0; //`ifdef DEBUG //$display("*** ALU ERROR: iOperation = %d ***",iOperation); //`endif end endcase end endmodule //------------------------------------------------------------------------
Go to most recent revision | Compare with Previous | Blame | View Log