OpenCores
URL https://opencores.org/ocsvn/thor/thor/trunk

Subversion Repositories thor

[/] [thor/] [trunk/] [FT64/] [rtl/] [seq/] [FT64seq.v] - Rev 54

Go to most recent revision | Compare with Previous | Blame | View Log

// ============================================================================
//        __
//   \\__/ o\    (C) 2017-2018  Robert Finch, Waterloo
//    \  __ /    All rights reserved.
//     \/_//     robfinch<remove>@finitron.ca
//       ||
//
// FT64seq.v
// - FT64 processing core - sequential version
//
// This source file is free software: you can redistribute it and/or modify 
// it under the terms of the GNU Lesser General Public License as published 
// by the Free Software Foundation, either version 3 of the License, or     
// (at your option) any later version.                                      
//                                                                          
// This source file is distributed in the hope that it will be useful,      
// but WITHOUT ANY WARRANTY; without even the implied warranty of           
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the            
// GNU General Public License for more details.                             
//                                                                          
// You should have received a copy of the GNU General Public License        
// along with this program.  If not, see <http://www.gnu.org/licenses/>.    
//
// ============================================================================
//
// Comment out the following line to exclude AMO operations from the core.
`define EXT_A	1'b1
// Comment out the following line to exclude multiply/divide operations from the core.
`define EXT_M	1'b1
 
`define BRK		6'h00
`define R2		6'h02
`define R1			6'h01
`define ABS				5'h04
`define NOT             5'h05
`define SUB			6'h05
`define Scc		    6'h06
`define Sccu	    6'h07
`define SHIFTW		6'h0F
`define SHIFTB		6'h1F
`define LEAX		6'h18
`define SYNC		6'h22
`define SHIFTC		6'h2F
`define SEI			6'h30
`define WAIT		6'h31
`define RTI			6'h32
`define RTE			6'h32
`define DIVMODU		6'h3C
`define DIVMODSU	6'h3D
`define DIVMOD		6'h3E
`define SHIFTH		6'h3F
`define BccR	6'h03
`define ADD		6'h04
`define CMP		6'h06
`define CMPU	6'h07
`define AND		6'h08
`define OR		6'h09
`define XOR		6'h0A
`define REX		6'h0D
`define CSR		6'h0E
`define LH		6'h10
`define LHU		6'h11
`define LW		6'h12
`define LB		6'h13
`define SH		6'h14
`define SB		6'h15
`define SW		6'h16
`define SWC		6'h17
`define JAL		6'h18
`define CALL	6'h19
`define QOPI	6'h1A
`define QOR			3'd0
`define QADD		3'd1
`define QAND		3'd2
`define QXOR		3'd3
`define SccI	6'h1B
`define NOP		6'h1C
`define LWR		6'h1D
`define LC		6'h20
`define LCU		6'h21
`define BITFLD	6'h22
`define LBU		6'h23
`define SC		6'h24
`define BBc0	6'h26
`define BBc1	6'h27
`define JMP		6'h28
`define LINK	6'h2A
`define MODUI	6'h2C
`define MODSUI	6'h2D
`define MODI	6'h2E
`define AMO		6'h2F
`define AMOSWAP		6'h00
`define AMOADD		6'h04
`define AMOAND		6'h08
`define AMOOR		6'h09
`define AMOXOR		6'h0A
`define AMOSHL		6'h0C
`define AMOSHR		6'h0D
`define AMOASR		6'h0E
`define AMOROL		6'h0F
`define AMOMIN		6'h1C
`define AMOMAX		6'h1D
`define AMOMINU		6'h1E
`define AMOMAXU		6'h1F
`define AMOSWAPI	6'h20
`define AMOADDI		6'h24
`define AMOANDI		6'h28
`define AMOORI		6'h29
`define AMOXORI		6'h2A
`define AMOSHLI		6'h2C
`define AMOSHRI		6'h2D
`define AMOASRI		6'h2E
`define AMOROLI		6'h2F
`define AMOMINI		6'h3C
`define AMOMAXI		6'h3D
`define AMOMINUI	6'h3E
`define AMOMAXUI	6'h3F
`define Bcc0	6'h30
`define Bcc1	6'h31
`define BEQ0	6'h32
`define BEQ1	6'h33
`define MULU	6'h38
`define MULSU	6'h39
`define MUL		6'h3A
`define DIVUI	6'h3C
`define DIVSUI	6'h3D
`define DIVI	6'h3E
 
`define SHL		4'h0
`define SHR		4'h1
`define ASL		4'h2
`define ASR		4'h3
`define ROL		4'h4
`define ROR		4'h5
`define SHLI	4'h8
`define SHRI	4'h9
`define ASLI	4'hA
`define ASRI	4'hB
`define ROLI	4'hC
`define RORI	4'hD
 
`define BEQ		4'h0
`define BNE		4'h1
`define BLT		4'h2
`define BGE		4'h3
`define BLTU	4'h4
`define BGEU	4'h5
`define FBEQ	4'h8
`define FBNE	4'h9
`define FBLT	4'hA
`define FBGE	4'hB
 
`define HARTID	11'h001
`define TICK	11'h002
`define CAUSE	11'h006
`define SCRATCH	11'h009
`define SEMA	11'h00C
`define TVEC	11'b000_0011_0???
`define TIME	11'h7E0
`define INSTRET	11'h7E1
 
module FT64seq(hartid_i, sig_i, rst_i, clk_i, tm_clk_i, irq_i, cause_i,
	cyc_o, stb_o, ack_i, sel_o, we_o, adr_o, dat_i, dat_o, sr_o, cr_o, rb_i,
	state);
input [63:0] hartid_i;
input [63:0] sig_i;
input rst_i;
input clk_i;
input tm_clk_i;				// 100 MHz
input [2:0] irq_i;
input [8:0] cause_i;
output reg cyc_o;
output reg stb_o;
input ack_i;
output reg [15:0] sel_o;
output reg we_o;
output reg [31:0] adr_o;
input [127:0] dat_i;
output reg [127:0] dat_o;
output reg sr_o;
output reg cr_o;
input rb_i;
output reg [7:0] state;
 
// Wall clock timing parameter. Number of tm_clk_i cycles for 1s interval
parameter WCTIME1S = 32'd100000000;
 
parameter RST_ADDR = 32'hFFFC0100;
parameter RESET = 8'd0;
parameter IFETCH = 8'd1;
parameter IFETCH_ACK = 8'd2;
parameter IFETCH_NACK = 8'd3;
parameter REGFETCH = 8'd4;
parameter DECODE = 8'd5;
parameter EXECUTE = 8'd6;
parameter MEMORY = 8'd7;
parameter MEMORY_NACK = 8'd8;
parameter MULDIV2 = 8'd9;
parameter AMOOP = 8'd10;
parameter AMOMEM = 8'd11;
parameter word = 2'd3;
parameter half = 2'd2;
parameter char = 2'd1;
parameter byt_ = 2'd0;
 
integer n, m;
reg [63:0] sema;
reg [43:0] brkstack [0:4];
reg [31:0] tvec [0:7];
reg [2:0] ol;
reg [2:0] im;
reg [7:0] pl;
reg [31:0] pc,opc;
reg [31:0] ir;
wire [5:0] opcode = ir[5:0];
wire [5:0] funct = ir[31:26];
wire [4:0] func5 = ir[25:21];
wire [3:0] func4 = ir[25:22];
reg [1:0] opsize;
reg [31:0] ibuf_adr [0:7];
reg [31:0] ibuf [0:7];
reg [2:0] ibuf_cnt;
reg rfwr;
reg [4:0] Ra, Rb, Rc, Rt;
reg [63:0] regfile [0:31];
wire [63:0] rfoa = regfile[Ra];
wire [63:0] rfob = regfile[Rb];
wire [63:0] rfoc = regfile[Rc];
reg [63:0] a,b,c,res,amores;
reg [31:0] rasstack [0:511];
reg [8:0] rassp;
reg [4:0] regLR = 5'd29;
 
// CSR's
reg [8:0] cause;
reg [63:0] scratch;
reg [63:0] tick;
reg [63:0] wctime, times;
reg [63:0] instret;
 
wire [127:0] produ;// = a * b;
wire [127:0] prods;// = $signed(a) * $signed(b);
wire [127:0] prodsu;// = $signed(a) * b;
wire [2:0] npl = ir[23:16] | a;
wire [63:0] sum = a + b;
wire [63:0] dif = a - b;
wire [31:0] eandx = a + (b << ir[22:21]);
wire [63:0] am8 = a - 32'd8;	// for link
wire [31:0] xIncea = ir[25] ? a + {{59{ir[25]}},ir[25:21]} : a;	// for POP / PUSH
 
reg [63:0] opimp;
reg [63:0] fnimp;
 
function [23:0] regname;
input [4:0] regno;
case(regno)
5'd0:	regname = "r0";
5'd1:	regname = "r1";
5'd2:	regname = "r2";
5'd3:	regname = "r3";
5'd4:	regname = "r4";
5'd5:	regname = "r5";
5'd6:	regname = "r6";
5'd7:	regname = "r7";
5'd8:	regname = "r8";
5'd9:	regname = "r9";
5'd10:	regname = "r10";
5'd11:	regname = "r11";
5'd12:	regname = "r12";
5'd13:	regname = "r13";
5'd14:	regname = "r14";
5'd15:	regname = "r15";
5'd16:	regname = "r16";
5'd17:	regname = "r17";
5'd18:	regname = "r18";
5'd19:	regname = "r19";
5'd20:	regname = "r20";
5'd21:	regname = "r21";
5'd22:	regname = "r22";
5'd23:	regname = "r23";
5'd24:	regname = "r24";
5'd25:	regname = "r25";
5'd26:	regname = "r26";
5'd27:	regname = "r27";
5'd28:	regname = "r28";
5'd29:	regname = "lr";
5'd30:	regname = "bp";
5'd31:	regname = "sp";
endcase
endfunction
 
always @*
begin
m <= 4'hF;
for (n = 0; n < 8; n = n + 1)
	if (pc==ibuf_adr[n])
		m <= n;
end
 
reg [127:0] din;	// input data latch
reg [3:0] dshift;
wire [7:0] byte_in = din >> {dshift[3:0],3'b0};
wire [15:0] char_in = din >> {dshift[3:1],4'h0};
wire [31:0] half_in = din >> {dshift[3:2],5'h0};
wire [63:0] word_in = din >> {dshift[3],6'h0};
 
wire [127:0] shlo = {64'd0,a} << b[5:0];
wire [127:0] shro = {a,64'd0} >> b[5:0];
wire [31:0]  asro32 = a[31] ? ~(32'hFFFFFFFFFFFFFFFF >> b[5:0]) | shro[95:64] : shro[95:64];
 
wire [63:0] bfo;
wire [63:0] shiftwo;
wire [31:0] shiftho;
 
FT64_shift uws1
(
	.instr(ir),
	.a(a),
	.b(b),
	.res(shiftwo),
	.ov()
);
 
FT64_shifth uhws1
(
	.instr(ir),
	.a(a[31:0]),
	.b(b[31:0]),
	.res(shiftho),
	.ov()
);
 
FT64_bitfield ubf1
(
	.inst(ir),
	.a(a),
	.b(b),
	.o(bfo),
	.masko()
);
 
reg div_ld, mul_ld;
reg [4:0] mul_cnt;
wire div_done;
wire [63:0] div_qo, div_ro;
wire div_sgn = opcode==`DIVI || opcode==`MODI || (opcode==`R2 && (funct==`DIVMOD));
wire div_sgnus = opcode==`DIVSUI || opcode==`MODSUI || (opcode==`R2 && (funct==`DIVMODSU));
 
`ifdef EXT_M
FT64_divider udiv1
(
	.rst(rst_i),
	.clk(clk_i),
	.ld(div_ld),
	.abort(),
	.sgn(div_sgn),
	.sgnus(div_sgnus),
	.a(a),
	.b(b),
	.qo(div_qo),
	.ro(div_ro),
	.dvByZr(),
	.done(div_done),
	.idle()
);
 
FT64_mul umul1
(
	.CLK(clk_i),
	.A(a),
	.B(b),
	.P(prods)
);
 
FT64_mulu umul2
(
	.CLK(clk_i),
	.A(a),
	.B(b),
	.P(produ)
);
 
FT64_mulsu umul3
(
	.CLK(clk_i),
	.A(a),
	.B(b),
	.P(prodsu)
);
`endif
 
wire takb;
 
FT64_EvalBranch ube1
(
	.instr(ir),
	.a(a),
	.b(b),
	.takb(takb)
);
 
always @(posedge clk_i)
if (rst_i)
	mul_cnt <= 5'd19;
else begin
	if (mul_ld)
		mul_cnt <= 5'd1;
	else if (mul_cnt < 5'd19)
		mul_cnt <= mul_cnt + 5'd1;
end
wire mul_done = mul_cnt==5'd19;
 
always @(posedge clk_i)
	if (ack_i)
		din <= dat_i;
always @(posedge clk_i)
	if (ack_i)
		dshift <= adr_o[3:0];
 
reg rbl;
always @(posedge clk_i)
	if (ack_i)
		rbl <= rb_i;
 
always @(posedge clk_i)
	if (rst_i)
		tick <= 63'd0;
	else
		tick <= tick + 64'd1;
 
always @(posedge clk_i)
if (rst_i)
	state <= RESET;
else begin
 
// Cause these signals to pulse for just one clock cycle. They are set
// active below.
div_ld <= `FALSE;
mul_ld <= `FALSE;
rfwr <= `FALSE;
 
case(state)
 
// RESET:
// Reset only the signals critical to the proper operation of the core.
// This includes setting the PC address and deactivating the bus
// controls.
RESET:
	begin
	im <= 3'd7;
	ol <= 3'd0;
	pl <= 8'h00;
	pc <= RST_ADDR;
	cyc_o <= `LOW;
	stb_o <= `LOW;
	we_o <= `LOW;
	sel_o <= 16'h0000;
	adr_o <= 32'hFFFFFFFF;
	instret <= 64'd0;
	opimp <= 64'h000F_F1FF_3FFF_67DD;
`ifdef EXT_A
	opimp[47] <= 1'b1;
`endif
`ifdef EXT_M
	opimp[63:55] <= 8'h77;
`endif
	fnimp <= 64'h8005_701F_A1FF_87F4;
`ifdef EXT_M
	fnimp[63:55] <= 8'h77;
`endif
	goto(IFETCH);
	end
 
// IFETCH:
// Fetch instructions from memory located by the program counter. A fully
// associative buffer (cache) of the most recently used eight instructions
// is maintained. A memory access won't be required if the instruction can
// be found in the buffer.
// Also update the register file for the previous instruction. Rather than
// have another state in the state machine to perform the register update
// it is done here to improve performance.
IFETCH:
	begin
		opc <= pc;
		instret <= instret + 64'd1;
		if (irq_i > im) begin
			ir <= {13'd0,irq_i,1'b0,cause_i,`BRK};
			goto(DECODE);
		end
		else if (m[3]) begin
			cyc_o <= `HIGH;
			stb_o <= `HIGH;
			sel_o <= 16'hF << {pc[3:2],2'b0};
			adr_o <= pc;
			goto(IFETCH_ACK);
		end
		else begin
			ir <= ibuf[m];
			pc <= pc + 32'd4;
			$display("ir: %h (from ibuf)", ibuf[m]);
			goto(DECODE);
		end
	end
IFETCH_ACK:
	if (ack_i) begin
		cyc_o <= `LOW;
		stb_o <= `LOW;
		sel_o <= 16'h0000;
		//adr_o <= 32'hFFFFFFFF;
		goto(IFETCH_NACK);
	end
IFETCH_NACK:
	if (~ack_i) begin
		ir <= half_in;
		ibuf[ibuf_cnt] <= half_in;
		ibuf_adr[ibuf_cnt] <= pc;
		ibuf_cnt <= ibuf_cnt + 3'd1;
		pc <= pc + 32'd4;
		$display("ir: %h", half_in);
		goto(DECODE);
	end
 
// DECODE:
// Setup for register file access. Ra, Rb, Rc are almost always decoded from
// the same spot in the instruction register to keep the decoding simple and
// access to the register file fast. For the call instruction Ra is forced to
// r31 since it doesn't come from the ir. Rt tends to float around depending on
// the instruction.
// Several instructions which do not have register operands (JMP,NOP,RTI, and
// BRK) are executed directly in the decode stage to improve performance.
DECODE:
	begin
		goto(REGFETCH);
		Ra <= ir[10:6];
		Rb <= ir[15:11];
		Rc <= ir[20:16];
		Rt <= 5'd0;
		opsize <= word;
		if (!opimp[opcode])
			exe_brk(9'd485);	// unimplemented
		case(opcode)
		`BRK:
			exe_brk(ir[14:6]);
		`R2:
			begin
				if (!fnimp[opcode])
					exe_brk(9'd485);	// unimplemented
				Rt <= ir[20:16];
				case(funct)
				`R1:
					case(func5)
					`ABS,`NOT:	Rt <= ir[15:11];
					endcase
				`ADD,`SUB:
				    opsize <= ir[22:21];
				`AND,`OR,`XOR:
					Rt <= ir[25:21];
				`SHIFTB,`SHIFTC,`SHIFTH,`SHIFTW:
					Rt <= ir[25] ? ir[15:11] : ir[20:16];
				// The SYNC instruction is treated as a NOP since this machine
				// is strictly in order.
				`SYNC:	goto(IFETCH);
				`SB,`SC,`SH,`SW,`SWC:	Rt <= 5'd0;
				endcase
			end
		`NOP:	goto(IFETCH);
		`JMP:
			begin
			pc <= {pc[31:28],ir[31:6],2'b00};
			goto(IFETCH);
			end
		`CALL:
			Rt <= regLR;
		`JAL:
			Rt <= ir[15:11];
		`CSR:
			Rt <= ir[15:11];
		`QOPI:
			begin
			Ra <= ir[15:11];
			Rt <= ir[15:11];
			end
		`BITFLD:
			Rt <= ir[15:11];
		`ADD,`CMP,`CMPU,`AND,`OR,`XOR,
`ifdef EXT_M
		`MULU,`MUL,`MULSU,
		`DIVI,`DIVUI,`DIVSUI,`MODI,`MODUI,`MODSUI,
`endif
		`LB,`LBU,`LC,`LCU,`LH,`LHU,`LW,`LWR:
			Rt <= ir[15:11];
		`SB,`SC,`SH,`SW,`SWC:
			Rt <= 5'd0;
`ifdef EXT_A
		`AMO:
			Rt <= ir[31] ? ir[15:11] : ir[20:16];
`endif
		default: ;
		endcase
	end
 
// REGFETCH:
// Set operands from the register file, or the instruction register for
// immediate operands.
REGFETCH:
	begin
		goto(EXECUTE);
		a <= rfoa;
		b <= rfob;
		case(opcode)
		`R2:
			case(funct)
			`SHIFTW,`SHIFTB,`SHIFTC,`SHIFTH:
				if (ir[25]) b <= ir[21:16];
			`AND,`OR,`XOR:
				c <= rfoc;
`ifdef EXT_M				
			`MUL,`MULU,`MULSU:
				mul_ld <= `TRUE;
			`DIVMOD,`DIVMODU,`DIVMODSU:
				div_ld <= `TRUE;
`endif
			`LB,`LBU,`LH,`LHU,`LC,`LCU,`LW,`LWR,
			`SB,`SC,`SH,`SW,`SWC:
				c <= rfoc;
			endcase
		`ADD,`CMP,`CMPU,`AND,`OR,`XOR:
			b <= {{48{ir[31]}},ir[31:16]};
		`SccI:
			b <= {{52{ir[27]}},ir[27:16]};
`ifdef EXT_M
		`MUL,`MULU,`MULSU:
			begin
			b <= {{48{ir[31]}},ir[31:16]};
			mul_ld <= `TRUE;
			end
		`DIVI,`MODI,`DIVUI,`DIVSUI,`MODUI,`MODSUI:
			begin
			b <= {{48{ir[31]}},ir[31:16]};
			div_ld <= `TRUE;
			end
`endif		
		`QOPI:
			begin
				case(ir[10:8])
				3'd0,3'd3:	// OR, XOR
					case(ir[7:6])
					2'd0:	b <= {{48{1'b0}},ir[31:16]};
					2'd1:	b <= {{32{1'b0}},ir[31:16]} << 16;
					2'd2:	b <= {{16{1'b0}},ir[31:16]} << 32;
					2'd3:	b <= {ir[31:16]} << 48;
					endcase
				3'd1:	// ADD
					case(ir[7:6])
					2'd0:	b <= {{48{ir[31]}},ir[31:16]};
					2'd1:	b <= {{32{ir[31]}},ir[31:16]} << 16;
					2'd2:	b <= {{16{ir[31]}},ir[31:16]} << 32;
					2'd3:	b <= {ir[31:16]} << 48;
					endcase
				3'd2:	// AND
					case(ir[7:6])
					2'd0:	b <= {{48{1'b1}},ir[31:16]};
					2'd1:	b <= {{32{1'b1}},ir[31:16],16'hFFFF};
					2'd2:	b <= {{16{1'b1}},ir[31:16],32'hFFFFFFFF};
					2'd3:	b <= {ir[31:16],48'hFFFFFFFFFFFF};
					endcase
				default:	b <= 64'd0;
				endcase
			end
		`Bcc0,`Bcc1,`BccR,`BBc0,`BBc1:
			c <= rfoc;
		`BEQ0,`BEQ1:
			b <= {{55{ir[19]}},ir[19:11]};
		`JAL:
			b <= {{48{ir[31]}},ir[31:16]};
		`LB,`LBU,`LH,`LHU,`LC,`LCU,`LW,`LWR,
		`SB,`SC,`SH,`SW,`SWC:
			begin
			b <= {{48{ir[31]}},ir[31:16]};
			c <= rfob;
			end
`ifdef EXT_A		
		`AMO:
			if (ir[31])
				b <= {{59{ir[20]}},ir[20:16]};
`endif			
		endcase
	end
 
// EXECUTE:
// Execute the instruction. Compute results and begin any memory access.
EXECUTE:
	begin
		goto(IFETCH);
		case(opcode)
		`R2:
			case(funct)
			`RTE:
				begin
					pc <= {brkstack[0][43:14],2'b00};
					pl <= brkstack[0][13:6];
					ol <= brkstack[0][5:3];
					im <= brkstack[0][2:0];
					for (n = 0; n < 4; n = n + 1)
						brkstack[n] <= brkstack[n+1];
					sema[0] <= 1'b0;
					sema[ir[21:16]|a[5:0]] <= 1'b0;
				end
			`R1:
				case(func5)
				`ABS:	begin res <= a[63] ? -a : a; rfwr <= `TRUE; end
				`NOT:   begin res <= a!=0 ? 64'd0 : 64'd1; rfwr <= `TRUE; end
				endcase
			`SEI:	im <= a[2:0] | ir[18:16];
			`SHIFTW:
			    begin
			    rfwr <= `TRUE;
			    res <= shiftwo;
                end
			`SHIFTH:
                begin
                rfwr <= `TRUE;
                case(func4)
                `SHL,`SHLI:    res <= {32'd0,shiftho};
                `SHR,`SHRI:    res <= {32'd0,shiftho};
                `ASL,`ASLI:    res <= {{32{shiftho[31]}},shiftho};
                `ASR,`ASRI:    res <= {{32{shiftho[31]}},shiftho};
                `ROL,`ROLI: begin
                            res[31:0] <= shiftho;
                            res[63:32] <= {32{shiftho[31]}};
                            end
                `ROR,`RORI: begin
                            res[31:0] <= shiftho;
                            res[63:32] <= {32{shiftho[31]}};
                            end
                endcase
                end
            `ADD:	begin
                    rfwr <= `TRUE;
                    case(opsize)
                    word:   res <= sum;
                    half:   res <= {{32{sum[31]}},sum[31:0]};
                    char:   res <= {{48{sum[15]}},sum[15:0]};
                    byt_:   res <= {{56{sum[7]}},sum[7:0]};
                    endcase
                    end
            `SUB:	begin
                    rfwr <= `TRUE;
                    case(opsize)
                    word:   res <= dif;
                    half:   res <= {{32{dif[31]}},dif[31:0]};
                    char:   res <= {{48{dif[15]}},dif[15:0]};
                    byt_:   res <= {{56{dif[7]}},dif[7:0]};
                    endcase
                    end
			`Scc:	begin
					rfwr <= `TRUE;
					case(ir[25:23])
					3'd0:	res <= $signed(a) < $signed(b) ? 64'hFFFFFFFFFFFFFFFF : a==b ? 64'h0 : 64'h1;
					3'd2:	res <= a==b;
					3'd3:	res <= a!=b;
					3'd4:	res <= $signed(a) < $signed(b);
					3'd5:	res <= $signed(a) >= $signed(b);
					3'd6:	res <= $signed(a) <= $signed(b);
					3'd7:	res <= $signed(a) > $signed(b);
					endcase
					end
			`Sccu:	begin
					rfwr <= `TRUE;
					case(ir[25:23])
					3'd0:	res <= a < b ? 64'hFFFFFFFFFFFFFFFF : a==b ? 64'h0 : 64'h1;
					3'd2:	res <= a==b;
					3'd3:	res <= a!=b;
					3'd4:	res <= a < b;
					3'd5:	res <= a >= b;
					3'd6:	res <= a <= b;
					3'd7:	res <= a > b;
					endcase
					end
`ifdef EXT_M					
			`MULU:	if (mul_done) begin
						res <= ir[25:23]==3'd0 ? produ[63:0] : produ[127:64];
						rfwr <= `TRUE;
						goto(IFETCH);
					end
					else
						goto(EXECUTE);
			`MUL:	if (mul_done) begin
						res <= ir[25:23]==3'd0 ? prods[63:0] : prods[127:64];
						rfwr <= `TRUE;
						goto(IFETCH);
					end
					else
						goto(EXECUTE);
			`MULSU:	if (mul_done) begin
						res <= ir[25:23]==3'd0 ? prodsu[63:0] : prodsu[127:64];
						rfwr <= `TRUE;
						goto(IFETCH);
					end
					else
						goto(EXECUTE);
			// For divide stay in the EXECUTE state until the divide is done.
			`DIVMOD,`DIVMODU,`DIVMODSU:
					if (div_done) begin
						res <= ir[25:23]==3'd0 ? div_qo : div_ro;
						rfwr <= `TRUE;
						goto(IFETCH);
					end
					else
						goto(EXECUTE);
`endif				
			`AND:	begin res <= a & b & c; rfwr <= `TRUE; end
			`OR:	begin res <= a | b | c; rfwr <= `TRUE; end
			`XOR:	begin res <= a ^ b ^ c; rfwr <= `TRUE; end
			`LEAX:
				begin
					rfwr <= `TRUE;
					res <= eandx;
				end
			`LB,`LBU:	wb_read(16'h01 << eandx[3:0], eandx);
			`LC,`LCU:	wb_read(16'h03 << {eandx[3:1],1'b0}, eandx);
			`LH,`LHU:	wb_read(16'h0F << {eandx[3:2],2'b0}, eandx);
			`LW:		wb_read(16'hFF << {eandx[3],3'b0}, eandx);
			`LWR: begin wb_read(16'hFF << {eandx[3],3'b0}, eandx); sr_o <= `HIGH; end
			`SB:	wb_write(16'h01 << eandx[3:0],eandx,{8{c[7:0]}});
			`SC:	wb_write(16'h03 << {eandx[3:1],1'b0},eandx,{4{c[15:0]}});
			`SH:	wb_write(16'h0F << {eandx[3:2],2'b0},eandx,{2{c[31:0]}});
			`SW:	wb_write(16'hFF << {eandx[3],3'b0},eandx,c);
			`SWC:
				begin
					cr_o <= `HIGH;
					wb_write(16'hFF << {eandx[3],3'b0},eandx,c);
				end
			endcase
		`ADD:	begin res <= sum; rfwr <= `TRUE; end
		`CMP:	begin res <= $signed(a) < $signed(b) ? 64'hFFFFFFFFFFFFFFFF : a==b ? 64'h0 : 64'h1; rfwr <= `TRUE; end
		`CMPU:	begin res <= a < b ? 64'hFFFFFFFFFFFFFFFF : a==b ? 64'h0 : 64'h1; rfwr <= `TRUE; end
		`SccI:
				begin
				rfwr <= `TRUE;
				case(ir[31:28])
				4'd2:	res <= a==b;
				4'd3:	res <= a!=b;
				4'd4:	res <= $signed(a) < $signed(b);
				4'd5:	res <= $signed(a) >= $signed(b);
				4'd6:	res <= $signed(a) <= $signed(b);
				4'd7:	res <= $signed(a) > $signed(b);
				4'd12:	res <= a < b;
				4'd13:	res <= a >= b;
				4'd14:	res <= a <= b;
				4'd15:	res <= a > b;
				endcase
				end
`ifdef EXT_M				
		`MULU:	if (mul_done) begin res <= produ[63:0]; rfwr <= `TRUE; end else goto(EXECUTE);
		`MUL:	if (mul_done) begin res <= prods[63:0]; rfwr <= `TRUE; end else goto(EXECUTE);
		`MULSU:	if (mul_done) begin res <= prodsu[63:0]; rfwr <= `TRUE; end else goto(EXECUTE);
		// Stay in execute state until divide is done.
		`DIVI,`DIVUI,`DIVSUI:
				if (div_done) begin
					res <= div_qo;
					rfwr <= `TRUE;
				end
				else
					goto(EXECUTE);
		`MODI,`MODUI,`MODSUI:
				if (div_done) begin
					res <= div_ro;
					rfwr <= `TRUE;
				end
				else
					goto(EXECUTE);
`endif					
		`BITFLD:	begin res <= bfo; rfwr <= `TRUE; end
		`AND:	begin res <= a & b; rfwr <= `TRUE; end
		`OR:	begin res <= a | b; rfwr <= `TRUE; end
		`XOR:	begin res <= a ^ b; rfwr <= `TRUE; end
		`QOPI:
		      begin
		      rfwr <= `TRUE;
		      case(ir[10:8])
		      3'd0:   res <= a | b;
		      3'd1:   res <= a + b;
		      3'd2:   res <= a & b;
		      3'd3:   res <= a ^ b;
		      endcase
		      end
		`Bcc0,`Bcc1,`BEQ0,`BEQ1,`BBc0,`BBc1:
			begin
				if (takb)
					pc <= pc + {{21{ir[31]}},ir[31:22],ir[0],2'b00};
				$display("%h: br %h", opc, pc + {{21{ir[31]}},ir[31:22],ir[0],2'b00});
			end
		`BccR:
			begin
				if (takb)
					pc <= c;
				$display("%h: br %h", opc, c);
			end
		`JAL:
			begin
				pc <= {sum[31:2],2'b00};
				rfwr <= `TRUE;
				res <= pc;
			end
		`CALL:
			begin
				pc <= {pc[31:28],ir[31:6],2'b00};
				res <= pc;
				rfwr <= `TRUE;
				$display("%h: jal %h", opc, {pc[31:28],ir[31:6],2'b00});
			end
		`REX:
			begin
				ol <= ir[13:11];
				case(ir[13:11])
				3'd0:		pl <= 8'h00;
				3'd1:		pl <= 8'h01;
				default:	pl <= (npl < 2) ? {5'd0,ir[13:11]} : npl;
				endcase
				if (ir[13:11]!=3'd0)
					pc <= tvec[ir[13:11]];
				im <= ir[26:24];
			end
		`CSR:
			begin
				case(ir[31:30])
				2'd0:	begin read_csr(ir[26:16],res); rfwr <= `TRUE; end
				default:begin
							rfwr <= `TRUE;
							read_csr(ir[26:16],res);
							write_csr(ir[26:16],ir[31:30],a);
						end
				endcase
			end
		`LB,`LBU:	wb_read(16'h01 << sum[3:0],sum);
		`LC,`LCU:	wb_read(16'h03 << {sum[3:1],1'b0},sum);
		`LH,`LHU:	wb_read(16'h0F << {sum[3:2],2'b0},sum);
		`LW:		wb_read(16'hFF << {sum[3],3'b0},sum);
		`LWR: begin wb_read(16'hFF << {sum[3],3'b0},sum); sr_o <= `HIGH; end
		`SB:	wb_write(16'h01 << sum[3:0],sum,{8{c[7:0]}});
		`SC:	wb_write(16'h03 << {sum[3:1],1'b0},sum,{4{c[15:0]}});
		`SH:	wb_write(16'h0F << {sum[3:2],2'b0},sum,{2{c[31:0]}});
		`SW:	wb_write(16'hFF << {sum[3],3'b0},sum,c);
		`SWC:
			begin
				cr_o <= `HIGH;
				wb_write(16'hFF << {sum[3],3'b0},sum,c);
			end
`ifdef EXT_A			
		`AMO:
			case(ir[22:21])
			byt_:	wb_read(16'h01 << sum[3:0],a);
			char:	wb_read(16'h03 << {sum[3:1],1'b0},a);
			half:	wb_read(16'h0F << {sum[3:2],2'b0},a);
			word:	wb_read(16'hFF << {sum[3],3'b0},a);
			endcase
`endif			
		endcase
	end
 
// MEMORY:
// Finish memory cycle started in EXECUTE by waiting for an ack. Latch input
// data. The data is registered here before subsequent use because it's likely
// coming from a large mux. We don't want to cascade the mux and the shift
// operation required to align the data into a single clock cycle.
// If an AMO operation is in progress keep the cycle active.
MEMORY:
	if (ack_i) begin
		goto(MEMORY_NACK);
`ifdef EXT_A
		if (opcode!=`AMO)
`endif
			cyc_o <= `LOW;
		stb_o <= `LOW;
		we_o <= `LOW;
		sel_o <= 16'h0000;
		sr_o <= `LOW;
		cr_o <= `LOW;
	end
 
// Wait for ack to go back low again. Nomrally ack should go low immediately
// when the bus cycle is terminated within the same clock cycle. However some
// bus slaves don't put ack low until the clock edge when seeing the
// terminated bus cycle. We want to ensure that a second bus cycle isn't
// started until ack is low or the ack could be mistakenly accepted.
MEMORY_NACK:
	if (~ack_i) begin
		goto(IFETCH);
		case(opcode)
		`R2:
			case(funct)
    		`LB:	begin res <= {{56{byte_in[7]}},byte_in}; rfwr <= `TRUE; end
            `LBU:   begin res <= {{56{1'b0}},byte_in}; rfwr <= `TRUE; end
            `LC:    begin res <= {{48{char_in[15]}},char_in}; rfwr <= `TRUE; end
            `LCU:   begin res <= {{48{1'b0}},char_in}; rfwr <= `TRUE; end
            `LH:    begin res <= {{32{half_in[31]}},half_in}; rfwr <= `TRUE; end
            `LHU:   begin res <= {{32{1'b0}},half_in}; rfwr <= `TRUE; end
            `LW:    begin res <= word_in; rfwr <= `TRUE; end
			`SWC:	sema[0] <= rbl;
			endcase	
		`LB:	begin res <= {{56{byte_in[7]}},byte_in}; rfwr <= `TRUE; end
		`LBU:	begin res <= {{56{1'b0}},byte_in}; rfwr <= `TRUE; end
		`LC:	begin res <= {{48{char_in[15]}},char_in}; rfwr <= `TRUE; end
		`LCU:	begin res <= {{48{1'b0}},char_in}; rfwr <= `TRUE; end
		`LH:	begin res <= {{32{half_in[31]}},half_in}; rfwr <= `TRUE; end
		`LHU:	begin res <= {{32{1'b0}},half_in}; rfwr <= `TRUE; end
		`LW:	begin res <= word_in; rfwr <= `TRUE; end
		`SWC:	sema[0] <= rbl;
`ifdef EXT_A		
		`AMO:	begin
					goto(AMOOP);
					case(ir[22:21])
					byt_:	begin 
								res <= {{56{byte_in[7]}},byte_in};
								a <= {{56{byte_in[7]}},byte_in};
								rfwr <= `TRUE;
							end
					char:	begin res <= {{48{char_in[15]}},char_in}; a <= {{48{char_in[15]}},char_in}; rfwr <= `TRUE; end
					half:	begin res <= {{32{half_in[31]}},half_in}; a <= {{32{half_in[31]}},half_in}; rfwr <= `TRUE; end
					word:	begin res <= word_in; a <= word_in; rfwr <= `TRUE; end
					endcase
				end
`endif
		endcase
	end
`ifdef EXT_A
AMOOP:
	begin
		goto(AMOMEM);
		case(funct)
		`AMOSWAP,`AMOSWAPI:	amores <= b;
		`AMOADD,`AMOADDI:	amores <= a + b;
		`AMOAND,`AMOANDI:	amores <= a & b;
		`AMOOR,`AMOORI:		amores <= a | b;
		`AMOXOR,`AMOXORI:	amores <= a ^ b;
		`AMOSHL,`AMOSHLI,
		`AMOSHR,`AMOSHRI,
		`AMOASR,`AMOASRI,
		`AMOROL,`AMOROLI:
			case(ir[22:21])
			half:		amores <= shiftho;
			default:	amores <= shiftwo;
			endcase
		`AMOMIN,`AMOMINI:	amores <= $signed(a) < $signed(b) ? a : b;
		`AMOMAX,`AMOMAXI:	amores <= $signed(a) > $signed(b) ? a : b;
		`AMOMINU,`AMOMINUI:	amores <= a < b ? a : b;
		`AMOMAXU,`AMOMAXUI:	amores <= a > b ? a : b;
		default:	;
		endcase
	end
AMOMEM:
	begin
		goto(MEMORY);
		ir[5:0] <= `NOP;	// <- force memory nack back to ifetch
		case(ir[22:21])
		byt_:	wb_write(16'h01 << adr_o[3:0],adr_o,{8{amores[7:0]}});
		char:	wb_write(16'h03 << {adr_o[3:1],1'b0},adr_o,{4{amores[15:0]}});
		half:	wb_write(16'h0F << {adr_o[3:2],2'b0},adr_o,{2{amores[31:0]}});
		word:	wb_write(16'hFF << {adr_o[3],3'b0},adr_o,amores);
		endcase
	end
`endif
endcase
 
// Handle the register file update. The update is caused in a couple of
// different states. There may be two updates for a single instruction.
// Note that r0 is always forced to zero. A write to r0 may be needed
// before it's used anywhere.
if (rfwr) begin
	regfile[Rt] <= |Rt ? res : 64'd0;
	if (|Rt)
		$display("%s=%h",regname(Rt),res);
end
 
$display("Time: %d", $time);
$display("Tick: %d Instret: %d", tick, instret);
 
end
 
always @(posedge tm_clk_i)
if (rst_i)
	wctime <= 64'd1;
else begin
	if (wctime[31:0]==WCTIME1S) begin
		wctime[31:0] <= 32'd1;
		wctime[63:32] <= wctime[63:32] + 32'd1;
	end
	else
		wctime[31:0] <= wctime[31:0] + 32'd1;
end
always @(posedge clk_i)
	times <= wctime;
 
task exe_brk;
input [8:0] caus;
begin
	for (n = 0; n < 4; n = n + 1)
		brkstack[n+1] <= brkstack[n];
	brkstack[0] <= {pc[31:2],pl,ol,im};
	if (ir[15]==1'b0)
		im <= ir[18:16];
	ol <= 3'd0;
	pl <= 8'h00;
	pc <= tvec[0];
	cause <= caus;
	goto(IFETCH);
end
endtask
 
task read_csr;
input [11:0] regno;
output [63:0] val;
begin
	casez(regno)
	`HARTID:	val <= hartid_i;
	`TICK:		val <= tick;
	`CAUSE:		val <= {55'd0,cause};
	`SCRATCH:	val <= scratch;
	`SEMA:		val <= sema;
	`TVEC:		val <= tvec[regno[2:0]];
	`TIME:		val <= times;
	`INSTRET:	val <= instret;
	endcase
end
endtask
 
task write_csr;
input [11:0] regno;
input [1:0] op;
input [63:0] val;
begin
	case(op)
	2'd0:	;	// read only
	2'd1:
		casez(regno)
		`CAUSE:	cause <= val[8:0];
		`SCRATCH:	scratch <= val;
		`SEMA:	sema <= val;
		`TVEC:	tvec[regno[2:0]] <= val;
		endcase
	2'd2:
		casez(regno)
		`SEMA:	sema <= sema | val;
		endcase
	2'd3:
		casez(regno)
		`SEMA:	sema <= sema & ~val;
		endcase
	endcase
end
endtask
 
task wb_read;
input [15:0] sel;
input [31:0] adr;
begin
	cyc_o <= `HIGH;
	stb_o <= `HIGH;
	sel_o <= sel;
	adr_o <= adr;
	$display("%h: l?[u] %h", opc, adr);
	goto(MEMORY);
end
endtask
 
task wb_write;
input [15:0] sel;
input [31:0] adr;
input [63:0] dat;
begin
	cyc_o <= `HIGH;
	stb_o <= `HIGH;
	we_o <= `HIGH;
	sel_o <= sel;
	adr_o <= adr;
	dat_o <= {2{dat}};
	goto(MEMORY);
	$display("%h: s? %h <= %h", opc, adr, dat);
end
endtask
 
task goto;
input [7:0] st;
begin
	state <= st;
end
endtask
 
endmodule
 

Go to most recent revision | Compare with Previous | Blame | View Log

powered by: WebSVN 2.1.0

© copyright 1999-2024 OpenCores.org, equivalent to Oliscience, all rights reserved. OpenCores®, registered trademark.