This lesson starts at commit 52ad976f12300a37998296b9861bfa7bccabac4a.

6. Implementing more instructions

After the hopefully fun diversion in the last lesson, we are back to work. There are 40-ish instructions in the RISC-V base instruction set, and we have only implemented two so far. Let's bang out some more instructions!

Let's grab the RV32/64G Instruction Set Listings of the RISC-V docs.

First, let's just add variables for all the bit fields we don't have yet.

src/core/decode_write.vhd CHANGED Viewed

@@ -31,8 +31,14 @@ begin
 		variable funct7: std_logic_vector(6 downto 0);
 		variable rs1, rs2, rd : std_logic_vector(4 downto 0);
 		variable i_imm: std_logic_vector(11 downto 0);
 		variable i_imm_s: std_logic_vector(31 downto 0);
 		variable v_decode_output: decode_output_t;
 	begin
@@ -51,7 +57,14 @@ begin
 			funct7 := decode_input.instr(31 downto 25);
 			rd     := decode_input.instr(11 downto 7);
 			i_imm := decode_input.instr(31 downto 20);
 			i_imm_s := std_logic_vector(resize(signed(i_imm), 32));
 			v_decode_output := DEFAULT_DECODE_OUTPUT;

 		variable funct7: std_logic_vector(6 downto 0);
 		variable rs1, rs2, rd : std_logic_vector(4 downto 0);
+		variable b_imm: std_logic_vector(12 downto 0);
+		variable b_imm_s: std_logic_vector(31 downto 0);
 		variable i_imm: std_logic_vector(11 downto 0);
 		variable i_imm_s: std_logic_vector(31 downto 0);
+		variable j_imm: std_logic_vector(20 downto 0);
+		variable j_imm_s: std_logic_vector(31 downto 0);
+		variable s_imm: std_logic_vector(11 downto 0);
+		variable u_imm: std_logic_vector(31 downto 0);
 		variable v_decode_output: decode_output_t;
 	begin
 			funct7 := decode_input.instr(31 downto 25);
 			rd     := decode_input.instr(11 downto 7);
+			b_imm := decode_input.instr(31) & decode_input.instr(7) & decode_input.instr(30 downto 25) & decode_input.instr(11 downto 8) & "0";
 			i_imm := decode_input.instr(31 downto 20);
+			j_imm := decode_input.instr(31) & decode_input.instr(19 downto 12) & decode_input.instr(20) & decode_input.instr(30 downto 21) & "0";
+			s_imm := decode_input.instr(31 downto 25) & decode_input.instr(11 downto 7);
+			u_imm := decode_input.instr(31 downto 12) & "000000000000";
+			-- sign extension
+			b_imm_s := std_logic_vector(resize(signed(b_imm), 32));
 			i_imm_s := std_logic_vector(resize(signed(i_imm), 32));
 			v_decode_output := DEFAULT_DECODE_OUTPUT;

Now, let's remove the decoding logic we currently have and just start implementing the instructions from the RV32/64G Instruction Set Listings.

src/core/decode_write.vhd CHANGED Viewed

@@ -73,30 +73,7 @@ begin
 				v_decode_output.is_active := '1';
 				v_decode_output.is_invalid := '0';
-				if opcode = "0010011" and funct3 = "000" then
-					-- ADDI rd, rs, imm (I-type): sets rd to the sum of rs1 and the sign-extended immediate
-					v_decode_output.operation := OP_ADD;
-					v_decode_output.operand1 := reg(to_integer(unsigned(rs1)));
-					v_decode_output.operand2 := i_imm_s;
-					v_decode_output.destination_reg := rd;
-				elsif opcode = "0110011" and funct3 = "000" and funct7 = "0000000" then
-					-- ADD rd, rs1, rs2 (R-type): sets rd to the sum of rs1 and rs2
-					v_decode_output.operation := OP_ADD;
-					v_decode_output.operand1 := reg(to_integer(unsigned(rs1)));
-					v_decode_output.operand2 := reg(to_integer(unsigned(rs2)));
-					v_decode_output.destination_reg := rd;
-				elsif opcode = "1111111" and funct3 = "000" then
-					-- LED rs1: set the LEDs to the 8 least significant bits of rs1
-					v_decode_output.operation := OP_LED;
-					v_decode_output.operand1 := reg(to_integer(unsigned(rs1)));
-					v_decode_output.operand2 := (others => '0');
-					v_decode_output.destination_reg := (others => '0');
-				elsif opcode = "1111111" and funct3 = "001" then
-					-- HANG
-					v_decode_output := DEFAULT_DECODE_OUTPUT;
-				else
-					v_decode_output.is_invalid := '1';
-				end if;
 			else
 				decode_output <= DEFAULT_DECODE_OUTPUT;
 			end if;

 				v_decode_output.is_active := '1';
 				v_decode_output.is_invalid := '0';
+				-- TODO: implement instruction decoding
 			else
 				decode_output <= DEFAULT_DECODE_OUTPUT;
 			end if;

So we start with LUI and AUIPC. In Chapter 2 (RV32I Base Integer Instruction Set) of the RISC-V unprivileged architecture document, we find this:

Descriptions and bits for LUI and AUIPC instructions

In chapter 35, we see that the opcode field is 0110111 for LUI and 0010111 for AUIPC.

src/core/decode_write.vhd CHANGED Viewed

@@ -73,7 +73,13 @@ begin
 				v_decode_output.is_active := '1';
 				v_decode_output.is_invalid := '0';
-				-- TODO: implement instruction decoding
 			else
 				decode_output <= DEFAULT_DECODE_OUTPUT;
 			end if;

 				v_decode_output.is_active := '1';
 				v_decode_output.is_invalid := '0';
+				if opcode = "0110111" then
+					-- TODO: LUI
+				elsif opcode = "0010111" then
+					-- TODO: AUIPC
+				else
+					v_decode_output.is_invalid := '1';
+				end if;
 			else
 				decode_output <= DEFAULT_DECODE_OUTPUT;
 			end if;

So, we start with LUI. We need to place the immediate value in the rd register. This is easy enough with the existing infrastructure.

src/core/decode_write.vhd CHANGED Viewed

@@ -74,7 +74,11 @@ begin
 				v_decode_output.is_invalid := '0';
 				if opcode = "0110111" then
-					-- TODO: LUI
 				elsif opcode = "0010111" then
 					-- TODO: AUIPC
 				else

 				v_decode_output.is_invalid := '0';
 				if opcode = "0110111" then
+					-- LUI
+					v_decode_output.operation := OP_ADD;
+					v_decode_output.operand1 := (others => '0');
+					v_decode_output.operand2 := u_imm;
+					v_decode_output.destination_reg := rd;
 				elsif opcode = "0010111" then
 					-- TODO: AUIPC
 				else

AUIPC is similar, but the it adds the immediate to the address of the instruction. This address is in the pc register in the fetch stage, but not yet available in the decode stage, so we need to pass it in the output of the fetch stage.

src/core/constants.vhd CHANGED Viewed

@@ -7,7 +7,8 @@ use work.core_types.all;
 package core_constants is
 	constant DEFAULT_FETCH_OUTPUT: fetch_output_t := (
 		is_active => '0',
-		instr => (others => '0')
 	);
 	constant DEFAULT_DECODE_OUTPUT: decode_output_t := (

 package core_constants is
 	constant DEFAULT_FETCH_OUTPUT: fetch_output_t := (
 		is_active => '0',
+		instr => (others => '0'),
+		pc => (others => '0')
 	);
 	constant DEFAULT_DECODE_OUTPUT: decode_output_t := (

src/core/fetch.vhd CHANGED Viewed

@@ -34,6 +34,7 @@ begin
 				output.is_active <= '1';
 				output.instr <= imem(to_integer(pc(5 downto 2)));
 			else
 				output <= DEFAULT_FETCH_OUTPUT;
 			end if;

 				output.is_active <= '1';
 				output.instr <= imem(to_integer(pc(5 downto 2)));
+				output.pc <= std_logic_vector(pc);
 			else
 				output <= DEFAULT_FETCH_OUTPUT;
 			end if;

src/core/types.vhd CHANGED Viewed

@@ -8,6 +8,7 @@ package core_types is
 	type fetch_output_t is record
 		is_active: std_logic;
 		instr: std_logic_vector(31 downto 0);
 	end record fetch_output_t;
 	type decode_output_t is record

 	type fetch_output_t is record
 		is_active: std_logic;
 		instr: std_logic_vector(31 downto 0);
+		pc: std_logic_vector(31 downto 0);
 	end record fetch_output_t;
 	type decode_output_t is record

Now, we can implement AUIPC similar to LUI in the decode stage.

src/core/decode_write.vhd CHANGED Viewed

@@ -80,7 +80,11 @@ begin
 					v_decode_output.operand2 := u_imm;
 					v_decode_output.destination_reg := rd;
 				elsif opcode = "0010111" then
-					-- TODO: AUIPC
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

 					v_decode_output.operand2 := u_imm;
 					v_decode_output.destination_reg := rd;
 				elsif opcode = "0010111" then
+					-- AUIPC
+					v_decode_output.operation := OP_ADD;
+					v_decode_output.operand1 := decode_input.pc;
+					v_decode_output.operand2 := u_imm;
+					v_decode_output.destination_reg := rd;
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

Now, JAL and JALR are control flow instructions, which mean we'll have to somehow change the value of the pc register in the fetch stage. This requires changes in at least 3 modules as well as some testing. This is a bit too much work for this lesson; we'll just work on the "low-hanging fruit" now, and will return to the instructions that require more work later.

src/core/decode_write.vhd CHANGED Viewed

@@ -85,6 +85,10 @@ begin
 					v_decode_output.operand1 := decode_input.pc;
 					v_decode_output.operand2 := u_imm;
 					v_decode_output.destination_reg := rd;
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

 					v_decode_output.operand1 := decode_input.pc;
 					v_decode_output.operand2 := u_imm;
 					v_decode_output.destination_reg := rd;
+				elsif opcode = "1101111" then
+					-- TODO: JAL
+				elsif opcode = "1100111" and funct3 = "000" then
+					-- TODO: JALR
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

Now, BEQ, BNE, BLT, BGE, BLTU, and BGEU are control flow instructions as well, so we skip them too.

src/core/decode_write.vhd CHANGED Viewed

@@ -89,6 +89,22 @@ begin
 					-- TODO: JAL
 				elsif opcode = "1100111" and funct3 = "000" then
 					-- TODO: JALR
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

 					-- TODO: JAL
 				elsif opcode = "1100111" and funct3 = "000" then
 					-- TODO: JALR
+				elsif opcode = "1100011" then
+					if funct3 = "000" then
+						-- TODO: BEQ
+					elsif funct3 = "001" then
+						-- TODO: BNE
+					elsif funct3 = "100" then
+						-- TODO: BLT
+					elsif funct3 = "101" then
+						-- TODO: BGE
+					elsif funct3 = "110" then
+						-- TODO: BLTU
+					elsif funct3 = "111" then
+						-- TODO: BGEU
+					else
+						v_decode_output.is_invalid := '1';
+					end if;
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

We'll also skip LB, LH, LW, LBU, LHU, SB, SH, SW because these are memory operations and we haven't implemented memory yet. So far, this is going excellent.

src/core/decode_write.vhd CHANGED Viewed

@@ -105,6 +105,30 @@ begin
 					else
 						v_decode_output.is_invalid := '1';
 					end if;
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

 					else
 						v_decode_output.is_invalid := '1';
 					end if;
+				elsif opcode = "0000011" then
+					if funct3 = "000" then
+						-- TODO: LB
+					elsif funct3 = "001" then
+						-- TODO: LH
+					elsif funct3 = "010" then
+						-- TODO: LW
+					elsif funct3 = "100" then
+						-- TODO: LBU
+					elsif funct3 = "101" then
+						-- TODO: LHU
+					else
+						v_decode_output.is_invalid := '1';
+					end if;
+				elsif opcode = "0100011" then
+					if funct3 = "000" then
+						-- TODO: SB
+					elsif funct3 = "001" then
+						-- TODO: SH
+					elsif funct3 = "010" then
+						-- TODO: SW
+					else
+						v_decode_output.is_invalid := '1';
+					end if;
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

Now, we arrive at a bunch of instructions that have the same opcode (but a different value for the funct3 field): ADDI, SLTI, SLTIU, XORI, ORI, ANDI.

First, we want to recognize these instructions.

src/core/decode_write.vhd CHANGED Viewed

@@ -129,6 +129,22 @@ begin
 					else
 						v_decode_output.is_invalid := '1';
 					end if;
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

 					else
 						v_decode_output.is_invalid := '1';
 					end if;
+				elsif opcode = "0010011" then
+					if funct3 = "000" then
+						-- TODO: ADDI
+					elsif funct3 = "010" then
+						-- TODO: SLTI
+					elsif funct3 = "" then
+						-- TODO: SLTIU
+					elsif funct3 = "" then
+						-- TODO: XORI
+					elsif funct3 = "" then
+						-- TODO: ORI
+					elsif funct3 = "" then
+						-- TODO: ANDI
+					else
+						v_decode_output.is_invalid := '1';
+					end if;
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

We have implemented ADDI before, so we can just add that code back.

src/core/decode_write.vhd CHANGED Viewed

@@ -131,7 +131,11 @@ begin
 					end if;
 				elsif opcode = "0010011" then
 					if funct3 = "000" then
-						-- TODO: ADDI
 					elsif funct3 = "010" then
 						-- TODO: SLTI
 					elsif funct3 = "" then

 					end if;
 				elsif opcode = "0010011" then
 					if funct3 = "000" then
+						-- ADDI
+						v_decode_output.operation := OP_ADD;
+						v_decode_output.operand1 := reg(to_integer(unsigned(rs1)));
+						v_decode_output.operand2 := i_imm_s;
+						v_decode_output.destination_reg := rd;
 					elsif funct3 = "010" then
 						-- TODO: SLTI
 					elsif funct3 = "" then

The other instructions are very similar, but the exact operation that is executed in the execute stage is slightly different. So we can structure the code a bit differently to take advantage of the similarity.

src/core/decode_write.vhd CHANGED Viewed

@@ -130,12 +130,13 @@ begin
 						v_decode_output.is_invalid := '1';
 					end if;
 				elsif opcode = "0010011" then
 					if funct3 = "000" then
 						-- ADDI
 						v_decode_output.operation := OP_ADD;
-						v_decode_output.operand1 := reg(to_integer(unsigned(rs1)));
-						v_decode_output.operand2 := i_imm_s;
-						v_decode_output.destination_reg := rd;
 					elsif funct3 = "010" then
 						-- TODO: SLTI
 					elsif funct3 = "" then

 						v_decode_output.is_invalid := '1';
 					end if;
 				elsif opcode = "0010011" then
+					v_decode_output.operand1 := reg(to_integer(unsigned(rs1)));
+					v_decode_output.operand2 := i_imm_s;
+					v_decode_output.destination_reg := rd;
 					if funct3 = "000" then
 						-- ADDI
 						v_decode_output.operation := OP_ADD;
 					elsif funct3 = "010" then
 						-- TODO: SLTI
 					elsif funct3 = "" then

Now we add a couple of operations so that we can decode SLTI, SLTIU, XORI, ORI, ANDI.

src/core/decode_write.vhd CHANGED Viewed

@@ -138,15 +138,20 @@ begin
 						-- ADDI
 						v_decode_output.operation := OP_ADD;
 					elsif funct3 = "010" then
-						-- TODO: SLTI
-					elsif funct3 = "" then
-						-- TODO: SLTIU
-					elsif funct3 = "" then
-						-- TODO: XORI
-					elsif funct3 = "" then
-						-- TODO: ORI
-					elsif funct3 = "" then
-						-- TODO: ANDI
 					else
 						v_decode_output.is_invalid := '1';
 					end if;

 						-- ADDI
 						v_decode_output.operation := OP_ADD;
 					elsif funct3 = "010" then
+						-- SLTI
+						v_decode_output.operation := OP_SLT;
+					elsif funct3 = "011" then
+						-- SLTIU
+						v_decode_output.operation := OP_SLTU;
+					elsif funct3 = "100" then
+						-- XORI
+						v_decode_output.operation := OP_XOR;
+					elsif funct3 = "110" then
+						-- ORI
+						v_decode_output.operation := OP_OR;
+					elsif funct3 = "111" then
+						-- ANDI
+						v_decode_output.operation := OP_AND;
 					else
 						v_decode_output.is_invalid := '1';
 					end if;

src/core/types.vhd CHANGED Viewed

@@ -3,7 +3,7 @@ use ieee.std_logic_1164.all;
 package core_types is
-	type operation_t is (OP_ADD, OP_LED);
 	type fetch_output_t is record
 		is_active: std_logic;

 package core_types is
+	type operation_t is (OP_ADD, OP_SLT, OP_SLTU, OP_XOR, OP_OR, OP_AND, OP_LED);
 	type fetch_output_t is record
 		is_active: std_logic;

Now we still have to implement these operations in the execute module.

OP_SLT compares two operands as signed numbers, and sets 1 when the first operand is less than the second.

src/core/execute.vhd CHANGED Viewed

@@ -29,6 +29,12 @@ begin
 			if input.is_active = '1' and input.is_invalid = '0' then
 				if input.operation = OP_ADD then
 					v_output.result := std_logic_vector(unsigned(input.operand1) + unsigned(input.operand2));
 				elsif input.operation = OP_LED then
 					led <= input.operand1(7 downto 0);
 				else

 			if input.is_active = '1' and input.is_invalid = '0' then
 				if input.operation = OP_ADD then
 					v_output.result := std_logic_vector(unsigned(input.operand1) + unsigned(input.operand2));
+				elsif input.operation = OP_SLT then
+					if signed(input.operand1) < signed(input.operand2) then
+						v_output.result := std_logic_vector(to_unsigned(1, 32));
+					else
+						v_output.result := (others => '0');
+					end if;
 				elsif input.operation = OP_LED then
 					led <= input.operand1(7 downto 0);
 				else

OP_SLTU is similar but works on unsigned operands.

src/core/execute.vhd CHANGED Viewed

@@ -35,6 +35,12 @@ begin
 					else
 						v_output.result := (others => '0');
 					end if;
 				elsif input.operation = OP_LED then
 					led <= input.operand1(7 downto 0);
 				else

 					else
 						v_output.result := (others => '0');
 					end if;
+				elsif input.operation = OP_SLTU then
+					if unsigned(input.operand1) < unsigned(input.operand2) then
+						v_output.result := std_logic_vector(to_unsigned(1, 32));
+					else
+						v_output.result := (others => '0');
+					end if;
 				elsif input.operation = OP_LED then
 					led <= input.operand1(7 downto 0);
 				else

OP_XOR, OP_OR, and OP_AND are similar and simple to implement.

src/core/execute.vhd CHANGED Viewed

@@ -41,6 +41,12 @@ begin
 					else
 						v_output.result := (others => '0');
 					end if;
 				elsif input.operation = OP_LED then
 					led <= input.operand1(7 downto 0);
 				else

 					else
 						v_output.result := (others => '0');
 					end if;
+				elsif input.operation = OP_XOR then
+					v_output.result := input.operand1 xor input.operand2;
+				elsif input.operation = OP_OR then
+					v_output.result := input.operand1 or input.operand2;
+				elsif input.operation = OP_AND then
+					v_output.result := input.operand1 and input.operand2;
 				elsif input.operation = OP_LED then
 					led <= input.operand1(7 downto 0);
 				else

Now, SLLI, SRLI, and SRAI are similar to eachother but different from the instructions we just implemented, but for some reason all share the same opcode. I'll put these three instructions above the ones we just implemented, so that we can use slightly less logic.

src/core/decode_write.vhd CHANGED Viewed

@@ -129,6 +129,16 @@ begin
 					else
 						v_decode_output.is_invalid := '1';
 					end if;
 				elsif opcode = "0010011" then
 					v_decode_output.operand1 := reg(to_integer(unsigned(rs1)));
 					v_decode_output.operand2 := i_imm_s;

 					else
 						v_decode_output.is_invalid := '1';
 					end if;
+				elsif opcode = "0010011" and funct3 = "001" and funct7 = "0000000" then
+					-- TODO: SLLI
+				elsif opcode = "0010011" and funct3 = "101" then
+					if funct7 = "0000000" then
+						-- TODO: SRLI
+					elsif funct7 = "0000001" then
+						-- TODO: SRAI
+					else
+						v_decode_output.is_invalid := '1';
+					end if;
 				elsif opcode = "0010011" then
 					v_decode_output.operand1 := reg(to_integer(unsigned(rs1)));
 					v_decode_output.operand2 := i_imm_s;

Again, we add operations to implement the decoding of these instructions.

src/core/decode_write.vhd CHANGED Viewed

@@ -130,12 +130,22 @@ begin
 						v_decode_output.is_invalid := '1';
 					end if;
 				elsif opcode = "0010011" and funct3 = "001" and funct7 = "0000000" then
-					-- TODO: SLLI
 				elsif opcode = "0010011" and funct3 = "101" then
 					if funct7 = "0000000" then
-						-- TODO: SRLI
 					elsif funct7 = "0000001" then
-						-- TODO: SRAI
 					else
 						v_decode_output.is_invalid := '1';
 					end if;

 						v_decode_output.is_invalid := '1';
 					end if;
 				elsif opcode = "0010011" and funct3 = "001" and funct7 = "0000000" then
+					-- SLLI
+					v_decode_output.operand1 := reg(to_integer(unsigned(rs1)));
+					v_decode_output.operand2 := "000000000000000000000000000" & rs2;
+					v_decode_output.destination_reg := rd;
+					v_decode_output.operation := OP_SLL;
 				elsif opcode = "0010011" and funct3 = "101" then
+					v_decode_output.operand1 := reg(to_integer(unsigned(rs1)));
+					v_decode_output.operand2 := "000000000000000000000000000" & rs2;
+					v_decode_output.destination_reg := rd;
 					if funct7 = "0000000" then
+						-- SRLI
+						v_decode_output.operation := OP_SRL;
 					elsif funct7 = "0000001" then
+						-- SRAI
+						v_decode_output.operation := OP_SRA;
 					else
 						v_decode_output.is_invalid := '1';
 					end if;

src/core/types.vhd CHANGED Viewed

@@ -3,7 +3,7 @@ use ieee.std_logic_1164.all;
 package core_types is
-	type operation_t is (OP_ADD, OP_SLT, OP_SLTU, OP_XOR, OP_OR, OP_AND, OP_LED);
 	type fetch_output_t is record
 		is_active: std_logic;

 package core_types is
+	type operation_t is (OP_ADD, OP_SLT, OP_SLTU, OP_XOR, OP_OR, OP_AND, OP_SLL, OP_SRL, OP_SRA, OP_LED);
 	type fetch_output_t is record
 		is_active: std_logic;

Then we implement the operations themselves. The shift instructions are a bit weird. The manual mentions

The operand to be shifted is in rs1, and the shift amount is encoded in the lower 5 bits of the I-immediate field.

This means that you can shift by at most 31 bits. Janky as hell in my opinion, but we're just implementing the spec, not making it.

A nice way of implementing shifts by a variable number of bits, say n, is two do the shift as a sequence of shifts of powers of two. If n is 5-bits, and the most significant bit of n is set, we shift by 16 bits. If the next bit is set, we shift by 8 bits, etc., etc. At the end, we'll have shifted by n bits.

src/core/execute.vhd CHANGED Viewed

@@ -21,6 +21,8 @@ begin
 	process (clk)
 		variable v_output: execute_output_t;
 	begin
 		if rising_edge(clk) then
 			v_output := DEFAULT_EXECUTE_OUTPUT;
@@ -47,6 +49,61 @@ begin
 					v_output.result := input.operand1 or input.operand2;
 				elsif input.operation = OP_AND then
 					v_output.result := input.operand1 and input.operand2;
 				elsif input.operation = OP_LED then
 					led <= input.operand1(7 downto 0);
 				else

 	process (clk)
 		variable v_output: execute_output_t;
+		variable v_sign: std_logic_vector(31 downto 0);
 	begin
 		if rising_edge(clk) then
 			v_output := DEFAULT_EXECUTE_OUTPUT;
 					v_output.result := input.operand1 or input.operand2;
 				elsif input.operation = OP_AND then
 					v_output.result := input.operand1 and input.operand2;
+				elsif input.operation = OP_SLL then
+					v_output.result := input.operand1;
+					if input.operand2(4) = '1' then
+						v_output.result := v_output.result(15 downto 0) & "0000000000000000";
+					end if;
+					if input.operand2(3) = '1' then
+						v_output.result := v_output.result(23 downto 0) & "00000000";
+					end if;
+					if input.operand2(2) = '1' then
+						v_output.result := v_output.result(27 downto 0) & "0000";
+					end if;
+					if input.operand2(1) = '1' then
+						v_output.result := v_output.result(29 downto 0) & "00";
+					end if;
+					if input.operand2(0) = '1' then
+						v_output.result := v_output.result(30 downto 0) & "0";
+					end if;
+				elsif input.operation = OP_SRL then
+					v_output.result := input.operand1;
+					if input.operand2(4) = '1' then
+						v_output.result := "0000000000000000" & v_output.result(31 downto 16);
+					end if;
+					if input.operand2(3) = '1' then
+						v_output.result := "00000000" & v_output.result(31 downto 8);
+					end if;
+					if input.operand2(2) = '1' then
+						v_output.result := "0000" & v_output.result(31 downto 4);
+					end if;
+					if input.operand2(1) = '1' then
+						v_output.result := "00" & v_output.result(31 downto 2);
+					end if;
+					if input.operand2(0) = '1' then
+						v_output.result := "0" & v_output.result(31 downto 1);
+					end if;
+				elsif input.operation = OP_SRA then
+					v_output.result := input.operand1;
+					v_sign := (others => input.operand1(31));
+					if input.operand2(4) = '1' then
+						v_output.result := v_sign(15 downto 0) & v_output.result(31 downto 16);
+					end if;
+					if input.operand2(3) = '1' then
+						v_output.result := v_sign(7 downto 0) & v_output.result(31 downto 8);
+					end if;
+					if input.operand2(2) = '1' then
+						v_output.result := v_sign(3 downto 0) & v_output.result(31 downto 4);
+					end if;
+					if input.operand2(1) = '1' then
+						v_output.result := v_sign(2 downto 0) & v_output.result(31 downto 3);
+					end if;
+					if input.operand2(0) = '1' then
+						v_output.result := v_sign(1 downto 0) & v_output.result(31 downto 2);
+					end if;
 				elsif input.operation = OP_LED then
 					led <= input.operand1(7 downto 0);
 				else

This is a big change, but it's (almost) the same verbose code. In fact, we can merge the implementations of the two right shifts (SRL and SRA).

src/core/execute.vhd CHANGED Viewed

@@ -67,27 +67,14 @@ begin
 					if input.operand2(0) = '1' then
 						v_output.result := v_output.result(30 downto 0) & "0";
 					end if;
-				elsif input.operation = OP_SRL then
 					v_output.result := input.operand1;
-					if input.operand2(4) = '1' then
-						v_output.result := "0000000000000000" & v_output.result(31 downto 16);
-					end if;
-					if input.operand2(3) = '1' then
-						v_output.result := "00000000" & v_output.result(31 downto 8);
-					end if;
-					if input.operand2(2) = '1' then
-						v_output.result := "0000" & v_output.result(31 downto 4);
-					end if;
-					if input.operand2(1) = '1' then
-						v_output.result := "00" & v_output.result(31 downto 2);
-					end if;
-					if input.operand2(0) = '1' then
-						v_output.result := "0" & v_output.result(31 downto 1);
 					end if;
-				elsif input.operation = OP_SRA then
-					v_output.result := input.operand1;
-					v_sign := (others => input.operand1(31));
 					if input.operand2(4) = '1' then
 						v_output.result := v_sign(15 downto 0) & v_output.result(31 downto 16);

 					if input.operand2(0) = '1' then
 						v_output.result := v_output.result(30 downto 0) & "0";
 					end if;
+				elsif input.operation = OP_SRL or input.operation = OP_SRA then
 					v_output.result := input.operand1;
+					if input.operation = OP_SRL then
+						v_sign := (others => '0');
+					else
+						v_sign := (others => input.operand1(31));
 					end if;
 					if input.operand2(4) = '1' then
 						v_output.result := v_sign(15 downto 0) & v_output.result(31 downto 16);

Moving on; almost all of the instructions with opcode 0110011 are register-register versions of instructions we already implemented. The SUB instruction is the only exception.

As usual I'll add placeholders first.

src/core/decode_write.vhd CHANGED Viewed

@@ -175,6 +175,30 @@ begin
 					else
 						v_decode_output.is_invalid := '1';
 					end if;
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

 					else
 						v_decode_output.is_invalid := '1';
 					end if;
+				elsif opcode = "0110011" then
+					if funct7 = "0000000" and funct3 = "000" then
+						-- TODO: ADD
+					elsif funct7 = "0100000" and funct3 = "000" then
+						-- TODO: SUB
+					elsif funct7 = "0000000" and funct3 = "001" then
+						-- TODO: SLL
+					elsif funct7 = "0000000" and funct3 = "010" then
+						-- TODO: SLT
+					elsif funct7 = "0000000" and funct3 = "011" then
+						-- TODO: SLTU
+					elsif funct7 = "0000000" and funct3 = "100" then
+						-- TODO: XOR
+					elsif funct7 = "0000000" and funct3 = "101" then
+						-- TODO: SRL
+					elsif funct7 = "0100000" and funct3 = "101" then
+						-- TODO: SRA
+					elsif funct7 = "0000000" and funct3 = "110" then
+						-- TODO: OR
+					elsif funct7 = "0000000" and funct3 = "111" then
+						-- TODO: AND
+					else
+						v_decode_output.is_invalid := '1';
+					end if;
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

src/core/types.vhd CHANGED Viewed

@@ -3,7 +3,7 @@ use ieee.std_logic_1164.all;
 package core_types is
-	type operation_t is (OP_ADD, OP_SLT, OP_SLTU, OP_XOR, OP_OR, OP_AND, OP_SLL, OP_SRL, OP_SRA, OP_LED);
 	type fetch_output_t is record
 		is_active: std_logic;

 package core_types is
+	type operation_t is (OP_ADD, OP_SLT, OP_SLTU, OP_XOR, OP_OR, OP_AND, OP_SLL, OP_SRL, OP_SRA, OP_SUB, OP_LED);
 	type fetch_output_t is record
 		is_active: std_logic;

Now we'll add the implementation.

src/core/decode_write.vhd CHANGED Viewed

@@ -176,26 +176,40 @@ begin
 						v_decode_output.is_invalid := '1';
 					end if;
 				elsif opcode = "0110011" then
 					if funct7 = "0000000" and funct3 = "000" then
-						-- TODO: ADD
 					elsif funct7 = "0100000" and funct3 = "000" then
-						-- TODO: SUB
 					elsif funct7 = "0000000" and funct3 = "001" then
-						-- TODO: SLL
 					elsif funct7 = "0000000" and funct3 = "010" then
-						-- TODO: SLT
 					elsif funct7 = "0000000" and funct3 = "011" then
-						-- TODO: SLTU
 					elsif funct7 = "0000000" and funct3 = "100" then
-						-- TODO: XOR
 					elsif funct7 = "0000000" and funct3 = "101" then
-						-- TODO: SRL
 					elsif funct7 = "0100000" and funct3 = "101" then
-						-- TODO: SRA
 					elsif funct7 = "0000000" and funct3 = "110" then
-						-- TODO: OR
 					elsif funct7 = "0000000" and funct3 = "111" then
-						-- TODO: AND
 					else
 						v_decode_output.is_invalid := '1';
 					end if;

 						v_decode_output.is_invalid := '1';
 					end if;
 				elsif opcode = "0110011" then
+					v_decode_output.operand1 := reg(to_integer(unsigned(rs1)));
+					v_decode_output.operand2 := reg(to_integer(unsigned(rs2)));
+					v_decode_output.destination_reg := rd;
 					if funct7 = "0000000" and funct3 = "000" then
+						-- ADD
+						v_decode_output.operation := OP_ADD;
 					elsif funct7 = "0100000" and funct3 = "000" then
+						-- SUB
+						v_decode_output.operation := OP_SUB;
 					elsif funct7 = "0000000" and funct3 = "001" then
+						-- SLL
+						v_decode_output.operation := OP_SLL;
 					elsif funct7 = "0000000" and funct3 = "010" then
+						-- SLT
+						v_decode_output.operation := OP_SLT;
 					elsif funct7 = "0000000" and funct3 = "011" then
+						-- SLTU
+						v_decode_output.operation := OP_SLTU;
 					elsif funct7 = "0000000" and funct3 = "100" then
+						-- XOR
+						v_decode_output.operation := OP_XOR;
 					elsif funct7 = "0000000" and funct3 = "101" then
+						-- SRL
+						v_decode_output.operation := OP_SRL;
 					elsif funct7 = "0100000" and funct3 = "101" then
+						-- SRA
+						v_decode_output.operation := OP_SRA;
 					elsif funct7 = "0000000" and funct3 = "110" then
+						-- OR
+						v_decode_output.operation := OP_OR;
 					elsif funct7 = "0000000" and funct3 = "111" then
+						-- AND
+						v_decode_output.operation := OP_AND;
 					else
 						v_decode_output.is_invalid := '1';
 					end if;

Now, we just have to implement OP_SUB in the decoder.

src/core/execute.vhd CHANGED Viewed

@@ -31,6 +31,8 @@ begin
 			if input.is_active = '1' and input.is_invalid = '0' then
 				if input.operation = OP_ADD then
 					v_output.result := std_logic_vector(unsigned(input.operand1) + unsigned(input.operand2));
 				elsif input.operation = OP_SLT then
 					if signed(input.operand1) < signed(input.operand2) then
 						v_output.result := std_logic_vector(to_unsigned(1, 32));

 			if input.is_active = '1' and input.is_invalid = '0' then
 				if input.operation = OP_ADD then
 					v_output.result := std_logic_vector(unsigned(input.operand1) + unsigned(input.operand2));
+				elsif input.operation = OP_SUB then
+					v_output.result := std_logic_vector(unsigned(input.operand1) - unsigned(input.operand2));
 				elsif input.operation = OP_SLT then
 					if signed(input.operand1) < signed(input.operand2) then
 						v_output.result := std_logic_vector(to_unsigned(1, 32));

OK, phew. Just a couple of oddball instructions left. FENCE is used for memory ordering. We don't even have memory yet, so for now we'll make this a NOP.

src/core/decode_write.vhd CHANGED Viewed

@@ -213,6 +213,8 @@ begin
 					else
 						v_decode_output.is_invalid := '1';
 					end if;
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

 					else
 						v_decode_output.is_invalid := '1';
 					end if;
+				elsif funct3 = "000" and opcode = "0001111" then
+					-- FENCE (implemented as NOP)
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

Now, FENCE.TSO and PAUSE are special cases of FENCE, which we already handle. So we can skip them; We'll look if we can do something better later.

ECALL and EBREAK are traps, which we have not implemented yet. So I'll add the logic to be able to easily decode them later, but otherwise ignore them.

src/core/decode_write.vhd CHANGED Viewed

@@ -215,6 +215,10 @@ begin
 					end if;
 				elsif funct3 = "000" and opcode = "0001111" then
 					-- FENCE (implemented as NOP)
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

 					end if;
 				elsif funct3 = "000" and opcode = "0001111" then
 					-- FENCE (implemented as NOP)
+				elsif i_imm = "000000000000" and rs1 = "00000" and funct3 = "000" and rd = "00000" and opcode = "1110011" then
+					-- ECALL
+				elsif i_imm = "000000000001" and rs1 = "00000" and funct3 = "000" and rd = "00000" and opcode = "1110011" then
+					-- EBREAK
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

Now that we're done, let's add back our custom "LED" and "HANG" instructions.

src/core/decode_write.vhd CHANGED Viewed

@@ -219,6 +219,15 @@ begin
 					-- ECALL
 				elsif i_imm = "000000000001" and rs1 = "00000" and funct3 = "000" and rd = "00000" and opcode = "1110011" then
 					-- EBREAK
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

 					-- ECALL
 				elsif i_imm = "000000000001" and rs1 = "00000" and funct3 = "000" and rd = "00000" and opcode = "1110011" then
 					-- EBREAK
+				elsif opcode = "1111111" and funct3 = "000" then
+					-- LED (custom instruction): set the LEDs to the 8 least significant bits of rs1
+					v_decode_output.operation := OP_LED;
+					v_decode_output.operand1 := reg(to_integer(unsigned(rs1)));
+					v_decode_output.operand2 := (others => '0');
+					v_decode_output.destination_reg := (others => '0');
+				elsif opcode = "1111111" and funct3 = "001" then
+					-- HANG (custom instruction): stops execution of the CPU
+					v_decode_output := DEFAULT_DECODE_OUTPUT;
 				else
 					v_decode_output.is_invalid := '1';
 				end if;

Phew, we added a lot of instructions! We added the decoding for all instructions and actually implemented about half of all the instructions in the basic RV32 ISA. Not bad for a single lesson.

Did we forget anything? Testing, you say?