Skip to content


RPU 1.0
Browse files Browse the repository at this point in the history
Updated ISA support to RV32IMZcsr - Passes riscv-compliance.
Integer divide/rem in 34 cycles.
Integer multiply in 2 cycles (when using xilinx dsp blocks!)
Saved multiple cycles from fetch/memory load stages by short-cutting the start of memory requests.
Compliant misaligned exceptions for jumps,loads and stores. Addrs starting 0xFxxxxxxx ignore alignment requests (assumes mmio space).
Added CSRs for riscv-compliance requirements.
Source ran through a formatter for ease of use.
  • Loading branch information
Domipheus committed Sep 10, 2020
1 parent 47a0058 commit 4b16f9b
Show file tree
Hide file tree
Showing 12 changed files with 2,555 additions and 1,445 deletions.
4 changes: 3 additions & 1 deletion
Original file line number Diff line number Diff line change
@@ -1,7 +1,9 @@
Basic RISC-V CPU implementation in VHDL.

This is a RV32I ISA CPU implementation, based off of my TPU CPU design. It is very simple, is missing several features, but can run rv32i-compiled GCC toolchain binaries at over 200MHz on a Digilent Arty S7-50 board, built with Xilinx Spartan 7 tools. Can also boot Zephyr given correct SoC environment and invalid emulation handling of multiply/divide/mod M-extension instruction via invalid instruction trap.
This is a RV32IMZcsr ISA CPU implementation, based off of my TPU CPU design. It is very simple, but has run rv32i-compiled GCC toolchain binaries at over 200MHz on a Digilent Arty S7-50 board, built with Xilinx Spartan 7 tools.

When used in the ArtyS7-RPU-SoC can run DooM timedemo3 at ~8fps, and boot operating systems such as Zephyr RTOS.

Please let me know if you are using any of the RPU design in your own projects! I am contactable on twitter @domipheus.

Expand Down
558 changes: 517 additions & 41 deletions tests/rpu_core_tb.vhd

Large diffs are not rendered by default.

168 changes: 168 additions & 0 deletions tests/tb_alu_int32_div.vhd
Original file line number Diff line number Diff line change
@@ -0,0 +1,168 @@
-- Company:
-- Engineer:
-- Create Date: 12.11.2018 22:51:11
-- Design Name:
-- Module Name: rpu_core_tb - Behavioral
-- Project Name:
-- Target Devices:
-- Tool Versions:
-- Description:
-- Dependencies:
-- Revision:
-- Revision 0.01 - File Created
-- Additional Comments:

library IEEE;

-- Uncomment the following library declaration if using
-- arithmetic functions with Signed or Unsigned values

-- Uncomment the following library declaration if instantiating
-- any Xilinx leaf cells in this code.
--library UNISIM;
--use UNISIM.VComponents.all;

library work;
use work.constants.all;

entity alu_int32_div_tb is
-- Port ( );
end alu_int32_div_tb;

architecture Behavioral of alu_int32_div_tb is

-- The RPU core definition
component alu_int32_div is
Port (
I_clk : in STD_LOGIC;
I_exec : in STD_LOGIC;
I_dividend : in STD_LOGIC_VECTOR (XLEN32M1 downto 0);
I_divisor : in STD_LOGIC_VECTOR (XLEN32M1 downto 0);
I_op : in STD_LOGIC_VECTOR (1 downto 0);
O_dataResult : out STD_LOGIC_VECTOR (XLEN32M1 downto 0);
O_done : out STD_LOGIC;
O_int : out std_logic
end component;

signal I_clk : std_logic := '0';
signal I_exec : std_logic := '0';
signal I_dividend : std_logic_vector(31 downto 0) := (others => '0');
signal I_divisor : std_logic_vector(31 downto 0) := (others => '0');
signal I_op : std_logic_vector(1 downto 0) := (others => '0');
signal O_dataResult : std_logic_vector(31 downto 0) := (others => '0');
signal O_done : std_logic := '0';
signal O_int : std_logic := '0';

-- Clock period definitions
constant I_clk_period : time := 10 ns;

-- Instantiate the Unit Under Test (UUT)
uut: alu_int32_div PORT MAP (
I_clk => I_clk,
I_exec => I_exec,
I_dividend => I_dividend,
I_divisor => I_divisor,
I_op => I_op,
O_dataResult => O_dataResult,
O_done => O_done,
O_int => O_int

-- Clock process definitions
I_clk_process :process
I_clk <= '0';
wait for I_clk_period/2;
I_clk <= '1';
wait for I_clk_period/2;
end process;

-- Stimulus process
stim_proc: process
-- hold reset state for 100 ns.
wait for 100 ns;

wait for I_clk_period*10;
-- insert stimulus here

I_dividend <= X"ffffffff";
I_divisor <= X"00000000";
I_exec <= '1';
wait for I_clk_period;
I_exec <= '0';

wait for I_clk_period*500;

I_dividend <= X"0000000a";
I_divisor <= X"0000000a";
I_exec <= '1';
wait for I_clk_period;
I_exec <= '0';

wait for I_clk_period*500;

I_dividend <= X"00001001";
I_divisor <= X"00000111";
I_exec <= '1';
wait for I_clk_period;
I_exec <= '0';

wait for I_clk_period*500;

I_dividend <= X"ffff0001";
I_divisor <= X"00000111";
I_exec <= '1';
wait for I_clk_period;
I_exec <= '0';

wait for I_clk_period*500;

-- I_dividend <= X"ffff0001";
-- I_divisor <= X"00000111";
-- I_op <= ALU_INT32_DIV_OP_DIVU;
-- I_exec <= '1';
-- wait for I_clk_period;
-- I_exec <= '0';
-- wait for I_clk_period*500;

I_dividend <= X"00011101";
I_divisor <= X"00000001";
I_exec <= '1';
wait for I_clk_period;
I_exec <= '0';

wait for I_clk_period*500;

I_dividend <= X"00010001";
I_divisor <= X"00000111";
I_exec <= '1';
wait for I_clk_period;
I_exec <= '0';
end process;

end Behavioral;
183 changes: 183 additions & 0 deletions vhdl/alu_int32_div.vhd
Original file line number Diff line number Diff line change
@@ -0,0 +1,183 @@
-- Project Name: RISC-V CPU
-- Description: ALU unit for 32-bit integer division ops
-- Copyright 2020 Colin Riley
-- Licensed under the Apache License, Version 2.0 (the "License");
-- you may not use this file except in compliance with the License.
-- You may obtain a copy of the License at
-- Unless required by applicable law or agreed to in writing, software
-- distributed under the License is distributed on an "AS IS" BASIS,
-- See the License for the specific language governing permissions and
-- limitations under the License.

library IEEE;
use IEEE.STD_LOGIC_1164.all;

-- Uncomment the following library declaration if using
-- arithmetic functions with Signed or Unsigned values
library work;
use work.constants.all;

entity alu_int32_div is
port (
I_clk : in STD_LOGIC;
I_exec : in STD_LOGIC;
I_dividend : in STD_LOGIC_VECTOR (XLEN32M1 downto 0);
I_divisor : in STD_LOGIC_VECTOR (XLEN32M1 downto 0);
I_op : in STD_LOGIC_VECTOR (1 downto 0);
O_dataResult : out STD_LOGIC_VECTOR (XLEN32M1 downto 0);
O_done : out STD_LOGIC;
O_int : out std_logic
end alu_int32_div;

architecture Behavioral of alu_int32_div is
signal s_done : std_logic := '0';
signal s_int : std_logic := '0';
signal s_op : std_logic_vector(1 downto 0) := (others => '0');
signal s_result : std_logic_vector(XLEN32M1 downto 0) := (others => '0');
signal s_outsign : std_logic := '0';
signal s_ur : unsigned(XLEN32M1 downto 0) := (others => '0');

signal s_i : integer := 0;
signal s_N : unsigned(XLEN32M1 downto 0) := (others => '0');
signal s_D : unsigned(XLEN32M1 downto 0) := (others => '0');
signal s_R : unsigned(XLEN32M1 downto 0) := (others => '0');
signal s_Q : unsigned(XLEN32M1 downto 0) := (others => '0');
constant STATE_IDLE : integer := 0;
constant STATE_INFLIGHTU : integer := 1;
constant STATE_COMPLETE : integer := 2;

signal s_state : integer := 0;

process (I_clk)
if rising_edge(I_clk) then
if s_state = STATE_IDLE then
s_done <= '0';
if I_exec = '1' then
s_op <= I_op;
s_done <= '0';

if (I_divisor = X"00000000") then
s_state <= STATE_COMPLETE;
s_Q <= X"ffffffff";

if I_dividend(31) = '1' then
s_R <= unsigned(-signed(I_dividend));
s_R <= unsigned(I_dividend);
end if;

if (I_op = ALU_INT32_DIV_OP_DIV) or (I_op = ALU_INT32_DIV_OP_DIVU) then
s_outsign <= '0';
s_outsign <= I_dividend(31);
end if;

elsif (I_divisor = X"00000001") and (I_op = ALU_INT32_DIV_OP_DIV) then
s_state <= STATE_COMPLETE;
s_R <= X"00000000";
if I_dividend(31) = '1' then
s_Q <= unsigned(-signed(I_dividend));
s_Q <= unsigned(I_dividend);
end if;
s_outsign <= I_dividend(31);

if I_op(ALU_INT32_DIV_OP_UNSIGNED_BIT) = '1' then
s_N <= unsigned(I_dividend);
s_D <= unsigned(I_divisor);
s_ur <= X"00000000";
s_Q <= X"00000000";
s_R <= X"00000000";

s_i <= 31;
s_outsign <= '0';

if (I_op = ALU_INT32_DIV_OP_DIV) then
s_outsign <= I_dividend(31) xor I_divisor(31);
s_outsign <= I_dividend(31);
end if;

if I_dividend(31) = '1' then
s_N <= unsigned(-signed(I_dividend));
s_N <= unsigned(I_dividend);
end if;

if I_divisor(31) = '1' then
s_D <= unsigned(-signed(I_divisor));
s_D <= unsigned(I_divisor);
end if;

s_ur <= X"00000000";

s_Q <= X"00000000";
s_R <= X"00000000";

s_i <= 31;

end if;
end if;
end if;

elsif s_state = STATE_INFLIGHTU then
-- binary integer long division loop
if (s_R(30 downto 0) & s_N(s_i)) >= s_D then
s_R <= (s_R(30 downto 0) & s_N(s_i)) - s_D;
s_Q(s_i) <= '1';
s_R <= s_R(30 downto 0) & s_N(s_i);
end if;

if s_i = 0 then
s_state <= STATE_COMPLETE;
s_i <= s_i - 1;
end if;

elsif s_state = STATE_COMPLETE then

if (s_op = ALU_INT32_DIV_OP_DIV) or (s_op = ALU_INT32_DIV_OP_DIVU) then
if (s_outsign = '1') then
s_result <= std_logic_vector(-signed(std_logic_vector(s_Q)));
s_result <= std_logic_vector(s_Q);
end if;
if (s_outsign = '1') then
s_result <= std_logic_vector(-signed(std_logic_vector(s_R)));
s_result <= std_logic_vector(s_R);
end if;
end if;

s_done <= '1';
s_state <= STATE_IDLE;
end if;
end if;
end process;

O_dataResult <= s_result;
O_done <= s_done;
O_int <= s_int;
end Behavioral;
20 changes: 20 additions & 0 deletions vhdl/constants.vhd
Original file line number Diff line number Diff line change
Expand Up @@ -149,6 +149,24 @@ constant F7_OP_OR: std_logic_vector(6 downto 0) := "0000000";
constant F3_OP_AND: std_logic_vector(2 downto 0) := "111";
constant F7_OP_AND: std_logic_vector(6 downto 0) := "0000000";

-- RV32M Extension
constant F7_OP_M_EXT: std_logic_vector(6 downto 0) := "0000001";
constant F3_OP_M_MUL: std_logic_vector(2 downto 0) := "000";
constant F3_OP_M_MULH: std_logic_vector(2 downto 0) := "001";
constant F3_OP_M_MULHSU: std_logic_vector(2 downto 0) := "010";
constant F3_OP_M_MULHU: std_logic_vector(2 downto 0) := "011";
constant F3_OP_M_DIV: std_logic_vector(2 downto 0) := "100";
constant F3_OP_M_DIVU: std_logic_vector(2 downto 0) := "101";
constant F3_OP_M_REM: std_logic_vector(2 downto 0) := "110";
constant F3_OP_M_REMU: std_logic_vector(2 downto 0) := "111";

-- bit 0 of the OP definitions denote unsigned ops; same as above
constant ALU_INT32_DIV_OP_UNSIGNED_BIT: integer := 0;
constant ALU_INT32_DIV_OP_DIV: std_logic_vector(1 downto 0) := "00";
constant ALU_INT32_DIV_OP_DIVU: std_logic_vector(1 downto 0) := "01";
constant ALU_INT32_DIV_OP_REM: std_logic_vector(1 downto 0) := "10";
constant ALU_INT32_DIV_OP_REMU: std_logic_vector(1 downto 0) := "11";

constant F3_MISCMEM_FENCE: std_logic_vector(2 downto 0) := "000";
constant F3_MISCMEM_FENCEI: std_logic_vector(2 downto 0) := "001";

Expand Down Expand Up @@ -262,6 +280,8 @@ constant CSR_OP_IMM_CLEAR_WR: std_logic_vector(4 downto 0) := "11100";
constant CSR_OP_IMM_CLEAR_W: std_logic_vector(4 downto 0) := "11101";
constant CSR_OP_IMM_CLEAR_R: std_logic_vector(4 downto 0) := "11110";

end constants;

package body constants is
Expand Down

0 comments on commit 4b16f9b

Please sign in to comment.