forked from libre-chip/cpu
WIP adding fetch::l1_i_cache
This commit is contained in:
parent
c62d33048c
commit
94ae979686
7 changed files with 46935 additions and 4 deletions
|
|
@ -37,6 +37,8 @@ pub struct CpuConfig {
|
|||
pub max_branches_per_fetch: NonZeroUsize,
|
||||
pub max_fetches_in_flight: NonZeroUsize,
|
||||
pub log2_fetch_width_in_bytes: u8,
|
||||
pub log2_cache_line_size_in_bytes: u8,
|
||||
pub log2_l1_i_cache_line_count: u8,
|
||||
/// default value for [`UnitConfig::max_in_flight`]
|
||||
pub default_unit_max_in_flight: NonZeroUsize,
|
||||
pub rob_size: NonZeroUsize,
|
||||
|
|
@ -63,6 +65,8 @@ impl CpuConfig {
|
|||
v
|
||||
};
|
||||
pub const DEFAULT_LOG2_FETCH_WIDTH_IN_BYTES: u8 = 3;
|
||||
pub const DEFAULT_LOG2_CACHE_LINE_SIZE_IN_BYTES: u8 = 6;
|
||||
pub const DEFAULT_LOG2_L1_I_CACHE_LINE_COUNT: u8 = 8;
|
||||
pub const DEFAULT_UNIT_MAX_IN_FLIGHT: NonZeroUsize = {
|
||||
let Some(v) = NonZeroUsize::new(8) else {
|
||||
unreachable!();
|
||||
|
|
@ -77,6 +81,8 @@ impl CpuConfig {
|
|||
max_branches_per_fetch: Self::DEFAULT_MAX_BRANCHES_PER_FETCH,
|
||||
max_fetches_in_flight: Self::DEFAULT_MAX_FETCHES_IN_FLIGHT,
|
||||
log2_fetch_width_in_bytes: Self::DEFAULT_LOG2_FETCH_WIDTH_IN_BYTES,
|
||||
log2_cache_line_size_in_bytes: Self::DEFAULT_LOG2_CACHE_LINE_SIZE_IN_BYTES,
|
||||
log2_l1_i_cache_line_count: Self::DEFAULT_LOG2_L1_I_CACHE_LINE_COUNT,
|
||||
default_unit_max_in_flight: Self::DEFAULT_UNIT_MAX_IN_FLIGHT,
|
||||
rob_size,
|
||||
}
|
||||
|
|
@ -141,6 +147,37 @@ impl CpuConfig {
|
|||
.checked_shl(self.log2_fetch_width_in_bytes.into())
|
||||
.expect("log2_fetch_width_in_bytes is too big")
|
||||
}
|
||||
pub fn cache_line_size_in_bytes(&self) -> usize {
|
||||
1usize
|
||||
.checked_shl(self.log2_cache_line_size_in_bytes.into())
|
||||
.expect("log2_cache_line_size_in_bytes is too big")
|
||||
}
|
||||
pub fn log2_fetches_per_cache_line(&self) -> usize {
|
||||
self.log2_cache_line_size_in_bytes
|
||||
.checked_sub(self.log2_fetch_width_in_bytes)
|
||||
.expect("cache line size in bytes must not be smaller than fetch width in bytes")
|
||||
.into()
|
||||
}
|
||||
pub fn fetches_per_cache_line(&self) -> usize {
|
||||
self.log2_fetches_per_cache_line()
|
||||
.try_into()
|
||||
.ok()
|
||||
.and_then(|v| 1usize.checked_shl(v))
|
||||
.expect("log2_fetches_per_cache_line is too big")
|
||||
}
|
||||
pub fn l1_i_cache_line_count(&self) -> usize {
|
||||
1usize
|
||||
.checked_shl(self.log2_l1_i_cache_line_count.into())
|
||||
.expect("log2_l1_i_cache_line_count is too big")
|
||||
}
|
||||
pub fn log2_l1_i_cache_size_in_bytes(&self) -> usize {
|
||||
self.log2_l1_i_cache_line_count as usize + self.log2_cache_line_size_in_bytes as usize
|
||||
}
|
||||
pub fn l1_i_cache_size_in_bytes(&self) -> usize {
|
||||
1usize
|
||||
.checked_shl(self.log2_l1_i_cache_size_in_bytes() as _)
|
||||
.expect("L1 I-Cache is too big")
|
||||
}
|
||||
}
|
||||
|
||||
#[hdl(get(|c| c.fetch_width.get()))]
|
||||
|
|
@ -161,6 +198,30 @@ pub type CpuConfigLog2FetchWidthInBytes<C: PhantomConstGet<CpuConfig>> = DynSize
|
|||
#[hdl(get(|c| c.fetch_width_in_bytes()))]
|
||||
pub type CpuConfigFetchWidthInBytes<C: PhantomConstGet<CpuConfig>> = DynSize;
|
||||
|
||||
#[hdl(get(|c| c.log2_fetches_per_cache_line()))]
|
||||
pub type CpuConfigLog2FetchesPerCacheLine<C: PhantomConstGet<CpuConfig>> = DynSize;
|
||||
|
||||
#[hdl(get(|c| c.fetches_per_cache_line()))]
|
||||
pub type CpuConfigFetchesPerCacheLine<C: PhantomConstGet<CpuConfig>> = DynSize;
|
||||
|
||||
#[hdl(get(|c| c.log2_cache_line_size_in_bytes.into()))]
|
||||
pub type CpuConfigLog2CacheLineSizeInBytes<C: PhantomConstGet<CpuConfig>> = DynSize;
|
||||
|
||||
#[hdl(get(|c| c.cache_line_size_in_bytes()))]
|
||||
pub type CpuConfigCacheLineSizeInBytes<C: PhantomConstGet<CpuConfig>> = DynSize;
|
||||
|
||||
#[hdl(get(|c| c.log2_l1_i_cache_line_count.into()))]
|
||||
pub type CpuConfigLog2L1ICacheLineCount<C: PhantomConstGet<CpuConfig>> = DynSize;
|
||||
|
||||
#[hdl(get(|c| c.l1_i_cache_line_count()))]
|
||||
pub type CpuConfigL1ICacheLineCount<C: PhantomConstGet<CpuConfig>> = DynSize;
|
||||
|
||||
#[hdl(get(|c| c.log2_l1_i_cache_size_in_bytes()))]
|
||||
pub type CpuConfigLog2L1ICacheSizeInBytes<C: PhantomConstGet<CpuConfig>> = DynSize;
|
||||
|
||||
#[hdl(get(|c| c.l1_i_cache_size_in_bytes()))]
|
||||
pub type CpuConfigL1ICacheSizeInBytes<C: PhantomConstGet<CpuConfig>> = DynSize;
|
||||
|
||||
#[hdl(get(|c| c.rob_size.get()))]
|
||||
pub type CpuConfigRobSize<C: PhantomConstGet<CpuConfig>> = DynSize;
|
||||
|
||||
|
|
|
|||
1056
crates/cpu/src/fetch.rs
Normal file
1056
crates/cpu/src/fetch.rs
Normal file
File diff suppressed because it is too large
Load diff
|
|
@ -2,6 +2,7 @@
|
|||
// See Notices.txt for copyright information
|
||||
pub mod config;
|
||||
pub mod decoder;
|
||||
pub mod fetch;
|
||||
pub mod instruction;
|
||||
pub mod next_pc;
|
||||
pub mod powerisa_instructions_xml;
|
||||
|
|
|
|||
|
|
@ -2719,13 +2719,13 @@ impl SimValueDefault for BranchPredictionState {
|
|||
|
||||
#[derive(Copy, Clone, Debug)]
|
||||
#[must_use]
|
||||
enum ResetStatus {
|
||||
pub(crate) enum ResetStatus {
|
||||
Done,
|
||||
Working,
|
||||
}
|
||||
|
||||
impl ResetStatus {
|
||||
fn and(self, other: Self) -> Self {
|
||||
pub(crate) fn and(self, other: Self) -> Self {
|
||||
match (self, other) {
|
||||
(ResetStatus::Done, ResetStatus::Done) => ResetStatus::Done,
|
||||
(ResetStatus::Done | ResetStatus::Working, ResetStatus::Working)
|
||||
|
|
@ -2734,7 +2734,7 @@ impl ResetStatus {
|
|||
}
|
||||
}
|
||||
|
||||
trait SimValueDefault: Type {
|
||||
pub(crate) trait SimValueDefault: Type {
|
||||
fn sim_value_default(self) -> SimValue<Self>;
|
||||
}
|
||||
|
||||
|
|
@ -2828,7 +2828,7 @@ impl SimValueDefault for WipDecodedInsn {
|
|||
}
|
||||
}
|
||||
|
||||
trait ResetSteps: Type {
|
||||
pub(crate) trait ResetSteps: Type {
|
||||
fn reset_step(this: &mut SimValue<Self>, step: usize) -> ResetStatus;
|
||||
}
|
||||
|
||||
|
|
|
|||
|
|
@ -2,6 +2,24 @@
|
|||
// See Notices.txt for copyright information
|
||||
|
||||
use fayalite::{expr::ops::ExprIndex, int::UIntInRangeInclusiveType, prelude::*};
|
||||
use std::fmt;
|
||||
|
||||
#[derive(Clone, Debug)]
|
||||
pub struct ArrayVecFullError<V, I: Iterator> {
|
||||
pub value: V,
|
||||
pub rest: std::iter::Chain<std::iter::Once<I::Item>, I>,
|
||||
}
|
||||
|
||||
impl<V, I: Iterator> fmt::Display for ArrayVecFullError<V, I> {
|
||||
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
||||
write!(f, "ArrayVec is full")
|
||||
}
|
||||
}
|
||||
|
||||
impl<V: fmt::Debug, I: Iterator<Item: fmt::Debug> + fmt::Debug> std::error::Error
|
||||
for ArrayVecFullError<V, I>
|
||||
{
|
||||
}
|
||||
|
||||
#[hdl]
|
||||
pub type Length<Max: Size> = UIntInRangeInclusiveType<ConstUsize<0>, Max>;
|
||||
|
|
@ -46,6 +64,29 @@ impl<T: Type, N: Size> ArrayVec<T, N> {
|
|||
len: self.elements.len().to_sim_value_with_type(self.len),
|
||||
}
|
||||
}
|
||||
pub fn from_iter_sim<I: IntoIterator<Item: ToSimValueWithType<T>>>(
|
||||
self,
|
||||
uninit_element: impl ToSimValueWithType<T>,
|
||||
iter: I,
|
||||
) -> Result<SimValue<Self>, ArrayVecFullError<SimValue<Self>, I::IntoIter>> {
|
||||
let mut value = Self::new_sim(self, uninit_element);
|
||||
let element = self.element();
|
||||
let mut iter = iter.into_iter();
|
||||
for i in 0..self.capacity() {
|
||||
let Some(v) = iter.next() else {
|
||||
break;
|
||||
};
|
||||
value.elements[i] = v.into_sim_value_with_type(element);
|
||||
}
|
||||
if let Some(extra) = iter.next() {
|
||||
Err(ArrayVecFullError {
|
||||
value,
|
||||
rest: std::iter::once(extra).chain(iter),
|
||||
})
|
||||
} else {
|
||||
Ok(value)
|
||||
}
|
||||
}
|
||||
pub fn element(self) -> T {
|
||||
self.elements.element()
|
||||
}
|
||||
|
|
|
|||
45574
crates/cpu/tests/expected/fetch.vcd
generated
Normal file
45574
crates/cpu/tests/expected/fetch.vcd
generated
Normal file
File diff suppressed because it is too large
Load diff
198
crates/cpu/tests/fetch.rs
Normal file
198
crates/cpu/tests/fetch.rs
Normal file
|
|
@ -0,0 +1,198 @@
|
|||
// SPDX-License-Identifier: LGPL-3.0-or-later
|
||||
// See Notices.txt for copyright information
|
||||
|
||||
use cpu::{
|
||||
config::{CpuConfig, UnitConfig},
|
||||
fetch::{MemoryInterface, fetch},
|
||||
next_pc::NextPcToFetchInterface,
|
||||
unit::UnitKind,
|
||||
util::array_vec::ArrayVec,
|
||||
};
|
||||
use fayalite::{
|
||||
prelude::*,
|
||||
sim::vcd::VcdWriterDecls,
|
||||
util::{DebugAsDisplay, RcWriter},
|
||||
};
|
||||
use std::{cell::Cell, collections::VecDeque, num::NonZeroUsize};
|
||||
|
||||
const MEMORY_QUEUE_SIZE: usize = 32;
|
||||
|
||||
#[hdl]
|
||||
struct MemoryQueueEntry {
|
||||
addr: UInt<64>,
|
||||
cycles_left: UInt<8>,
|
||||
}
|
||||
|
||||
impl MemoryQueueEntry {
|
||||
#[hdl]
|
||||
fn default_sim(self) -> SimValue<Self> {
|
||||
#[hdl(sim)]
|
||||
Self {
|
||||
addr: 0u64,
|
||||
cycles_left: 0u8,
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
#[hdl_module(extern)]
|
||||
fn mock_memory(config: PhantomConst<CpuConfig>) {
|
||||
#[hdl]
|
||||
let cd: ClockDomain = m.input();
|
||||
#[hdl]
|
||||
let memory_interface: MemoryInterface<PhantomConst<CpuConfig>> =
|
||||
m.input(MemoryInterface[config]);
|
||||
#[hdl]
|
||||
let queue_debug: ArrayVec<MemoryQueueEntry, ConstUsize<{ MEMORY_QUEUE_SIZE }>> = m.output();
|
||||
m.register_clock_for_past(cd.clk);
|
||||
m.extern_module_simulation_fn(
|
||||
(cd, memory_interface, queue_debug),
|
||||
|(cd, memory_interface, queue_debug), mut sim| async move {
|
||||
// intentionally have a different sequence each time we're reset
|
||||
let delay_sequence_index = Cell::new(0);
|
||||
sim.resettable(
|
||||
cd,
|
||||
async |mut sim| {
|
||||
sim.write(memory_interface.start.ready, false).await;
|
||||
sim.write(
|
||||
memory_interface.finish.data,
|
||||
memory_interface.ty().finish.data.HdlNone(),
|
||||
)
|
||||
.await;
|
||||
sim.write(
|
||||
queue_debug,
|
||||
queue_debug.ty().new_sim(MemoryQueueEntry.default_sim()),
|
||||
)
|
||||
.await;
|
||||
},
|
||||
|sim, ()| {
|
||||
run_fn(
|
||||
cd,
|
||||
memory_interface,
|
||||
queue_debug,
|
||||
&delay_sequence_index,
|
||||
sim,
|
||||
)
|
||||
},
|
||||
)
|
||||
.await;
|
||||
},
|
||||
);
|
||||
#[hdl]
|
||||
async fn run_fn(
|
||||
cd: Expr<ClockDomain>,
|
||||
memory_interface: Expr<MemoryInterface<PhantomConst<CpuConfig>>>,
|
||||
queue_debug: Expr<ArrayVec<MemoryQueueEntry, ConstUsize<{ MEMORY_QUEUE_SIZE }>>>,
|
||||
delay_sequence_index: &Cell<u64>,
|
||||
mut sim: ExternModuleSimulationState,
|
||||
) {
|
||||
let config = memory_interface.config.ty();
|
||||
let mut queue: VecDeque<SimValue<MemoryQueueEntry>> = VecDeque::new();
|
||||
loop {
|
||||
let mut sim_queue = queue_debug.ty().new_sim(MemoryQueueEntry.default_sim());
|
||||
for entry in &queue {
|
||||
ArrayVec::try_push_sim(&mut sim_queue, entry)
|
||||
.ok()
|
||||
.expect("queue is known to be small enough");
|
||||
}
|
||||
sim.write(queue_debug, sim_queue).await;
|
||||
// TODO:
|
||||
sim.wait_for_clock_edge(cd.clk).await;
|
||||
println!(
|
||||
"Dump mock memory queue: {:#?}",
|
||||
Vec::from_iter(
|
||||
queue
|
||||
.iter()
|
||||
.map(|v| { DebugAsDisplay(format!("addr={:#x}", v.addr.as_int())) })
|
||||
)
|
||||
);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
#[hdl_module]
|
||||
fn dut(config: PhantomConst<CpuConfig>) {
|
||||
#[hdl]
|
||||
let cd: ClockDomain = m.input();
|
||||
#[hdl]
|
||||
let from_next_pc: NextPcToFetchInterface<PhantomConst<CpuConfig>> =
|
||||
m.input(NextPcToFetchInterface[config]);
|
||||
#[hdl]
|
||||
let fetch = instance(fetch(config));
|
||||
#[hdl]
|
||||
let fetch {
|
||||
cd: fetch_cd,
|
||||
memory_interface: fetch_memory_interface,
|
||||
from_next_pc: fetch_from_next_pc,
|
||||
} = fetch;
|
||||
connect(fetch_cd, cd);
|
||||
connect(fetch_from_next_pc, from_next_pc);
|
||||
#[hdl]
|
||||
let mock_memory = instance(mock_memory(config));
|
||||
#[hdl]
|
||||
let mock_memory {
|
||||
cd: mock_memory_cd,
|
||||
memory_interface: mock_memory_interface,
|
||||
queue_debug: _,
|
||||
} = mock_memory;
|
||||
connect(mock_memory_cd, cd);
|
||||
connect(mock_memory_interface, fetch_memory_interface);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn test_fetch() {
|
||||
let _n = SourceLocation::normalize_files_for_tests();
|
||||
let mut config = CpuConfig::new(
|
||||
vec![
|
||||
UnitConfig::new(UnitKind::AluBranch),
|
||||
UnitConfig::new(UnitKind::AluBranch),
|
||||
],
|
||||
NonZeroUsize::new(20).unwrap(),
|
||||
);
|
||||
config.fetch_width = NonZeroUsize::new(2).unwrap();
|
||||
config.log2_fetch_width_in_bytes = 4;
|
||||
config.l1_i_cache_line_count = NonZeroUsize::new(16).unwrap();
|
||||
let m = dut(PhantomConst::new_sized(config));
|
||||
let mut sim = Simulation::new(m);
|
||||
let writer = RcWriter::default();
|
||||
sim.add_trace_writer(VcdWriterDecls::new(writer.clone()));
|
||||
struct DumpVcdOnDrop {
|
||||
writer: Option<RcWriter>,
|
||||
}
|
||||
impl Drop for DumpVcdOnDrop {
|
||||
fn drop(&mut self) {
|
||||
if let Some(mut writer) = self.writer.take() {
|
||||
let vcd = String::from_utf8(writer.take()).unwrap();
|
||||
println!("####### VCD:\n{vcd}\n#######");
|
||||
}
|
||||
}
|
||||
}
|
||||
let mut writer = DumpVcdOnDrop {
|
||||
writer: Some(writer),
|
||||
};
|
||||
let from_next_pc_ty = sim.io().from_next_pc.ty();
|
||||
sim.write_clock(sim.io().cd.clk, false);
|
||||
sim.write_reset(sim.io().cd.rst, true);
|
||||
sim.write(
|
||||
sim.io().from_next_pc.cancel.data,
|
||||
from_next_pc_ty.cancel.data.HdlNone(),
|
||||
);
|
||||
sim.write(
|
||||
sim.io().from_next_pc.fetch.data,
|
||||
from_next_pc_ty.fetch.data.HdlNone(),
|
||||
);
|
||||
for cycle in 0..2000 {
|
||||
// TODO: drive from_next_pc
|
||||
sim.advance_time(SimDuration::from_nanos(500));
|
||||
println!("clock tick: {cycle}");
|
||||
sim.write_clock(sim.io().cd.clk, true);
|
||||
sim.advance_time(SimDuration::from_nanos(500));
|
||||
sim.write_clock(sim.io().cd.clk, false);
|
||||
sim.write_reset(sim.io().cd.rst, false);
|
||||
}
|
||||
// FIXME: vcd is just whatever fetch does now, which isn't known to be correct
|
||||
let vcd = String::from_utf8(writer.writer.take().unwrap().take()).unwrap();
|
||||
println!("####### VCD:\n{vcd}\n#######");
|
||||
if vcd != include_str!("expected/fetch.vcd") {
|
||||
panic!();
|
||||
}
|
||||
}
|
||||
Loading…
Add table
Add a link
Reference in a new issue