WIP: splitting reg_alloc
This commit is contained in:
		
							parent
							
								
									3f94ec24a6
								
							
						
					
					
						commit
						de080a6d4a
					
				
					 15 changed files with 818 additions and 543 deletions
				
			
		|  | @ -16,3 +16,6 @@ version.workspace = true | |||
| 
 | ||||
| [dependencies] | ||||
| fayalite.workspace = true | ||||
| 
 | ||||
| [lints.rust] | ||||
| unexpected_cfgs = { level = "warn", check-cfg = ['cfg(todo)'] } | ||||
|  |  | |||
|  | @ -3,8 +3,9 @@ | |||
| use crate::{ | ||||
|     instruction::{MOpTrait, PRegNum, RenamedMOp, UnitNum, UnitOutRegNum, CONST_ZERO_UNIT_NUM}, | ||||
|     unit::{ | ||||
|         unit_base::{UnitForwardingInfo, UnitToRegAlloc}, | ||||
|         UnitCancelInput, UnitKind, UnitOutputWrite, | ||||
|         unit_base::{ExecuteEnd, ExecuteStart}, | ||||
|         RenamedInsnData, RetireQueueIndex, UnitForwardingInfo, UnitKind, UnitOutputWrite, | ||||
|         UnitToRegAlloc, | ||||
|     }, | ||||
| }; | ||||
| use fayalite::prelude::*; | ||||
|  | @ -35,7 +36,6 @@ pub struct CpuConfig { | |||
|     pub fetch_width: NonZeroUsize, | ||||
|     /// default value for [`UnitConfig::max_in_flight`]
 | ||||
|     pub default_unit_max_in_flight: NonZeroUsize, | ||||
|     pub rob_size: NonZeroUsize, | ||||
| } | ||||
| 
 | ||||
| impl CpuConfig { | ||||
|  | @ -52,13 +52,12 @@ impl CpuConfig { | |||
|         }; | ||||
|         v | ||||
|     }; | ||||
|     pub fn new(units: Vec<UnitConfig>, rob_size: NonZeroUsize) -> Self { | ||||
|     pub fn new(units: Vec<UnitConfig>) -> Self { | ||||
|         Self { | ||||
|             units, | ||||
|             out_reg_num_width: Self::DEFAULT_OUT_REG_NUM_WIDTH, | ||||
|             fetch_width: Self::DEFAULT_FETCH_WIDTH, | ||||
|             default_unit_max_in_flight: Self::DEFAULT_UNIT_MAX_IN_FLIGHT, | ||||
|             rob_size, | ||||
|         } | ||||
|     } | ||||
|     pub fn non_const_unit_nums(&self) -> std::ops::Range<usize> { | ||||
|  | @ -79,8 +78,8 @@ impl CpuConfig { | |||
|     pub fn p_reg_num_width(&self) -> usize { | ||||
|         self.unit_num_width() + self.out_reg_num_width | ||||
|     } | ||||
|     pub fn renamed_mop_in_unit(&self) -> RenamedMOp<UnitOutRegNum<DynSize>, DynSize> { | ||||
|         RenamedMOp[self.unit_out_reg_num()][self.p_reg_num_width()] | ||||
|     pub fn renamed_mop(&self) -> RenamedMOp<DynSize> { | ||||
|         RenamedMOp[self.p_reg_num_width()] | ||||
|     } | ||||
|     pub fn unit_output_write(&self) -> UnitOutputWrite<DynSize> { | ||||
|         UnitOutputWrite[self.out_reg_num_width] | ||||
|  | @ -88,9 +87,6 @@ impl CpuConfig { | |||
|     pub fn unit_output_writes(&self) -> Array<HdlOption<UnitOutputWrite<DynSize>>> { | ||||
|         Array[HdlOption[self.unit_output_write()]][self.non_const_unit_nums().len()] | ||||
|     } | ||||
|     pub fn unit_cancel_input(&self) -> UnitCancelInput<DynSize> { | ||||
|         UnitCancelInput[self.out_reg_num_width] | ||||
|     } | ||||
|     pub fn unit_forwarding_info(&self) -> UnitForwardingInfo<DynSize, DynSize, DynSize> { | ||||
|         UnitForwardingInfo[self.unit_num_width()][self.out_reg_num_width] | ||||
|             [self.non_const_unit_nums().len()] | ||||
|  | @ -101,19 +97,39 @@ impl CpuConfig { | |||
|             .unwrap_or(self.default_unit_max_in_flight) | ||||
|     } | ||||
|     pub fn unit_to_reg_alloc< | ||||
|         MOp: Type + MOpTrait<DestReg = UnitOutRegNum<DynSize>, SrcRegWidth = DynSize>, | ||||
|         MOp: Type + MOpTrait<DestReg = (), SrcRegWidth = DynSize>, | ||||
|         ExtraOut: Type, | ||||
|     >( | ||||
|         &self, | ||||
|         mop_ty: MOp, | ||||
|         extra_out_ty: ExtraOut, | ||||
|     ) -> UnitToRegAlloc<MOp, ExtraOut, DynSize, DynSize, DynSize> { | ||||
|         assert_eq!( | ||||
|             mop_ty.dest_reg_ty(), | ||||
|             self.unit_out_reg_num(), | ||||
|             "inconsistent types", | ||||
|         ); | ||||
|     ) -> UnitToRegAlloc<MOp, ExtraOut, DynSize, DynSize, DynSize, DynSize> { | ||||
|         UnitToRegAlloc[mop_ty][extra_out_ty][self.unit_num_width()][self.out_reg_num_width] | ||||
|             [self.non_const_unit_nums().len()] | ||||
|             [self.non_const_unit_nums().len()][self.retire_queue_index_width()] | ||||
|     } | ||||
|     pub fn retire_queue_index_width(&self) -> usize { | ||||
|         let max_in_flight: usize = (0..self.units.len()) | ||||
|             .map(|unit_index| self.unit_max_in_flight(unit_index).get()) | ||||
|             .sum(); | ||||
|         2 + max_in_flight.next_power_of_two().ilog2() as usize | ||||
|     } | ||||
|     pub fn retire_queue_index(&self) -> RetireQueueIndex<DynSize> { | ||||
|         RetireQueueIndex[self.retire_queue_index_width()] | ||||
|     } | ||||
|     pub fn renamed_insn_data<MOp: Type, DestReg: Type>( | ||||
|         &self, | ||||
|         mop: MOp, | ||||
|         dest: DestReg, | ||||
|     ) -> RenamedInsnData<MOp, DestReg, DynSize> { | ||||
|         RenamedInsnData[mop][dest][self.retire_queue_index_width()] | ||||
|     } | ||||
|     pub fn execute_start<MOp: Type>(&self, mop: MOp) -> ExecuteStart<MOp, DynSize, DynSize> { | ||||
|         ExecuteStart[mop][self.out_reg_num_width][self.retire_queue_index_width()] | ||||
|     } | ||||
|     pub fn execute_end<ExtraOut: Type>( | ||||
|         &self, | ||||
|         extra_out_ty: ExtraOut, | ||||
|     ) -> ExecuteEnd<DynSize, DynSize, ExtraOut> { | ||||
|         ExecuteEnd[self.out_reg_num_width][self.retire_queue_index_width()][extra_out_ty] | ||||
|     } | ||||
| } | ||||
|  |  | |||
|  | @ -910,11 +910,9 @@ impl MOpRegNum { | |||
|     //
 | ||||
|     // TODO: maybe add more registers later.
 | ||||
|     pub const FLAG_REG_NUMS: Range<u32> = 0xFE..0x100; | ||||
|     /// registers handled by a special small rename table (for flags and stuff, since it has more read/write ports)
 | ||||
|     pub const SPECIAL_REG_NUMS: Range<u32> = Self::FLAG_REG_NUMS; | ||||
|     /// registers handled by the large rename table for normal registers (has less read/write ports)
 | ||||
|     pub const NORMAL_REG_NUMS: Range<u32> = | ||||
|         Self::CONST_ZERO_REG_NUM + 1..Self::SPECIAL_REG_NUMS.start; | ||||
|     /// registers that aren't constants
 | ||||
|     pub const NON_CONST_REG_NUMS: Range<u32> = | ||||
|         Self::CONST_ZERO_REG_NUM + 1..Self::FLAG_REG_NUMS.end; | ||||
| } | ||||
| 
 | ||||
| #[hdl(cmp_eq)] | ||||
|  | @ -929,29 +927,6 @@ pub struct MOpDestReg { | |||
|     pub flag_regs: Array<HdlOption<()>, { range_u32_len(&MOpRegNum::FLAG_REG_NUMS) }>, | ||||
| } | ||||
| 
 | ||||
| #[derive(Copy, Clone, Eq, PartialEq, Ord, PartialOrd, Hash, Debug)] | ||||
| pub enum RenameTableName { | ||||
|     /// the large rename table for normal registers (has less read/write ports)
 | ||||
|     Normal, | ||||
|     /// a special small rename table (for flags and stuff, since it has more read/write ports)
 | ||||
|     Special, | ||||
| } | ||||
| 
 | ||||
| impl RenameTableName { | ||||
|     pub const fn reg_range(self) -> std::ops::Range<u32> { | ||||
|         match self { | ||||
|             Self::Normal => MOpRegNum::NORMAL_REG_NUMS, | ||||
|             Self::Special => MOpRegNum::SPECIAL_REG_NUMS, | ||||
|         } | ||||
|     } | ||||
|     pub const fn as_str(self) -> &'static str { | ||||
|         match self { | ||||
|             Self::Normal => "rename_table_normal", | ||||
|             Self::Special => "rename_table_special", | ||||
|         } | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| #[derive(Copy, Clone, Eq, PartialEq, Hash, Debug)] | ||||
| pub enum MOpDestRegKind { | ||||
|     NormalReg { | ||||
|  | @ -989,16 +964,13 @@ impl fmt::Display for MOpDestRegName { | |||
| } | ||||
| 
 | ||||
| impl MOpDestRegKind { | ||||
|     pub const fn reg_range(self) -> std::ops::Range<u32> { | ||||
|     pub const fn reg_num_range(self) -> std::ops::Range<u32> { | ||||
|         match self { | ||||
|             Self::NormalReg { .. } => MOpRegNum::NORMAL_REG_NUMS, | ||||
|             Self::FlagReg { .. } => MOpRegNum::FLAG_REG_NUMS, | ||||
|         } | ||||
|     } | ||||
|     pub const fn rename_table_names(self) -> &'static [RenameTableName] { | ||||
|         match self { | ||||
|             Self::NormalReg { .. } => &[RenameTableName::Normal, RenameTableName::Special], | ||||
|             Self::FlagReg { .. } => &[RenameTableName::Special], | ||||
|             Self::NormalReg { dest_reg_index: _ } => MOpRegNum::NON_CONST_REG_NUMS, | ||||
|             Self::FlagReg { | ||||
|                 reg_num, | ||||
|                 flag_reg_index: _, | ||||
|             } => reg_num..reg_num + 1, | ||||
|         } | ||||
|     } | ||||
|     pub fn fixed_reg_num(self) -> Option<u32> { | ||||
|  | @ -1091,5 +1063,5 @@ pub type MOp = UnitMOp< | |||
| >; | ||||
| 
 | ||||
| #[hdl] | ||||
| pub type RenamedMOp<DestReg: Type, SrcRegWidth: Size> = | ||||
|     UnitMOp<DestReg, SrcRegWidth, L2RegisterFileMOp<DestReg, SrcRegWidth>>; | ||||
| pub type RenamedMOp<SrcRegWidth: Size> = | ||||
|     UnitMOp<(), SrcRegWidth, L2RegisterFileMOp<(), SrcRegWidth>>; | ||||
|  |  | |||
							
								
								
									
										267
									
								
								crates/cpu/src/instruction_rename.rs
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										267
									
								
								crates/cpu/src/instruction_rename.rs
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,267 @@ | |||
| // SPDX-License-Identifier: LGPL-3.0-or-later
 | ||||
| // See Notices.txt for copyright information
 | ||||
| 
 | ||||
| use crate::{ | ||||
|     config::CpuConfig, | ||||
|     instruction::{MOp, MOpDestReg, MOpRegNum, MOpTrait, MoveRegMOp, PRegNum, RenamedMOp}, | ||||
|     rename_table::{rename_table, RenameTablePortConfig}, | ||||
|     unit::{RenamedInsnData, RetireQueueIndex, UnitMOp}, | ||||
|     util::array_vec::{ArrayVec, Length, ReadyValidArray}, | ||||
| }; | ||||
| use fayalite::{ | ||||
|     prelude::*, | ||||
|     util::{prefix_sum::PrefixSumAlgorithm, ready_valid::ReadyValid}, | ||||
| }; | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct InstructionRenameInputInsn<UnitNumWidth: Size, OutRegNumWidth: Size> { | ||||
|     pub mop: MOp, | ||||
|     pub pc: UInt<64>, | ||||
|     pub renamed_dest: PRegNum<UnitNumWidth, OutRegNumWidth>, | ||||
| } | ||||
| 
 | ||||
| impl CpuConfig { | ||||
|     pub fn instruction_rename_input_insn(&self) -> InstructionRenameInputInsn<DynSize, DynSize> { | ||||
|         InstructionRenameInputInsn[self.unit_num_width()][self.out_reg_num_width] | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| struct InsnsInPrefixSummary<FetchWidth: Size> { | ||||
|     all_ready: Bool, | ||||
|     ready_count: Length<FetchWidth>, | ||||
|     retire_queue_used: Length<FetchWidth>, | ||||
| } | ||||
| 
 | ||||
| #[hdl_module] | ||||
| pub fn instruction_rename(config: &CpuConfig) { | ||||
|     #[hdl] | ||||
|     let cd: ClockDomain = m.input(); | ||||
|     #[hdl] | ||||
|     let insns_in: ReadyValidArray<InstructionRenameInputInsn<DynSize, DynSize>, DynSize> = | ||||
|         m.input(ReadyValidArray[config.instruction_rename_input_insn()][config.fetch_width.get()]); | ||||
|     #[hdl] | ||||
|     let start_retire_queue_index: RetireQueueIndex<DynSize> = m.input(config.retire_queue_index()); | ||||
|     #[hdl] | ||||
|     let end_retire_queue_index: RetireQueueIndex<DynSize> = m.output(config.retire_queue_index()); | ||||
|     #[hdl] | ||||
|     let insns_out: Array< | ||||
|         ReadyValid<RenamedInsnData<RenamedMOp<DynSize>, PRegNum<DynSize, DynSize>, DynSize>>, | ||||
|     > = m.output( | ||||
|         Array[ReadyValid[config.renamed_insn_data(config.renamed_mop(), config.p_reg_num())]] | ||||
|             [config.fetch_width.get()], | ||||
|     ); | ||||
| 
 | ||||
|     // TODO: handle resetting table after cancelling instructions
 | ||||
| 
 | ||||
|     #[hdl] | ||||
|     let insns_ready_or_move = wire(Array[Bool][config.fetch_width.get()]); | ||||
| 
 | ||||
|     for (insn_ready_or_move, insn_out) in insns_ready_or_move.into_iter().zip(insns_out) { | ||||
|         connect(insn_ready_or_move, insn_out.ready); | ||||
|     } | ||||
| 
 | ||||
|     ArrayVec::for_each(insns_in.data, |fetch_index, input_insn| { | ||||
|         #[hdl] | ||||
|         match input_insn.mop { | ||||
|             UnitMOp::<_, _, _>::TransformedMove(_) => { | ||||
|                 connect(insns_ready_or_move[fetch_index], true); | ||||
|             } | ||||
|             UnitMOp::<_, _, _>::AluBranch(_) | UnitMOp::<_, _, _>::LoadStore(_) => {} | ||||
|         } | ||||
|     }); | ||||
| 
 | ||||
|     let insns_in_prefix_summary_ty = InsnsInPrefixSummary[config.fetch_width.get()]; | ||||
|     #[hdl] | ||||
|     let insns_in_prefix_summaries = | ||||
|         wire(Array[insns_in_prefix_summary_ty][config.fetch_width.get()]); | ||||
|     let insns_in_prefix_summaries_vec = PrefixSumAlgorithm::WorkEfficient.run( | ||||
|         (0..config.fetch_width.get()).map(|fetch_index| { | ||||
|             #[hdl] | ||||
|             let insns_in_prefix_summary_in = wire(insns_in_prefix_summary_ty); | ||||
|             #[hdl] | ||||
|             let InsnsInPrefixSummary::<_> { | ||||
|                 all_ready, | ||||
|                 ready_count, | ||||
|                 retire_queue_used, | ||||
|             } = insns_in_prefix_summary_in; | ||||
|             connect(all_ready, insns_out[fetch_index].ready); | ||||
|             connect( | ||||
|                 ready_count, | ||||
|                 Expr::ty(ready_count).cast_from_uint_unchecked(all_ready.cast_to(UInt[1])), | ||||
|             ); | ||||
|             connect(retire_queue_used, Expr::ty(retire_queue_used).zero()); | ||||
|             #[hdl] | ||||
|             if let HdlSome(input_insn) = ArrayVec::get(insns_in.data, fetch_index) { | ||||
|                 connect(retire_queue_used, ready_count); | ||||
|                 #[hdl] | ||||
|                 match input_insn.mop { | ||||
|                     UnitMOp::<_, _, _>::TransformedMove(_) => { | ||||
|                         connect(all_ready, true); | ||||
|                     } | ||||
|                     UnitMOp::<_, _, _>::AluBranch(_) | UnitMOp::<_, _, _>::LoadStore(_) => {} | ||||
|                 } | ||||
|             } | ||||
|             insns_in_prefix_summary_in | ||||
|         }), | ||||
|         |l, r| { | ||||
|             #[hdl] | ||||
|             let insns_in_prefix_summary_merge = wire(insns_in_prefix_summary_ty); | ||||
|             #[hdl] | ||||
|             let InsnsInPrefixSummary::<_> { | ||||
|                 all_ready, | ||||
|                 ready_count, | ||||
|                 retire_queue_used, | ||||
|             } = insns_in_prefix_summary_merge; | ||||
|             connect(all_ready, l.all_ready & r.all_ready); | ||||
|             #[hdl] | ||||
|             if l.all_ready { | ||||
|                 connect( | ||||
|                     ready_count, | ||||
|                     Expr::ty(ready_count).cast_from_uint_unchecked( | ||||
|                         Length::as_uint(l.ready_count) + Length::as_uint(r.ready_count), | ||||
|                     ), | ||||
|                 ); | ||||
|                 connect( | ||||
|                     retire_queue_used, | ||||
|                     Expr::ty(retire_queue_used).cast_from_uint_unchecked( | ||||
|                         Length::as_uint(l.retire_queue_used) + Length::as_uint(r.retire_queue_used), | ||||
|                     ), | ||||
|                 ); | ||||
|             } else { | ||||
|                 connect(ready_count, l.ready_count); | ||||
|                 connect(retire_queue_used, l.retire_queue_used); | ||||
|             } | ||||
|             insns_in_prefix_summary_merge | ||||
|         }, | ||||
|     ); | ||||
|     for (l, r) in insns_in_prefix_summaries | ||||
|         .into_iter() | ||||
|         .zip(insns_in_prefix_summaries_vec) | ||||
|     { | ||||
|         connect(l, r); | ||||
|     } | ||||
|     connect( | ||||
|         insns_in.ready, | ||||
|         insns_in_prefix_summaries[config.fetch_width.get() - 1].ready_count, | ||||
|     ); | ||||
| 
 | ||||
|     #[hdl] | ||||
|     let retire_queue_indexes = | ||||
|         wire(Array[config.retire_queue_index()][config.fetch_width.get() + 1]); | ||||
|     connect(retire_queue_indexes[0], start_retire_queue_index); | ||||
|     connect( | ||||
|         end_retire_queue_index, | ||||
|         retire_queue_indexes[config.fetch_width.get()], | ||||
|     ); | ||||
|     for (retire_queue_index, insns_in_prefix_summary) in retire_queue_indexes | ||||
|         .into_iter() | ||||
|         .skip(1) | ||||
|         .zip(insns_in_prefix_summaries) | ||||
|     { | ||||
|         connect_any( | ||||
|             retire_queue_index.index, | ||||
|             start_retire_queue_index.index | ||||
|                 + Length::as_uint(insns_in_prefix_summary.retire_queue_used), | ||||
|         ); | ||||
|     } | ||||
| 
 | ||||
|     let mut port_configs = Vec::new(); | ||||
|     let mut src_reg_count = 0; | ||||
|     MOpTrait::for_each_src_reg(MOp.uninit(), &mut |_, src_index| { | ||||
|         src_reg_count = src_reg_count.max(src_index + 1); | ||||
|     }); | ||||
|     for _ in 0..config.fetch_width.get() { | ||||
|         for _ in 0..src_reg_count { | ||||
|             port_configs.push(RenameTablePortConfig::Read { | ||||
|                 addr_range: MOpRegNum::NON_CONST_REG_NUMS, | ||||
|             }); | ||||
|         } | ||||
|         for dest_reg_kind in MOpDestReg::REG_KINDS { | ||||
|             port_configs.push(RenameTablePortConfig::Write { | ||||
|                 addr_range: dest_reg_kind.reg_num_range(), | ||||
|             }); | ||||
|         } | ||||
|     } | ||||
| 
 | ||||
|     #[hdl] | ||||
|     let rename_table = instance(rename_table(config, &port_configs)); | ||||
| 
 | ||||
|     connect(rename_table.cd, cd); | ||||
| 
 | ||||
|     for read_port in rename_table.read_ports { | ||||
|         connect_any(read_port.addr, 0_hdl_u0); | ||||
|     } | ||||
|     for write_port in rename_table.write_ports { | ||||
|         connect_any(write_port.addr, 0_hdl_u0); | ||||
|         connect_any(write_port.data, config.p_reg_num().const_zero()); | ||||
|     } | ||||
| 
 | ||||
|     ArrayVec::for_each( | ||||
|         ReadyValidArray::firing_data(insns_in), | ||||
|         |fetch_index, input_insn| { | ||||
|             let read_port_index = fetch_index * src_reg_count; | ||||
|             let write_port_index = fetch_index * MOpDestReg::REG_COUNT; | ||||
|             #[hdl] | ||||
|             let InstructionRenameInputInsn::<_, _> { | ||||
|                 mop, | ||||
|                 pc, | ||||
|                 renamed_dest, | ||||
|             } = input_insn; | ||||
|             let insn_out = MOpTrait::map_regs( | ||||
|                 mop, | ||||
|                 (), | ||||
|                 config.p_reg_num_width(), | ||||
|                 &mut |src_reg, src_index| { | ||||
|                     connect( | ||||
|                         rename_table.read_ports[read_port_index + src_index].addr, | ||||
|                         src_reg.cast_bits_to(MOpRegNum), | ||||
|                     ); | ||||
|                     rename_table.read_ports[read_port_index + src_index] | ||||
|                         .data | ||||
|                         .cast_to_bits() | ||||
|                 }, | ||||
|             ); | ||||
|             for (i, dest_reg) in MOpDestReg::regs(MOpTrait::dest_reg(mop)) | ||||
|                 .into_iter() | ||||
|                 .enumerate() | ||||
|             { | ||||
|                 connect( | ||||
|                     rename_table.write_ports[write_port_index + i].addr, | ||||
|                     dest_reg, | ||||
|                 ); | ||||
|                 connect( | ||||
|                     rename_table.write_ports[write_port_index + i].data, | ||||
|                     renamed_dest, | ||||
|                 ); | ||||
|             } | ||||
|             let insn_out = UnitMOp::try_with_transformed_move_op( | ||||
|                 insn_out, | ||||
|                 config.renamed_mop().TransformedMove, | ||||
|                 |insn_out: Expr<HdlOption<_>>, move_reg: Expr<MoveRegMOp<_, _>>| { | ||||
|                     for i in 0..MOpDestReg::REG_COUNT { | ||||
|                         // execute move by using same PRegNum as src[0] for dest
 | ||||
|                         connect( | ||||
|                             rename_table.write_ports[write_port_index + i].data, | ||||
|                             move_reg.common.src[0].cast_bits_to(config.p_reg_num()), | ||||
|                         ); | ||||
|                     } | ||||
|                     // move already executed, so remove it
 | ||||
|                     connect(insn_out, Expr::ty(insn_out).HdlNone()); | ||||
|                 }, | ||||
|             ); | ||||
|             connect( | ||||
|                 insns_out[fetch_index].data, | ||||
|                 HdlOption::map(insn_out, |insn_out| { | ||||
|                     #[hdl] | ||||
|                     RenamedInsnData::<_, _, _> { | ||||
|                         retire_queue_index: retire_queue_indexes[fetch_index], | ||||
|                         pc, | ||||
|                         dest: renamed_dest, | ||||
|                         mop: insn_out, | ||||
|                     } | ||||
|                 }), | ||||
|             ); | ||||
|         }, | ||||
|     ); | ||||
| } | ||||
|  | @ -2,7 +2,10 @@ | |||
| // See Notices.txt for copyright information
 | ||||
| pub mod config; | ||||
| pub mod instruction; | ||||
| pub mod instruction_rename; | ||||
| pub mod reg_alloc; | ||||
| pub mod register; | ||||
| pub mod rename_table; | ||||
| pub mod retire_queue; | ||||
| pub mod unit; | ||||
| pub mod util; | ||||
|  |  | |||
|  | @ -3,17 +3,17 @@ | |||
| use crate::{ | ||||
|     config::CpuConfig, | ||||
|     instruction::{ | ||||
|         MOp, MOpDestReg, MOpRegNum, MOpTrait, MoveRegMOp, PRegNum, RenameTableName, UnitOutRegNum, | ||||
|         MOp, MOpDestReg, MOpRegNum, MOpTrait, MoveRegMOp, PRegNum, UnitOutRegNum, | ||||
|         COMMON_MOP_SRC_LEN, | ||||
|     }, | ||||
|     unit::{ | ||||
|         unit_base::{UnitForwardingInfo, UnitInput}, | ||||
|         GlobalState, TrapData, UnitMOp, UnitOutput, UnitOutputWrite, UnitResult, | ||||
|         UnitResultCompleted, UnitTrait, | ||||
|     }, | ||||
|     util::tree_reduce::tree_reduce_with_state, | ||||
|     util::array_vec::ReadyValidArray, | ||||
| }; | ||||
| use fayalite::{ | ||||
|     int::BoolOrIntType, | ||||
|     memory::{splat_mask, WriteStruct}, | ||||
|     module::{instance_with_loc, memory_with_loc, wire_with_loc}, | ||||
|     prelude::*, | ||||
|  | @ -44,150 +44,12 @@ pub enum FetchDecodeSpecialOp { | |||
| 
 | ||||
| #[hdl] | ||||
| pub struct FetchDecodeInterface<FetchWidth: Size> { | ||||
|     pub decoded_insns: ArrayType<ReadyValid<FetchedDecodedMOp>, FetchWidth>, | ||||
|     pub decoded_insns: ReadyValidArray<FetchedDecodedMOp, FetchWidth>, | ||||
|     #[hdl(flip)] | ||||
|     pub fetch_decode_special_op: ReadyValid<FetchDecodeSpecialOp>, | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| struct ROBRenamedInsn<UnitNumWidth: Size, OutRegNumWidth: Size> { | ||||
|     mop_dest: MOpDestReg, | ||||
|     p_dest: PRegNum<UnitNumWidth, OutRegNumWidth>, | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| struct ROBEntry<UnitNumWidth: Size, OutRegNumWidth: Size> { | ||||
|     renamed_insn: ROBRenamedInsn<UnitNumWidth, OutRegNumWidth>, | ||||
|     dest_written: Bool, | ||||
| } | ||||
| 
 | ||||
| #[hdl_module] | ||||
| fn rob(config: &CpuConfig) { | ||||
|     #[hdl] | ||||
|     let cd: ClockDomain = m.input(); | ||||
|     #[hdl] | ||||
|     let renamed_insns_in: Array<ReadyValid<ROBRenamedInsn<DynSize, DynSize>>> = m.input( | ||||
|         Array[ReadyValid[ROBRenamedInsn[config.unit_num_width()][config.out_reg_num_width]]] | ||||
|             [config.fetch_width.get()], | ||||
|     ); | ||||
|     #[hdl] | ||||
|     let unit_forwarding_info: UnitForwardingInfo<DynSize, DynSize, DynSize> = | ||||
|         m.input(config.unit_forwarding_info()); | ||||
| 
 | ||||
|     let rob_entry_ty = ROBEntry[config.unit_num_width()][config.out_reg_num_width]; | ||||
|     #[hdl] | ||||
|     let rob = reg_builder() | ||||
|         .clock_domain(cd) | ||||
|         .no_reset(Array[rob_entry_ty][config.rob_size.get()]); | ||||
|     #[hdl] | ||||
|     let rob_valid_start = reg_builder() | ||||
|         .clock_domain(cd) | ||||
|         .reset(UInt::range(0..config.rob_size.get()).zero()); | ||||
|     #[hdl] | ||||
|     let rob_valid_end = reg_builder() | ||||
|         .clock_domain(cd) | ||||
|         .reset(UInt::range(0..config.rob_size.get()).zero()); | ||||
|     #[hdl] | ||||
|     let free_space = wire(UInt::range_inclusive(0..=config.rob_size.get())); | ||||
|     #[hdl] | ||||
|     if rob_valid_end.cmp_lt(rob_valid_start) { | ||||
|         // rob_valid_end wrapped around but start didn't
 | ||||
|         connect_any( | ||||
|             free_space, | ||||
|             rob_valid_end + config.rob_size.get() - rob_valid_start, | ||||
|         ); | ||||
|     } else { | ||||
|         connect_any(free_space, rob_valid_end - rob_valid_start); | ||||
|     } | ||||
| 
 | ||||
|     struct IndexAndRange { | ||||
|         index: Expr<UInt>, | ||||
|         range: std::ops::Range<usize>, | ||||
|     } | ||||
| 
 | ||||
|     let mut next_write_index = IndexAndRange { | ||||
|         index: rob_valid_end, | ||||
|         range: 0..config.rob_size.get(), | ||||
|     }; | ||||
|     for fetch_index in 0..config.fetch_width.get() { | ||||
|         let write_index = next_write_index; | ||||
|         let next_write_index_range = write_index.range.start..write_index.range.end + 1; | ||||
|         next_write_index = IndexAndRange { | ||||
|             index: wire_with_loc( | ||||
|                 &format!("next_write_index_{fetch_index}"), | ||||
|                 SourceLocation::caller(), | ||||
|                 UInt::range(next_write_index_range.clone()), | ||||
|             ), | ||||
|             range: next_write_index_range, | ||||
|         }; | ||||
|         connect( | ||||
|             renamed_insns_in[fetch_index].ready, | ||||
|             fetch_index.cmp_lt(free_space), | ||||
|         ); | ||||
|         #[hdl] | ||||
|         if let HdlSome(renamed_insn) = ReadyValid::firing_data(renamed_insns_in[fetch_index]) { | ||||
|             for i in write_index.range.clone() { | ||||
|                 #[hdl] | ||||
|                 if write_index.index.cmp_eq(i) { | ||||
|                     connect( | ||||
|                         rob[i % config.rob_size.get()], | ||||
|                         #[hdl] | ||||
|                         ROBEntry { | ||||
|                             renamed_insn, | ||||
|                             dest_written: false, | ||||
|                         }, | ||||
|                     ); | ||||
|                 } | ||||
|             } | ||||
|         } | ||||
|         // TODO: optimize write_index chain better
 | ||||
|         connect_any( | ||||
|             next_write_index.index, | ||||
|             write_index.index | ||||
|                 + ReadyValid::firing(renamed_insns_in[fetch_index]).cast_to_static::<UInt<1>>(), | ||||
|         ); | ||||
|     } | ||||
|     assert!( | ||||
|         config.rob_size >= config.fetch_width, | ||||
|         "rob_size ({}) is too small for fetch_width = {} -- next_write_index would overflow", | ||||
|         config.rob_size, | ||||
|         config.fetch_width, | ||||
|     ); | ||||
|     #[hdl] | ||||
|     if next_write_index.index.cmp_lt(config.rob_size.get()) { | ||||
|         connect_any(rob_valid_end, next_write_index.index); | ||||
|     } else { | ||||
|         connect_any( | ||||
|             rob_valid_end, | ||||
|             next_write_index.index - config.rob_size.get(), | ||||
|         ); | ||||
|     } | ||||
| 
 | ||||
|     // TODO: optimize better, O(rob_size * unit_count) is too big here
 | ||||
|     for rob_index in 0..config.rob_size.get() { | ||||
|         for unit_index in 0..config.non_const_unit_nums().len() { | ||||
|             #[hdl] | ||||
|             if let HdlSome(unit_output_write) = unit_forwarding_info.unit_output_writes[unit_index] | ||||
|             { | ||||
|                 #[hdl] | ||||
|                 let UnitOutputWrite::<_> { | ||||
|                     which: unit_out_reg, | ||||
|                     value: _, | ||||
|                 } = unit_output_write; | ||||
|                 let p_reg_num = #[hdl] | ||||
|                 PRegNum::<_, _> { | ||||
|                     unit_num: config.unit_num().from_index(unit_index), | ||||
|                     unit_out_reg, | ||||
|                 }; | ||||
|                 #[hdl] | ||||
|                 if rob[rob_index].renamed_insn.p_dest.cmp_eq(p_reg_num) { | ||||
|                     connect(rob[rob_index].dest_written, true); | ||||
|                 } | ||||
|             } | ||||
|         } | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| #[cfg(todo)] | ||||
| #[hdl_module] | ||||
| /// combination register allocator, register renaming, unit selection, and retire handling
 | ||||
| pub fn reg_alloc(config: &CpuConfig) { | ||||
|  | @ -205,10 +67,6 @@ pub fn reg_alloc(config: &CpuConfig) { | |||
|     ); | ||||
|     // TODO: finish
 | ||||
| 
 | ||||
|     #[hdl] | ||||
|     let rob = instance(rob(config)); | ||||
|     connect(rob.cd, cd); | ||||
| 
 | ||||
|     let mut rename_table_mems = BTreeMap::<RenameTableName, MemBuilder<_>>::new(); | ||||
| 
 | ||||
|     for reg_kind in MOpDestReg::REG_KINDS { | ||||
|  | @ -238,11 +96,6 @@ pub fn reg_alloc(config: &CpuConfig) { | |||
|     #[hdl] | ||||
|     let renamed_mops_out_reg = wire(Array[HdlOption[config.p_reg_num()]][config.fetch_width.get()]); | ||||
|     for fetch_index in 0..config.fetch_width.get() { | ||||
|         // TODO: finish
 | ||||
|         connect( | ||||
|             rob.renamed_insns_in[fetch_index].data, | ||||
|             Expr::ty(rob).renamed_insns_in.element().data.HdlNone(), | ||||
|         ); | ||||
|         // TODO: finish
 | ||||
|         connect( | ||||
|             fetch_decode_interface.decoded_insns[fetch_index].ready, | ||||
|  | @ -483,7 +336,6 @@ pub fn reg_alloc(config: &CpuConfig) { | |||
|     ); | ||||
|     #[hdl] | ||||
|     let unit_forwarding_info = wire(config.unit_forwarding_info()); | ||||
|     connect(rob.unit_forwarding_info, unit_forwarding_info); | ||||
|     for (unit_index, unit_config) in config.units.iter().enumerate() { | ||||
|         let dyn_unit = unit_config.kind.unit(config, unit_index); | ||||
|         let unit = instance_with_loc( | ||||
|  |  | |||
|  | @ -1,7 +1,10 @@ | |||
| // SPDX-License-Identifier: LGPL-3.0-or-later
 | ||||
| // See Notices.txt for copyright information
 | ||||
| use crate::util::tree_reduce::tree_reduce; | ||||
| use fayalite::{module::wire_with_loc, prelude::*, util::ready_valid::ReadyValid}; | ||||
| use fayalite::{ | ||||
|     module::wire_with_loc, | ||||
|     prelude::*, | ||||
|     util::{prefix_sum::reduce, ready_valid::ReadyValid}, | ||||
| }; | ||||
| use std::{num::NonZeroUsize, ops::Range}; | ||||
| 
 | ||||
| #[hdl_module] | ||||
|  | @ -44,7 +47,7 @@ pub fn unit_free_regs_tracker( | |||
|         count, | ||||
|         count_overflowed, | ||||
|         alloc_nums, | ||||
|     }) = tree_reduce( | ||||
|     }) = reduce( | ||||
|         (0..reg_count).map(|index| Summary { | ||||
|             range: index..index + 1, | ||||
|             count: (!allocated_reg[index]) | ||||
|  |  | |||
							
								
								
									
										187
									
								
								crates/cpu/src/rename_table.rs
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										187
									
								
								crates/cpu/src/rename_table.rs
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,187 @@ | |||
| // SPDX-License-Identifier: LGPL-3.0-or-later
 | ||||
| // See Notices.txt for copyright information
 | ||||
| 
 | ||||
| use crate::{ | ||||
|     config::CpuConfig, | ||||
|     instruction::{MOpRegNum, PRegNum}, | ||||
|     util::range_intersection, | ||||
| }; | ||||
| use fayalite::{ | ||||
|     memory::{splat_mask, ReadStruct, WriteStruct}, | ||||
|     module::memory_with_loc, | ||||
|     prelude::*, | ||||
| }; | ||||
| use std::{mem, ops::Range}; | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct RenameTableReadPort<UnitNumWidth: Size, OutRegNumWidth: Size> { | ||||
|     pub addr: MOpRegNum, | ||||
|     #[hdl(flip)] | ||||
|     pub data: PRegNum<UnitNumWidth, OutRegNumWidth>, | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct RenameTableWritePort<UnitNumWidth: Size, OutRegNumWidth: Size> { | ||||
|     pub addr: MOpRegNum, | ||||
|     pub data: PRegNum<UnitNumWidth, OutRegNumWidth>, | ||||
| } | ||||
| 
 | ||||
| #[derive(Clone, Debug)] | ||||
| pub enum RenameTablePortConfig { | ||||
|     Read { addr_range: Range<u32> }, | ||||
|     Write { addr_range: Range<u32> }, | ||||
| } | ||||
| 
 | ||||
| /// register rename table.
 | ||||
| /// all read/write operations are done in the order of `port_configs`.
 | ||||
| /// So if `port_configs[0]` is a write and `port_configs[1]` is a read,
 | ||||
| /// then the read port will combinatorially return data written by the
 | ||||
| /// write port in the *same* clock cycle. However, if `port_configs[0]`
 | ||||
| /// is a read and `port_configs[1]` is a write, then the read port will
 | ||||
| /// not see the data written by the write port until the *next* clock cycle.
 | ||||
| #[hdl_module] | ||||
| pub fn rename_table(config: &CpuConfig, port_configs: &[RenameTablePortConfig]) { | ||||
|     let read_count = port_configs | ||||
|         .iter() | ||||
|         .filter(|v| matches!(v, RenameTablePortConfig::Read { .. })) | ||||
|         .count(); | ||||
|     let write_count = port_configs | ||||
|         .iter() | ||||
|         .filter(|v| matches!(v, RenameTablePortConfig::Write { .. })) | ||||
|         .count(); | ||||
| 
 | ||||
|     #[hdl] | ||||
|     let cd: ClockDomain = m.input(); | ||||
|     #[hdl] | ||||
|     let read_ports: Array<RenameTableReadPort<DynSize, DynSize>> = m.input( | ||||
|         Array[RenameTableReadPort[config.unit_num_width()][config.out_reg_num_width]][read_count], | ||||
|     ); | ||||
|     #[hdl] | ||||
|     let write_ports: Array<RenameTableWritePort<DynSize, DynSize>> = m.input( | ||||
|         Array[RenameTableWritePort[config.unit_num_width()][config.out_reg_num_width]][write_count], | ||||
|     ); | ||||
| 
 | ||||
|     for read_port in read_ports { | ||||
|         connect(read_port.data, config.p_reg_num().const_zero()); | ||||
|     } | ||||
| 
 | ||||
|     let port_configs_and_indexes = port_configs.iter().scan( | ||||
|         (0usize, 0), | ||||
|         |(read_port_index, write_port_index), port_config| { | ||||
|             Some(( | ||||
|                 port_config, | ||||
|                 match port_config { | ||||
|                     RenameTablePortConfig::Read { .. } => { | ||||
|                         mem::replace(read_port_index, *read_port_index + 1) | ||||
|                     } | ||||
|                     RenameTablePortConfig::Write { .. } => { | ||||
|                         mem::replace(write_port_index, *write_port_index + 1) | ||||
|                     } | ||||
|                 }, | ||||
|             )) | ||||
|         }, | ||||
|     ); | ||||
| 
 | ||||
|     let mut range_transitions = Vec::with_capacity(port_configs.len() * 2); | ||||
|     for port_config in port_configs { | ||||
|         let (RenameTablePortConfig::Read { addr_range } | ||||
|         | RenameTablePortConfig::Write { addr_range }) = port_config; | ||||
|         range_transitions.push(addr_range.start); | ||||
|         range_transitions.push(addr_range.end); | ||||
|     } | ||||
|     range_transitions.sort_unstable(); | ||||
|     range_transitions.dedup(); | ||||
|     let mut last_range_transition = None; | ||||
|     for range_transition in range_transitions { | ||||
|         let Some(last_range_transition) = last_range_transition.replace(range_transition) else { | ||||
|             continue; | ||||
|         }; | ||||
|         let cur_addr_range = last_range_transition..range_transition; | ||||
|         let mut mem = memory_with_loc( | ||||
|             &if cur_addr_range.len() == 1 { | ||||
|                 format!("mem_{:#x}", cur_addr_range.start) | ||||
|             } else { | ||||
|                 format!("mem_{:#x}_{:#x}", cur_addr_range.start, cur_addr_range.end) | ||||
|             }, | ||||
|             config.p_reg_num(), | ||||
|             SourceLocation::caller(), | ||||
|         ); | ||||
|         mem.depth(cur_addr_range.len()); | ||||
|         let addr_in_range = |addr: Expr<MOpRegNum>| { | ||||
|             if cur_addr_range.len() == 1 { | ||||
|                 addr.value.cmp_eq(cur_addr_range.start) | ||||
|             } else { | ||||
|                 addr.value.cmp_ge(cur_addr_range.start) & addr.value.cmp_lt(cur_addr_range.end) | ||||
|             } | ||||
|         }; | ||||
|         for (port_config, port_index) in port_configs_and_indexes.clone() { | ||||
|             match port_config { | ||||
|                 RenameTablePortConfig::Read { addr_range } => { | ||||
|                     if range_intersection(&addr_range, &cur_addr_range).is_none() { | ||||
|                         continue; | ||||
|                     } | ||||
|                     let port = read_ports[port_index]; | ||||
|                     #[hdl] | ||||
|                     let ReadStruct::<_, _> { | ||||
|                         addr, | ||||
|                         en, | ||||
|                         clk, | ||||
|                         data, | ||||
|                     } = mem.new_read_port(); | ||||
|                     connect_any(addr, port.addr.value - cur_addr_range.start); | ||||
|                     connect(en, addr_in_range(port.addr)); | ||||
|                     connect(clk, cd.clk); | ||||
|                     #[hdl] | ||||
|                     if en { | ||||
|                         connect(port.data, data); | ||||
|                     } | ||||
|                 } | ||||
|                 RenameTablePortConfig::Write { addr_range } => { | ||||
|                     if range_intersection(&addr_range, &cur_addr_range).is_none() { | ||||
|                         continue; | ||||
|                     } | ||||
|                     let port = write_ports[port_index]; | ||||
|                     #[hdl] | ||||
|                     let WriteStruct::<_, _> { | ||||
|                         addr, | ||||
|                         en, | ||||
|                         clk, | ||||
|                         data, | ||||
|                         mask, | ||||
|                     } = mem.new_write_port(); | ||||
|                     connect_any(addr, port.addr.value - cur_addr_range.start); | ||||
|                     connect(en, addr_in_range(port.addr)); | ||||
|                     connect(clk, cd.clk); | ||||
|                     connect(data, port.data); | ||||
|                     connect(mask, splat_mask(Expr::ty(port).data, true.to_expr())); | ||||
|                 } | ||||
|             } | ||||
|         } | ||||
|     } | ||||
|     for (port_config_index, (port_config, port_index)) in | ||||
|         port_configs_and_indexes.clone().enumerate() | ||||
|     { | ||||
|         let RenameTablePortConfig::Read { addr_range } = port_config else { | ||||
|             continue; | ||||
|         }; | ||||
|         let port = read_ports[port_index]; | ||||
|         for (prev_port_config, prev_port_index) in | ||||
|             port_configs_and_indexes.clone().take(port_config_index) | ||||
|         { | ||||
|             let RenameTablePortConfig::Write { | ||||
|                 addr_range: prev_addr_range, | ||||
|             } = prev_port_config | ||||
|             else { | ||||
|                 continue; | ||||
|             }; | ||||
|             if range_intersection(addr_range, prev_addr_range).is_none() { | ||||
|                 continue; | ||||
|             } | ||||
|             let prev_port = write_ports[prev_port_index]; | ||||
|             #[hdl] | ||||
|             if prev_port.addr.cmp_eq(port.addr) { | ||||
|                 connect(port.data, prev_port.data); | ||||
|             } | ||||
|         } | ||||
|     } | ||||
| } | ||||
							
								
								
									
										12
									
								
								crates/cpu/src/retire_queue.rs
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										12
									
								
								crates/cpu/src/retire_queue.rs
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,12 @@ | |||
| // SPDX-License-Identifier: LGPL-3.0-or-later
 | ||||
| // See Notices.txt for copyright information
 | ||||
| 
 | ||||
| use crate::config::CpuConfig; | ||||
| use fayalite::prelude::*; | ||||
| 
 | ||||
| #[hdl_module] | ||||
| pub fn retire_queue(config: &CpuConfig) { | ||||
|     #[hdl] | ||||
|     let cd: ClockDomain = m.input(); | ||||
|     todo!(); | ||||
| } | ||||
|  | @ -8,13 +8,15 @@ use crate::{ | |||
|         RenamedMOp, UnitOutRegNum, | ||||
|     }, | ||||
|     register::{FlagsMode, PRegValue}, | ||||
|     unit::unit_base::UnitToRegAlloc, | ||||
| }; | ||||
| use fayalite::{ | ||||
|     bundle::{Bundle, BundleType}, | ||||
|     int::BoolOrIntType, | ||||
|     intern::{Intern, Interned}, | ||||
|     prelude::*, | ||||
|     util::ready_valid::ReadyValid, | ||||
| }; | ||||
| use std::marker::PhantomData; | ||||
| 
 | ||||
| pub mod alu_branch; | ||||
| pub mod unit_base; | ||||
|  | @ -204,23 +206,28 @@ macro_rules! all_units { | |||
|             })* | ||||
|         }; | ||||
| 
 | ||||
|         $(impl<$DestReg: Type, $SrcRegWidth: Size> MOpInto<RenamedMOp<$DestReg, $SrcRegWidth>> for $BeforeOp { | ||||
|             fn mop_into_ty(self) -> RenamedMOp<$DestReg, $SrcRegWidth> { | ||||
|                 RenamedMOp[MOpTrait::dest_reg_ty(self)][MOpTrait::src_reg_width(self)] | ||||
|             } | ||||
|             fn mop_into(this: Expr<Self>) -> Expr<RenamedMOp<$DestReg, $SrcRegWidth>> { | ||||
|                 MOpInto::<RenamedMOp<$DestReg, $SrcRegWidth>>::mop_into_ty(Expr::ty(this)).$BeforeUnit(this) | ||||
|             } | ||||
|         })* | ||||
|         const _: () = { | ||||
|             #[hdl] | ||||
|             type $DestReg = (); | ||||
| 
 | ||||
|         $(impl<$DestReg: Type, $SrcRegWidth: Size> MOpInto<RenamedMOp<$DestReg, $SrcRegWidth>> for $AfterOp { | ||||
|             fn mop_into_ty(self) -> RenamedMOp<$DestReg, $SrcRegWidth> { | ||||
|                 RenamedMOp[MOpTrait::dest_reg_ty(self)][MOpTrait::src_reg_width(self)] | ||||
|             } | ||||
|             fn mop_into(this: Expr<Self>) -> Expr<RenamedMOp<$DestReg, $SrcRegWidth>> { | ||||
|                 MOpInto::<RenamedMOp<$DestReg, $SrcRegWidth>>::mop_into_ty(Expr::ty(this)).$AfterUnit(this) | ||||
|             } | ||||
|         })* | ||||
|             $(impl<$SrcRegWidth: Size> MOpInto<RenamedMOp<$SrcRegWidth>> for $BeforeOp { | ||||
|                 fn mop_into_ty(self) -> RenamedMOp<$SrcRegWidth> { | ||||
|                     RenamedMOp[MOpTrait::src_reg_width(self)] | ||||
|                 } | ||||
|                 fn mop_into(this: Expr<Self>) -> Expr<RenamedMOp<$SrcRegWidth>> { | ||||
|                     MOpInto::<RenamedMOp<$SrcRegWidth>>::mop_into_ty(Expr::ty(this)).$BeforeUnit(this) | ||||
|                 } | ||||
|             })* | ||||
| 
 | ||||
|             $(impl<$SrcRegWidth: Size> MOpInto<RenamedMOp<$SrcRegWidth>> for $AfterOp { | ||||
|                 fn mop_into_ty(self) -> RenamedMOp<$SrcRegWidth> { | ||||
|                     RenamedMOp[MOpTrait::src_reg_width(self)] | ||||
|                 } | ||||
|                 fn mop_into(this: Expr<Self>) -> Expr<RenamedMOp<$SrcRegWidth>> { | ||||
|                     MOpInto::<RenamedMOp<$SrcRegWidth>>::mop_into_ty(Expr::ty(this)).$AfterUnit(this) | ||||
|                 } | ||||
|             })* | ||||
|         }; | ||||
|     }; | ||||
| } | ||||
| 
 | ||||
|  | @ -253,6 +260,80 @@ pub struct GlobalState { | |||
|     pub flags_mode: FlagsMode, | ||||
| } | ||||
| 
 | ||||
| /// index into the retire queue (the queue of instructions that haven't yet retired)
 | ||||
| #[hdl(cmp_eq)] | ||||
| pub struct RetireQueueIndex<Width: Size> { | ||||
|     /// increases by one for each instruction added to the retire queue.
 | ||||
|     ///
 | ||||
|     /// this wraps around, so you must not compare it using `cmp_lt`/`cmp_gt`
 | ||||
|     /// but instead must use [`Self::insns_until`] and compare the output with zero.
 | ||||
|     pub index: UIntType<Width>, | ||||
| } | ||||
| 
 | ||||
| impl<Width: Size> RetireQueueIndex<Width> { | ||||
|     pub fn insns_until( | ||||
|         this: impl ToExpr<Type = Self>, | ||||
|         target: impl ToExpr<Type = Self>, | ||||
|     ) -> Expr<SIntType<Width>> { | ||||
|         let this = this.to_expr(); | ||||
|         let target = target.to_expr(); | ||||
|         assert_eq!(Expr::ty(this), Expr::ty(target)); | ||||
|         (this.index - target.index).cast_to(Expr::ty(this).index.as_same_width_sint()) | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct RenamedInsnData<MOp, DestReg, RetireQueueIndexWidth: Size> { | ||||
|     pub retire_queue_index: RetireQueueIndex<RetireQueueIndexWidth>, | ||||
|     pub pc: UInt<64>, | ||||
|     pub dest: DestReg, | ||||
|     pub mop: MOp, | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct UnitForwardingInfo<UnitNumWidth: Size, OutRegNumWidth: Size, UnitCount: Size> { | ||||
|     pub unit_output_writes: ArrayType<HdlOption<UnitOutputWrite<OutRegNumWidth>>, UnitCount>, | ||||
|     pub unit_reg_frees: ArrayType<HdlOption<UnitOutRegNum<OutRegNumWidth>>, UnitCount>, | ||||
|     pub _phantom: PhantomData<UnitNumWidth>, | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct UnitToRegAlloc< | ||||
|     MOp: Type, | ||||
|     ExtraOut: Type, | ||||
|     UnitNumWidth: Size, | ||||
|     OutRegNumWidth: Size, | ||||
|     UnitCount: Size, | ||||
|     RetireQueueIndexWidth: Size, | ||||
| > { | ||||
|     #[hdl(flip)] | ||||
|     pub unit_forwarding_info: UnitForwardingInfo<UnitNumWidth, OutRegNumWidth, UnitCount>, | ||||
|     #[hdl(flip)] | ||||
|     pub input: | ||||
|         ReadyValid<RenamedInsnData<MOp, UnitOutRegNum<OutRegNumWidth>, RetireQueueIndexWidth>>, | ||||
|     #[hdl(flip)] | ||||
|     pub cancel_input: HdlOption<UnitCancelInput<OutRegNumWidth>>, | ||||
|     pub output: HdlOption<UnitOutput<OutRegNumWidth, RetireQueueIndexWidth, ExtraOut>>, | ||||
| } | ||||
| 
 | ||||
| impl< | ||||
|         MOp: Type, | ||||
|         ExtraOut: Type, | ||||
|         UnitNumWidth: Size, | ||||
|         OutRegNumWidth: Size, | ||||
|         UnitCount: Size, | ||||
|         RetireQueueIndexWidth: Size, | ||||
|     > | ||||
|     UnitToRegAlloc<MOp, ExtraOut, UnitNumWidth, OutRegNumWidth, UnitCount, RetireQueueIndexWidth> | ||||
| { | ||||
|     pub fn mop_ty(self) -> MOp { | ||||
|         self.input.data.HdlSome.mop | ||||
|     } | ||||
|     pub fn extra_out_ty(self) -> ExtraOut { | ||||
|         self.output.HdlSome.extra_out_ty() | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| #[hdl(cmp_eq)] | ||||
| pub struct UnitResultCompleted<ExtraOut> { | ||||
|     pub value: PRegValue, | ||||
|  | @ -261,7 +342,7 @@ pub struct UnitResultCompleted<ExtraOut> { | |||
| 
 | ||||
| #[hdl(cmp_eq)] | ||||
| pub struct UnitOutputWrite<OutRegNumWidth: Size> { | ||||
|     pub which: UnitOutRegNum<OutRegNumWidth>, | ||||
|     pub dest: UnitOutRegNum<OutRegNumWidth>, | ||||
|     pub value: PRegValue, | ||||
| } | ||||
| 
 | ||||
|  | @ -283,20 +364,32 @@ impl<ExtraOut: Type> UnitResult<ExtraOut> { | |||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct UnitOutput<OutRegNumWidth: Size, ExtraOut> { | ||||
|     pub which: UnitOutRegNum<OutRegNumWidth>, | ||||
| pub struct UnitOutput<OutRegNumWidth: Size, RetireQueueIndexWidth: Size, ExtraOut> { | ||||
|     pub dest: UnitOutRegNum<OutRegNumWidth>, | ||||
|     pub retire_queue_index: RetireQueueIndex<RetireQueueIndexWidth>, | ||||
|     pub result: UnitResult<ExtraOut>, | ||||
| } | ||||
| 
 | ||||
| impl<OutRegNumWidth: Size, ExtraOut: Type> UnitOutput<OutRegNumWidth, ExtraOut> { | ||||
| impl<OutRegNumWidth: Size, RetireQueueIndexWidth: Size, ExtraOut: Type> | ||||
|     UnitOutput<OutRegNumWidth, RetireQueueIndexWidth, ExtraOut> | ||||
| { | ||||
|     pub fn extra_out_ty(self) -> ExtraOut { | ||||
|         self.result.extra_out_ty() | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| #[hdl(cmp_eq)] | ||||
| pub struct UnitCancelInput<OutRegNumWidth: Size> { | ||||
|     pub which: UnitOutRegNum<OutRegNumWidth>, | ||||
| pub struct UnitCancelInput<RetireQueueIndexWidth: Size> { | ||||
|     pub target: RetireQueueIndex<RetireQueueIndexWidth>, | ||||
| } | ||||
| 
 | ||||
| impl<RetireQueueIndexWidth: Size> UnitCancelInput<RetireQueueIndexWidth> { | ||||
|     pub fn is_canceled( | ||||
|         this: impl ToExpr<Type = Self>, | ||||
|         insn_retire_queue_index: impl ToExpr<Type = RetireQueueIndex<RetireQueueIndexWidth>>, | ||||
|     ) -> Expr<Bool> { | ||||
|         RetireQueueIndex::insns_until(insn_retire_queue_index, this.to_expr().target).cmp_ge(0i8) | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| pub trait UnitTrait: | ||||
|  | @ -312,17 +405,14 @@ pub trait UnitTrait: | |||
| 
 | ||||
|     fn unit_kind(&self) -> UnitKind; | ||||
| 
 | ||||
|     fn extract_mop( | ||||
|         &self, | ||||
|         mop: Expr<RenamedMOp<UnitOutRegNum<DynSize>, DynSize>>, | ||||
|     ) -> Expr<HdlOption<Self::MOp>>; | ||||
|     fn extract_mop(&self, mop: Expr<RenamedMOp<DynSize>>) -> Expr<HdlOption<Self::MOp>>; | ||||
| 
 | ||||
|     fn module(&self) -> Interned<Module<Self::Type>>; | ||||
| 
 | ||||
|     fn unit_to_reg_alloc( | ||||
|         &self, | ||||
|         this: Expr<Self::Type>, | ||||
|     ) -> Expr<UnitToRegAlloc<Self::MOp, Self::ExtraOut, DynSize, DynSize, DynSize>>; | ||||
|     ) -> Expr<UnitToRegAlloc<Self::MOp, Self::ExtraOut, DynSize, DynSize, DynSize, DynSize>>; | ||||
| 
 | ||||
|     fn cd(&self, this: Expr<Self::Type>) -> Expr<ClockDomain>; | ||||
| 
 | ||||
|  | @ -370,10 +460,7 @@ impl UnitTrait for DynUnit { | |||
|         self.unit_kind | ||||
|     } | ||||
| 
 | ||||
|     fn extract_mop( | ||||
|         &self, | ||||
|         mop: Expr<RenamedMOp<UnitOutRegNum<DynSize>, DynSize>>, | ||||
|     ) -> Expr<HdlOption<Self::MOp>> { | ||||
|     fn extract_mop(&self, mop: Expr<RenamedMOp<DynSize>>) -> Expr<HdlOption<Self::MOp>> { | ||||
|         self.unit.extract_mop(mop) | ||||
|     } | ||||
| 
 | ||||
|  | @ -384,7 +471,7 @@ impl UnitTrait for DynUnit { | |||
|     fn unit_to_reg_alloc( | ||||
|         &self, | ||||
|         this: Expr<Self::Type>, | ||||
|     ) -> Expr<UnitToRegAlloc<Self::MOp, Self::ExtraOut, DynSize, DynSize, DynSize>> { | ||||
|     ) -> Expr<UnitToRegAlloc<Self::MOp, Self::ExtraOut, DynSize, DynSize, DynSize, DynSize>> { | ||||
|         self.unit.unit_to_reg_alloc(this) | ||||
|     } | ||||
| 
 | ||||
|  | @ -425,10 +512,7 @@ impl<T: UnitTrait + Clone + std::hash::Hash + Eq> UnitTrait for DynUnitWrapper<T | |||
|         self.0.unit_kind() | ||||
|     } | ||||
| 
 | ||||
|     fn extract_mop( | ||||
|         &self, | ||||
|         mop: Expr<RenamedMOp<UnitOutRegNum<DynSize>, DynSize>>, | ||||
|     ) -> Expr<HdlOption<Self::MOp>> { | ||||
|     fn extract_mop(&self, mop: Expr<RenamedMOp<DynSize>>) -> Expr<HdlOption<Self::MOp>> { | ||||
|         Expr::from_enum(Expr::as_enum(self.0.extract_mop(mop))) | ||||
|     } | ||||
| 
 | ||||
|  | @ -439,7 +523,7 @@ impl<T: UnitTrait + Clone + std::hash::Hash + Eq> UnitTrait for DynUnitWrapper<T | |||
|     fn unit_to_reg_alloc( | ||||
|         &self, | ||||
|         this: Expr<Self::Type>, | ||||
|     ) -> Expr<UnitToRegAlloc<Self::MOp, Self::ExtraOut, DynSize, DynSize, DynSize>> { | ||||
|     ) -> Expr<UnitToRegAlloc<Self::MOp, Self::ExtraOut, DynSize, DynSize, DynSize, DynSize>> { | ||||
|         Expr::from_bundle(Expr::as_bundle( | ||||
|             self.0.unit_to_reg_alloc(Expr::from_bundle(this)), | ||||
|         )) | ||||
|  |  | |||
|  | @ -4,14 +4,14 @@ | |||
| use crate::{ | ||||
|     config::CpuConfig, | ||||
|     instruction::{ | ||||
|         AddSubMOp, AluBranchMOp, AluCommonMOp, CommonMOp, LogicalMOp, MOpTrait, OutputIntegerMode, | ||||
|         RenamedMOp, UnitOutRegNum, COMMON_MOP_SRC_LEN, | ||||
|         AddSubMOp, AluBranchMOp, AluCommonMOp, CommonMOp, LogicalMOp, OutputIntegerMode, | ||||
|         RenamedMOp, COMMON_MOP_SRC_LEN, | ||||
|     }, | ||||
|     register::{FlagsMode, PRegFlagsPowerISA, PRegFlagsX86, PRegValue}, | ||||
|     unit::{ | ||||
|         unit_base::{unit_base, ExecuteEnd, ExecuteStart, UnitToRegAlloc}, | ||||
|         unit_base::{unit_base, ExecuteEnd, ExecuteStart}, | ||||
|         DynUnit, DynUnitWrapper, GlobalState, UnitKind, UnitMOp, UnitOutput, UnitResult, | ||||
|         UnitResultCompleted, UnitTrait, | ||||
|         UnitResultCompleted, UnitToRegAlloc, UnitTrait, | ||||
|     }, | ||||
| }; | ||||
| use fayalite::{ | ||||
|  | @ -24,7 +24,7 @@ use std::{collections::HashMap, ops::RangeTo}; | |||
| 
 | ||||
| #[hdl] | ||||
| fn add_sub<SrcCount: KnownSize>( | ||||
|     mop: Expr<AddSubMOp<UnitOutRegNum<DynSize>, DynSize, SrcCount>>, | ||||
|     mop: Expr<AddSubMOp<(), DynSize, SrcCount>>, | ||||
|     pc: Expr<UInt<64>>, | ||||
|     flags_mode: Expr<FlagsMode>, | ||||
|     src_values: Expr<Array<PRegValue, { COMMON_MOP_SRC_LEN }>>, | ||||
|  | @ -232,7 +232,7 @@ fn add_sub<SrcCount: KnownSize>( | |||
| 
 | ||||
| #[hdl] | ||||
| fn logical( | ||||
|     mop: Expr<LogicalMOp<UnitOutRegNum<DynSize>, DynSize>>, | ||||
|     mop: Expr<LogicalMOp<(), DynSize>>, | ||||
|     flags_mode: Expr<FlagsMode>, | ||||
|     src_values: Expr<Array<PRegValue, { COMMON_MOP_SRC_LEN }>>, | ||||
| ) -> Expr<UnitResultCompleted<()>> { | ||||
|  | @ -250,15 +250,13 @@ pub fn alu_branch(config: &CpuConfig, unit_index: usize) { | |||
|     let cd: ClockDomain = m.input(); | ||||
|     #[hdl] | ||||
|     let unit_to_reg_alloc: UnitToRegAlloc< | ||||
|         AluBranchMOp<UnitOutRegNum<DynSize>, DynSize>, | ||||
|         AluBranchMOp<(), DynSize>, | ||||
|         (), | ||||
|         DynSize, | ||||
|         DynSize, | ||||
|         DynSize, | ||||
|     > = m.output(config.unit_to_reg_alloc( | ||||
|         AluBranchMOp[config.unit_out_reg_num()][config.p_reg_num_width()], | ||||
|         (), | ||||
|     )); | ||||
|         DynSize, | ||||
|     > = m.output(config.unit_to_reg_alloc(AluBranchMOp[()][config.p_reg_num_width()], ())); | ||||
|     #[hdl] | ||||
|     let global_state: GlobalState = m.input(); | ||||
| 
 | ||||
|  | @ -279,24 +277,21 @@ pub fn alu_branch(config: &CpuConfig, unit_index: usize) { | |||
|     #[hdl] | ||||
|     if let HdlSome(execute_start) = ReadyValid::firing_data(unit_base.execute_start) { | ||||
|         #[hdl] | ||||
|         let ExecuteStart::<_> { | ||||
|             mop, | ||||
|             pc, | ||||
|             src_values, | ||||
|         } = execute_start; | ||||
|         let ExecuteStart::<_, _, _> { insn, src_values } = execute_start; | ||||
|         #[hdl] | ||||
|         match mop { | ||||
|         match insn.mop { | ||||
|             AluBranchMOp::<_, _>::AddSub(mop) => connect( | ||||
|                 unit_base.execute_end, | ||||
|                 HdlSome( | ||||
|                     #[hdl] | ||||
|                     ExecuteEnd::<_, _> { | ||||
|                     ExecuteEnd::<_, _, _> { | ||||
|                         unit_output: #[hdl] | ||||
|                         UnitOutput::<_, _> { | ||||
|                             which: MOpTrait::dest_reg(mop), | ||||
|                         UnitOutput::<_, _, _> { | ||||
|                             dest: insn.dest, | ||||
|                             retire_queue_index: insn.retire_queue_index, | ||||
|                             result: UnitResult[()].Completed(add_sub( | ||||
|                                 mop, | ||||
|                                 pc, | ||||
|                                 insn.pc, | ||||
|                                 global_state.flags_mode, | ||||
|                                 src_values, | ||||
|                             )), | ||||
|  | @ -308,13 +303,14 @@ pub fn alu_branch(config: &CpuConfig, unit_index: usize) { | |||
|                 unit_base.execute_end, | ||||
|                 HdlSome( | ||||
|                     #[hdl] | ||||
|                     ExecuteEnd::<_, _> { | ||||
|                     ExecuteEnd::<_, _, _> { | ||||
|                         unit_output: #[hdl] | ||||
|                         UnitOutput::<_, _> { | ||||
|                             which: MOpTrait::dest_reg(mop), | ||||
|                         UnitOutput::<_, _, _> { | ||||
|                             dest: insn.dest, | ||||
|                             retire_queue_index: insn.retire_queue_index, | ||||
|                             result: UnitResult[()].Completed(add_sub( | ||||
|                                 mop, | ||||
|                                 pc, | ||||
|                                 insn.pc, | ||||
|                                 global_state.flags_mode, | ||||
|                                 src_values, | ||||
|                             )), | ||||
|  | @ -326,10 +322,11 @@ pub fn alu_branch(config: &CpuConfig, unit_index: usize) { | |||
|                 unit_base.execute_end, | ||||
|                 HdlSome( | ||||
|                     #[hdl] | ||||
|                     ExecuteEnd::<_, _> { | ||||
|                     ExecuteEnd::<_, _, _> { | ||||
|                         unit_output: #[hdl] | ||||
|                         UnitOutput::<_, _> { | ||||
|                             which: MOpTrait::dest_reg(mop), | ||||
|                         UnitOutput::<_, _, _> { | ||||
|                             dest: insn.dest, | ||||
|                             retire_queue_index: insn.retire_queue_index, | ||||
|                             result: UnitResult[()].Completed(logical( | ||||
|                                 mop, | ||||
|                                 global_state.flags_mode, | ||||
|  | @ -361,7 +358,7 @@ impl AluBranch { | |||
| impl UnitTrait for AluBranch { | ||||
|     type Type = alu_branch; | ||||
|     type ExtraOut = (); | ||||
|     type MOp = AluBranchMOp<UnitOutRegNum<DynSize>, DynSize>; | ||||
|     type MOp = AluBranchMOp<(), DynSize>; | ||||
| 
 | ||||
|     fn ty(&self) -> Self::Type { | ||||
|         self.module.io_ty() | ||||
|  | @ -379,10 +376,7 @@ impl UnitTrait for AluBranch { | |||
|         UnitKind::AluBranch | ||||
|     } | ||||
| 
 | ||||
|     fn extract_mop( | ||||
|         &self, | ||||
|         mop: Expr<RenamedMOp<UnitOutRegNum<DynSize>, DynSize>>, | ||||
|     ) -> Expr<HdlOption<Self::MOp>> { | ||||
|     fn extract_mop(&self, mop: Expr<RenamedMOp<DynSize>>) -> Expr<HdlOption<Self::MOp>> { | ||||
|         UnitMOp::alu_branch_mop(mop) | ||||
|     } | ||||
| 
 | ||||
|  | @ -393,7 +387,7 @@ impl UnitTrait for AluBranch { | |||
|     fn unit_to_reg_alloc( | ||||
|         &self, | ||||
|         this: Expr<Self::Type>, | ||||
|     ) -> Expr<UnitToRegAlloc<Self::MOp, Self::ExtraOut, DynSize, DynSize, DynSize>> { | ||||
|     ) -> Expr<UnitToRegAlloc<Self::MOp, Self::ExtraOut, DynSize, DynSize, DynSize, DynSize>> { | ||||
|         this.unit_to_reg_alloc | ||||
|     } | ||||
| 
 | ||||
|  |  | |||
|  | @ -5,69 +5,28 @@ use crate::{ | |||
|     config::CpuConfig, | ||||
|     instruction::{MOpTrait, PRegNum, UnitNum, UnitOutRegNum, COMMON_MOP_SRC_LEN}, | ||||
|     register::PRegValue, | ||||
|     unit::{UnitCancelInput, UnitOutput, UnitOutputWrite}, | ||||
|     util::tree_reduce::tree_reduce, | ||||
|     unit::{ | ||||
|         RenamedInsnData, UnitCancelInput, UnitForwardingInfo, UnitOutput, UnitOutputWrite, | ||||
|         UnitToRegAlloc, | ||||
|     }, | ||||
| }; | ||||
| use fayalite::{ | ||||
|     memory::splat_mask, | ||||
|     module::{memory_with_loc, wire_with_loc}, | ||||
|     prelude::*, | ||||
|     ty::StaticType, | ||||
|     util::ready_valid::ReadyValid, | ||||
|     util::{prefix_sum::reduce, ready_valid::ReadyValid}, | ||||
| }; | ||||
| use std::marker::PhantomData; | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct UnitForwardingInfo<UnitNumWidth: Size, OutRegNumWidth: Size, UnitCount: Size> { | ||||
|     pub unit_output_writes: ArrayType<HdlOption<UnitOutputWrite<OutRegNumWidth>>, UnitCount>, | ||||
|     pub unit_reg_frees: ArrayType<HdlOption<UnitOutRegNum<OutRegNumWidth>>, UnitCount>, | ||||
|     pub _phantom: PhantomData<UnitNumWidth>, | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct UnitInput<MOp: Type> { | ||||
|     pub mop: MOp, | ||||
|     pub pc: UInt<64>, | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct UnitToRegAlloc< | ||||
|     MOp: Type, | ||||
|     ExtraOut: Type, | ||||
|     UnitNumWidth: Size, | ||||
|     OutRegNumWidth: Size, | ||||
|     UnitCount: Size, | ||||
| > { | ||||
|     #[hdl(flip)] | ||||
|     pub unit_forwarding_info: UnitForwardingInfo<UnitNumWidth, OutRegNumWidth, UnitCount>, | ||||
|     #[hdl(flip)] | ||||
|     pub input: ReadyValid<UnitInput<MOp>>, | ||||
|     #[hdl(flip)] | ||||
|     pub cancel_input: HdlOption<UnitCancelInput<OutRegNumWidth>>, | ||||
|     pub output: HdlOption<UnitOutput<OutRegNumWidth, ExtraOut>>, | ||||
| } | ||||
| 
 | ||||
| impl<MOp: Type, ExtraOut: Type, UnitNumWidth: Size, OutRegNumWidth: Size, UnitCount: Size> | ||||
|     UnitToRegAlloc<MOp, ExtraOut, UnitNumWidth, OutRegNumWidth, UnitCount> | ||||
| { | ||||
|     pub fn mop_ty(self) -> MOp { | ||||
|         self.input.data.HdlSome.mop | ||||
|     } | ||||
|     pub fn extra_out_ty(self) -> ExtraOut { | ||||
|         self.output.HdlSome.extra_out_ty() | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct ExecuteStart<MOp: Type + MOpTrait<DestReg = UnitOutRegNum<DynSize>>> { | ||||
|     pub mop: MOp, | ||||
|     pub pc: UInt<64>, | ||||
| pub struct ExecuteStart<MOp: Type, OutRegNumWidth: Size, RetireQueueIndexWidth: Size> { | ||||
|     pub insn: RenamedInsnData<MOp, UnitOutRegNum<OutRegNumWidth>, RetireQueueIndexWidth>, | ||||
|     pub src_values: Array<PRegValue, { COMMON_MOP_SRC_LEN }>, | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct ExecuteEnd<OutRegNumWidth: Size, ExtraOut> { | ||||
|     pub unit_output: UnitOutput<OutRegNumWidth, ExtraOut>, | ||||
| pub struct ExecuteEnd<OutRegNumWidth: Size, RetireQueueIndexWidth: Size, ExtraOut> { | ||||
|     pub unit_output: UnitOutput<OutRegNumWidth, RetireQueueIndexWidth, ExtraOut>, | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
|  | @ -148,10 +107,9 @@ impl InFlightOpState { | |||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| struct InFlightOp<MOp: Type> { | ||||
| struct InFlightOp<MOp: Type, OutRegNumWidth: Size, RetireQueueIndexWidth: Size> { | ||||
|     state: InFlightOpState, | ||||
|     mop: MOp, | ||||
|     pc: UInt<64>, | ||||
|     insn: RenamedInsnData<MOp, UnitOutRegNum<OutRegNumWidth>, RetireQueueIndexWidth>, | ||||
|     src_ready_flags: Array<Bool, { COMMON_MOP_SRC_LEN }>, | ||||
| } | ||||
| 
 | ||||
|  | @ -166,7 +124,7 @@ impl<OpIndexWidth: Size> InFlightOpsSummary<OpIndexWidth> { | |||
|     fn new<MOp: Type>( | ||||
|         op_index: usize, | ||||
|         op_index_ty: UIntType<OpIndexWidth>, | ||||
|         in_flight_op: impl ToExpr<Type = HdlOption<InFlightOp<MOp>>>, | ||||
|         in_flight_op: impl ToExpr<Type = HdlOption<InFlightOp<MOp, DynSize, DynSize>>>, | ||||
|     ) -> Expr<Self> { | ||||
|         let empty_op_index = wire_with_loc( | ||||
|             &format!("empty_op_index_{op_index}"), | ||||
|  | @ -183,10 +141,9 @@ impl<OpIndexWidth: Size> InFlightOpsSummary<OpIndexWidth> { | |||
|         #[hdl] | ||||
|         if let HdlSome(in_flight_op) = in_flight_op { | ||||
|             #[hdl] | ||||
|             let InFlightOp::<_> { | ||||
|             let InFlightOp::<_, _, _> { | ||||
|                 state, | ||||
|                 mop: _, | ||||
|                 pc: _, | ||||
|                 insn: _, | ||||
|                 src_ready_flags, | ||||
|             } = in_flight_op; | ||||
|             connect(ready_op_index, HdlOption[op_index_ty].HdlNone()); | ||||
|  | @ -224,13 +181,15 @@ impl<OpIndexWidth: Size> InFlightOpsSummary<OpIndexWidth> { | |||
| 
 | ||||
| impl InFlightOpsSummary<DynSize> { | ||||
|     fn summarize<MOp: Type, MaxInFlight: Size>( | ||||
|         in_flight_ops: impl ToExpr<Type = ArrayType<HdlOption<InFlightOp<MOp>>, MaxInFlight>>, | ||||
|         in_flight_ops: impl ToExpr< | ||||
|             Type = ArrayType<HdlOption<InFlightOp<MOp, DynSize, DynSize>>, MaxInFlight>, | ||||
|         >, | ||||
|     ) -> Expr<Self> { | ||||
|         let in_flight_ops = in_flight_ops.to_expr(); | ||||
|         let max_in_flight = Expr::ty(in_flight_ops).len(); | ||||
|         let index_range = 0..max_in_flight; | ||||
|         let index_ty = UInt::range(index_range.clone()); | ||||
|         tree_reduce( | ||||
|         reduce( | ||||
|             index_range.map(|i| Self::new(i, index_ty, in_flight_ops[i])), | ||||
|             Self::combine, | ||||
|         ) | ||||
|  | @ -239,10 +198,7 @@ impl InFlightOpsSummary<DynSize> { | |||
| } | ||||
| 
 | ||||
| #[hdl_module] | ||||
| pub fn unit_base< | ||||
|     MOp: Type + MOpTrait<DestReg = UnitOutRegNum<DynSize>, SrcRegWidth = DynSize>, | ||||
|     ExtraOut: Type, | ||||
| >( | ||||
| pub fn unit_base<MOp: Type + MOpTrait<DestReg = (), SrcRegWidth = DynSize>, ExtraOut: Type>( | ||||
|     config: &CpuConfig, | ||||
|     unit_index: usize, | ||||
|     mop_ty: MOp, | ||||
|  | @ -251,18 +207,20 @@ pub fn unit_base< | |||
|     #[hdl] | ||||
|     let cd: ClockDomain = m.input(); | ||||
|     #[hdl] | ||||
|     let unit_to_reg_alloc: UnitToRegAlloc<MOp, ExtraOut, DynSize, DynSize, DynSize> = | ||||
|     let unit_to_reg_alloc: UnitToRegAlloc<MOp, ExtraOut, DynSize, DynSize, DynSize, DynSize> = | ||||
|         m.output(config.unit_to_reg_alloc(mop_ty, extra_out_ty)); | ||||
|     #[hdl] | ||||
|     let execute_start: ReadyValid<ExecuteStart<MOp>> = m.output(ReadyValid[ExecuteStart[mop_ty]]); | ||||
|     let execute_start: ReadyValid<ExecuteStart<MOp, DynSize, DynSize>> = | ||||
|         m.output(ReadyValid[config.execute_start(mop_ty)]); | ||||
|     #[hdl] | ||||
|     let execute_end: HdlOption<ExecuteEnd<DynSize, ExtraOut>> = | ||||
|         m.input(HdlOption[ExecuteEnd[config.out_reg_num_width][extra_out_ty]]); | ||||
|     let execute_end: HdlOption<ExecuteEnd<DynSize, DynSize, ExtraOut>> = | ||||
|         m.input(HdlOption[config.execute_end(extra_out_ty)]); | ||||
| 
 | ||||
|     connect(execute_start.data, Expr::ty(execute_start).data.HdlNone()); | ||||
| 
 | ||||
|     let max_in_flight = config.unit_max_in_flight(unit_index).get(); | ||||
|     let in_flight_op_ty = InFlightOp[mop_ty]; | ||||
|     let in_flight_op_ty = | ||||
|         InFlightOp[mop_ty][config.out_reg_num_width][config.retire_queue_index_width()]; | ||||
|     #[hdl] | ||||
|     let in_flight_ops = reg_builder() | ||||
|         .clock_domain(cd) | ||||
|  | @ -361,15 +319,15 @@ pub fn unit_base< | |||
|         connect(ready_write_port.mask, true); | ||||
|         #[hdl] | ||||
|         if let HdlSome(unit_output_write) = unit_output_writes[unit_index] { | ||||
|             connect_any(write_port.addr, unit_output_write.which.value); | ||||
|             connect_any(write_port.addr, unit_output_write.dest.value); | ||||
|             connect(write_port.data, unit_output_write.value); | ||||
|             connect(write_port.en, true); | ||||
|             connect_any(ready_write_port.addr, unit_output_write.which.value); | ||||
|             connect_any(ready_write_port.addr, unit_output_write.dest.value); | ||||
|             connect(ready_write_port.en, true); | ||||
|             let p_reg_num = #[hdl] | ||||
|             PRegNum::<_, _> { | ||||
|                 unit_num: config.unit_num().from_index(unit_index), | ||||
|                 unit_out_reg: unit_output_write.which, | ||||
|                 unit_out_reg: unit_output_write.dest, | ||||
|             }; | ||||
|             for src_index in 0..COMMON_MOP_SRC_LEN { | ||||
|                 #[hdl] | ||||
|  | @ -399,9 +357,8 @@ pub fn unit_base< | |||
|                 execute_start.data, | ||||
|                 HdlSome( | ||||
|                     #[hdl] | ||||
|                     ExecuteStart::<_> { | ||||
|                         mop: in_flight_op.mop, | ||||
|                         pc: in_flight_op.pc, | ||||
|                     ExecuteStart::<_, _, _> { | ||||
|                         insn: in_flight_op.insn, | ||||
|                         src_values: read_src_values, | ||||
|                     }, | ||||
|                 ), | ||||
|  | @ -420,7 +377,12 @@ pub fn unit_base< | |||
|     #[hdl] | ||||
|     if let HdlSome(input) = ReadyValid::firing_data(unit_to_reg_alloc.input) { | ||||
|         #[hdl] | ||||
|         let UnitInput::<_> { mop, pc } = input; | ||||
|         let RenamedInsnData::<_, _, _> { | ||||
|             retire_queue_index, | ||||
|             pc: _, | ||||
|             dest: _, | ||||
|             mop, | ||||
|         } = input; | ||||
|         #[hdl] | ||||
|         let input_mop_src_regs = wire(mop_ty.src_regs_ty()); | ||||
|         connect( | ||||
|  | @ -436,20 +398,24 @@ pub fn unit_base< | |||
|         connect(src_ready_flags, input_src_regs_valid); | ||||
|         connect(input_src_regs, input_mop_src_regs); | ||||
|         #[hdl] | ||||
|         if unit_to_reg_alloc.cancel_input.cmp_ne(HdlSome( | ||||
|             #[hdl] | ||||
|             UnitCancelInput::<_> { | ||||
|                 which: MOp::dest_reg(mop), | ||||
|             }, | ||||
|         )) { | ||||
|         let input_is_canceled = wire(); | ||||
|         connect(input_is_canceled, false); | ||||
|         #[hdl] | ||||
|         if let HdlSome(cancel_input) = unit_to_reg_alloc.cancel_input { | ||||
|             connect( | ||||
|                 input_is_canceled, | ||||
|                 UnitCancelInput::is_canceled(cancel_input, retire_queue_index), | ||||
|             ); | ||||
|         } | ||||
|         #[hdl] | ||||
|         if !input_is_canceled { | ||||
|             connect( | ||||
|                 input_in_flight_op, | ||||
|                 HdlSome( | ||||
|                     #[hdl] | ||||
|                     InFlightOp::<_> { | ||||
|                     InFlightOp::<_, _, _> { | ||||
|                         state: InFlightOpState.Ready(), | ||||
|                         mop, | ||||
|                         pc, | ||||
|                         insn: input, | ||||
|                         src_ready_flags, | ||||
|                     }, | ||||
|                 ), | ||||
|  | @ -483,13 +449,11 @@ pub fn unit_base< | |||
|         #[hdl] | ||||
|         if let HdlSome(in_flight_op) = in_flight_ops[in_flight_op_index] { | ||||
|             #[hdl] | ||||
|             let InFlightOp::<_> { | ||||
|             let InFlightOp::<_, _, _> { | ||||
|                 state, | ||||
|                 mop, | ||||
|                 pc, | ||||
|                 insn, | ||||
|                 src_ready_flags, | ||||
|             } = in_flight_op; | ||||
|             let which = MOp::dest_reg(mop); | ||||
|             let src_regs = wire_with_loc( | ||||
|                 &format!("in_flight_op_src_regs_{in_flight_op_index}"), | ||||
|                 SourceLocation::caller(), | ||||
|  | @ -499,7 +463,7 @@ pub fn unit_base< | |||
|                 src_regs, | ||||
|                 repeat(config.p_reg_num().const_zero().cast_to_bits(), ConstUsize), | ||||
|             ); | ||||
|             MOp::connect_src_regs(mop, src_regs); | ||||
|             MOp::connect_src_regs(insn.mop, src_regs); | ||||
| 
 | ||||
|             #[hdl] | ||||
|             if in_flight_ops_summary.ready_op_index.cmp_eq(HdlSome( | ||||
|  | @ -517,7 +481,7 @@ pub fn unit_base< | |||
|                 if let HdlSome(unit_output_write) = unit_output_writes[unit_index] { | ||||
|                     #[hdl] | ||||
|                     let UnitOutputWrite::<_> { | ||||
|                         which: unit_out_reg, | ||||
|                         dest: unit_out_reg, | ||||
|                         value: _, | ||||
|                     } = unit_output_write; | ||||
|                     let p_reg_num = #[hdl] | ||||
|  | @ -537,20 +501,21 @@ pub fn unit_base< | |||
|                 } | ||||
|             } | ||||
| 
 | ||||
|             connect( | ||||
|                 in_flight_op_canceling[in_flight_op_index], | ||||
|                 unit_to_reg_alloc.cancel_input.cmp_eq(HdlSome( | ||||
|                     #[hdl] | ||||
|                     UnitCancelInput::<_> { which }, | ||||
|                 )), | ||||
|             ); | ||||
|             connect(in_flight_op_canceling[in_flight_op_index], false); | ||||
|             #[hdl] | ||||
|             if let HdlSome(cancel_input) = unit_to_reg_alloc.cancel_input { | ||||
|                 connect( | ||||
|                     in_flight_op_canceling[in_flight_op_index], | ||||
|                     UnitCancelInput::is_canceled(cancel_input, insn.retire_queue_index), | ||||
|                 ); | ||||
|             } | ||||
| 
 | ||||
|             #[hdl] | ||||
|             if let HdlSome(execute_end) = execute_end { | ||||
|                 #[hdl] | ||||
|                 let ExecuteEnd::<_, _> { unit_output } = execute_end; | ||||
|                 let ExecuteEnd::<_, _, _> { unit_output } = execute_end; | ||||
|                 #[hdl] | ||||
|                 if which.cmp_eq(unit_output.which) { | ||||
|                 if insn.dest.cmp_eq(unit_output.dest) { | ||||
|                     connect(in_flight_op_execute_ending[in_flight_op_index], true); | ||||
|                     #[hdl] | ||||
|                     if !in_flight_op_canceling[in_flight_op_index] { | ||||
|  | @ -567,7 +532,7 @@ pub fn unit_base< | |||
|             #[hdl] | ||||
|             if let HdlSome(execute_start) = ReadyValid::firing_data(execute_start) { | ||||
|                 #[hdl] | ||||
|                 if which.cmp_eq(MOp::dest_reg(execute_start.mop)) { | ||||
|                 if insn.dest.cmp_eq(execute_start.insn.dest) { | ||||
|                     connect(in_flight_op_execute_starting[in_flight_op_index], true); | ||||
|                 } | ||||
|             } | ||||
|  | @ -594,10 +559,9 @@ pub fn unit_base< | |||
|                     in_flight_ops[in_flight_op_index], | ||||
|                     HdlSome( | ||||
|                         #[hdl] | ||||
|                         InFlightOp::<_> { | ||||
|                         InFlightOp::<_, _, _> { | ||||
|                             state, | ||||
|                             mop, | ||||
|                             pc, | ||||
|                             insn, | ||||
|                             src_ready_flags: in_flight_op_next_src_ready_flags[in_flight_op_index], | ||||
|                         }, | ||||
|                     ), | ||||
|  |  | |||
|  | @ -2,7 +2,6 @@ | |||
| // See Notices.txt for copyright information
 | ||||
| 
 | ||||
| pub mod array_vec; | ||||
| pub mod tree_reduce; | ||||
| 
 | ||||
| pub(crate) const fn range_u32_len(range: &std::ops::Range<u32>) -> usize { | ||||
|     let retval = range.end.saturating_sub(range.start); | ||||
|  | @ -25,3 +24,16 @@ pub(crate) const fn range_u32_nth_or_panic(range: &std::ops::Range<u32>, index: | |||
|         panic!("index out of range") | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| pub(crate) const fn range_intersection( | ||||
|     a: &std::ops::Range<u32>, | ||||
|     b: &std::ops::Range<u32>, | ||||
| ) -> Option<std::ops::Range<u32>> { | ||||
|     let start = if a.start > b.start { a.start } else { b.start }; | ||||
|     let end = if a.end < b.end { a.end } else { b.end }; | ||||
|     if start < end { | ||||
|         Some(start..end) | ||||
|     } else { | ||||
|         None | ||||
|     } | ||||
| } | ||||
|  |  | |||
|  | @ -2,8 +2,11 @@ | |||
| // See Notices.txt for copyright information
 | ||||
| 
 | ||||
| use fayalite::{ | ||||
|     expr::ops::{ExprCastTo, ExprIndex, ExprPartialEq, ExprPartialOrd}, | ||||
|     int::SizeType, | ||||
|     expr::{ | ||||
|         ops::{ExprCastTo, ExprIndex, ExprPartialEq, ExprPartialOrd}, | ||||
|         ToLiteralBits, | ||||
|     }, | ||||
|     int::{IntType, SizeType}, | ||||
|     intern::{Intern, Interned}, | ||||
|     prelude::*, | ||||
|     ty::{MatchVariantWithoutScope, StaticType, TypeProperties}, | ||||
|  | @ -249,6 +252,29 @@ impl<T: Type, N: Size> ArrayVec<T, N> { | |||
|         }); | ||||
|         array_vec_as_array_of_options | ||||
|     } | ||||
|     #[hdl] | ||||
|     pub fn get<Idx: IntType<Dyn = UInt>>( | ||||
|         this: impl ToExpr<Type = Self>, | ||||
|         index: impl ToExpr<Type = Idx>, | ||||
|     ) -> Expr<HdlOption<T>> { | ||||
|         let this = this.to_expr(); | ||||
|         let index = Expr::as_dyn_int(index.to_expr()); | ||||
|         let never_in_bounds = index.cmp_ge(Expr::ty(this).capacity()); | ||||
|         if let Ok(never_in_bounds) = never_in_bounds.to_literal_bits() { | ||||
|             if never_in_bounds[0] { | ||||
|                 // avoid error from out-of-bounds constant index
 | ||||
|                 return HdlOption[Expr::ty(this).element()].HdlNone(); | ||||
|             } | ||||
|         } | ||||
|         #[hdl] | ||||
|         let array_vec_get = wire(HdlOption[Expr::ty(this).element()]); | ||||
|         connect(array_vec_get, Expr::ty(array_vec_get).HdlNone()); | ||||
|         #[hdl] | ||||
|         if index.cmp_lt(Length::as_uint(Self::len(this))) { | ||||
|             connect(array_vec_get, HdlSome(this.elements[index])); | ||||
|         } | ||||
|         array_vec_get | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| impl<T: Type, N: Size, Idx, IdxWidth: Size> ExprIndex<Idx> for ArrayVec<T, N> | ||||
|  | @ -263,3 +289,35 @@ where | |||
|         <ArrayType<T, N> as ExprIndex<Idx>>::expr_index(&this.elements, index) | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| #[hdl] | ||||
| pub struct ReadyValidArray<T: Type, N: Size> { | ||||
|     pub data: ArrayVec<T, N>, | ||||
|     #[hdl(flip)] | ||||
|     pub ready: Length<N>, | ||||
| } | ||||
| 
 | ||||
| impl<T: Type, N: Size> ReadyValidArray<T, N> { | ||||
|     #[hdl] | ||||
|     pub fn firing_len(this: impl ToExpr<Type = Self>) -> Expr<Length<N>> { | ||||
|         let this = this.to_expr(); | ||||
|         assert_eq!(Expr::ty(this).data.len_ty(), Expr::ty(this).ready); | ||||
|         #[hdl] | ||||
|         let firing_len = wire(Expr::ty(this).data.len); | ||||
|         connect(firing_len, this.data.len); | ||||
|         #[hdl] | ||||
|         if this.data.len.cmp_gt(this.ready) { | ||||
|             connect(firing_len, this.ready); | ||||
|         } | ||||
|         firing_len | ||||
|     } | ||||
|     #[hdl] | ||||
|     pub fn firing_data(this: impl ToExpr<Type = Self>) -> Expr<ArrayVec<T, N>> { | ||||
|         let this = this.to_expr(); | ||||
|         #[hdl] | ||||
|         let firing_data = wire(Expr::ty(this).data); | ||||
|         connect(firing_data, this.data); | ||||
|         connect(firing_data.len, Self::firing_len(this)); | ||||
|         firing_data | ||||
|     } | ||||
| } | ||||
|  |  | |||
|  | @ -1,152 +0,0 @@ | |||
| // SPDX-License-Identifier: LGPL-3.0-or-later
 | ||||
| // See Notices.txt for copyright information
 | ||||
| #[derive(Copy, Clone, PartialEq, Eq, Hash, Debug)] | ||||
| pub enum TreeReduceOp { | ||||
|     Input, | ||||
|     Reduce, | ||||
| } | ||||
| 
 | ||||
| #[derive(Copy, Clone, Debug)] | ||||
| struct Entry { | ||||
|     start: usize, | ||||
|     depth: u32, | ||||
| } | ||||
| 
 | ||||
| #[derive(Clone, Debug)] | ||||
| pub struct TreeReduceOps { | ||||
|     len: usize, | ||||
|     stack: Vec<Entry>, | ||||
| } | ||||
| 
 | ||||
| impl TreeReduceOps { | ||||
|     pub fn new(len: usize) -> Self { | ||||
|         TreeReduceOps { | ||||
|             len, | ||||
|             stack: Vec::new(), | ||||
|         } | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| impl Iterator for TreeReduceOps { | ||||
|     type Item = TreeReduceOp; | ||||
|     fn next(&mut self) -> Option<Self::Item> { | ||||
|         match *self.stack { | ||||
|             [] if self.len != 0 => { | ||||
|                 self.stack.push(Entry { start: 0, depth: 0 }); | ||||
|                 Some(TreeReduceOp::Input) | ||||
|             } | ||||
|             [.., ref mut second_last, last] if second_last.depth == last.depth => { | ||||
|                 second_last.depth += 1; | ||||
|                 self.stack.pop(); | ||||
|                 Some(TreeReduceOp::Reduce) | ||||
|             } | ||||
|             [.., last] if self.len - last.start > 1 << last.depth => { | ||||
|                 let start = last.start + (1 << last.depth); | ||||
|                 self.stack.push(Entry { start, depth: 0 }); | ||||
|                 Some(TreeReduceOp::Input) | ||||
|             } | ||||
|             [.., ref mut second_last, _] => { | ||||
|                 second_last.depth += 1; | ||||
|                 self.stack.pop(); | ||||
|                 Some(TreeReduceOp::Reduce) | ||||
|             } | ||||
|             _ => None, | ||||
|         } | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| #[track_caller] | ||||
| pub fn tree_reduce_with_state<S, I, R>( | ||||
|     iter: impl IntoIterator<IntoIter: ExactSizeIterator, Item = I>, | ||||
|     state: &mut S, | ||||
|     mut input: impl FnMut(&mut S, I) -> R, | ||||
|     mut reduce: impl FnMut(&mut S, R, R) -> R, | ||||
| ) -> Option<R> { | ||||
|     let mut stack = Vec::new(); | ||||
|     let mut iter = iter.into_iter(); | ||||
|     for op in TreeReduceOps::new(iter.len()) { | ||||
|         match op { | ||||
|             TreeReduceOp::Input => stack.push(input( | ||||
|                 state, | ||||
|                 iter.next().expect("inconsistent iterator len() and next()"), | ||||
|             )), | ||||
|             TreeReduceOp::Reduce => { | ||||
|                 let Some(r) = stack.pop() else { | ||||
|                     unreachable!(); | ||||
|                 }; | ||||
|                 let Some(l) = stack.pop() else { | ||||
|                     unreachable!(); | ||||
|                 }; | ||||
|                 stack.push(reduce(state, l, r)); | ||||
|             } | ||||
|         } | ||||
|     } | ||||
|     stack.pop() | ||||
| } | ||||
| 
 | ||||
| pub fn tree_reduce<T>( | ||||
|     iter: impl IntoIterator<Item = T, IntoIter: ExactSizeIterator>, | ||||
|     mut reduce: impl FnMut(T, T) -> T, | ||||
| ) -> Option<T> { | ||||
|     tree_reduce_with_state(iter, &mut (), |_, v| v, move |_, l, r| reduce(l, r)) | ||||
| } | ||||
| 
 | ||||
| #[cfg(test)] | ||||
| mod tests { | ||||
|     use super::*; | ||||
|     use std::ops::Range; | ||||
| 
 | ||||
|     fn recursive_tree_reduce(range: Range<usize>, ops: &mut Vec<TreeReduceOp>) { | ||||
|         if range.len() == 1 { | ||||
|             ops.push(TreeReduceOp::Input); | ||||
|             return; | ||||
|         } | ||||
|         if range.is_empty() { | ||||
|             return; | ||||
|         } | ||||
|         let pow2_len = range.len().next_power_of_two(); | ||||
|         let split = range.start + pow2_len / 2; | ||||
|         recursive_tree_reduce(range.start..split, ops); | ||||
|         recursive_tree_reduce(split..range.end, ops); | ||||
|         ops.push(TreeReduceOp::Reduce); | ||||
|     } | ||||
| 
 | ||||
|     #[test] | ||||
|     fn test_tree_reduce() { | ||||
|         const EXPECTED: &'static [&'static [TreeReduceOp]] = { | ||||
|             use TreeReduceOp::{Input as I, Reduce as R}; | ||||
|             &[ | ||||
|                 &[], | ||||
|                 &[I], | ||||
|                 &[I, I, R], | ||||
|                 &[I, I, R, I, R], | ||||
|                 &[I, I, R, I, I, R, R], | ||||
|                 &[I, I, R, I, I, R, R, I, R], | ||||
|                 &[I, I, R, I, I, R, R, I, I, R, R], | ||||
|                 &[I, I, R, I, I, R, R, I, I, R, I, R, R], | ||||
|                 &[I, I, R, I, I, R, R, I, I, R, I, I, R, R, R], | ||||
|             ] | ||||
|         }; | ||||
|         for len in 0..64 { | ||||
|             let mut expected = vec![]; | ||||
|             recursive_tree_reduce(0..len, &mut expected); | ||||
|             if let Some(&expected2) = EXPECTED.get(len) { | ||||
|                 assert_eq!(*expected, *expected2, "len={len}"); | ||||
|             } | ||||
|             assert_eq!( | ||||
|                 TreeReduceOps::new(len).collect::<Vec<_>>(), | ||||
|                 expected, | ||||
|                 "len={len}" | ||||
|             ); | ||||
|             let seq: Vec<_> = (0..len).collect(); | ||||
|             assert_eq!( | ||||
|                 seq, | ||||
|                 tree_reduce(seq.iter().map(|&v| vec![v]), |mut l, r| { | ||||
|                     l.extend_from_slice(&r); | ||||
|                     l | ||||
|                 }) | ||||
|                 .unwrap_or_default() | ||||
|             ); | ||||
|         } | ||||
|     } | ||||
| } | ||||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue