Add a GEMV layer bin

This commit is contained in:
2024-02-22 22:28:43 +01:00
parent ba74572989
commit a13de61081
3 changed files with 101 additions and 2 deletions

View File

@@ -0,0 +1,24 @@
#![no_std]
#![no_main]
extern crate alloc;
use core::fmt::Write;
use nalgebra::{SMatrix, SVector};
use pim_os::{pim::vector::F16x1, uart::Uart0};
const ROWS: usize = 128;
const COLUMNS: usize = 128;
#[no_mangle]
pub extern "C" fn main() {
let matrix = SMatrix::<F16x1, ROWS, COLUMNS>::zeros();
let mut input_vector = SVector::<F16x1, COLUMNS>::zeros();
for _ in 0..5 {
input_vector = matrix * input_vector;
core::hint::black_box(input_vector);
}
writeln!(Uart0, "Done").unwrap();
}

View File

@@ -77,7 +77,7 @@ pub extern "C" fn main() {
pim::state::set_bank_mode(BankMode::SingleBank);
}
writeln!(Uart0, "{output_partial_sum_vector}").unwrap();
// writeln!(Uart0, "{output_partial_sum_vector}").unwrap();
let output_vector = SVector::<F16x1, ROWS>::from_fn(|r, _| {
output_partial_sum_vector[r]
@@ -86,5 +86,8 @@ pub extern "C" fn main() {
.fold(F16x1::zero(), |acc, val| acc + *val)
});
writeln!(Uart0, "{output_vector}").unwrap();
core::hint::black_box(output_vector);
// writeln!(Uart0, "{output_vector}").unwrap();
writeln!(Uart0, "Done").unwrap();
}

View File

@@ -0,0 +1,72 @@
#![no_std]
#![no_main]
extern crate alloc;
use aarch64_cpu::asm::barrier;
use alloc::boxed::Box;
use core::fmt::Write;
use nalgebra::{SMatrix, SVector};
use num_traits::{One, Zero};
use pim_isa::BankMode;
use pim_os::{
kernel::gemv,
pim::{
self, interleaved_array,
vector::{F16x1, F16x16},
},
uart::Uart0,
};
const ROWS: usize = 128;
const COLUMNS: usize = 128;
const X16_ROWS: usize = ROWS / 16;
const X16_COLUMNS: usize = COLUMNS / 16;
#[no_mangle]
pub extern "C" fn main() {
pim::state::set_kernel(&gemv::KERNEL_X4);
let mut matrix = SMatrix::<_, ROWS, COLUMNS>::zeros();
matrix.fill_lower_triangle(F16x1::one(), 0);
let pim_matrix = Box::new(pim::continuous_array::Matrix::<X16_ROWS, X16_COLUMNS>::from(matrix));
let input_vector = SVector::<_, X16_COLUMNS>::from_element(F16x16::one());
let mut output_partial_sum_vector = Box::new(SVector::<F16x16, ROWS>::zeros());
let dummy = Box::new(0);
for _ in 0..5 {
let interleaved_input_vector =
Box::new(interleaved_array::Vector::from(input_vector.clone()));
// Verify everything is correctly initialized before PIM operation
barrier::dsb(barrier::SY);
// Execute kernel
{
pim::state::set_bank_mode(BankMode::PimAllBank);
gemv::execute(
pim_matrix.as_ref(),
interleaved_input_vector.as_ref(),
output_partial_sum_vector.as_mut(),
dummy.as_ref(),
);
pim::state::set_bank_mode(BankMode::SingleBank);
}
let output_vector = SVector::<F16x1, ROWS>::from_fn(|r, _| {
output_partial_sum_vector[r]
.0
.iter()
.fold(F16x1::zero(), |acc, val| acc + *val)
});
core::hint::black_box(output_vector);
}
writeln!(Uart0, "Done").unwrap();
}