use lamellar::array::prelude::*; use lamellar::memregion::prelude::*; fn initialize_mem_region( memregion: &LamellarMemoryRegion, init_val: T, inc_val: T, ) { unsafe { let mut i = init_val; //(len_per_pe * my_pe as f32).round() as usize; for elem in memregion.as_mut_slice().unwrap() { *elem = i; i += inc_val; } } } macro_rules! initialize_array { (UnsafeArray,$array:ident,$init_val:ident) => { unsafe { $array .dist_iter_mut() .for_each(move |x| *x = $init_val) .block(); } }; (AtomicArray,$array:ident,$init_val:ident) => { $array .dist_iter() .for_each(move |x| x.store($init_val)) .block(); }; (LocalLockArray,$array:ident,$init_val:ident) => { $array .dist_iter_mut() .for_each(move |x| *x = $init_val) .block(); }; (GlobalLockArray,$array:ident,$init_val:ident) => { $array .dist_iter_mut() .for_each(move |x| *x = $init_val) .block(); }; } macro_rules! onesided_iter { (GlobalLockArray,$array:ident) => { $array.read_lock().block().onesided_iter() }; ($arraytype:ident,$array:ident) => { $array.onesided_iter() }; } macro_rules! put_test{ ($array:ident, $t:ty, $len:expr, $dist:ident) =>{ { let world = lamellar::LamellarWorldBuilder::new().build(); let num_pes = world.num_pes(); let my_pe = world.my_pe(); let array_total_len = $len; let mem_seg_len = array_total_len; let mut success = true; let array: $array::<$t> = $array::<$t>::new(world.team(), array_total_len, $dist).block().into(); //convert into abstract LamellarArray, distributed len is total_len let shared_mem_region: LamellarMemoryRegion<$t> = world.alloc_shared_mem_region(mem_seg_len).block().into(); //Convert into abstract LamellarMemoryRegion, each local segment is total_len //initialize array let init_val = my_pe as $t; initialize_array!($array, array, init_val); array.wait_all(); array.barrier(); initialize_mem_region(&shared_mem_region,0 as $t,1 as $t); // world.barrier(); for tx_size in 1..=mem_seg_len{ let num_txs = mem_seg_len/tx_size; for tx in (my_pe..num_txs).step_by(num_pes){ // unsafe{println!("tx_size {:?} tx {:?} sindex: {:?} eindex: {:?} {:?}",tx_size,tx, tx*tx_size,std::cmp::min(mem_seg_len,(tx+1)*tx_size),&shared_mem_region.sub_region(tx*tx_size..std::cmp::min(mem_seg_len,(tx+1)*tx_size)).as_slice());} #[allow(unused_unsafe)] unsafe {let _ = array.put(tx*tx_size,&shared_mem_region.sub_region(tx*tx_size..std::cmp::min(mem_seg_len,(tx+1)*tx_size))).spawn();} } array.wait_all(); array.barrier(); #[allow(unused_unsafe)] for (i,elem) in unsafe { onesided_iter!($array,array).into_iter().enumerate().take( num_txs * tx_size) }{ if ((i as $t - *elem) as f32).abs() > 0.0001 { eprintln!("{:?} {:?} {:?}",i as $t,*elem,((i as $t - *elem) as f32).abs()); success = false; } } array.barrier(); // array.print(); initialize_array!($array, array, init_val); array.wait_all(); array.barrier(); } array.barrier(); world.wait_all(); world.barrier(); let half_len = array_total_len/2; let start_i = half_len/2; let end_i = start_i + half_len; let sub_array = array.sub_array(start_i..end_i); world.barrier(); // sub_array.print(); for tx_size in 1..=half_len{ let num_txs = half_len/tx_size; for tx in (my_pe..num_txs).step_by(num_pes){ // unsafe{println!("tx_size {:?} tx {:?} sindex: {:?} eindex: {:?} {:?}",tx_size,tx, tx*tx_size,std::cmp::min(half_len,(tx+1)*tx_size),&shared_mem_region.sub_region(tx*tx_size..std::cmp::min(half_len,(tx+1)*tx_size)).as_slice());} #[allow(unused_unsafe)] unsafe {let _ = sub_array.put(tx*tx_size,&shared_mem_region.sub_region(tx*tx_size..std::cmp::min(half_len,(tx+1)*tx_size))).spawn();} } array.wait_all(); sub_array.barrier(); #[allow(unused_unsafe)] for (i,elem) in unsafe {onesided_iter!($array,sub_array).into_iter().enumerate().take( num_txs * tx_size)}{ if ((i as $t - *elem) as f32).abs() > 0.0001 { eprintln!("{:?} {:?} {:?}",i as $t,*elem,((i as $t - *elem) as f32).abs()); success = false; } } sub_array.barrier(); // sub_array.print(); initialize_array!($array, array, init_val); sub_array.wait_all(); sub_array.barrier(); // sub_array.print(); } array.barrier(); world.wait_all(); world.barrier(); let pe_len = array_total_len/num_pes; for pe in 0..num_pes{ let len = pe_len/2; let start_i = (pe*pe_len)+ len/2; let end_i = start_i+len; let sub_array = array.sub_array(start_i..end_i); world.barrier(); for tx_size in 1..len{ let num_txs = len/tx_size; for tx in (my_pe..num_txs).step_by(num_pes){ // unsafe{println!("tx_size {:?} tx {:?} sindex: {:?} eindex: {:?} {:?}",tx_size,tx, tx*tx_size,std::cmp::min(len,(tx+1)*tx_size),&shared_mem_region.sub_region(tx*tx_size..std::cmp::min(mem_seg_len,(tx+1)*tx_size)).as_slice());} #[allow(unused_unsafe)] unsafe {let _ = sub_array.put(tx*tx_size,&shared_mem_region.sub_region(tx*tx_size..std::cmp::min(len,(tx+1)*tx_size))).spawn();} } array.wait_all(); sub_array.barrier(); #[allow(unused_unsafe)] for (i,elem) in unsafe {onesided_iter!($array,sub_array).into_iter().enumerate().take( num_txs * tx_size)}{ if ((i as $t - *elem) as f32).abs() > 0.0001 { eprintln!("{:?} {:?} {:?}",i as $t,*elem,((i as $t - *elem) as f32).abs()); success = false; } } sub_array.barrier(); // sub_array.print(); initialize_array!($array, array, init_val); sub_array.wait_all(); sub_array.barrier(); } array.barrier(); world.wait_all(); world.barrier(); } if !success{ eprintln!("failed"); } } } } fn main() { let args: Vec = std::env::args().collect(); let array = args[1].clone(); let dist = args[2].clone(); let elem = args[3].clone(); let len = args[4].parse::().unwrap(); let dist_type = match dist.as_str() { "Block" => Distribution::Block, "Cyclic" => Distribution::Cyclic, _ => panic!("unsupported dist type"), }; match array.as_str() { "UnsafeArray" => match elem.as_str() { "u8" => put_test!(UnsafeArray, u8, len, dist_type), "u16" => put_test!(UnsafeArray, u16, len, dist_type), "u32" => put_test!(UnsafeArray, u32, len, dist_type), "u64" => put_test!(UnsafeArray, u64, len, dist_type), "u128" => put_test!(UnsafeArray, u128, len, dist_type), "usize" => put_test!(UnsafeArray, usize, len, dist_type), "i8" => put_test!(UnsafeArray, i8, len, dist_type), "i16" => put_test!(UnsafeArray, i16, len, dist_type), "i32" => put_test!(UnsafeArray, i32, len, dist_type), "i64" => put_test!(UnsafeArray, i64, len, dist_type), "i128" => put_test!(UnsafeArray, i128, len, dist_type), "isize" => put_test!(UnsafeArray, isize, len, dist_type), "f32" => put_test!(UnsafeArray, f32, len, dist_type), "f64" => put_test!(UnsafeArray, f64, len, dist_type), _ => eprintln!("unsupported element type"), }, "AtomicArray" => match elem.as_str() { "u8" => put_test!(AtomicArray, u8, len, dist_type), "u16" => put_test!(AtomicArray, u16, len, dist_type), "u32" => put_test!(AtomicArray, u32, len, dist_type), "u64" => put_test!(AtomicArray, u64, len, dist_type), "u128" => put_test!(AtomicArray, u128, len, dist_type), "usize" => put_test!(AtomicArray, usize, len, dist_type), "i8" => put_test!(AtomicArray, i8, len, dist_type), "i16" => put_test!(AtomicArray, i16, len, dist_type), "i32" => put_test!(AtomicArray, i32, len, dist_type), "i64" => put_test!(AtomicArray, i64, len, dist_type), "i128" => put_test!(AtomicArray, i128, len, dist_type), "isize" => put_test!(AtomicArray, isize, len, dist_type), "f32" => put_test!(AtomicArray, f32, len, dist_type), "f64" => put_test!(AtomicArray, f64, len, dist_type), _ => eprintln!("unsupported element type"), }, "LocalLockArray" => match elem.as_str() { "u8" => put_test!(LocalLockArray, u8, len, dist_type), "u16" => put_test!(LocalLockArray, u16, len, dist_type), "u32" => put_test!(LocalLockArray, u32, len, dist_type), "u64" => put_test!(LocalLockArray, u64, len, dist_type), "u128" => put_test!(LocalLockArray, u128, len, dist_type), "usize" => put_test!(LocalLockArray, usize, len, dist_type), "i8" => put_test!(LocalLockArray, i8, len, dist_type), "i16" => put_test!(LocalLockArray, i16, len, dist_type), "i32" => put_test!(LocalLockArray, i32, len, dist_type), "i64" => put_test!(LocalLockArray, i64, len, dist_type), "i128" => put_test!(LocalLockArray, i128, len, dist_type), "isize" => put_test!(LocalLockArray, isize, len, dist_type), "f32" => put_test!(LocalLockArray, f32, len, dist_type), "f64" => put_test!(LocalLockArray, f64, len, dist_type), _ => eprintln!("unsupported element type"), }, "GlobalLockArray" => match elem.as_str() { "u8" => put_test!(GlobalLockArray, u8, len, dist_type), "u16" => put_test!(GlobalLockArray, u16, len, dist_type), "u32" => put_test!(GlobalLockArray, u32, len, dist_type), "u64" => put_test!(GlobalLockArray, u64, len, dist_type), "u128" => put_test!(GlobalLockArray, u128, len, dist_type), "usize" => put_test!(GlobalLockArray, usize, len, dist_type), "i8" => put_test!(GlobalLockArray, i8, len, dist_type), "i16" => put_test!(GlobalLockArray, i16, len, dist_type), "i32" => put_test!(GlobalLockArray, i32, len, dist_type), "i64" => put_test!(GlobalLockArray, i64, len, dist_type), "i128" => put_test!(GlobalLockArray, i128, len, dist_type), "isize" => put_test!(GlobalLockArray, isize, len, dist_type), "f32" => put_test!(GlobalLockArray, f32, len, dist_type), "f64" => put_test!(GlobalLockArray, f64, len, dist_type), _ => {} //eprintln!("unsupported element type"), }, _ => eprintln!("unsupported array type"), } }