Make calibration able to autodetect micro architecture - still hacky for number of cores

This commit is contained in:
GuillaumeDIDIER 2020-05-28 11:22:50 +02:00
parent 80c6a556bf
commit c84aefa2e8
2 changed files with 61 additions and 43 deletions

View File

@ -1,11 +1,21 @@
#![allow(clippy::missing_safety_doc)]
use crate::complex_addressing::{cache_slicing, CacheSlicing};
use crate::{flush, maccess, rdtsc_fence};
use cpuid::MicroArchitecture;
use core::arch::x86_64 as arch_x86;
#[cfg(feature = "no_std")]
use polling_serial::{serial_print as print, serial_println as println};
extern crate alloc;
use crate::calibration::Verbosity::*;
use alloc::vec;
use alloc::vec::Vec;
use core::cmp::min;
use itertools::Itertools;
#[derive(Ord, PartialOrd, Eq, PartialEq)]
pub enum Verbosity {
NoOutput,
@ -20,14 +30,6 @@ pub struct HistParams {
bucket_number: usize,
}
extern crate alloc;
use crate::calibration::Verbosity::*;
use crate::complex_addressing::AddressHasher;
use alloc::vec;
use alloc::vec::Vec;
use core::cmp::min;
use itertools::Itertools;
pub unsafe fn only_reload(p: *const u8) -> u64 {
let t = rdtsc_fence();
maccess(p);
@ -194,7 +196,6 @@ pub fn calibrate_flush(
iterations: CFLUSH_NUM_ITER,
},
verbose_level,
None,
)
}
@ -234,7 +235,6 @@ pub unsafe fn calibrate(
iterations: num_iterations,
},
verbosity_level,
None,
)
}
@ -246,18 +246,7 @@ fn calibrate_impl_fixed_freq(
operations: &[CalibrateOperation],
hist_params: HistParams,
verbosity_level: Verbosity,
hasher: Option<&AddressHasher>,
) -> Vec<CalibrateResult> {
// TODO : adapt this to detect CPU generation and grab the correct masks.
// These are the skylake masks.
/*let masks: [usize; 3] = [
0b1111_0011_0011_0011_0010_0100_1100_0100_000000,
0b1011_1010_1101_0111_1110_1010_1010_0010_000000,
0b0110_1101_0111_1101_0101_1101_0101_0001_000000,
];
let hasher = AddressHasher::new(&masks);
*/
if verbosity_level >= Thresholds {
println!(
"Calibrating {}...",
@ -270,10 +259,28 @@ fn calibrate_impl_fixed_freq(
let to_bucket = |time: u64| -> usize { time as usize / hist_params.bucket_size };
let from_bucket = |bucket: usize| -> u64 { (bucket * hist_params.bucket_size) as u64 };
let slicing = if let Some(uarch) = MicroArchitecture::get_micro_architecture() {
Some(cache_slicing(uarch, 8))
} else {
None
};
let h = if let Some(s) = slicing {
if s.can_hash() {
Some(|addr: usize| -> usize { slicing.unwrap().hash(addr).unwrap() })
} else {
None
}
} else {
None
};
// TODO fix the GROSS hack of using max cpu core supported
let mut ret = Vec::new();
if verbosity_level >= Thresholds {
print!("CSV: address, ");
if hasher.is_some() {
if h.is_some() {
print!("hash, ");
}
println!(
@ -294,7 +301,7 @@ fn calibrate_impl_fixed_freq(
}
if verbosity_level >= RawResult {
print!("RESULT:address,");
if hasher.is_some() {
if h.is_some() {
print!("hash,");
}
println!(
@ -308,7 +315,7 @@ fn calibrate_impl_fixed_freq(
for i in (0..len).step_by(increment) {
let pointer = unsafe { p.offset(i) };
let hash = hasher.map(|h| h.hash(pointer as usize));
let hash = h.map(|h| h(pointer as usize));
if verbosity_level >= Thresholds {
print!("Calibration for {:p}", pointer);
@ -437,7 +444,6 @@ pub fn calibrate_L3_miss_hit(
iterations: 1 << 11,
},
verbose_level,
None,
);
r.into_iter().next().unwrap()

View File

@ -1,16 +1,20 @@
use crate::complex_addressing::CacheSlicing::{ComplexAddressing, Unsupported};
use crate::complex_addressing::CacheSlicing::{
ComplexAddressing, NoSlice, SimpleAddressing, Unsupported,
};
use cpuid::MicroArchitecture;
#[derive(Debug, Copy, Clone)]
pub enum CacheSlicing {
Unsupported,
ComplexAddressing(&'static [usize]),
SimpleAddressing(&'static usize),
NoSlice,
}
const SANDYBRIDGE_TO_SKYLAKE_FUNCTIONS: [usize; 3] = [
const SANDYBRIDGE_TO_SKYLAKE_FUNCTIONS: [usize; 4] = [
0b0110_1101_0111_1101_0101_1101_0101_0001_000000,
0b1011_1010_1101_0111_1110_1010_1010_0010_000000,
0b1111_0011_0011_0011_0010_0100_1100_0100_000000,
0b0, // TODO
];
// missing functions for more than 8 cores.
@ -26,28 +30,36 @@ pub fn cache_slicing(uarch: MicroArchitecture, physical_cores: u8) -> CacheSlici
| MicroArchitecture::CoffeeLake => {
ComplexAddressing(&SANDYBRIDGE_TO_SKYLAKE_FUNCTIONS[0..((trailing_zeros + 1) as usize)])
}
MicroArchitecture::SandyBridge => {
ComplexAddressing(&SANDYBRIDGE_TO_SKYLAKE_FUNCTIONS[0..((trailing_zeros) as usize)])
}
_ => Unsupported,
}
}
pub struct AddressHasher<'a> {
masks: &'a [usize],
fn hash(addr: usize, mask: usize) -> usize {
((addr & mask).count_ones() & 1) as usize
}
fn hash(addr: usize, mask: usize) -> u32 {
(addr & mask).count_ones() & 1
}
impl AddressHasher<'_> {
pub fn new(masks: &[usize]) -> AddressHasher {
AddressHasher { masks }
impl CacheSlicing {
pub fn can_hash(&self) -> bool {
match self {
Unsupported | NoSlice => false,
ComplexAddressing(_) | SimpleAddressing(_) => true,
}
pub fn hash(&self, addr: usize) -> u32 {
}
pub fn hash(&self, addr: usize) -> Option<usize> {
match self {
SimpleAddressing(&mask) => Some((addr & mask)),
ComplexAddressing(masks) => {
let mut res = 0;
for mask in self.masks {
for mask in *masks {
res <<= 1;
res |= hash(addr, *mask);
}
res
Some(res)
}
_ => None,
}
}
}