fn memset_element_unordered_atomic<T>(s: *mut T, c: u8, bytes: usize)where
    T: Copy + From<u8> + Shl<u32, Output = T> + BitOr<T, Output = T>,