pub const fn simd_aligned_size(size: usize) -> usize
Calculate SIMD-aligned buffer size (multiple of 4 for f64x4)