pub fn axpy_f64(a: &mut [f64], alpha: f64, b: &[f64])
Compute a[i] = a[i] + alpha * b[i] (axpy operation, f64 version)