diff options
Diffstat (limited to 'src/f32/sse2/mat2.rs')
-rw-r--r-- | src/f32/sse2/mat2.rs | 505 |
1 files changed, 505 insertions, 0 deletions
diff --git a/src/f32/sse2/mat2.rs b/src/f32/sse2/mat2.rs new file mode 100644 index 0000000..0222bdd --- /dev/null +++ b/src/f32/sse2/mat2.rs @@ -0,0 +1,505 @@ +// Generated from mat.rs.tera template. Edit the template, not the generated file. + +use crate::{swizzles::*, DMat2, Mat3, Mat3A, Vec2}; +#[cfg(not(target_arch = "spirv"))] +use core::fmt; +use core::iter::{Product, Sum}; +use core::ops::{Add, AddAssign, Mul, MulAssign, Neg, Sub, SubAssign}; + +#[cfg(target_arch = "x86")] +use core::arch::x86::*; +#[cfg(target_arch = "x86_64")] +use core::arch::x86_64::*; + +#[cfg(feature = "libm")] +#[allow(unused_imports)] +use num_traits::Float; + +union UnionCast { + a: [f32; 4], + v: Mat2, +} + +/// Creates a 2x2 matrix from column vectors. +#[inline(always)] +pub const fn mat2(x_axis: Vec2, y_axis: Vec2) -> Mat2 { + Mat2::from_cols(x_axis, y_axis) +} + +/// A 2x2 column major matrix. +#[derive(Clone, Copy)] +#[repr(transparent)] +pub struct Mat2(pub(crate) __m128); + +impl Mat2 { + /// A 2x2 matrix with all elements set to `0.0`. + pub const ZERO: Self = Self::from_cols(Vec2::ZERO, Vec2::ZERO); + + /// A 2x2 identity matrix, where all diagonal elements are `1`, and all off-diagonal elements are `0`. + pub const IDENTITY: Self = Self::from_cols(Vec2::X, Vec2::Y); + + /// All NAN:s. + pub const NAN: Self = Self::from_cols(Vec2::NAN, Vec2::NAN); + + #[allow(clippy::too_many_arguments)] + #[inline(always)] + const fn new(m00: f32, m01: f32, m10: f32, m11: f32) -> Self { + unsafe { + UnionCast { + a: [m00, m01, m10, m11], + } + .v + } + } + + /// Creates a 2x2 matrix from two column vectors. + #[inline(always)] + pub const fn from_cols(x_axis: Vec2, y_axis: Vec2) -> Self { + unsafe { + UnionCast { + a: [x_axis.x, x_axis.y, y_axis.x, y_axis.y], + } + .v + } + } + + /// Creates a 2x2 matrix from a `[f32; 4]` array stored in column major order. + /// If your data is stored in row major you will need to `transpose` the returned + /// matrix. + #[inline] + pub const fn from_cols_array(m: &[f32; 4]) -> Self { + Self::new(m[0], m[1], m[2], m[3]) + } + + /// Creates a `[f32; 4]` array storing data in column major order. + /// If you require data in row major order `transpose` the matrix first. + #[inline] + pub const fn to_cols_array(&self) -> [f32; 4] { + unsafe { *(self as *const Self as *const [f32; 4]) } + } + + /// Creates a 2x2 matrix from a `[[f32; 2]; 2]` 2D array stored in column major order. + /// If your data is in row major order you will need to `transpose` the returned + /// matrix. + #[inline] + pub const fn from_cols_array_2d(m: &[[f32; 2]; 2]) -> Self { + Self::from_cols(Vec2::from_array(m[0]), Vec2::from_array(m[1])) + } + + /// Creates a `[[f32; 2]; 2]` 2D array storing data in column major order. + /// If you require data in row major order `transpose` the matrix first. + #[inline] + pub const fn to_cols_array_2d(&self) -> [[f32; 2]; 2] { + unsafe { *(self as *const Self as *const [[f32; 2]; 2]) } + } + + /// Creates a 2x2 matrix with its diagonal set to `diagonal` and all other entries set to 0. + #[doc(alias = "scale")] + #[inline] + pub const fn from_diagonal(diagonal: Vec2) -> Self { + Self::new(diagonal.x, 0.0, 0.0, diagonal.y) + } + + /// Creates a 2x2 matrix containing the combining non-uniform `scale` and rotation of + /// `angle` (in radians). + #[inline] + pub fn from_scale_angle(scale: Vec2, angle: f32) -> Self { + let (sin, cos) = angle.sin_cos(); + Self::new(cos * scale.x, sin * scale.x, -sin * scale.y, cos * scale.y) + } + + /// Creates a 2x2 matrix containing a rotation of `angle` (in radians). + #[inline] + pub fn from_angle(angle: f32) -> Self { + let (sin, cos) = angle.sin_cos(); + Self::new(cos, sin, -sin, cos) + } + + /// Creates a 2x2 matrix from a 3x3 matrix, discarding the 2nd row and column. + #[inline] + pub fn from_mat3(m: Mat3) -> Self { + Self::from_cols(m.x_axis.xy(), m.y_axis.xy()) + } + + /// Creates a 2x2 matrix from a 3x3 matrix, discarding the 2nd row and column. + #[inline] + pub fn from_mat3a(m: Mat3A) -> Self { + Self::from_cols(m.x_axis.xy(), m.y_axis.xy()) + } + + /// Creates a 2x2 matrix from the first 4 values in `slice`. + /// + /// # Panics + /// + /// Panics if `slice` is less than 4 elements long. + #[inline] + pub const fn from_cols_slice(slice: &[f32]) -> Self { + Self::new(slice[0], slice[1], slice[2], slice[3]) + } + + /// Writes the columns of `self` to the first 4 elements in `slice`. + /// + /// # Panics + /// + /// Panics if `slice` is less than 4 elements long. + #[inline] + pub fn write_cols_to_slice(self, slice: &mut [f32]) { + slice[0] = self.x_axis.x; + slice[1] = self.x_axis.y; + slice[2] = self.y_axis.x; + slice[3] = self.y_axis.y; + } + + /// Returns the matrix column for the given `index`. + /// + /// # Panics + /// + /// Panics if `index` is greater than 1. + #[inline] + pub fn col(&self, index: usize) -> Vec2 { + match index { + 0 => self.x_axis, + 1 => self.y_axis, + _ => panic!("index out of bounds"), + } + } + + /// Returns a mutable reference to the matrix column for the given `index`. + /// + /// # Panics + /// + /// Panics if `index` is greater than 1. + #[inline] + pub fn col_mut(&mut self, index: usize) -> &mut Vec2 { + match index { + 0 => &mut self.x_axis, + 1 => &mut self.y_axis, + _ => panic!("index out of bounds"), + } + } + + /// Returns the matrix row for the given `index`. + /// + /// # Panics + /// + /// Panics if `index` is greater than 1. + #[inline] + pub fn row(&self, index: usize) -> Vec2 { + match index { + 0 => Vec2::new(self.x_axis.x, self.y_axis.x), + 1 => Vec2::new(self.x_axis.y, self.y_axis.y), + _ => panic!("index out of bounds"), + } + } + + /// Returns `true` if, and only if, all elements are finite. + /// If any element is either `NaN`, positive or negative infinity, this will return `false`. + #[inline] + pub fn is_finite(&self) -> bool { + self.x_axis.is_finite() && self.y_axis.is_finite() + } + + /// Returns `true` if any elements are `NaN`. + #[inline] + pub fn is_nan(&self) -> bool { + self.x_axis.is_nan() || self.y_axis.is_nan() + } + + /// Returns the transpose of `self`. + #[must_use] + #[inline] + pub fn transpose(&self) -> Self { + Self(unsafe { _mm_shuffle_ps(self.0, self.0, 0b11_01_10_00) }) + } + + /// Returns the determinant of `self`. + #[inline] + pub fn determinant(&self) -> f32 { + unsafe { + let abcd = self.0; + let dcba = _mm_shuffle_ps(abcd, abcd, 0b00_01_10_11); + let prod = _mm_mul_ps(abcd, dcba); + let det = _mm_sub_ps(prod, _mm_shuffle_ps(prod, prod, 0b01_01_01_01)); + _mm_cvtss_f32(det) + } + } + + /// Returns the inverse of `self`. + /// + /// If the matrix is not invertible the returned matrix will be invalid. + /// + /// # Panics + /// + /// Will panic if the determinant of `self` is zero when `glam_assert` is enabled. + #[must_use] + #[inline] + pub fn inverse(&self) -> Self { + unsafe { + const SIGN: __m128 = crate::sse2::m128_from_f32x4([1.0, -1.0, -1.0, 1.0]); + let abcd = self.0; + let dcba = _mm_shuffle_ps(abcd, abcd, 0b00_01_10_11); + let prod = _mm_mul_ps(abcd, dcba); + let sub = _mm_sub_ps(prod, _mm_shuffle_ps(prod, prod, 0b01_01_01_01)); + let det = _mm_shuffle_ps(sub, sub, 0b00_00_00_00); + let tmp = _mm_div_ps(SIGN, det); + glam_assert!(Mat2(tmp).is_finite()); + let dbca = _mm_shuffle_ps(abcd, abcd, 0b00_10_01_11); + Self(_mm_mul_ps(dbca, tmp)) + } + } + + /// Transforms a 2D vector. + #[inline] + pub fn mul_vec2(&self, rhs: Vec2) -> Vec2 { + unsafe { + use crate::Align16; + use core::mem::MaybeUninit; + let abcd = self.0; + let xxyy = _mm_set_ps(rhs.y, rhs.y, rhs.x, rhs.x); + let axbxcydy = _mm_mul_ps(abcd, xxyy); + let cydyaxbx = _mm_shuffle_ps(axbxcydy, axbxcydy, 0b01_00_11_10); + let result = _mm_add_ps(axbxcydy, cydyaxbx); + let mut out: MaybeUninit<Align16<Vec2>> = MaybeUninit::uninit(); + _mm_store_ps(out.as_mut_ptr().cast(), result); + out.assume_init().0 + } + } + + /// Multiplies two 2x2 matrices. + #[inline] + pub fn mul_mat2(&self, rhs: &Self) -> Self { + unsafe { + let abcd = self.0; + let rhs = rhs.0; + let xxyy0 = _mm_shuffle_ps(rhs, rhs, 0b01_01_00_00); + let xxyy1 = _mm_shuffle_ps(rhs, rhs, 0b11_11_10_10); + let axbxcydy0 = _mm_mul_ps(abcd, xxyy0); + let axbxcydy1 = _mm_mul_ps(abcd, xxyy1); + let cydyaxbx0 = _mm_shuffle_ps(axbxcydy0, axbxcydy0, 0b01_00_11_10); + let cydyaxbx1 = _mm_shuffle_ps(axbxcydy1, axbxcydy1, 0b01_00_11_10); + let result0 = _mm_add_ps(axbxcydy0, cydyaxbx0); + let result1 = _mm_add_ps(axbxcydy1, cydyaxbx1); + Self(_mm_shuffle_ps(result0, result1, 0b01_00_01_00)) + } + } + + /// Adds two 2x2 matrices. + #[inline] + pub fn add_mat2(&self, rhs: &Self) -> Self { + Self(unsafe { _mm_add_ps(self.0, rhs.0) }) + } + + /// Subtracts two 2x2 matrices. + #[inline] + pub fn sub_mat2(&self, rhs: &Self) -> Self { + Self(unsafe { _mm_sub_ps(self.0, rhs.0) }) + } + + /// Multiplies a 2x2 matrix by a scalar. + #[inline] + pub fn mul_scalar(&self, rhs: f32) -> Self { + Self(unsafe { _mm_mul_ps(self.0, _mm_set_ps1(rhs)) }) + } + + /// Returns true if the absolute difference of all elements between `self` and `rhs` + /// is less than or equal to `max_abs_diff`. + /// + /// This can be used to compare if two matrices contain similar elements. It works best + /// when comparing with a known value. The `max_abs_diff` that should be used used + /// depends on the values being compared against. + /// + /// For more see + /// [comparing floating point numbers](https://randomascii.wordpress.com/2012/02/25/comparing-floating-point-numbers-2012-edition/). + #[inline] + pub fn abs_diff_eq(&self, rhs: Self, max_abs_diff: f32) -> bool { + self.x_axis.abs_diff_eq(rhs.x_axis, max_abs_diff) + && self.y_axis.abs_diff_eq(rhs.y_axis, max_abs_diff) + } + + #[inline] + pub fn as_dmat2(&self) -> DMat2 { + DMat2::from_cols(self.x_axis.as_dvec2(), self.y_axis.as_dvec2()) + } +} + +impl Default for Mat2 { + #[inline] + fn default() -> Self { + Self::IDENTITY + } +} + +impl Add<Mat2> for Mat2 { + type Output = Self; + #[inline] + fn add(self, rhs: Self) -> Self::Output { + self.add_mat2(&rhs) + } +} + +impl AddAssign<Mat2> for Mat2 { + #[inline] + fn add_assign(&mut self, rhs: Self) { + *self = self.add_mat2(&rhs); + } +} + +impl Sub<Mat2> for Mat2 { + type Output = Self; + #[inline] + fn sub(self, rhs: Self) -> Self::Output { + self.sub_mat2(&rhs) + } +} + +impl SubAssign<Mat2> for Mat2 { + #[inline] + fn sub_assign(&mut self, rhs: Self) { + *self = self.sub_mat2(&rhs); + } +} + +impl Neg for Mat2 { + type Output = Self; + #[inline] + fn neg(self) -> Self::Output { + Self(unsafe { _mm_xor_ps(self.0, _mm_set1_ps(-0.0)) }) + } +} + +impl Mul<Mat2> for Mat2 { + type Output = Self; + #[inline] + fn mul(self, rhs: Self) -> Self::Output { + self.mul_mat2(&rhs) + } +} + +impl MulAssign<Mat2> for Mat2 { + #[inline] + fn mul_assign(&mut self, rhs: Self) { + *self = self.mul_mat2(&rhs); + } +} + +impl Mul<Vec2> for Mat2 { + type Output = Vec2; + #[inline] + fn mul(self, rhs: Vec2) -> Self::Output { + self.mul_vec2(rhs) + } +} + +impl Mul<Mat2> for f32 { + type Output = Mat2; + #[inline] + fn mul(self, rhs: Mat2) -> Self::Output { + rhs.mul_scalar(self) + } +} + +impl Mul<f32> for Mat2 { + type Output = Self; + #[inline] + fn mul(self, rhs: f32) -> Self::Output { + self.mul_scalar(rhs) + } +} + +impl MulAssign<f32> for Mat2 { + #[inline] + fn mul_assign(&mut self, rhs: f32) { + *self = self.mul_scalar(rhs); + } +} + +impl Sum<Self> for Mat2 { + fn sum<I>(iter: I) -> Self + where + I: Iterator<Item = Self>, + { + iter.fold(Self::ZERO, Self::add) + } +} + +impl<'a> Sum<&'a Self> for Mat2 { + fn sum<I>(iter: I) -> Self + where + I: Iterator<Item = &'a Self>, + { + iter.fold(Self::ZERO, |a, &b| Self::add(a, b)) + } +} + +impl Product for Mat2 { + fn product<I>(iter: I) -> Self + where + I: Iterator<Item = Self>, + { + iter.fold(Self::IDENTITY, Self::mul) + } +} + +impl<'a> Product<&'a Self> for Mat2 { + fn product<I>(iter: I) -> Self + where + I: Iterator<Item = &'a Self>, + { + iter.fold(Self::IDENTITY, |a, &b| Self::mul(a, b)) + } +} + +impl PartialEq for Mat2 { + #[inline] + fn eq(&self, rhs: &Self) -> bool { + self.x_axis.eq(&rhs.x_axis) && self.y_axis.eq(&rhs.y_axis) + } +} + +#[cfg(not(target_arch = "spirv"))] +impl AsRef<[f32; 4]> for Mat2 { + #[inline] + fn as_ref(&self) -> &[f32; 4] { + unsafe { &*(self as *const Self as *const [f32; 4]) } + } +} + +#[cfg(not(target_arch = "spirv"))] +impl AsMut<[f32; 4]> for Mat2 { + #[inline] + fn as_mut(&mut self) -> &mut [f32; 4] { + unsafe { &mut *(self as *mut Self as *mut [f32; 4]) } + } +} + +impl core::ops::Deref for Mat2 { + type Target = crate::deref::Cols2<Vec2>; + #[inline] + fn deref(&self) -> &Self::Target { + unsafe { &*(self as *const Self as *const Self::Target) } + } +} + +impl core::ops::DerefMut for Mat2 { + #[inline] + fn deref_mut(&mut self) -> &mut Self::Target { + unsafe { &mut *(self as *mut Self as *mut Self::Target) } + } +} + +#[cfg(not(target_arch = "spirv"))] +impl fmt::Debug for Mat2 { + fn fmt(&self, fmt: &mut fmt::Formatter<'_>) -> fmt::Result { + fmt.debug_struct(stringify!(Mat2)) + .field("x_axis", &self.x_axis) + .field("y_axis", &self.y_axis) + .finish() + } +} + +#[cfg(not(target_arch = "spirv"))] +impl fmt::Display for Mat2 { + fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { + write!(f, "[{}, {}]", self.x_axis, self.y_axis) + } +} |