18void Vec3::CheckW()
const
20#ifdef JPH_FLOATING_POINT_EXCEPTIONS_ENABLED
28#ifdef JPH_FLOATING_POINT_EXCEPTIONS_ENABLED
29 #if defined(JPH_USE_SSE)
30 return _mm_shuffle_ps(inValue, inValue, _MM_SHUFFLE(2, 2, 1, 0));
31 #elif defined(JPH_USE_NEON)
32 return JPH_NEON_SHUFFLE_F32x4(inValue, inValue, 0, 1, 2, 2);
33 #elif defined(JPH_USE_RVV)
35 const vfloat32m1_t v = __riscv_vle32_v_f32m1(inValue.mData, 3);
36 __riscv_vse32_v_f32m1(value.mData, v, 3);
37 value.mData[3] = value.mData[2];
41 value.mData[0] = inValue.mData[0];
42 value.mData[1] = inValue.mData[1];
43 value.mData[2] = inValue.mData[2];
44 value.mData[3] = inValue.mData[2];
53 mValue(sFixW(inRHS.mValue))
59#if defined(JPH_USE_SSE)
60 Type x = _mm_load_ss(&inV.
x);
61 Type y = _mm_load_ss(&inV.
y);
62 Type z = _mm_load_ss(&inV.
z);
63 Type xy = _mm_unpacklo_ps(x, y);
64 mValue = _mm_shuffle_ps(
xy, z, _MM_SHUFFLE(0, 0, 1, 0));
65#elif defined(JPH_USE_NEON)
66 float32x2_t
xy = vld1_f32(&inV.
x);
67 float32x2_t zz = vdup_n_f32(inV.
z);
69#elif defined(JPH_USE_RVV)
70 const vfloat32m1_t v = __riscv_vle32_v_f32m1(&inV.
x, 3);
71 __riscv_vse32_v_f32m1(
mF32, v, 3);
83#if defined(JPH_USE_SSE)
84 mValue = _mm_set_ps(inZ, inZ, inY, inX);
85#elif defined(JPH_USE_NEON)
87 uint32x2_t zz = vreinterpret_u32_f32(vdup_n_f32(inZ));
88 mValue = vreinterpretq_f32_u32(vcombine_u32(
xy, zz));
89#elif defined(JPH_USE_RVV)
90 const float aggregated[4] = { inX, inY, inZ, inZ };
91 const vfloat32m1_t v = __riscv_vle32_v_f32m1(aggregated, 4);
92 __riscv_vse32_v_f32m1(
mF32, v, 4);
101template<u
int32 SwizzleX, u
int32 SwizzleY, u
int32 SwizzleZ>
104 static_assert(SwizzleX <= 3,
"SwizzleX template parameter out of range");
105 static_assert(SwizzleY <= 3,
"SwizzleY template parameter out of range");
106 static_assert(SwizzleZ <= 3,
"SwizzleZ template parameter out of range");
108#if defined(JPH_USE_SSE)
109 return _mm_shuffle_ps(
mValue,
mValue, _MM_SHUFFLE(SwizzleZ, SwizzleZ, SwizzleY, SwizzleX));
110#elif defined(JPH_USE_NEON)
111 return JPH_NEON_SHUFFLE_F32x4(
mValue,
mValue, SwizzleX, SwizzleY, SwizzleZ, SwizzleZ);
112#elif defined(JPH_USE_RVV)
114 const vfloat32m1_t data = __riscv_vle32_v_f32m1(
mF32, 4);
115 const uint32 stored_indices[4] = { SwizzleX, SwizzleY, SwizzleZ, SwizzleZ };
116 const vuint32m1_t index = __riscv_vle32_v_u32m1(stored_indices, 4);
117 const vfloat32m1_t swizzled = __riscv_vrgather_vv_f32m1(data, index, 4);
118 __riscv_vse32_v_f32m1(v.
mF32, swizzled, 4);
127#if defined(JPH_USE_SSE)
128 return _mm_setzero_ps();
129#elif defined(JPH_USE_NEON)
130 return vdupq_n_f32(0);
131#elif defined(JPH_USE_RVV)
133 const vfloat32m1_t zero_vec = __riscv_vfmv_v_f_f32m1(0.0f, 3);
134 __riscv_vse32_v_f32m1(v.
mF32, zero_vec, 3);
137 return Vec3(0, 0, 0);
143#if defined(JPH_USE_SSE)
144 return _mm_set1_ps(inV);
145#elif defined(JPH_USE_NEON)
146 return vdupq_n_f32(inV);
147#elif defined(JPH_USE_RVV)
149 const vfloat32m1_t v = __riscv_vfmv_v_f_f32m1(inV, 3);
150 __riscv_vse32_v_f32m1(vec.
mF32, v, 3);
153 return Vec3(inV, inV, inV);
164 return sReplicate(numeric_limits<float>::quiet_NaN());
169#if defined(JPH_USE_SSE)
170 Type v = _mm_loadu_ps(&inV.
x);
171#elif defined(JPH_USE_NEON)
172 Type v = vld1q_f32(&inV.
x);
173#elif defined(JPH_USE_RVV)
175 const vfloat32m1_t rvv = __riscv_vle32_v_f32m1(&inV.
x, 3);
176 __riscv_vse32_v_f32m1(v.mData, rvv, 3);
178 Type v = { inV.
x, inV.
y, inV.
z };
185#if defined(JPH_USE_SSE)
187#elif defined(JPH_USE_NEON)
189#elif defined(JPH_USE_RVV)
191 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(inV1.
mF32, 3);
192 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
193 const vfloat32m1_t min = __riscv_vfmin_vv_f32m1(v1, v2, 3);
194 __riscv_vse32_v_f32m1(res.
mF32, min, 3);
205#if defined(JPH_USE_SSE)
207#elif defined(JPH_USE_NEON)
209#elif defined(JPH_USE_RVV)
211 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(inV1.
mF32, 3);
212 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
213 const vfloat32m1_t max = __riscv_vfmax_vv_f32m1(v1, v2, 3);
214 __riscv_vse32_v_f32m1(res.
mF32, max, 3);
225 return sMax(
sMin(inV, inMax), inMin);
230#if defined(JPH_USE_SSE)
231 return _mm_castps_si128(_mm_cmpeq_ps(inV1.
mValue, inV2.
mValue));
232#elif defined(JPH_USE_NEON)
234#elif defined(JPH_USE_RVV)
236 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(inV1.
mF32, 3);
237 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
238 const vbool32_t mask = __riscv_vmfeq_vv_f32m1_b32(v1, v2, 3);
239 const vuint32m1_t zeros = __riscv_vmv_v_x_u32m1(0x0, 3);
240 const vuint32m1_t merged = __riscv_vmerge_vxm_u32m1(zeros, 0xFFFFFFFF, mask, 3);
241 __riscv_vse32_v_u32m1(res.
mU32, merged, 3);
247 inV1.
mF32[1] == inV2.
mF32[1]? 0xffffffffu : 0,
255#if defined(JPH_USE_SSE)
256 return _mm_castps_si128(_mm_cmplt_ps(inV1.
mValue, inV2.
mValue));
257#elif defined(JPH_USE_NEON)
259#elif defined(JPH_USE_RVV)
261 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(inV1.
mF32, 3);
262 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
263 const vbool32_t mask = __riscv_vmflt_vv_f32m1_b32(v1, v2, 3);
264 const vuint32m1_t zeros = __riscv_vmv_v_x_u32m1(0x0, 3);
265 const vuint32m1_t merged = __riscv_vmerge_vxm_u32m1(zeros, 0xFFFFFFFF, mask, 3);
266 __riscv_vse32_v_u32m1(res.
mU32, merged, 3);
272 inV1.
mF32[1] < inV2.
mF32[1]? 0xffffffffu : 0,
280#if defined(JPH_USE_SSE)
281 return _mm_castps_si128(_mm_cmple_ps(inV1.
mValue, inV2.
mValue));
282#elif defined(JPH_USE_NEON)
284#elif defined(JPH_USE_RVV)
286 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(inV1.
mF32, 3);
287 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
288 const vbool32_t mask = __riscv_vmfle_vv_f32m1_b32(v1, v2, 3);
289 const vuint32m1_t zeros = __riscv_vmv_v_x_u32m1(0x0, 3);
290 const vuint32m1_t merged = __riscv_vmerge_vxm_u32m1(zeros, 0xFFFFFFFF, mask, 3);
291 __riscv_vse32_v_u32m1(res.
mU32, merged, 3);
297 inV1.
mF32[1] <= inV2.
mF32[1]? 0xffffffffu : 0,
305#if defined(JPH_USE_SSE)
306 return _mm_castps_si128(_mm_cmpgt_ps(inV1.
mValue, inV2.
mValue));
307#elif defined(JPH_USE_NEON)
309#elif defined(JPH_USE_RVV)
311 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(inV1.
mF32, 3);
312 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
313 const vbool32_t mask = __riscv_vmfgt_vv_f32m1_b32(v1, v2, 3);
314 const vuint32m1_t zeros = __riscv_vmv_v_x_u32m1(0x0, 3);
315 const vuint32m1_t merged = __riscv_vmerge_vxm_u32m1(zeros, 0xFFFFFFFF, mask, 3);
316 __riscv_vse32_v_u32m1(res.
mU32, merged, 3);
322 inV1.
mF32[1] > inV2.
mF32[1]? 0xffffffffu : 0,
330#if defined(JPH_USE_SSE)
331 return _mm_castps_si128(_mm_cmpge_ps(inV1.
mValue, inV2.
mValue));
332#elif defined(JPH_USE_NEON)
334#elif defined(JPH_USE_RVV)
336 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(inV1.
mF32, 3);
337 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
338 const vbool32_t mask = __riscv_vmfge_vv_f32m1_b32(v1, v2, 3);
339 const vuint32m1_t zeros = __riscv_vmv_v_x_u32m1(0x0, 3);
340 const vuint32m1_t merged = __riscv_vmerge_vxm_u32m1(zeros, 0xFFFFFFFF, mask, 3);
341 __riscv_vse32_v_u32m1(res.
mU32, merged, 3);
347 inV1.
mF32[1] >= inV2.
mF32[1]? 0xffffffffu : 0,
358 #elif defined(JPH_USE_NEON)
360 #elif defined(JPH_USE_RVV)
362 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(inMul1.
mF32, 3);
363 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inMul2.
mF32, 3);
364 const vfloat32m1_t rvv_add = __riscv_vle32_v_f32m1(inAdd.
mF32, 3);
365 const vfloat32m1_t fmadd = __riscv_vfmacc_vv_f32m1(rvv_add, v1, v2, 3);
366 __riscv_vse32_v_f32m1(res.
mF32, fmadd, 3);
369 return inMul1 * inMul2 + inAdd;
372 return inMul1 * inMul2 + inAdd;
378#if defined(JPH_USE_SSE4_1) && !defined(JPH_PLATFORM_WASM)
381#elif defined(JPH_USE_SSE)
382 __m128 is_set = _mm_castsi128_ps(_mm_srai_epi32(inControl.
mValue, 31));
383 Type v = _mm_or_ps(_mm_and_ps(is_set, inSet.
mValue), _mm_andnot_ps(is_set, inNotSet.
mValue));
385#elif defined(JPH_USE_NEON)
386 Type v = vbslq_f32(vreinterpretq_u32_s32(vshrq_n_s32(vreinterpretq_s32_u32(inControl.
mValue), 31)), inSet.
mValue, inNotSet.
mValue);
388#elif defined(JPH_USE_RVV)
390 const vuint32m1_t control = __riscv_vle32_v_u32m1(inControl.
mU32, 3);
391 const vfloat32m1_t not_set = __riscv_vle32_v_f32m1(inNotSet.
mF32, 3);
392 const vfloat32m1_t set = __riscv_vle32_v_f32m1(inSet.
mF32, 3);
395 const vuint32m1_t r = __riscv_vand_vx_u32m1(control, 0x80000000u, 3);
396 const vbool32_t rvv_mask = __riscv_vmsne_vx_u32m1_b32(r, 0x0, 3);
397 const vfloat32m1_t merged = __riscv_vmerge_vvm_f32m1(not_set, set, rvv_mask, 3);
398 __riscv_vse32_v_f32m1(masked.
mF32, merged, 3);
402 for (
int i = 0; i < 3; i++)
403 result.
mF32[i] = (inControl.
mU32[i] & 0x80000000u) ? inSet.
mF32[i] : inNotSet.
mF32[i];
404#ifdef JPH_FLOATING_POINT_EXCEPTIONS_ENABLED
413#if defined(JPH_USE_SSE)
415#elif defined(JPH_USE_NEON)
416 return vreinterpretq_f32_u32(vorrq_u32(vreinterpretq_u32_f32(inV1.
mValue), vreinterpretq_u32_f32(inV2.
mValue)));
417#elif defined(JPH_USE_RVV)
419 const vuint32m1_t v1 = __riscv_vle32_v_u32m1(
reinterpret_cast<const uint32 *
>(inV1.
mF32), 3);
420 const vuint32m1_t v2 = __riscv_vle32_v_u32m1(
reinterpret_cast<const uint32 *
>(inV2.
mF32), 3);
421 const vuint32m1_t res = __riscv_vor_vv_u32m1(v1, v2, 3);
422 __riscv_vse32_v_u32m1(
reinterpret_cast<uint32 *
>(or_result.
mF32), res, 3);
431#if defined(JPH_USE_SSE)
433#elif defined(JPH_USE_NEON)
434 return vreinterpretq_f32_u32(veorq_u32(vreinterpretq_u32_f32(inV1.
mValue), vreinterpretq_u32_f32(inV2.
mValue)));
435#elif defined(JPH_USE_RVV)
437 const vuint32m1_t v1 = __riscv_vle32_v_u32m1(
reinterpret_cast<const uint32 *
>(inV1.
mF32), 3);
438 const vuint32m1_t v2 = __riscv_vle32_v_u32m1(
reinterpret_cast<const uint32 *
>(inV2.
mF32), 3);
439 const vuint32m1_t res = __riscv_vxor_vv_u32m1(v1, v2, 3);
440 __riscv_vse32_v_u32m1(
reinterpret_cast<uint32 *
>(xor_result.
mF32), res, 3);
449#if defined(JPH_USE_SSE)
451#elif defined(JPH_USE_NEON)
452 return vreinterpretq_f32_u32(vandq_u32(vreinterpretq_u32_f32(inV1.
mValue), vreinterpretq_u32_f32(inV2.
mValue)));
453#elif defined(JPH_USE_RVV)
455 const vuint32m1_t v1 = __riscv_vle32_v_u32m1(
reinterpret_cast<const uint32 *
>(inV1.
mF32), 3);
456 const vuint32m1_t v2 = __riscv_vle32_v_u32m1(
reinterpret_cast<const uint32 *
>(inV2.
mF32), 3);
457 const vuint32m1_t res = __riscv_vand_vv_u32m1(v1, v2, 3);
458 __riscv_vse32_v_u32m1(
reinterpret_cast<uint32 *
>(and_result.
mF32), res, 3);
472template <
class Random>
475 std::uniform_real_distribution<float> zero_to_one(0.0f, 1.0f);
476 float theta = JPH_PI * zero_to_one(inRandom);
477 float phi = 2.0f * JPH_PI * zero_to_one(inRandom);
488 return (inV2 - *
this).LengthSq() <= inMaxDistSq;
498#if defined(JPH_USE_SSE)
500#elif defined(JPH_USE_NEON)
502#elif defined(JPH_USE_RVV)
504 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(
mF32, 3);
505 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
506 const vfloat32m1_t mul = __riscv_vfmul_vv_f32m1(v1, v2, 3);
507 __riscv_vse32_v_f32m1(res.
mF32, mul, 3);
516#if defined(JPH_USE_SSE)
517 return _mm_mul_ps(
mValue, _mm_set1_ps(inV2));
518#elif defined(JPH_USE_NEON)
519 return vmulq_n_f32(
mValue, inV2);
520#elif defined(JPH_USE_RVV)
522 const vfloat32m1_t src = __riscv_vle32_v_f32m1(
mF32, 3);
523 const vfloat32m1_t mul = __riscv_vfmul_vf_f32m1(src, inV2, 3);
524 __riscv_vse32_v_f32m1(res.
mF32, mul, 3);
533#if defined(JPH_USE_SSE)
534 return _mm_mul_ps(_mm_set1_ps(inV1), inV2.
mValue);
535#elif defined(JPH_USE_NEON)
536 return vmulq_n_f32(inV2.
mValue, inV1);
537#elif defined(JPH_USE_RVV)
539 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
540 const vfloat32m1_t mul = __riscv_vfmul_vf_f32m1(v1, inV1, 3);
541 __riscv_vse32_v_f32m1(res.
mF32, mul, 3);
550#if defined(JPH_USE_SSE)
551 return _mm_div_ps(
mValue, _mm_set1_ps(inV2));
552#elif defined(JPH_USE_NEON)
553 return vdivq_f32(
mValue, vdupq_n_f32(inV2));
554#elif defined(JPH_USE_RVV)
556 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(
mF32, 3);
557 const vfloat32m1_t div = __riscv_vfdiv_vf_f32m1(v1, inV2, 3);
558 __riscv_vse32_v_f32m1(res.
mF32, div, 3);
567#if defined(JPH_USE_SSE)
569#elif defined(JPH_USE_NEON)
571#elif defined(JPH_USE_RVV)
572 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(
mF32, 3);
573 const vfloat32m1_t res = __riscv_vfmul_vf_f32m1(v1, inV2, 3);
574 __riscv_vse32_v_f32m1(
mF32, res, 3);
576 for (
int i = 0; i < 3; ++i)
578 #ifdef JPH_FLOATING_POINT_EXCEPTIONS_ENABLED
587#if defined(JPH_USE_SSE)
589#elif defined(JPH_USE_NEON)
591#elif defined(JPH_USE_RVV)
592 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(
mF32, 3);
593 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
594 const vfloat32m1_t rvv_res = __riscv_vfmul_vv_f32m1(v1, v2, 3);
595 __riscv_vse32_v_f32m1(
mF32, rvv_res, 3);
597 for (
int i = 0; i < 3; ++i)
599 #ifdef JPH_FLOATING_POINT_EXCEPTIONS_ENABLED
608#if defined(JPH_USE_SSE)
610#elif defined(JPH_USE_NEON)
612#elif defined(JPH_USE_RVV)
613 const vfloat32m1_t v = __riscv_vle32_v_f32m1(
mF32, 3);
614 const vfloat32m1_t res = __riscv_vfdiv_vf_f32m1(v, inV2, 3);
615 __riscv_vse32_v_f32m1(
mF32, res, 3);
617 for (
int i = 0; i < 3; ++i)
619 #ifdef JPH_FLOATING_POINT_EXCEPTIONS_ENABLED
628#if defined(JPH_USE_SSE)
630#elif defined(JPH_USE_NEON)
632#elif defined(JPH_USE_RVV)
634 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(
mF32, 3);
635 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
636 const vfloat32m1_t rvv_add = __riscv_vfadd_vv_f32m1(v1, v2, 3);
637 __riscv_vse32_v_f32m1(res.
mF32, rvv_add, 3);
646#if defined(JPH_USE_SSE)
648#elif defined(JPH_USE_NEON)
650#elif defined(JPH_USE_RVV)
651 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(
mF32, 3);
652 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
653 const vfloat32m1_t rvv_add = __riscv_vfadd_vv_f32m1(v1, v2, 3);
654 __riscv_vse32_v_f32m1(
mF32, rvv_add, 3);
656 for (
int i = 0; i < 3; ++i)
658 #ifdef JPH_FLOATING_POINT_EXCEPTIONS_ENABLED
667#if defined(JPH_USE_SSE)
668 return _mm_sub_ps(_mm_setzero_ps(),
mValue);
669#elif defined(JPH_USE_NEON)
670 #ifdef JPH_CROSS_PLATFORM_DETERMINISTIC
671 return vsubq_f32(vdupq_n_f32(0),
mValue);
675#elif defined(JPH_USE_RVV)
676 #ifdef JPH_CROSS_PLATFORM_DETERMINISTIC
678 const vfloat32m1_t rvv_zero = __riscv_vfmv_v_f_f32m1(0.0f, 3);
679 const vfloat32m1_t v = __riscv_vle32_v_f32m1(
mF32, 3);
680 const vfloat32m1_t rvv_neg = __riscv_vfsub_vv_f32m1(rvv_zero, v, 3);
681 __riscv_vse32_v_f32m1(res.
mF32, rvv_neg, 3);
685 const vfloat32m1_t v = __riscv_vle32_v_f32m1(
mF32, 3);
686 const vfloat32m1_t rvv_neg = __riscv_vfsgnjn_vv_f32m1(v, v, 3);
687 __riscv_vse32_v_f32m1(res.
mF32, rvv_neg, 3);
691 #ifdef JPH_CROSS_PLATFORM_DETERMINISTIC
701#if defined(JPH_USE_SSE)
703#elif defined(JPH_USE_NEON)
705#elif defined(JPH_USE_RVV)
707 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(
mF32, 3);
708 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
709 const vfloat32m1_t rvv_sub = __riscv_vfsub_vv_f32m1(v1, v2, 3);
710 __riscv_vse32_v_f32m1(res.
mF32, rvv_sub, 3);
719#if defined(JPH_USE_SSE)
721#elif defined(JPH_USE_NEON)
723#elif defined(JPH_USE_RVV)
724 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(
mF32, 3);
725 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
726 const vfloat32m1_t rvv_sub = __riscv_vfsub_vv_f32m1(v1, v2, 3);
727 __riscv_vse32_v_f32m1(
mF32, rvv_sub, 3);
729 for (
int i = 0; i < 3; ++i)
731 #ifdef JPH_FLOATING_POINT_EXCEPTIONS_ENABLED
741#if defined(JPH_USE_SSE)
743#elif defined(JPH_USE_NEON)
745#elif defined(JPH_USE_RVV)
747 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(
mF32, 3);
748 const vfloat32m1_t v2 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
749 const vfloat32m1_t rvv_div = __riscv_vfdiv_vv_f32m1(v1, v2, 3);
750 __riscv_vse32_v_f32m1(res.
mF32, rvv_div, 3);
759#if defined(JPH_USE_SSE)
760 return _mm_shuffle_ps(
mValue,
mValue, _MM_SHUFFLE(0, 0, 0, 0));
761#elif defined(JPH_USE_NEON)
762 return vdupq_laneq_f32(
mValue, 0);
763#elif defined(JPH_USE_RVV)
765 const vfloat32m1_t splat = __riscv_vfmv_v_f_f32m1(
mF32[0], 4);
766 __riscv_vse32_v_f32m1(vec.
mF32, splat, 4);
775#if defined(JPH_USE_SSE)
776 return _mm_shuffle_ps(
mValue,
mValue, _MM_SHUFFLE(1, 1, 1, 1));
777#elif defined(JPH_USE_NEON)
778 return vdupq_laneq_f32(
mValue, 1);
779#elif defined(JPH_USE_RVV)
781 const vfloat32m1_t splat = __riscv_vfmv_v_f_f32m1(
mF32[1], 4);
782 __riscv_vse32_v_f32m1(vec.
mF32, splat, 4);
791#if defined(JPH_USE_SSE)
792 return _mm_shuffle_ps(
mValue,
mValue, _MM_SHUFFLE(2, 2, 2, 2));
793#elif defined(JPH_USE_NEON)
794 return vdupq_laneq_f32(
mValue, 2);
795#elif defined(JPH_USE_RVV)
797 const vfloat32m1_t splat = __riscv_vfmv_v_f_f32m1(
mF32[2], 4);
798 __riscv_vse32_v_f32m1(vec.
mF32, splat, 4);
817#if defined(JPH_USE_AVX512)
819#elif defined(JPH_USE_SSE)
820 return _mm_max_ps(_mm_sub_ps(_mm_setzero_ps(),
mValue),
mValue);
821#elif defined(JPH_USE_NEON)
823#elif defined(JPH_USE_RVV)
825 const vfloat32m1_t v = __riscv_vle32_v_f32m1(
mF32, 3);
826 const vfloat32m1_t rvv_abs = __riscv_vfsgnj_vf_f32m1(v, 1.0, 3);
827 __riscv_vse32_v_f32m1(res.
mF32, rvv_abs, 3);
847 return inA * inB - inC * inD;
853#if defined(JPH_USE_SSE)
854 Type t1 = _mm_shuffle_ps(inV2.
mValue, inV2.
mValue, _MM_SHUFFLE(0, 0, 2, 1));
855 t1 = _mm_mul_ps(t1,
mValue);
857 t2 = _mm_mul_ps(t2, inV2.
mValue);
858 Type t3 = _mm_sub_ps(t1, t2);
859 return _mm_shuffle_ps(t3, t3, _MM_SHUFFLE(0, 0, 2, 1));
860#elif defined(JPH_USE_NEON)
862 t1 = vmulq_f32(t1,
mValue);
864 t2 = vmulq_f32(t2, inV2.
mValue);
865 Type t3 = vsubq_f32(t1, t2);
866 return JPH_NEON_SHUFFLE_F32x4(t3, t3, 1, 2, 0, 0);
867#elif defined(JPH_USE_RVV)
868 const uint32 indices[3] = { 1, 2, 0 };
869 const vuint32m1_t gather_indices = __riscv_vle32_v_u32m1(indices, 3);
870 const vfloat32m1_t v0 = __riscv_vle32_v_f32m1(
mF32, 3);
871 const vfloat32m1_t v1 = __riscv_vle32_v_f32m1(inV2.
mF32, 3);
872 vfloat32m1_t t0 = __riscv_vrgather_vv_f32m1(v1, gather_indices, 3);
873 t0 = __riscv_vfmul_vv_f32m1(t0, v0, 3);
874 vfloat32m1_t t1 = __riscv_vrgather_vv_f32m1(v0, gather_indices, 3);
875 t1 = __riscv_vfmul_vv_f32m1(t1, v1, 3);
876 const vfloat32m1_t sub = __riscv_vfsub_vv_f32m1(t0, t1, 3);
877 const vfloat32m1_t cross = __riscv_vrgather_vv_f32m1(sub, gather_indices, 3);
880 __riscv_vse32_v_f32m1(cross_result.
mF32, cross, 3);
897#if defined(JPH_USE_SSE4_1)
898 #ifdef JPH_CROSS_PLATFORM_DETERMINISTIC
899 Type val = _mm_blend_ps(
mValue, _mm_setzero_ps(), 0x8);
900 Type shuf = _mm_movehdup_ps(val);
901 Type sums = _mm_add_ps(val, shuf);
902 shuf = _mm_movehl_ps(shuf, sums);
908 sums = _mm_add_ps(sums, shuf);
909 return _mm_cvtss_f32(sums);
910#elif defined(JPH_USE_NEON)
912 return vaddvq_f32(v);
913#elif defined(JPH_USE_RVV)
914 const vfloat32m1_t zeros = __riscv_vfmv_v_f_f32m1(0.0f, 3);
915 const vfloat32m1_t v = __riscv_vle32_v_f32m1(
mF32, 3);
916 const vfloat32m1_t sum = __riscv_vfredosum_vs_f32m1_f32m1(v, zeros, 3);
917 return __riscv_vfmv_f_s_f32m1_f32(sum);
919 #ifdef JPH_CROSS_PLATFORM_DETERMINISTIC
929 return (*
this * inV2).ReduceSum();
954#if defined(JPH_USE_SSE)
955 return _mm_sqrt_ps(
mValue);
956#elif defined(JPH_USE_NEON)
957 return vsqrtq_f32(
mValue);
958#elif defined(JPH_USE_RVV)
960 const vfloat32m1_t v = __riscv_vle32_v_f32m1(
mF32, 3);
961 const vfloat32m1_t rvv_sqrt = __riscv_vfsqrt_v_f32m1(v, 3);
962 __riscv_vse32_v_f32m1(res.
mF32, rvv_sqrt, 3);
976#if defined(JPH_USE_SSE4_1) && !defined(JPH_PLATFORM_WASM)
978 Type shuf = _mm_movehdup_ps(mul);
979 Type sums = _mm_add_ps(mul, shuf);
980 shuf = _mm_movehl_ps(mul, mul);
981 sums = _mm_add_ps(sums, shuf);
982 Type len_sq = _mm_shuffle_ps(sums, sums, _MM_SHUFFLE(0, 0, 0, 0));
986 Type is_zero = _mm_cmple_ps(len_sq, _mm_set1_ps(FLT_MIN));
987#ifdef JPH_FLOATING_POINT_EXCEPTIONS_ENABLED
988 if (_mm_movemask_ps(is_zero) == 0xf)
991 return _mm_div_ps(
mValue, _mm_sqrt_ps(len_sq));
993 return _mm_blendv_ps(_mm_div_ps(
mValue, _mm_sqrt_ps(len_sq)), inZeroValue.
mValue, is_zero);
995#elif defined(JPH_USE_NEON)
997 mul = vsetq_lane_f32(0, mul, 3);
998 float32x4_t len_sq = vdupq_n_f32(vaddvq_f32(mul));
999 uint32x4_t is_zero = vcleq_f32(len_sq, vdupq_n_f32(FLT_MIN));
1000 return vbslq_f32(is_zero, inZeroValue.
mValue, vdivq_f32(
mValue, vsqrtq_f32(len_sq)));
1001#elif defined(JPH_USE_RVV)
1002 const vfloat32m1_t src = __riscv_vle32_v_f32m1(
mF32, 3);
1003 const vfloat32m1_t zeros = __riscv_vfmv_v_f_f32m1(0.0f, 3);
1004 const vfloat32m1_t mul = __riscv_vfmul_vv_f32m1(src, src, 3);
1005 const vfloat32m1_t sum = __riscv_vfredosum_vs_f32m1_f32m1(mul, zeros, 3);
1006 const float dot = __riscv_vfmv_f_s_f32m1_f32(sum);
1010 const vfloat32m1_t splat = __riscv_vrgather_vx_f32m1(sum, 0, 3);
1011 const vfloat32m1_t length = __riscv_vfsqrt_v_f32m1(splat, 3);
1014 const vfloat32m1_t norm = __riscv_vfdiv_vv_f32m1(src, length, 3);
1015 __riscv_vse32_v_f32m1(v.
mF32, norm, 3);
1019 if (len_sq <= FLT_MIN)
1022 return *
this / JPH::Sqrt(len_sq);
1028 return abs(
LengthSq() - 1.0f) <= inTolerance;
1033#if defined(JPH_USE_AVX512)
1034 return (_mm_fpclass_ps_mask(
mValue, 0b10000001) & 0x7) != 0;
1035#elif defined(JPH_USE_SSE)
1036 return (_mm_movemask_ps(_mm_cmpunord_ps(
mValue,
mValue)) & 0x7) != 0;
1037#elif defined(JPH_USE_NEON)
1038 uint32x4_t mask = JPH_NEON_UINT32x4(1, 1, 1, 0);
1040 return vaddvq_u32(vandq_u32(is_equal, mask)) != 3;
1041#elif defined(JPH_USE_RVV)
1042 const vfloat32m1_t v = __riscv_vle32_v_f32m1(
mF32, 3);
1043 const vbool32_t mask = __riscv_vmfeq_vv_f32m1_b32(v, v, 3);
1044 const uint32 eq = __riscv_vcpop_m_b32(mask, 3);
1047 return isnan(
mF32[0]) || isnan(
mF32[1]) || isnan(
mF32[2]);
1053#if defined(JPH_USE_SSE)
1054 _mm_store_ss(&outV->
x,
mValue);
1056 _mm_store_ss(&outV->
y, t.
mValue);
1058 _mm_store_ss(&outV->
z, t.
mValue);
1059#elif defined(JPH_USE_NEON)
1060 float32x2_t
xy = vget_low_f32(
mValue);
1061 vst1_f32(&outV->
x,
xy);
1062 vst1q_lane_f32(&outV->
z,
mValue, 2);
1063#elif defined(JPH_USE_RVV)
1064 const vfloat32m1_t v = __riscv_vle32_v_f32m1(
mF32, 3);
1065 __riscv_vse32_v_f32m1(&outV->
x, v, 3);
1075#if defined(JPH_USE_SSE)
1076 return _mm_cvttps_epi32(
mValue);
1077#elif defined(JPH_USE_NEON)
1078 return vcvtq_u32_f32(
mValue);
1079#elif defined(JPH_USE_RVV)
1081 const vfloat32m1_t v = __riscv_vle32_v_f32m1(
mF32, 4);
1082 const vuint32m1_t cast = __riscv_vfcvt_rtz_xu_f_v_u32m1(v, 4);
1083 __riscv_vse32_v_u32m1(res.
mU32, cast, 4);
1092#if defined(JPH_USE_SSE)
1094#elif defined(JPH_USE_NEON)
1095 return vreinterpretq_u32_f32(
mValue);
1097 return *
reinterpret_cast<const UVec4 *
>(
this);
1117#if defined(JPH_USE_SSE)
1121 __m128 zero = _mm_setzero_ps();
1122 __m128 neg = _mm_sub_ps(zero,
mValue);
1123 __m128 perp_x = _mm_shuffle_ps(_mm_unpackhi_ps(
mValue, zero), neg, _MM_SHUFFLE(0, 0, 1, 0));
1124 __m128 perp_y = _mm_shuffle_ps(_mm_unpackhi_ps(zero,
mValue), neg, _MM_SHUFFLE(1, 1, 1, 0));
1128 __m128 xx = _mm_shuffle_ps(sq, sq, _MM_SHUFFLE(0, 0, 0, 0));
1129 __m128 yy = _mm_shuffle_ps(sq, sq, _MM_SHUFFLE(1, 1, 1, 1));
1130 __m128 zz = _mm_shuffle_ps(sq, sq, _MM_SHUFFLE(2, 2, 2, 2));
1131 __m128 x_gt_y = _mm_cmpgt_ps(xx, yy);
1134#if defined(JPH_USE_SSE4_1) && !defined(JPH_PLATFORM_WASM)
1135 __m128 result = _mm_blendv_ps(perp_y, perp_x, x_gt_y);
1137 __m128 result = _mm_or_ps(_mm_and_ps(x_gt_y, perp_x), _mm_andnot_ps(x_gt_y, perp_y));
1141 __m128 len = _mm_sqrt_ps(_mm_add_ps(_mm_max_ps(xx, yy), zz));
1142 return _mm_div_ps(result, len);
1145 float xx = x * x, yy = y * y, zz = z * z;
1146#ifdef JPH_CROSS_PLATFORM_DETERMINISTIC
1147 Vec3 perp_x(z, 0.0f, 0.0f - x);
1148 Vec3 perp_y(0.0f, z, 0.0f - y);
1150 Vec3 perp_x(z, 0.0f, -x);
1151 Vec3 perp_y(0.0f, z, -y);
1153 return (xx > yy ? perp_x : perp_y) / JPH::Sqrt(max(xx, yy) + zz);
1159#if defined(JPH_USE_AVX512)
1160 Type one = _mm_set1_ps(1.0f);
1161 return _mm_or_ps(_mm_fixupimm_ps(
mValue,
mValue, _mm_set1_epi32(0xA9A90100), 0), one);
1162#elif defined(JPH_USE_SSE)
1163 Type minus_one = _mm_set1_ps(-1.0f);
1164 Type one = _mm_set1_ps(1.0f);
1165 return _mm_or_ps(_mm_and_ps(
mValue, minus_one), one);
1166#elif defined(JPH_USE_NEON)
1167 Type minus_one = vdupq_n_f32(-1.0f);
1168 Type one = vdupq_n_f32(1.0f);
1169 return vreinterpretq_f32_u32(vorrq_u32(vandq_u32(vreinterpretq_u32_f32(
mValue), vreinterpretq_u32_f32(minus_one)), vreinterpretq_u32_f32(one)));
1170#elif defined(JPH_USE_RVV)
1172 const vfloat32m1_t rvv_in = __riscv_vle32_v_f32m1(
mF32, 3);
1173 const vfloat32m1_t rvv_one = __riscv_vfmv_v_f_f32m1(1.0, 3);
1174 const vfloat32m1_t rvv_signs = __riscv_vfsgnj_vv_f32m1(rvv_one, rvv_in, 3);
1175 __riscv_vse32_v_f32m1(res.
mF32, rvv_signs, 3);
1178 return Vec3(std::signbit(
mF32[0])? -1.0f : 1.0f,
1179 std::signbit(
mF32[1])? -1.0f : 1.0f,
1180 std::signbit(
mF32[2])? -1.0f : 1.0f);
1184template <
int X,
int Y,
int Z>
1187 static_assert(X == 1 || X == -1,
"X must be 1 or -1");
1188 static_assert(Y == 1 || Y == -1,
"Y must be 1 or -1");
1189 static_assert(Z == 1 || Z == -1,
"Z must be 1 or -1");
1190 return Vec3::sXor(*
this,
Vec3(X > 0? 0.0f : -0.0f, Y > 0? 0.0f : -0.0f, Z > 0? 0.0f : -0.0f));
1195 constexpr float cOneOverSqrt2 = 0.70710678f;
1196 constexpr uint cNumBits = 14;
1197 constexpr uint cMask = (1 << cNumBits) - 1;
1198 constexpr uint cMaxValue = cMask - 1;
1199 constexpr float cScale = float(cMaxValue) / (2.0f * cOneOverSqrt2);
1205 if (v[max_element] < 0.0f)
1207 value = 0x80000000u;
1212 value |= max_element << 29;
1216 switch (max_element)
1227 value |= compressed.
GetX();
1228 value |= compressed.
GetY() << cNumBits;
1234 constexpr float cOneOverSqrt2 = 0.70710678f;
1235 constexpr uint cNumBits = 14;
1236 constexpr uint cMask = (1u << cNumBits) - 1;
1237 constexpr uint cMaxValue = cMask - 1;
1238 constexpr int cHalfMaxValue = int(cMaxValue >> 1);
1239 constexpr float cScale = 2.0f * cOneOverSqrt2 / float(cMaxValue);
1242 Vec3 v =
Vec3(
float(
int(inValue & cMask) - cHalfMaxValue),
float(
int((inValue >> cNumBits) & cMask) - cHalfMaxValue), 0) * cScale;
1249 if ((inValue & 0x80000000u) != 0)
1253 switch ((inValue >> 29) & 3)
#define JPH_SUPPRESS_WARNINGS_STD_BEGIN
Definition Core.h:439
#define JPH_SUPPRESS_WARNINGS_STD_END
Definition Core.h:452
std::uint64_t uint64
Definition Core.h:515
unsigned int uint
Definition Core.h:510
#define JPH_NAMESPACE_END
Definition Core.h:434
std::uint32_t uint32
Definition Core.h:513
#define JPH_NAMESPACE_BEGIN
Definition Core.h:428
#define xy
Definition HLSLToCPP.h:511
#define JPH_MAKE_HASHABLE(type,...)
Definition HashCombine.h:223
#define JPH_ASSERT(...)
Definition IssueReporting.h:33
JPH_INLINE constexpr To BitCast(const From &inValue)
Simple implementation of C++20 std::bit_cast.
Definition Math.h:239
@ SWIZZLE_Z
Use the Z component.
Definition Swizzle.h:14
@ SWIZZLE_X
Use the X component.
Definition Swizzle.h:12
@ SWIZZLE_UNUSED
We always use the Z component when we don't specifically want to initialize a value,...
Definition Swizzle.h:16
@ SWIZZLE_Y
Use the Y component.
Definition Swizzle.h:13
Vec3 operator*(float inV1, Vec3Arg inV2)
Definition Vec3.inl:531
Class that holds 3 floats. Used as a storage class. Convert to Vec3 for calculations.
Definition Float3.h:13
float y
Definition Float3.h:39
float z
Definition Float3.h:40
float x
Definition Float3.h:38
JPH_INLINE UVec4 Swizzle() const
Swizzle the elements in inV.
JPH_INLINE uint32 GetY() const
Definition UVec4.h:103
static JPH_INLINE UVec4 sAnd(UVec4Arg inV1, UVec4Arg inV2)
Logical and (component wise)
Definition UVec4.inl:292
static JPH_INLINE UVec4 sOr(UVec4Arg inV1, UVec4Arg inV2)
Logical or (component wise)
Definition UVec4.inl:250
JPH_INLINE bool TestAllXYZTrue() const
Test if X, Y and Z components are true (true is when highest bit of component is set)
Definition UVec4.inl:663
Type mValue
Definition UVec4.h:223
JPH_INLINE uint32 GetX() const
Get individual components.
Definition UVec4.h:102
static JPH_INLINE UVec4 sXor(UVec4Arg inV1, UVec4Arg inV2)
Logical xor (component wise)
Definition UVec4.inl:271
JPH_INLINE Vec4 ReinterpretAsFloat() const
Reinterpret UVec4 as a Vec4 (doesn't change the bits)
Definition UVec4.inl:527
uint32 mU32[4]
Definition UVec4.h:224
JPH_INLINE bool IsClose(Vec3Arg inV2, float inMaxDistSq=1.0e-12f) const
Test if two vectors are close.
Definition Vec3.inl:486
static JPH_INLINE Vec3 sMax(Vec3Arg inV1, Vec3Arg inV2)
Return the maximum of each of the components.
Definition Vec3.inl:203
JPH_INLINE float Dot(Vec3Arg inV2) const
Dot product.
Definition Vec3.inl:927
JPH_INLINE Vec3 Normalized() const
Normalize vector.
Definition Vec3.inl:969
static JPH_INLINE Type sFixW(Type inValue)
Internal helper function that ensures that the Z component is replicated to the W component to preven...
Vec4::Type Type
Definition Vec3.h:27
JPH_INLINE bool operator==(Vec3Arg inV2) const
Comparison.
Definition Vec3.inl:481
JPH_INLINE Vec4 SplatX() const
Replicate the X component to all components.
Definition Vec3.inl:757
static JPH_INLINE Vec3 sMin(Vec3Arg inV1, Vec3Arg inV2)
Return the minimum value of each of the components.
Definition Vec3.inl:183
JPH_INLINE Vec3 Cross(Vec3Arg inV2) const
Cross product.
Definition Vec3.inl:851
JPH_INLINE Vec3 GetNormalizedPerpendicular() const
Get normalized vector that is perpendicular to this vector.
Definition Vec3.inl:1115
static Vec3 sRandom(Random &inRandom)
Get random unit vector.
Definition Vec3.inl:473
JPH_INLINE float GetX() const
Get individual components.
Definition Vec3.h:127
JPH_INLINE bool IsNormalized(float inTolerance=1.0e-6f) const
Test if vector is normalized.
Definition Vec3.inl:1026
static JPH_INLINE Vec3 sXor(Vec3Arg inV1, Vec3Arg inV2)
Logical xor (component wise)
Definition Vec3.inl:429
static JPH_INLINE Vec3 sDecompressUnitVector(uint32 inValue)
Decompress a unit vector from a 32 bit value.
Definition Vec3.inl:1232
JPH_INLINE float Length() const
Length of vector.
Definition Vec3.inl:947
static JPH_INLINE UVec4 sGreaterOrEqual(Vec3Arg inV1, Vec3Arg inV2)
Greater than or equal (component wise)
Definition Vec3.inl:328
JPH_INLINE float ReduceMin() const
Get the minimum of X, Y and Z.
Definition Vec3.inl:1101
JPH_INLINE Vec3 & operator-=(Vec3Arg inV2)
Subtract two float vectors (component wise)
Definition Vec3.inl:717
JPH_INLINE float ReduceMax() const
Get the maximum of X, Y and Z.
Definition Vec3.inl:1108
static JPH_INLINE Vec3 sDifferenceOfProducts(Vec3Arg inA, Vec3Arg inB, Vec3Arg inC, Vec3Arg inD)
Calculates inA * inB - inC * inD with more precision when FMA instructions are available....
Definition Vec3.inl:839
static JPH_INLINE UVec4 sLessOrEqual(Vec3Arg inV1, Vec3Arg inV2)
Less than or equal (component wise)
Definition Vec3.inl:278
JPH_INLINE Vec3 operator/(float inV2) const
Divide vector by float.
Definition Vec3.inl:548
friend JPH_INLINE Vec3 operator*(float inV1, Vec3Arg inV2)
Multiply vector with float.
Definition Vec3.inl:531
JPH_INLINE int GetLowestComponentIndex() const
Get index of component with lowest value.
Definition Vec3.inl:805
JPH_INLINE Vec3 & operator/=(float inV2)
Divide vector by float.
Definition Vec3.inl:606
JPH_INLINE Vec4 DotV4(Vec3Arg inV2) const
Dot product, returns the dot product in X, Y, Z and W components.
Definition Vec3.inl:937
JPH_INLINE Vec3 Abs() const
Return the absolute value of each of the components.
Definition Vec3.inl:815
static JPH_INLINE Vec3 sOne()
Vector with all ones.
Definition Vec3.inl:157
JPH_INLINE Vec3 Reciprocal() const
Reciprocal vector (1 / value) for each of the components.
Definition Vec3.inl:834
JPH_INLINE Vec3 NormalizedOr(Vec3Arg inZeroValue) const
Normalize vector or return inZeroValue if the length of the vector is zero.
Definition Vec3.inl:974
JPH_INLINE Vec3 FlipSign() const
Flips the signs of the components, e.g. FlipSign<-1, 1, -1>() will flip the signs of the X and Z comp...
Definition Vec3.inl:1185
JPH_INLINE Vec3 operator+(Vec3Arg inV2) const
Add two float vectors (component wise)
Definition Vec3.inl:626
JPH_INLINE float ReduceSum() const
Get the sum of X, Y and Z.
Definition Vec3.inl:894
JPH_INLINE uint32 CompressUnitVector() const
Compress a unit vector to a 32 bit value, precision is around 10^-4.
Definition Vec3.inl:1193
JPH_INLINE Vec4 SplatZ() const
Replicate the Z component to all components.
Definition Vec3.inl:789
JPH_INLINE Vec3 CrossPrecise(Vec3Arg inV2) const
Cross product (more precise version when FMA is available)
Definition Vec3.inl:889
static JPH_INLINE Vec3 sOr(Vec3Arg inV1, Vec3Arg inV2)
Logical or (component wise)
Definition Vec3.inl:411
static JPH_INLINE UVec4 sGreater(Vec3Arg inV1, Vec3Arg inV2)
Greater than (component wise)
Definition Vec3.inl:303
JPH_INLINE void SetZ(float inZ)
Definition Vec3.h:135
static JPH_INLINE Vec3 sAnd(Vec3Arg inV1, Vec3Arg inV2)
Logical and (component wise)
Definition Vec3.inl:447
JPH_INLINE void CheckW() const
Internal helper function that checks that W is equal to Z, so e.g. dividing by it should not generate...
static JPH_INLINE Vec3 sUnitSpherical(float inTheta, float inPhi)
Definition Vec3.inl:465
JPH_INLINE UVec4 ToInt() const
Convert each component from a float to an int.
Definition Vec3.inl:1073
Type mValue
Definition Vec3.h:308
JPH_INLINE float GetY() const
Definition Vec3.h:128
JPH_INLINE Vec4 SplatY() const
Replicate the Y component to all components.
Definition Vec3.inl:773
JPH_INLINE Vec3 operator-() const
Negate.
Definition Vec3.inl:665
JPH_INLINE void StoreFloat3(Float3 *outV) const
Store 3 floats to memory.
Definition Vec3.inl:1051
JPH_INLINE float LengthSq() const
Squared length of vector.
Definition Vec3.inl:942
float mF32[4]
Definition Vec3.h:309
static JPH_INLINE UVec4 sEquals(Vec3Arg inV1, Vec3Arg inV2)
Equals (component wise)
Definition Vec3.inl:228
JPH_INLINE bool IsNearZero(float inMaxDistSq=1.0e-12f) const
Test if vector is near zero.
Definition Vec3.inl:491
static JPH_INLINE Vec3 sZero()
Vector with all zeros.
Definition Vec3.inl:125
static JPH_INLINE UVec4 sLess(Vec3Arg inV1, Vec3Arg inV2)
Less than (component wise)
Definition Vec3.inl:253
static JPH_INLINE Vec3 sReplicate(float inV)
Replicate inV across all components.
Definition Vec3.inl:141
static JPH_INLINE Vec3 sClamp(Vec3Arg inV, Vec3Arg inMin, Vec3Arg inMax)
Clamp a vector between min and max (component wise)
Definition Vec3.inl:223
JPH_INLINE Vec3 & operator*=(float inV2)
Multiply vector with float.
Definition Vec3.inl:565
JPH_INLINE Vec3 & operator+=(Vec3Arg inV2)
Add two float vectors (component wise)
Definition Vec3.inl:644
static JPH_INLINE Vec3 sSelect(Vec3Arg inNotSet, Vec3Arg inSet, UVec4Arg inControl)
Component wise select, returns inNotSet when highest bit of inControl = 0 and inSet when highest bit ...
Definition Vec3.inl:376
JPH_INLINE bool IsNaN() const
Test if vector contains NaN elements.
Definition Vec3.inl:1031
JPH_INLINE Vec3 Sqrt() const
Component wise square root.
Definition Vec3.inl:952
JPH_INLINE UVec4 ReinterpretAsInt() const
Reinterpret Vec3 as a UVec4 (doesn't change the bits)
Definition Vec3.inl:1090
JPH_INLINE Vec3 DotV(Vec3Arg inV2) const
Dot product, returns the dot product in X, Y and Z components.
Definition Vec3.inl:932
static JPH_INLINE Vec3 sLoadFloat3Unsafe(const Float3 &inV)
Load 3 floats from memory (reads 32 bits extra which it doesn't use)
Definition Vec3.inl:167
JPH_INLINE float GetZ() const
Definition Vec3.h:129
JPH_INLINE Vec3 GetSign() const
Get vector that contains the sign of each element (returns 1.0f if positive, -1.0f if negative)
Definition Vec3.inl:1157
static JPH_INLINE Vec3 sNaN()
Vector with all NaN's.
Definition Vec3.inl:162
Vec3()=default
Constructor.
JPH_INLINE int GetHighestComponentIndex() const
Get index of component with highest value.
Definition Vec3.inl:810
static JPH_INLINE Vec3 sFusedMultiplyAdd(Vec3Arg inMul1, Vec3Arg inMul2, Vec3Arg inAdd)
Calculates inMul1 * inMul2 + inAdd.
Definition Vec3.inl:353
JPH_INLINE Vec3 Swizzle() const
Swizzle the elements in inV.
float mF32[4]
Definition Vec4.h:318
JPH_INLINE float GetX() const
Get individual components.
Definition Vec4.h:119
JPH_INLINE float GetY() const
Definition Vec4.h:120
static JPH_INLINE Vec4 sReplicate(float inV)
Replicate inV across all components.
Definition Vec4.inl:97
void SinCos(Vec4 &outSin, Vec4 &outCos) const
Calculate the sine and cosine for each element of this vector (input in radians)
Definition Vec4.inl:1171