Skip to content

Commit 9356f40

Browse files
Fixed SIMD smoothstep
1 parent 90f2b02 commit 9356f40

File tree

2 files changed

+22
-9
lines changed

2 files changed

+22
-9
lines changed

glm/simd/geometric.h

+15-9
Original file line numberDiff line numberDiff line change
@@ -102,17 +102,23 @@ GLM_FUNC_QUALIFIER glm_vec4 glm_vec4_reflect(glm_vec4 I, glm_vec4 N)
102102

103103
GLM_FUNC_QUALIFIER __m128 glm_vec4_refract(glm_vec4 I, glm_vec4 N, glm_vec4 eta)
104104
{
105-
glm_vec4 const dot0 = glm_vec4_dot(N, I);
106-
glm_vec4 const mul0 = _mm_mul_ps(eta, eta);
107-
glm_vec4 const mul1 = _mm_mul_ps(dot0, dot0);
108-
glm_vec4 const sub0 = _mm_sub_ps(_mm_set1_ps(1.0f), mul0);
109-
glm_vec4 const sub1 = _mm_sub_ps(_mm_set1_ps(1.0f), mul1);
110-
glm_vec4 const mul2 = _mm_mul_ps(sub0, sub1);
111-
112-
if(_mm_movemask_ps(_mm_cmplt_ss(mul2, _mm_set1_ps(0.0f))) == 0)
105+
// k = 1.0 - eta * eta * (1.0 - dot(N, I) * dot(N, I));
106+
// if (k < 0.0)
107+
// R = genType(0.0); // or genDType(0.0)
108+
// else
109+
// R = eta * I - (eta * dot(N, I) + sqrt(k)) * N;
110+
111+
glm_vec4 const dot0 = glm_vec4_dot(N, I); // dot(N, I)
112+
glm_vec4 const mul0 = _mm_mul_ps(eta, eta); // eta * eta
113+
glm_vec4 const mul1 = _mm_mul_ps(dot0, dot0); // dot(N, I) * dot(N, I)
114+
glm_vec4 const sub1 = _mm_sub_ps(_mm_set1_ps(1.0f), mul1); // (1.0 - dot(N, I) * dot(N, I))
115+
glm_vec4 const mul2 = _mm_mul_ps(mul0, sub1); // eta * eta * (1.0 - dot(N, I) * dot(N, I))
116+
glm_vec4 const sub0 = _mm_sub_ps(_mm_set1_ps(1.0f), mul2); // 1.0 - eta * eta * (1.0 - dot(N, I) * dot(N, I))
117+
118+
if(_mm_movemask_ps(_mm_cmplt_ss(sub0, _mm_set1_ps(0.0f))) == 0)
113119
return _mm_set1_ps(0.0f);
114120

115-
glm_vec4 const sqt0 = _mm_sqrt_ps(mul2);
121+
glm_vec4 const sqt0 = _mm_sqrt_ps(sub0);
116122
glm_vec4 const mad0 = glm_vec4_fma(eta, dot0, sqt0);
117123
glm_vec4 const mul4 = _mm_mul_ps(mad0, N);
118124
glm_vec4 const mul5 = _mm_mul_ps(eta, I);

test/core/core_func_geometric.cpp

+7
Original file line numberDiff line numberDiff line change
@@ -181,6 +181,13 @@ namespace refract
181181
Error += glm::all(glm::equal(C, glm::dvec2(0.0, -1.0), 0.0001)) ? 0 : 1;
182182
}
183183

184+
{
185+
glm::vec4 A(0.0f, -1.0f, 0.0f, 0.0f);
186+
glm::vec4 B(0.0f, 1.0f, 0.0f, 0.0f);
187+
glm::vec4 C = glm::refract(A, B, 0.5f);
188+
Error += glm::all(glm::equal(C, glm::vec4(0.0, -1.0, 0.0f, 0.0f), 0.0001f)) ? 0 : 1;
189+
}
190+
184191
return Error;
185192
}
186193
}//namespace refract

0 commit comments

Comments
 (0)