fix all DXC warnings and refactor the CascadeAccumulator (ex 31 needs to get fixed)

devshgraphicsprogramming · devshgraphicsprogramming · commit 0b6f2694c82c · 2026-04-09T17:41:53.000+02:00
diff --git a/examples_tests b/examples_tests
@@ -1 +1 @@
-Subproject commit 0a3ad464ecdd82b9d7b20b7911979ede7d1f8219
+Subproject commit 5f8dc886911e7672257eb1a6408359bf9f75473d
diff --git a/include/nbl/builtin/hlsl/bxdf/fresnel.hlsl b/include/nbl/builtin/hlsl/bxdf/fresnel.hlsl
@@ -665,9 +665,9 @@ struct iridescent_base
     using vector_type = T;
 
     template<bool SupportsTransmission, typename Colorspace>
-    T __call(const vector_type iork3, const vector_type etak23, const scalar_type clampedCosTheta) NBL_CONST_MEMBER_FUNC
+    T __call(const vector_type _iork3, const vector_type etak23, const scalar_type clampedCosTheta) NBL_CONST_MEMBER_FUNC
     {
-        return impl::iridescent_helper<T,false>::template __call<Colorspace>(D, ior1, ior2, ior3, iork3,
+        return impl::iridescent_helper<T,false>::template __call<Colorspace>(D, ior1, ior2, ior3, _iork3,
                                                             eta12, eta23, etak23, clampedCosTheta);
     }
 
@@ -684,9 +684,9 @@ struct iridescent_base
 
 // workaround due to DXC bug: github.com/microsoft/DirectXShaderCompiler/issues/5966
 template<typename T, bool SupportsTransmission, typename Colorspace>
-T __iridescent_base__call_const(NBL_CONST_REF_ARG(iridescent_base<T>) _this, const T iork3, const T etak23, const typename vector_traits<T>::scalar_type clampedCosTheta)
+T __iridescent_base__call_const(NBL_CONST_REF_ARG(iridescent_base<T>) _this, const T _iork3, const T etak23, const typename vector_traits<T>::scalar_type clampedCosTheta)
 {
-    return _this.template __call<SupportsTransmission, Colorspace>(iork3, etak23, clampedCosTheta);
+    return _this.template __call<SupportsTransmission, Colorspace>(_iork3, etak23, clampedCosTheta);
 }
 }
 
diff --git a/include/nbl/builtin/hlsl/ieee754.hlsl b/include/nbl/builtin/hlsl/ieee754.hlsl
@@ -16,8 +16,8 @@ template<typename Float>
 struct traits_base
 {
 	static_assert(is_same<Float, float16_t>::value || is_same<Float, float32_t>::value || is_same<Float, float64_t>::value);
-	NBL_CONSTEXPR_STATIC_INLINE int16_t exponentBitCnt = int16_t(0xbeef);
-	NBL_CONSTEXPR_STATIC_INLINE int16_t mantissaBitCnt = int16_t(0xbeef);
+	NBL_CONSTEXPR_STATIC_INLINE int16_t exponentBitCnt = (int16_t)0xbeef;
+	NBL_CONSTEXPR_STATIC_INLINE int16_t mantissaBitCnt = (int16_t)0xbeef;
 };
 
 template<>
@@ -73,7 +73,7 @@ template<>
 inline uint32_t extractBiasedExponent(uint64_t x)
 {
 	uint64_t output = (x >> traits<float64_t>::mantissaBitCnt) & (traits<float64_t>::exponentMask >> traits<float64_t>::mantissaBitCnt);
-	return uint32_t(output);
+	return _static_cast<uint32_t>(output);
 }
 
 template<>
@@ -100,7 +100,7 @@ NBL_CONSTEXPR_FUNC T replaceBiasedExponent(T x, typename unsigned_integer_of_siz
 template <typename T>
 NBL_CONSTEXPR_FUNC T fastMulExp2(T x, int n)
 {
-	return replaceBiasedExponent(x, extractBiasedExponent(x) + uint32_t(n));
+	return replaceBiasedExponent(x, extractBiasedExponent(x) + _static_cast<uint32_t>(n));
 }
 
 template <typename T>
diff --git a/include/nbl/builtin/hlsl/limits.hlsl b/include/nbl/builtin/hlsl/limits.hlsl
@@ -215,12 +215,12 @@ struct num_traits<float16_t> : num_base<float16_t>
     float16_t
 #endif
 ;
-    NBL_CONSTEXPR_STATIC_INLINE type      min           = 6.103515e-05F;
-    NBL_CONSTEXPR_STATIC_INLINE type      max           = 65504.0F;
-    NBL_CONSTEXPR_STATIC_INLINE type      denorm_min    = 5.96046448e-08F;
-    NBL_CONSTEXPR_STATIC_INLINE uint16_t  quiet_NaN     = 0x7FFF;
-    NBL_CONSTEXPR_STATIC_INLINE uint16_t  signaling_NaN = 0x7DFF;
-    NBL_CONSTEXPR_STATIC_INLINE uint16_t  infinity      = 0x7C00;
+    NBL_CONSTEXPR_STATIC_INLINE type      min           = (type)6.103515e-05F;
+    NBL_CONSTEXPR_STATIC_INLINE type      max           = (type)65504.0F;
+    NBL_CONSTEXPR_STATIC_INLINE type      denorm_min    = (type)5.96046448e-08F;
+    NBL_CONSTEXPR_STATIC_INLINE uint16_t  quiet_NaN     = (uint16_t)0x7FFF;
+    NBL_CONSTEXPR_STATIC_INLINE uint16_t  signaling_NaN = (uint16_t)0x7DFF;
+    NBL_CONSTEXPR_STATIC_INLINE uint16_t  infinity      = (uint16_t)0x7C00;
 };
 
 template<> 
diff --git a/include/nbl/builtin/hlsl/math/functions.hlsl b/include/nbl/builtin/hlsl/math/functions.hlsl
@@ -51,7 +51,7 @@ struct lp_norm<T,1,true NBL_PARTIAL_REQ_BOT(concepts::FloatingPointLikeVectorial
         array_get<T, scalar_type> getter;
 
         scalar_type retval = abs<scalar_type>(getter(v, 0));
-        for (int i = 1; i < vector_traits<T>::Dimension; i++)
+        for (uint32_t i = 1; i < vector_traits<T>::Dimension; i++)
             retval += abs<scalar_type>(getter(v, i));
         return retval;
     }
diff --git a/include/nbl/builtin/hlsl/math/linalg/basic.hlsl b/include/nbl/builtin/hlsl/math/linalg/basic.hlsl
@@ -4,6 +4,7 @@
 #ifndef __HLSL_VERSION
 #include <nbl/core/math/glslFunctions.h>
 #include "vectorSIMD.h"
+#include <nbl/builtin/hlsl/type_traits.hlsl>
 #endif
 #include <nbl/builtin/hlsl/cpp_compat/intrinsics.hlsl>
 #include <nbl/builtin/hlsl/matrix_utils/matrix_traits.hlsl>
@@ -140,7 +141,7 @@ namespace impl
 		{
 			To retval;
 
-			NBL_UNROLL for (int i = 0; i < N; ++i)
+			NBL_UNROLL for (uint16_t i = 0; i < N; ++i)
 			{
 				retval[i] = hlsl::_static_cast<ScalarTo>(vec[i]);
 			}
diff --git a/include/nbl/builtin/hlsl/numbers.hlsl b/include/nbl/builtin/hlsl/numbers.hlsl
@@ -11,33 +11,33 @@ namespace numbers
 {
 
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t e = float_t(2.718281828459045);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t e = (float_t)2.718281828459045;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t log2e = float_t(1.4426950408889634);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t log2e = (float_t)1.4426950408889634;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t log10e = float_t(0.4342944819032518);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t log10e = (float_t)0.4342944819032518;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t pi = float_t(3.141592653589793);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t pi = (float_t)3.141592653589793;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t inv_pi = float_t(0.3183098861837907);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t inv_pi = (float_t)0.3183098861837907;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t inv_sqrtpi = float_t(0.5641895835477563);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t inv_sqrtpi = (float_t)0.5641895835477563;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t ln2 = float_t(0.6931471805599453);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t ln2 = (float_t)0.6931471805599453;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t inv_ln2 = float_t(1.44269504088896);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t inv_ln2 = (float_t)1.44269504088896;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t ln10 = float_t(2.302585092994046);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t ln10 = (float_t)2.302585092994046;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t sqrt2 = float_t(1.4142135623730951);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t sqrt2 = (float_t)1.4142135623730951;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t sqrt3 = float_t(1.7320508075688772);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t sqrt3 = (float_t)1.7320508075688772;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t inv_sqrt3 = float_t(0.5773502691896257);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t inv_sqrt3 = (float_t)0.5773502691896257;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t egamma = float_t(0.5772156649015329);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t egamma = (float_t)0.5772156649015329;
 template <typename float_t>
-NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t phi = float_t(1.618033988749895);
+NBL_CONSTEXPR_INLINE_NSPC_SCOPE_VAR float_t phi = (float_t)1.618033988749895;
 
 }
 }
diff --git a/include/nbl/builtin/hlsl/rwmc/CascadeAccumulator.hlsl b/include/nbl/builtin/hlsl/rwmc/CascadeAccumulator.hlsl
@@ -12,38 +12,45 @@ namespace hlsl
 namespace rwmc
 {
 
-template<typename CascadeLayerType, uint32_t CascadeCountValue, typename SampleCountType = uint16_t NBL_PRIMARY_REQUIRES(concepts::Vector<CascadeLayerType> && concepts::UnsignedIntegralScalar<SampleCountType>)
+template<typename CascadeLayerType, uint16_t CascadeCount, typename SampleCountType = uint16_t NBL_PRIMARY_REQUIRES(concepts::Vector<CascadeLayerType> && concepts::UnsignedIntegralScalar<SampleCountType>)
 struct DefaultCascades
 {
+    // required public interfaces (TODO: a concept for it)
     using layer_type = CascadeLayerType;
     using sample_count_type = SampleCountType;
-    NBL_CONSTEXPR_STATIC_INLINE uint32_t CascadeCount = CascadeCountValue;
+    using weight_t = typename SSplattingParameters::scalar_t;
 
-    sample_count_type cascadeSampleCounter[CascadeCount];
-    CascadeLayerType data[CascadeCount];
+    inline uint16_t getLastCascade() {return CascadeCount-uint16_t(1);}
 
-    void clear(uint32_t cascadeIx)
+    void clear()
     {
-        cascadeSampleCounter[cascadeIx] = sample_count_type(0u);
-        data[cascadeIx] = promote<CascadeLayerType, float32_t>(0.0f);
+        for (uint16_t i=0u; i<CascadeCount; ++i)
+        {
+            __cascadeSampleCounter[i] = sample_count_type(0u);
+            __data[i] = promote<CascadeLayerType,float32_t>(0.0f);
+        }
     }
 
-    void addSampleIntoCascadeEntry(layer_type _sample, uint16_t lowerCascadeIndex, SSplattingParameters::scalar_t lowerCascadeLevelWeight, SSplattingParameters::scalar_t higherCascadeLevelWeight, sample_count_type sampleCount)
+    void addSampleIntoCascadeEntry(const layer_type _sample, const uint16_t lowerCascadeIndex, const weight_t lowerCascadeLevelWeight, const weight_t higherCascadeLevelWeight, const sample_count_type sampleCount)
     {
-        const SSplattingParameters::scalar_t reciprocalSampleCount = SSplattingParameters::scalar_t(1.0f) / SSplattingParameters::scalar_t(sampleCount);
+        const weight_t reciprocalSampleCount = _static_cast<weight_t>(1)/_static_cast<weight_t>(sampleCount);
 
-        sample_count_type lowerCascadeSampleCount = cascadeSampleCounter[lowerCascadeIndex];
-        data[lowerCascadeIndex] += (_sample * lowerCascadeLevelWeight - (sampleCount - lowerCascadeSampleCount) * data[lowerCascadeIndex]) * reciprocalSampleCount;
-        cascadeSampleCounter[lowerCascadeIndex] = sampleCount;
+        sample_count_type lowerCascadeSampleCount = __cascadeSampleCounter[lowerCascadeIndex];
+        __data[lowerCascadeIndex] += (_sample * lowerCascadeLevelWeight - (sampleCount - lowerCascadeSampleCount) * __data[lowerCascadeIndex]) * reciprocalSampleCount;
+        __cascadeSampleCounter[lowerCascadeIndex] = sampleCount;
 
         uint16_t higherCascadeIndex = lowerCascadeIndex + uint16_t(1u);
         if (higherCascadeIndex < CascadeCount)
         {
-            sample_count_type higherCascadeSampleCount = cascadeSampleCounter[higherCascadeIndex];
-            data[higherCascadeIndex] += (_sample * higherCascadeLevelWeight - (sampleCount - higherCascadeSampleCount) * data[higherCascadeIndex]) * reciprocalSampleCount;
-            cascadeSampleCounter[higherCascadeIndex] = sampleCount;
+            sample_count_type higherCascadeSampleCount = __cascadeSampleCounter[higherCascadeIndex];
+            __data[higherCascadeIndex] += (_sample * higherCascadeLevelWeight - (sampleCount - higherCascadeSampleCount) * __data[higherCascadeIndex]) * reciprocalSampleCount;
+            __cascadeSampleCounter[higherCascadeIndex] = sampleCount;
         }
     }
+    
+    // private
+    sample_count_type __cascadeSampleCounter[CascadeCount];
+    CascadeLayerType __data[CascadeCount];
 };
 
 template<typename CascadesType>
@@ -52,19 +59,18 @@ struct CascadeAccumulator
     using scalar_t = typename SSplattingParameters::scalar_t;
     using input_sample_type = typename CascadesType::layer_type;
     using sample_count_type = typename CascadesType::sample_count_type;
+    using weight_t = typename CascadesType::weight_t;
     using this_t = CascadeAccumulator<CascadesType>;
     using cascades_type = CascadesType;
-    NBL_CONSTEXPR_STATIC_INLINE uint16_t CascadeCount = cascades_type::CascadeCount;
-    NBL_CONSTEXPR_STATIC_INLINE scalar_t LastCascade = scalar_t(CascadeCount - 1u);
+
     cascades_type accumulation;
-    
     SSplattingParameters splattingParameters;
 
-    static this_t create(NBL_CONST_REF_ARG(SPackedSplattingParameters) settings)
+    static this_t create(NBL_CONST_REF_ARG(SPackedSplattingParameters) settings, const bool clear=true)
     {
         this_t retval;
-        for (uint16_t i = 0u; i < CascadeCount; ++i)
-            retval.accumulation.clear(i);
+        if (clear)
+            retval.accumulation.clear();
         retval.splattingParameters = settings.unpack();
 
         return retval;
@@ -73,25 +79,27 @@ struct CascadeAccumulator
     // most of this code is stolen from https://cg.ivd.kit.edu/publications/2018/rwmc/tool/split.cpp
     void addSample(const sample_count_type sampleCount, input_sample_type _sample)
     {
-        const scalar_t luma = splattingParameters.calcLuma<input_sample_type>(_sample);
-        const scalar_t log2Luma = log2<scalar_t>(luma);
+        const uint16_t lastCascade = accumulation.getLastCascade();
+
+        const weight_t luma = splattingParameters.calcLuma<input_sample_type>(_sample);
+        const weight_t log2Luma = hlsl::log2<weight_t>(luma);
         const scalar_t cascade = log2Luma * splattingParameters.RcpLog2Base - splattingParameters.Log2BaseRootOfStart;
-        const scalar_t clampedCascade = clamp(cascade, scalar_t(0), LastCascade);
-        const scalar_t clampedCascadeFloor = floor<scalar_t>(clampedCascade);
+        const scalar_t clampedCascade = hlsl::clamp<scalar_t>(cascade, scalar_t(0), lastCascade);
+        const scalar_t clampedCascadeFloor = hlsl::floor(clampedCascade);
         // c<=0 -> 0, c>=Count-1 -> Count-1 
-        uint16_t lowerCascadeIndex = uint16_t(clampedCascadeFloor);
+        const uint16_t lowerCascadeIndex = _static_cast<uint16_t>(clampedCascadeFloor);
         // 0 whenever clamped or `cascade` is integer (when `clampedCascade` is integer)
-        scalar_t higherCascadeWeight = clampedCascade - clampedCascadeFloor;
+        const weight_t higherCascadeWeight = _static_cast<weight_t>(clampedCascade - clampedCascadeFloor);
         // never 0 thanks to magic of `1-fract(x)`
-        scalar_t lowerCascadeWeight = scalar_t(1) - higherCascadeWeight;
+        weight_t lowerCascadeWeight = weight_t(1) - higherCascadeWeight;
 
         // handle super bright sample case
-        if (cascade > LastCascade)
-            lowerCascadeWeight = exp2(splattingParameters.BrightSampleLumaBias - log2Luma);
+        if (cascade > lastCascade)
+            lowerCascadeWeight = hlsl::exp2(_static_cast<weight_t>(splattingParameters.BrightSampleLumaBias - log2Luma));
 
         accumulation.addSampleIntoCascadeEntry(_sample, lowerCascadeIndex, lowerCascadeWeight, higherCascadeWeight, sampleCount);
     }
-
+     
     
 };
 
diff --git a/include/nbl/builtin/hlsl/rwmc/SplattingParameters.hlsl b/include/nbl/builtin/hlsl/rwmc/SplattingParameters.hlsl
@@ -12,6 +12,7 @@ namespace hlsl
 namespace rwmc
 {
 
+// TODO: template both on the ScalarType
 struct SSplattingParameters
 {
     using scalar_t = float32_t;
@@ -20,9 +21,9 @@ struct SSplattingParameters
     scalar_t BrightSampleLumaBias;
 
     template<typename CascadeLayerType, typename Colorspace = colorspace::scRGB>
-    scalar_t calcLuma(NBL_CONST_REF_ARG(CascadeLayerType) col)
+    typename vector_traits<CascadeLayerType>::scalar_type calcLuma(NBL_CONST_REF_ARG(CascadeLayerType) col)
     {
-        return hlsl::dot<CascadeLayerType>(hlsl::transpose(Colorspace::ToXYZ())[1], col);
+        return hlsl::dot(_static_cast<CascadeLayerType>(hlsl::transpose(Colorspace::ToXYZ())[1]), col);
     }
 };
 
diff --git a/include/nbl/builtin/hlsl/tgmath/impl.hlsl b/include/nbl/builtin/hlsl/tgmath/impl.hlsl
@@ -393,10 +393,10 @@ struct erf_helper<float16_t>
 	static float16_t __call(float16_t _x)
 	{
 		// A&S approximation to 2.5x10-5
-		const float16_t a1 = float16_t(0.3480242f);
-		const float16_t a2 = float16_t(-0.0958798f);
-		const float16_t a3 = float16_t(0.7478556f);
-		const float16_t p = float16_t(0.47047f);
+		const float16_t a1 = _static_cast<float16_t>(0.3480242f);
+		const float16_t a2 = _static_cast<float16_t>(-0.0958798f);
+		const float16_t a3 = _static_cast<float16_t>(0.7478556f);
+		const float16_t p = _static_cast<float16_t>(0.47047f);
 
 		float16_t _sign = float16_t(sign<float16_t>(_x));
 		float16_t x = abs_helper<float16_t>::__call(_x);
diff --git a/include/nbl/builtin/hlsl/type_traits.hlsl b/include/nbl/builtin/hlsl/type_traits.hlsl
@@ -861,6 +861,25 @@ using float_of_size_t = typename float_of_size<bytesize>::type;
 // deal with typetraits, for now we rely on Clang/DXC internal __decltype(), if it breaks we revert to commit e4ab38ca227b15b2c79641c39161f1f922b779a3
 #ifdef __HLSL_VERSION
 
+// This partial spec is to stop a pile of warnings from DXC about precision of conversions
+namespace nbl
+{
+namespace hlsl
+{
+namespace impl
+{
+template<typename To, typename From>
+struct static_cast_helper<To,From,enable_if_t<is_fundamental_v<To>&&is_fundamental_v<From>,void> >
+{
+    NBL_CONSTEXPR_STATIC_INLINE To cast(From u)
+    {
+        return (To)u;
+    }
+};
+}
+}
+}
+
 #define alignof(expr) ::nbl::hlsl::alignment_of_v<__decltype(expr)>
 
 // shoudl really return a std::type_info like struct or something, but no `constexpr` and unsure whether its possible to have a `const static SomeStruct` makes it hard to do...

Original file line number	Diff line number	Diff line change
`@@ -665,9 +665,9 @@ struct iridescent_base`
`665`	`665`	`using vector_type = T;`
`666`	`666`
`667`	`667`	`template<bool SupportsTransmission, typename Colorspace>`
`668`		`- T __call(const vector_type iork3, const vector_type etak23, const scalar_type clampedCosTheta) NBL_CONST_MEMBER_FUNC`
	`668`	`+ T __call(const vector_type _iork3, const vector_type etak23, const scalar_type clampedCosTheta) NBL_CONST_MEMBER_FUNC`
`669`	`669`	`{`
`670`		`- return impl::iridescent_helper<T,false>::template __call<Colorspace>(D, ior1, ior2, ior3, iork3,`
	`670`	`+ return impl::iridescent_helper<T,false>::template __call<Colorspace>(D, ior1, ior2, ior3, _iork3,`
`671`	`671`	`eta12, eta23, etak23, clampedCosTheta);`
`672`	`672`	`}`
`673`	`673`
`@@ -684,9 +684,9 @@ struct iridescent_base`
`684`	`684`
`685`	`685`	`// workaround due to DXC bug: github.com/microsoft/DirectXShaderCompiler/issues/5966`
`686`	`686`	`template<typename T, bool SupportsTransmission, typename Colorspace>`
`687`		`-T __iridescent_base__call_const(NBL_CONST_REF_ARG(iridescent_base<T>) _this, const T iork3, const T etak23, const typename vector_traits<T>::scalar_type clampedCosTheta)`
	`687`	`+T __iridescent_base__call_const(NBL_CONST_REF_ARG(iridescent_base<T>) _this, const T _iork3, const T etak23, const typename vector_traits<T>::scalar_type clampedCosTheta)`
`688`	`688`	`{`
`689`		`- return _this.template __call<SupportsTransmission, Colorspace>(iork3, etak23, clampedCosTheta);`
	`689`	`+ return _this.template __call<SupportsTransmission, Colorspace>(_iork3, etak23, clampedCosTheta);`
`690`	`690`	`}`
`691`	`691`	`}`
`692`	`692`
Original file line number	Diff line number	Diff line change
`@@ -16,8 +16,8 @@ template<typename Float>`
`16`	`16`	`struct traits_base`
`17`	`17`	`{`
`18`	`18`	`static_assert(is_same<Float, float16_t>::value \|\| is_same<Float, float32_t>::value \|\| is_same<Float, float64_t>::value);`
`19`		`- NBL_CONSTEXPR_STATIC_INLINE int16_t exponentBitCnt = int16_t(0xbeef);`
`20`		`- NBL_CONSTEXPR_STATIC_INLINE int16_t mantissaBitCnt = int16_t(0xbeef);`
	`19`	`+ NBL_CONSTEXPR_STATIC_INLINE int16_t exponentBitCnt = (int16_t)0xbeef;`
	`20`	`+ NBL_CONSTEXPR_STATIC_INLINE int16_t mantissaBitCnt = (int16_t)0xbeef;`
`21`	`21`	`};`
`22`	`22`
`23`	`23`	`template<>`
`@@ -73,7 +73,7 @@ template<>`
`73`	`73`	`inline uint32_t extractBiasedExponent(uint64_t x)`
`74`	`74`	`{`
`75`	`75`	`uint64_t output = (x >> traits<float64_t>::mantissaBitCnt) & (traits<float64_t>::exponentMask >> traits<float64_t>::mantissaBitCnt);`
`76`		`- return uint32_t(output);`
	`76`	`+ return _static_cast<uint32_t>(output);`
`77`	`77`	`}`
`78`	`78`
`79`	`79`	`template<>`
`@@ -100,7 +100,7 @@ NBL_CONSTEXPR_FUNC T replaceBiasedExponent(T x, typename unsigned_integer_of_siz`
`100`	`100`	`template <typename T>`
`101`	`101`	`NBL_CONSTEXPR_FUNC T fastMulExp2(T x, int n)`
`102`	`102`	`{`
`103`		`- return replaceBiasedExponent(x, extractBiasedExponent(x) + uint32_t(n));`
	`103`	`+ return replaceBiasedExponent(x, extractBiasedExponent(x) + _static_cast<uint32_t>(n));`
`104`	`104`	`}`
`105`	`105`
`106`	`106`	`template <typename T>`
Original file line number	Diff line number	Diff line change
`@@ -51,7 +51,7 @@ struct lp_norm<T,1,true NBL_PARTIAL_REQ_BOT(concepts::FloatingPointLikeVectorial`
`51`	`51`	`array_get<T, scalar_type> getter;`
`52`	`52`
`53`	`53`	`scalar_type retval = abs<scalar_type>(getter(v, 0));`
`54`		`- for (int i = 1; i < vector_traits<T>::Dimension; i++)`
	`54`	`+ for (uint32_t i = 1; i < vector_traits<T>::Dimension; i++)`
`55`	`55`	`retval += abs<scalar_type>(getter(v, i));`
`56`	`56`	`return retval;`
`57`	`57`	`}`
Original file line number	Diff line number	Diff line change
`@@ -4,6 +4,7 @@`
`4`	`4`	`#ifndef __HLSL_VERSION`
`5`	`5`	`#include <nbl/core/math/glslFunctions.h>`
`6`	`6`	`#include "vectorSIMD.h"`
	`7`	`+#include <nbl/builtin/hlsl/type_traits.hlsl>`
`7`	`8`	`#endif`
`8`	`9`	`#include <nbl/builtin/hlsl/cpp_compat/intrinsics.hlsl>`
`9`	`10`	`#include <nbl/builtin/hlsl/matrix_utils/matrix_traits.hlsl>`
`@@ -140,7 +141,7 @@ namespace impl`
`140`	`141`	`{`
`141`	`142`	`To retval;`
`142`	`143`
`143`		`- NBL_UNROLL for (int i = 0; i < N; ++i)`
	`144`	`+ NBL_UNROLL for (uint16_t i = 0; i < N; ++i)`
`144`	`145`	`{`
`145`	`146`	`retval[i] = hlsl::_static_cast<ScalarTo>(vec[i]);`
`146`	`147`	`}`
Original file line number	Diff line number	Diff line change
`@@ -12,6 +12,7 @@ namespace hlsl`
`12`	`12`	`namespace rwmc`
`13`	`13`	`{`
`14`	`14`
	`15`	`+// TODO: template both on the ScalarType`
`15`	`16`	`struct SSplattingParameters`
`16`	`17`	`{`
`17`	`18`	`using scalar_t = float32_t;`
`@@ -20,9 +21,9 @@ struct SSplattingParameters`
`20`	`21`	`scalar_t BrightSampleLumaBias;`
`21`	`22`
`22`	`23`	`template<typename CascadeLayerType, typename Colorspace = colorspace::scRGB>`
`23`		`- scalar_t calcLuma(NBL_CONST_REF_ARG(CascadeLayerType) col)`
	`24`	`+ typename vector_traits<CascadeLayerType>::scalar_type calcLuma(NBL_CONST_REF_ARG(CascadeLayerType) col)`
`24`	`25`	`{`
`25`		`- return hlsl::dot<CascadeLayerType>(hlsl::transpose(Colorspace::ToXYZ())[1], col);`
	`26`	`+ return hlsl::dot(_static_cast<CascadeLayerType>(hlsl::transpose(Colorspace::ToXYZ())[1]), col);`
`26`	`27`	`}`
`27`	`28`	`};`
`28`	`29`