Created transpose partial spec for emulated matrices

Przemog1 · Przemog1 · commit 03c90422fb87 · 2024-12-17T21:51:34.000+01:00
diff --git a/include/nbl/builtin/hlsl/cpp_compat/impl/intrinsics_impl.hlsl b/include/nbl/builtin/hlsl/cpp_compat/impl/intrinsics_impl.hlsl
@@ -2,6 +2,7 @@
 #define _NBL_BUILTIN_HLSL_CPP_COMPAT_IMPL_INTRINSICS_IMPL_INCLUDED_
 
 #include <nbl/builtin/hlsl/cpp_compat/basic.h>
+#include <nbl/builtin/hlsl/matrix_utils/matrix_traits.hlsl>
 #include <nbl/builtin/hlsl/concepts.hlsl>
 
 namespace nbl
@@ -362,6 +363,24 @@ struct lerp_helper<vector<T, N>, vector<bool, N> >
 	}
 };
 
+template<typename Matrix>
+struct transpose_helper;
+
+template<typename T, int N, int M>
+struct transpose_helper<matrix<T, N, M> >
+{
+	using transposed_t = typename matrix_traits<matrix<T, N, M> >::transposed_type;
+
+	static transposed_t transpose(NBL_CONST_REF_ARG(matrix<T, N, M>) m)
+	{
+#ifdef __HLSL_VERSION
+		return spirv::transpose(m);
+#else
+		return reinterpret_cast<transposed_t&>(glm::transpose(reinterpret_cast<typename matrix<T, N, M>::Base const&>(m)));
+#endif
+	}
+};
+
 }
 }
 }
diff --git a/include/nbl/builtin/hlsl/cpp_compat/intrinsics.hlsl b/include/nbl/builtin/hlsl/cpp_compat/intrinsics.hlsl
@@ -8,6 +8,7 @@
 #include <nbl/builtin/hlsl/spirv_intrinsics/core.hlsl>
 #include <nbl/builtin/hlsl/spirv_intrinsics/glsl.std.450.hlsl>
 #include <nbl/builtin/hlsl/cpp_compat/impl/intrinsics_impl.hlsl>
+#include <nbl/builtin/hlsl/matrix_utils/matrix_traits.hlsl>
 
 #ifndef __HLSL_VERSION
 #include <algorithm>
@@ -121,14 +122,10 @@ inline T lerp(NBL_CONST_REF_ARG(T) x, NBL_CONST_REF_ARG(T) y, NBL_CONST_REF_ARG(
 }
 
 // transpose not defined cause its implemented via hidden friend
-template<typename T, uint16_t N, uint16_t M>
-inline matrix<T, M, N> transpose(NBL_CONST_REF_ARG(matrix<T, N, M>) m)
+template<typename Matrix>
+inline typename matrix_traits<Matrix>::transposed_type transpose(NBL_CONST_REF_ARG(Matrix) m)
 {
-#ifdef __HLSL_VERSION
-	return spirv::transpose(m);
-#else
-	return reinterpret_cast<matrix<T, M, N>&>(glm::transpose(reinterpret_cast<typename matrix<T, N, M>::Base const&>(m)));
-#endif
+	return cpp_compat_intrinsics_impl::transpose_helper<Matrix>::transpose(m);
 }
 
 template<typename T>
diff --git a/include/nbl/builtin/hlsl/emulated/float64_t_impl.hlsl b/include/nbl/builtin/hlsl/emulated/float64_t_impl.hlsl
@@ -153,12 +153,12 @@ NBL_CONSTEXPR_INLINE_FUNC bool areBothInfinity(uint64_t lhs, uint64_t rhs)
 
 NBL_CONSTEXPR_INLINE_FUNC bool areBothZero(uint64_t lhs, uint64_t rhs)
 {
-    return ((lhs << 1) == 0ull) && ((rhs << 1) == 0ull);
+    return !bool((lhs | rhs) << 1);
 }
 
 NBL_CONSTEXPR_INLINE_FUNC bool areBothSameSignZero(uint64_t lhs, uint64_t rhs)
 {
-    return ((lhs << 1) == 0ull) && (lhs == rhs);
+    return !bool((lhs) << 1) && (lhs == rhs);
 }
 
 enum OperatorType
diff --git a/include/nbl/builtin/hlsl/emulated/matrix_t.hlsl b/include/nbl/builtin/hlsl/emulated/matrix_t.hlsl
@@ -2,6 +2,7 @@
 #define _NBL_BUILTIN_HLSL_EMULATED_MATRIX_T_HLSL_INCLUDED_
 
 #include <nbl/builtin/hlsl/portable/float64_t.hlsl>
+#include <nbl/builtin/hlsl/matrix_utils/matrix_traits.hlsl>
 
 namespace nbl
 {
@@ -20,7 +21,7 @@ struct emulated_matrix
 
     vec_t rows[RowCount];
 
-    transposed_t getTransposed()
+    transposed_t getTransposed() NBL_CONST_MEMBER_FUNC
     {
         static nbl::hlsl::array_get<typename this_t::vec_t, T> getter;
         static nbl::hlsl::array_set<typename transposed_t::vec_t, T> setter;
@@ -47,8 +48,29 @@ using emulated_matrix_t4x4 = emulated_matrix<EmulatedType, 4, 4>;
 template<typename EmulatedType>
 using emulated_matrix_t3x4 = emulated_matrix<EmulatedType, 3, 4>;
 
+// i choose to implement it this way because of this DXC bug: https://github.com/microsoft/DirectXShaderCompiler/issues/7007
+#define DEFINE_MATRIX_TRAITS_TEMPLATE_SPECIALIZATION(ROW_COUNT, COLUMN_COUNT) \
+template<typename T> \
+struct matrix_traits<emulated_matrix<T, ROW_COUNT, COLUMN_COUNT> > \
+{ \
+    using scalar_type = T; \
+    using row_type = vector<T, COLUMN_COUNT>; \
+    using transposed_type = emulated_matrix<T, COLUMN_COUNT, ROW_COUNT>; \
+    NBL_CONSTEXPR_STATIC_INLINE uint32_t RowCount = ROW_COUNT; \
+    NBL_CONSTEXPR_STATIC_INLINE uint32_t ColumnCount = COLUMN_COUNT; \
+    NBL_CONSTEXPR_STATIC_INLINE bool Square = RowCount == ColumnCount; \
+};
+
+DEFINE_MATRIX_TRAITS_TEMPLATE_SPECIALIZATION(2, 2)
+DEFINE_MATRIX_TRAITS_TEMPLATE_SPECIALIZATION(3, 3)
+DEFINE_MATRIX_TRAITS_TEMPLATE_SPECIALIZATION(4, 4)
+DEFINE_MATRIX_TRAITS_TEMPLATE_SPECIALIZATION(3, 4)
+
+#undef DEFINE_MATRIX_TRAITS_TEMPLATE_SPECIALIZATION
+
 namespace emulated_matrix_impl
 {
+// TODO: move to cpp_compat/impl/intrinsics_impl.hlsl
 template<typename LhsT, typename RhsT>
 struct mul_helper
 {
@@ -77,8 +99,24 @@ struct mul_helper<emulated_matrix<ComponentT, RowCount, ColumnCount>, emulated_v
         return output;
     }
 };
+
+}
+
+namespace cpp_compat_intrinsics_impl
+{
+template<typename T, int N, int M>
+struct transpose_helper<emulated_matrix<T, N, M> >
+{
+    using transposed_t = typename matrix_traits<emulated_matrix<T, N, M> >::transposed_type;
+
+	static transposed_t transpose(NBL_CONST_REF_ARG(emulated_matrix<T, N, M>) m)
+	{
+        return m.getTransposed();
+	}
+};
 }
 
+// TODO: move to cpp_compat/intrinsics.hlsl
 // TODO: concepts, to ensure that LhsT is a matrix and RhsT is a vector type
 template<typename MatT, typename VecT>
 VecT mul(MatT mat, VecT vec)
diff --git a/include/nbl/builtin/hlsl/matrix_utils/matrix_traits.hlsl b/include/nbl/builtin/hlsl/matrix_utils/matrix_traits.hlsl
@@ -1,7 +1,8 @@
 #ifndef _NBL_BUILTIN_HLSL_MATRIX_UTILS_MATRIX_TRAITS_INCLUDED_
 #define _NBL_BUILTIN_HLSL_MATRIX_UTILS_MATRIX_TRAITS_INCLUDED_
 
-#include <nbl/builtin/hlsl/cpp_compat.hlsl>
+#include <nbl/builtin/hlsl/cpp_compat/basic.h>
+#include <nbl/builtin/hlsl/cpp_compat/matrix.hlsl>
 
 namespace nbl
 {
@@ -18,6 +19,7 @@ struct matrix_traits<matrix<T, ROW_COUNT, COLUMN_COUNT> > \
 { \
     using scalar_type = T; \
     using row_type = vector<T, COLUMN_COUNT>; \
+    using transposed_type = matrix<T, COLUMN_COUNT, ROW_COUNT>; \
     NBL_CONSTEXPR_STATIC_INLINE uint32_t RowCount = ROW_COUNT; \
     NBL_CONSTEXPR_STATIC_INLINE uint32_t ColumnCount = COLUMN_COUNT; \
     NBL_CONSTEXPR_STATIC_INLINE bool Square = RowCount == ColumnCount; \
@@ -28,6 +30,8 @@ DEFINE_MATRIX_TRAITS_TEMPLATE_SPECIALIZATION(3, 3)
 DEFINE_MATRIX_TRAITS_TEMPLATE_SPECIALIZATION(4, 4)
 DEFINE_MATRIX_TRAITS_TEMPLATE_SPECIALIZATION(3, 4)
 
+#undef DEFINE_MATRIX_TRAITS_TEMPLATE_SPECIALIZATION
+
 // TODO: when this bug: https://github.com/microsoft/DirectXShaderCompiler/issues/7007 is fixed, uncomment and delete template specializations
 /*template<typename T, uint32_t N, uint32_t M>
 struct matrix_traits<matrix<T,N,M> >

Original file line number	Diff line number	Diff line change
`@@ -153,12 +153,12 @@ NBL_CONSTEXPR_INLINE_FUNC bool areBothInfinity(uint64_t lhs, uint64_t rhs)`
`153`	`153`
`154`	`154`	`NBL_CONSTEXPR_INLINE_FUNC bool areBothZero(uint64_t lhs, uint64_t rhs)`
`155`	`155`	`{`
`156`		`- return ((lhs << 1) == 0ull) && ((rhs << 1) == 0ull);`
	`156`	`+ return !bool((lhs \| rhs) << 1);`
`157`	`157`	`}`
`158`	`158`
`159`	`159`	`NBL_CONSTEXPR_INLINE_FUNC bool areBothSameSignZero(uint64_t lhs, uint64_t rhs)`
`160`	`160`	`{`
`161`		`- return ((lhs << 1) == 0ull) && (lhs == rhs);`
	`161`	`+ return !bool((lhs) << 1) && (lhs == rhs);`
`162`	`162`	`}`
`163`	`163`
`164`	`164`	`enum OperatorType`