From 5886fd31719331647ef66e7d565eccedd719aa1a Mon Sep 17 00:00:00 2001 From: Mikhail Katliar Date: Sat, 7 Dec 2024 13:52:13 +0100 Subject: [PATCH] Fixed StaticVectorPointerTest on neon64 (#48) --- include/blast/math/dense/StaticVector.hpp | 176 ++++++++++++ include/blast/math/simd/arch/Neon64.hpp | 17 +- include/blast/math/views/Row.hpp | 267 ++++++++++++++++++ .../math/dense/StaticVectorPointerTest.cpp | 13 +- test/blast/math/views/RowTest.cpp | 2 +- 5 files changed, 456 insertions(+), 19 deletions(-) create mode 100644 include/blast/math/dense/StaticVector.hpp diff --git a/include/blast/math/dense/StaticVector.hpp b/include/blast/math/dense/StaticVector.hpp new file mode 100644 index 00000000..64c19b90 --- /dev/null +++ b/include/blast/math/dense/StaticVector.hpp @@ -0,0 +1,176 @@ +// Copyright (c) 2019-2024 Mikhail Katliar All rights reserved. +// Use of this source code is governed by a BSD-style +// license that can be found in the LICENSE file. + +#pragma once + +#include +#include +#include +#include +#include +#include +#include + +#include +#include + + +namespace blast +{ + /// @brief Vector with statically defined size. + /// + /// @tparam T element type of the vector + /// @tparam N number of elements + /// @tparam TF transpose flag + template + class StaticVector + { + public: + using ElementType = T; + static TransposeFlag constexpr transposeFlag = TF; + + + StaticVector() noexcept + { + // Initialize padding elements to 0 to prevent denorms in calculations. + // Denorms can significantly impair performance, see https://github.com/giaf/blasfeo/issues/103 + std::fill_n(v_, capacity_, T {}); + } + + + StaticVector(T const& v) noexcept + { + std::fill_n(v_, capacity_, v); + } + + + /** + * @brief Construct from an initializer list. + * + * \code + * StaticVector v {1., 2., 3.}; + * \endcode + * + * @param list list of vector elements. If @a list is shorter than @a N, + * the remaining vector elements will be 0. If @a list is longer than @a N, + * the extra elements of @a list will be ignored. + */ + constexpr StaticVector(std::initializer_list list) + { + fill(copy_n(list.begin(), std::min(list.size(), N), std::begin(v_)), std::end(v_), T {}); + } + + + StaticVector& operator=(T val) noexcept + { + std::fill_n(v_, capacity_, val); + + return *this; + } + + + constexpr T const& operator[](size_t i) const noexcept + { + assert(i < N); + return v_[i]; + } + + + constexpr T& operator[](size_t i) + { + assert(i < N); + return v_[i]; + } + + + static size_t constexpr size() noexcept + { + return N; + } + + + T * data() noexcept + { + return v_; + } + + + T const * data() const noexcept + { + return v_; + } + + + /** + * @brief Set all vector elements to 0 + */ + void reset() noexcept + { + std::fill_n(v_, capacity_, T {}); + } + + + private: + static size_t constexpr capacity_ = nextMultiple(N, SimdSize_v); + + // Alignment of the data elements. + static size_t constexpr alignment_ = CACHE_LINE_SIZE; + + // Aligned element storage. + alignas(alignment_) T v_[capacity_]; + + }; + + + template + inline size_t constexpr size(StaticVector const& m) noexcept + { + return N; + } + + + template + inline constexpr T * data(StaticVector& m) noexcept + { + return m.data(); + } + + + template + inline constexpr T const * data(StaticVector const& m) noexcept + { + return m.data(); + } + + + template + inline void reset(StaticVector& m) noexcept + { + m.reset(); + } + + + template + struct IsDenseVector> : std::true_type {}; + + + template + struct IsStatic> : std::true_type {}; + + + template + struct IsAligned> : std::integral_constant {}; + + + template + struct IsPadded> : std::integral_constant {}; + + + template + struct IsStaticallySpaced> : std::integral_constant {}; + + + template + struct Spacing> : std::integral_constant {}; +} diff --git a/include/blast/math/simd/arch/Neon64.hpp b/include/blast/math/simd/arch/Neon64.hpp index 83c23cbc..6c2238f9 100644 --- a/include/blast/math/simd/arch/Neon64.hpp +++ b/include/blast/math/simd/arch/Neon64.hpp @@ -1,16 +1,7 @@ -// Copyright 2024 Mikhail Katliar -// -// Licensed under the Apache License, Version 2.0 (the "License"); -// you may not use this file except in compliance with the License. -// You may obtain a copy of the License at -// -// https://www.apache.org/licenses/LICENSE-2.0 -// -// Unless required by applicable law or agreed to in writing, software -// distributed under the License is distributed on an "AS IS" BASIS, -// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -// See the License for the specific language governing permissions and -// limitations under the License. +// Copyright (c) 2019-2024 Mikhail Katliar All rights reserved. +// Use of this source code is governed by a BSD-style +// license that can be found in the LICENSE file. + #pragma once #include diff --git a/include/blast/math/views/Row.hpp b/include/blast/math/views/Row.hpp index b9afee98..95da03c5 100644 --- a/include/blast/math/views/Row.hpp +++ b/include/blast/math/views/Row.hpp @@ -6,3 +6,270 @@ #include #include +#include + + +namespace blast +{ + /** + * @brief Row view of a matrix + * + * NOTE: this implementation is not optimized! + * It holds a refrerence to the matrix, as well as a raw pointer, + * the row index, and the column index of the first element. + * Instead it could be just a matrix pointer and the length. + * This would reduce the amount of data needed to represent the @a Row object, + * increasig the possibility of storing everything in registers and reducing + * the number of registers needed. + * + * @tparam MT viewed matrix type + */ + template + class Row + { + public: + static TransposeFlag constexpr transposeFlag = rowVector; + + using ViewedType = MT; + using ElementType = ElementType_t; + + //! Reference to a constant submatrix value. + using ConstReference = ElementType const&; + + //! Reference to a non-constant submatrix value. + using Reference = std::conditional_t, ConstReference, ElementType&>; + + //! Pointer to a constant submatrix value. + using ConstPointer = ElementType const *; + + //! Pointer to a non-constant submatrix value. + using Pointer = std::conditional_t, ConstPointer, ElementType *>; + + + /** + * @brief Constructor + * + * @param matrix the matrix + * @param i row index + * @param j start of the row + * @param n row length + */ + explicit inline constexpr Row(MT& matrix, size_t i, size_t j, size_t n) + : matrix_ {matrix} + , i_ {i} + , j_ {j} + , n_ {n} + , data_ {&matrix(i, j)} + { + BLAST_USER_ASSERT(i_ < rows(matrix_), "Invalid row index"); + BLAST_USER_ASSERT(j_ < columns(matrix_), "Invalid column index"); + BLAST_USER_ASSERT(j_ + n_ <= columns(matrix_), "Invalid row length"); + } + + + Row(Row const&) = default; + + + /** + * @brief Vector assignment + * + * Copies elements from the right-hand side expression + * + * @tparam VT type of right-hand side vector + * + * @param rhs + * + * @return reference to *this + */ + template + Row& operator=(VT const& rhs) + { + assign(*this, rhs); + return *this; + } + + + Reference operator[](size_t j) noexcept + { + BLAST_USER_ASSERT(j_ + j < columns(matrix_), "Invalid vector access index"); + + return matrix_(i_, j_ + j); + } + + + ConstReference operator[](size_t j) const + { + BLAST_USER_ASSERT(j_ + j < columns(matrix_), "Invalid vector access index"); + + return const_cast(matrix_)(i_, j_ + j); + } + + + friend Pointer data(Row& m) noexcept + { + return m.data_; + } + + + friend ConstPointer data(Row const& m) noexcept + { + return m.data_; + } + + + friend size_t constexpr size(Row const& row) noexcept + { + return row.n_; + } + + + /** + * @brief Subvector of a row + * + * @param row the original row + * @param j start index of the subvector within @a row + * @param n length of the subvector + */ + friend auto subvector(Row&& row, size_t j, size_t n) noexcept + { + return Row {row.matrix_, row.i_, row.j_ + j, n}; + } + + + /** + * @brief Subvector of a const row + * + * @param row the original row + * @param j start index of the subvector within @a row + * @param n length of the subvector + */ + friend auto subvector(Row const& row, size_t j, size_t n) noexcept + { + return Row {const_cast(row.matrix_), row.i_, row.j_ + j, n}; + } + + + private: + ViewedType& matrix_; //!< The matrix containing the submatrix. + size_t const i_; + size_t const j_; + size_t const n_; + Pointer const data_; + }; + + + /** + * @brief Specialization for @a Row class + */ + template + struct IsAligned> : std::integral_constant && IsPadded_v> {}; + + + /** + * @brief Specialization for @a Row class + */ + template + struct IsPadded> : std::integral_constant && StorageOrder_v == rowMajor> {}; + + + /** + * @brief Specialization for @a Row class + */ + template + struct IsStatic> : IsStatic {}; + + + /** + * @brief Specialization for @a Row class + */ + template + struct IsDenseVector> : IsDenseMatrix {}; + + + /** + * @brief Specialization for @a Row class + */ + template + struct IsView> : std::integral_constant {}; + + + /** + * @brief Specialization for rows of dense (non-panel) matrices + */ + template + requires IsDenseMatrix_v + struct IsStaticallySpaced> : std::integral_constant || StorageOrder_v == rowMajor> {}; + + + /** + * @brief Specialization for rows of panel matrices + */ + template + requires IsPanelMatrix_v + struct IsStaticallySpaced> : std::integral_constant == columnMajor> {}; + + + /** + * @brief Specialization for rows of dense (non-panel) matrices + */ + template + requires IsDenseMatrix_v && IsStatic_v + struct Spacing> : std::integral_constant == rowMajor ? 1 : Spacing_v> {}; + + + /** + * @brief Specialization for rows of panel matrices + */ + template + requires IsPanelMatrix_v && (StorageOrder_v == columnMajor) + struct Spacing> : std::integral_constant>> {}; + + + /** + * @brief Full row of a matrix + * + * @tparam MT type of the matrix containing the row + * + * @param matrix matrix containing the row + * @param row row index + * + * @return submatrix of @a matrix + */ + template + inline auto row(MT& matrix, size_t row) + { + return Row {matrix, row, 0, columns(matrix)}; + } + + + /** + * @brief Partial row of a matrix + * + * @tparam MT type of the matrix containing the row + * + * @param matrix matrix containing the row + * @param row row index + * @param column row start + * @param n row length + * + * @return submatrix of @a matrix + */ + template + inline auto row(MT& matrix, size_t row, size_t column, size_t n) + { + return Row {matrix, row, column, n}; + } + + + /** + * @brief Set all elements of a row to their default value (0). + * + * @param matrix submatrix to set to 0. + */ + template + inline void reset(Row& row) noexcept + { + for (size_t i = 0; i < size(row); ++i) + row[i] = 0; + } +} diff --git a/test/blast/math/dense/StaticVectorPointerTest.cpp b/test/blast/math/dense/StaticVectorPointerTest.cpp index a8050c8f..b737aa9b 100644 --- a/test/blast/math/dense/StaticVectorPointerTest.cpp +++ b/test/blast/math/dense/StaticVectorPointerTest.cpp @@ -3,7 +3,10 @@ // license that can be found in the LICENSE file. #include -#include +#include +#include +#include +#include #include @@ -18,7 +21,7 @@ namespace blast :: testing using Real = Scalar; - template + template void testSpacingImpl() { StaticVector v; @@ -27,7 +30,7 @@ namespace blast :: testing } - template + template void testGetImpl() { StaticVector v; @@ -37,7 +40,7 @@ namespace blast :: testing } - template + template void testOffsetImpl() { StaticVector v; @@ -56,7 +59,7 @@ namespace blast :: testing StaticMatrix A; size_t constexpr i = 1, j = 2; - auto p = ptr(blaze::subvector(blaze::row(A)), 0); + auto p = ptr(subvector(row(A, i), j, columns(A) - j), 0); ASSERT_EQ(p.get(), &A(i, j)); ASSERT_EQ(p.spacing(), SO == columnMajor ? A.spacing() : 1); } diff --git a/test/blast/math/views/RowTest.cpp b/test/blast/math/views/RowTest.cpp index 17cfced6..61c7eeb8 100644 --- a/test/blast/math/views/RowTest.cpp +++ b/test/blast/math/views/RowTest.cpp @@ -19,7 +19,7 @@ namespace blast :: testing for (size_t i = 0; i < rows(A); ++i) { auto r = row(A, i); - ASSERT_EQ(r.size(), A.columns()); + ASSERT_EQ(size(r), A.columns()); } }