Mercurial > hg > orthanc-stone
annotate OrthancStone/Sources/Toolbox/AlignedMatrix.h @ 2069:5956d7357098 deep-learning
macro ORTHANC_HAS_WASM_SIMD has to be manually defined
author | Sebastien Jodogne <s.jodogne@gmail.com> |
---|---|
date | Fri, 19 May 2023 17:00:17 +0200 |
parents | 22a83fb9dd23 |
children |
rev | line source |
---|---|
2068
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
1 /** |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
2 * Stone of Orthanc |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
3 * Copyright (C) 2012-2016 Sebastien Jodogne, Medical Physics |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
4 * Department, University Hospital of Liege, Belgium |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
5 * Copyright (C) 2017-2022 Osimis S.A., Belgium |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
6 * Copyright (C) 2021-2022 Sebastien Jodogne, ICTEAM UCLouvain, Belgium |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
7 * |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
8 * This program is free software: you can redistribute it and/or |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
9 * modify it under the terms of the GNU Lesser General Public License |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
10 * as published by the Free Software Foundation, either version 3 of |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
11 * the License, or (at your option) any later version. |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
12 * |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
13 * This program is distributed in the hope that it will be useful, but |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
14 * WITHOUT ANY WARRANTY; without even the implied warranty of |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
16 * Lesser General Public License for more details. |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
17 * |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
18 * You should have received a copy of the GNU Lesser General Public |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
19 * License along with this program. If not, see |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
20 * <http://www.gnu.org/licenses/>. |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
21 **/ |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
22 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
23 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
24 #pragma once |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
25 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
26 #include "SimdIncludes.h" |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
27 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
28 #if (ORTHANC_HAS_AVX2 == 1 || ORTHANC_HAS_SSE2 == 1 || ORTHANC_HAS_WASM_SIMD == 1) |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
29 # define ORTHANC_HAS_MATRIX_PRODUCT_TRANSPOSED_VECTORIZED 1 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
30 #else |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
31 # define ORTHANC_HAS_MATRIX_PRODUCT_TRANSPOSED_VECTORIZED 0 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
32 #endif |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
33 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
34 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
35 #include <boost/noncopyable.hpp> |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
36 #include <cassert> |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
37 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
38 namespace OrthancStone |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
39 { |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
40 /** |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
41 * 2D matrix whose rows are aligned for the largest SIMD |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
42 * instructions that are available. |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
43 **/ |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
44 class AlignedMatrix : public boost::noncopyable |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
45 { |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
46 private: |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
47 class ProductTransposedVectorizedContext; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
48 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
49 unsigned int rows_; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
50 unsigned int cols_; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
51 size_t pitch_; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
52 size_t pitchFloatPointer_; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
53 float* content_; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
54 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
55 void Setup(unsigned int rows, |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
56 unsigned int cols); |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
57 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
58 public: |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
59 AlignedMatrix(unsigned int rows, |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
60 unsigned int cols) |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
61 { |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
62 Setup(rows, cols); |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
63 } |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
64 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
65 ~AlignedMatrix(); |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
66 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
67 unsigned int GetRows() const |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
68 { |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
69 return rows_; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
70 } |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
71 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
72 unsigned int GetColumns() const |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
73 { |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
74 return cols_; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
75 } |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
76 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
77 unsigned int GetPitch() const |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
78 { |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
79 return pitch_; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
80 } |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
81 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
82 float* GetRowPointer(unsigned int row) |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
83 { |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
84 assert(row < rows_); |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
85 return content_ + row * pitchFloatPointer_; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
86 } |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
87 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
88 const float* GetRowPointer(unsigned int row) const |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
89 { |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
90 assert(row < rows_); |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
91 return content_ + row * pitchFloatPointer_; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
92 } |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
93 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
94 size_t GetIndex(unsigned int row, |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
95 unsigned int col) const |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
96 { |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
97 assert(row < rows_ && col < cols_); |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
98 return row * pitchFloatPointer_ + col; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
99 } |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
100 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
101 float GetValue(unsigned int row, |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
102 unsigned int col) const |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
103 { |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
104 return content_[GetIndex(row, col)]; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
105 } |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
106 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
107 void SetValue(unsigned int row, |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
108 unsigned int col, |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
109 float value) const |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
110 { |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
111 content_[GetIndex(row, col)] = value; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
112 } |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
113 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
114 void AddValue(unsigned int row, |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
115 unsigned int col, |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
116 float value) |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
117 { |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
118 content_[GetIndex(row, col)] += value; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
119 } |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
120 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
121 void FillZeros(); |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
122 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
123 // Computes "C = A * B" without SIMD operations |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
124 static void ProductPlain(AlignedMatrix& c, |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
125 const AlignedMatrix& a, |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
126 const AlignedMatrix& b); |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
127 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
128 #if ORTHANC_HAS_MATRIX_PRODUCT_TRANSPOSED_VECTORIZED == 1 |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
129 // Computes "C = A * B^T" using SIMD operations |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
130 static void ProductTransposedVectorized(AlignedMatrix& c, |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
131 const AlignedMatrix& a, |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
132 const AlignedMatrix& bt); |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
133 #endif |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
134 }; |
22a83fb9dd23
added AlignedMatrix and TimerLogger
Sebastien Jodogne <s.jodogne@gmail.com>
parents:
diff
changeset
|
135 } |