49 const scalar_t* B_3x3,
51 matmul3x3_3x1(A_3x3[0], A_3x3[1], A_3x3[2], A_3x3[3], A_3x3[4], A_3x3[5],
52 A_3x3[6], A_3x3[7], A_3x3[8], B_3x3[0], B_3x3[3], B_3x3[6],
53 C_3x3[0], C_3x3[3], C_3x3[6]);
54 matmul3x3_3x1(A_3x3[0], A_3x3[1], A_3x3[2], A_3x3[3], A_3x3[4], A_3x3[5],
55 A_3x3[6], A_3x3[7], A_3x3[8], B_3x3[1], B_3x3[4], B_3x3[7],
56 C_3x3[1], C_3x3[4], C_3x3[7]);
57 matmul3x3_3x1(A_3x3[0], A_3x3[1], A_3x3[2], A_3x3[3], A_3x3[4], A_3x3[5],
58 A_3x3[6], A_3x3[7], A_3x3[8], B_3x3[2], B_3x3[5], B_3x3[8],
59 C_3x3[2], C_3x3[5], C_3x3[8]);
114 scalar_t* output_3x3) {
115 scalar_t det =
det3x3(A_3x3);
119 scalar_t invdet = 1.0 / det;
120 output_3x3[0] = (A_3x3[4] * A_3x3[8] - A_3x3[7] * A_3x3[5]) * invdet;
121 output_3x3[1] = (A_3x3[2] * A_3x3[7] - A_3x3[1] * A_3x3[8]) * invdet;
122 output_3x3[2] = (A_3x3[1] * A_3x3[5] - A_3x3[2] * A_3x3[4]) * invdet;
123 output_3x3[3] = (A_3x3[5] * A_3x3[6] - A_3x3[3] * A_3x3[8]) * invdet;
124 output_3x3[4] = (A_3x3[0] * A_3x3[8] - A_3x3[2] * A_3x3[6]) * invdet;
125 output_3x3[5] = (A_3x3[3] * A_3x3[2] - A_3x3[0] * A_3x3[5]) * invdet;
126 output_3x3[6] = (A_3x3[3] * A_3x3[7] - A_3x3[6] * A_3x3[4]) * invdet;
127 output_3x3[7] = (A_3x3[6] * A_3x3[1] - A_3x3[0] * A_3x3[7]) * invdet;
128 output_3x3[8] = (A_3x3[0] * A_3x3[4] - A_3x3[3] * A_3x3[1]) * invdet;
165 scalar_t* output_3x3) {
166 output_3x3[0] = A_3x3[0];
167 output_3x3[1] = A_3x3[3];
168 output_3x3[2] = A_3x3[6];
170 output_3x3[3] = A_3x3[1];
171 output_3x3[4] = A_3x3[4];
172 output_3x3[5] = A_3x3[7];
174 output_3x3[6] = A_3x3[2];
175 output_3x3[7] = A_3x3[5];
176 output_3x3[8] = A_3x3[8];
181 scalar_t temp_01 = A_4x4[1];
182 scalar_t temp_02 = A_4x4[2];
183 scalar_t temp_03 = A_4x4[3];
184 scalar_t temp_12 = A_4x4[6];
185 scalar_t temp_13 = A_4x4[7];
186 scalar_t temp_23 = A_4x4[11];
189 A_4x4[3] = A_4x4[12];
191 A_4x4[7] = A_4x4[13];
192 A_4x4[11] = A_4x4[14];
203 scalar_t* output_4x4) {
204 output_4x4[0] = A_4x4[0];
205 output_4x4[1] = A_4x4[4];
206 output_4x4[2] = A_4x4[8];
207 output_4x4[3] = A_4x4[12];
209 output_4x4[4] = A_4x4[1];
210 output_4x4[5] = A_4x4[5];
211 output_4x4[6] = A_4x4[9];
212 output_4x4[7] = A_4x4[13];
214 output_4x4[8] = A_4x4[2];
215 output_4x4[9] = A_4x4[6];
216 output_4x4[10] = A_4x4[10];
217 output_4x4[11] = A_4x4[14];
219 output_4x4[12] = A_4x4[3];
220 output_4x4[13] = A_4x4[7];
221 output_4x4[14] = A_4x4[11];
222 output_4x4[15] = A_4x4[15];