32 #include "NE10_types.h" 37 ne10_result_t ne10_mulmat_2x2f_c (ne10_mat2x2f_t * dst, ne10_mat2x2f_t * src1, ne10_mat2x2f_t * src2, ne10_uint32_t count)
39 #define A1 src1[ itr ].c1.r1 40 #define A2 src2[ itr ].c1.r1 41 #define B1 src1[ itr ].c1.r2 42 #define B2 src2[ itr ].c1.r2 43 #define C1 src1[ itr ].c2.r1 44 #define C2 src2[ itr ].c2.r1 45 #define D1 src1[ itr ].c2.r2 46 #define D2 src2[ itr ].c2.r2 48 NE10_X_OPERATION_FLOAT_C
50 dst[ itr ].c1.r1 = (A1 * A2) + (C1 * B2);
51 dst[ itr ].c1.r2 = (B1 * A2) + (D1 * B2);
53 dst[ itr ].c2.r1 = (A1 * C2) + (C1 * D2);
54 dst[ itr ].c2.r2 = (B1 * C2) + (D1 * D2);
67 ne10_result_t ne10_mulmat_3x3f_c (ne10_mat3x3f_t * dst, ne10_mat3x3f_t * src1, ne10_mat3x3f_t * src2, ne10_uint32_t count)
69 #define A1 src1[ itr ].c1.r1 70 #define A2 src2[ itr ].c1.r1 71 #define B1 src1[ itr ].c1.r2 72 #define B2 src2[ itr ].c1.r2 73 #define C1 src1[ itr ].c1.r3 74 #define C2 src2[ itr ].c1.r3 75 #define D1 src1[ itr ].c2.r1 76 #define D2 src2[ itr ].c2.r1 77 #define E1 src1[ itr ].c2.r2 78 #define E2 src2[ itr ].c2.r2 79 #define F1 src1[ itr ].c2.r3 80 #define F2 src2[ itr ].c2.r3 81 #define G1 src1[ itr ].c3.r1 82 #define G2 src2[ itr ].c3.r1 83 #define H1 src1[ itr ].c3.r2 84 #define H2 src2[ itr ].c3.r2 85 #define I1 src1[ itr ].c3.r3 86 #define I2 src2[ itr ].c3.r3 88 NE10_X_OPERATION_FLOAT_C
90 dst[ itr ].c1.r1 = (A1 * A2) + (D1 * B2) + (G1 * C2);
91 dst[ itr ].c1.r2 = (B1 * A2) + (E1 * B2) + (H1 * C2);
92 dst[ itr ].c1.r3 = (C1 * A2) + (F1 * B2) + (I1 * C2);
94 dst[ itr ].c2.r1 = (A1 * D2) + (D1 * E2) + (G1 * F2);
95 dst[ itr ].c2.r2 = (B1 * D2) + (E1 * E2) + (H1 * F2);
96 dst[ itr ].c2.r3 = (C1 * D2) + (F1 * E2) + (I1 * F2);
98 dst[ itr ].c3.r1 = (A1 * G2) + (D1 * H2) + (G1 * I2);
99 dst[ itr ].c3.r2 = (B1 * G2) + (E1 * H2) + (H1 * I2);
100 dst[ itr ].c3.r3 = (C1 * G2) + (F1 * H2) + (I1 * I2);
123 ne10_result_t ne10_mulmat_4x4f_c (ne10_mat4x4f_t * dst, ne10_mat4x4f_t * src1, ne10_mat4x4f_t * src2, ne10_uint32_t count)
125 #define A1 src1[ itr ].c1.r1 126 #define A2 src2[ itr ].c1.r1 127 #define B1 src1[ itr ].c1.r2 128 #define B2 src2[ itr ].c1.r2 129 #define C1 src1[ itr ].c1.r3 130 #define C2 src2[ itr ].c1.r3 131 #define D1 src1[ itr ].c1.r4 132 #define D2 src2[ itr ].c1.r4 134 #define E1 src1[ itr ].c2.r1 135 #define E2 src2[ itr ].c2.r1 136 #define F1 src1[ itr ].c2.r2 137 #define F2 src2[ itr ].c2.r2 138 #define G1 src1[ itr ].c2.r3 139 #define G2 src2[ itr ].c2.r3 140 #define H1 src1[ itr ].c2.r4 141 #define H2 src2[ itr ].c2.r4 143 #define I1 src1[ itr ].c3.r1 144 #define I2 src2[ itr ].c3.r1 145 #define J1 src1[ itr ].c3.r2 146 #define J2 src2[ itr ].c3.r2 147 #define K1 src1[ itr ].c3.r3 148 #define K2 src2[ itr ].c3.r3 149 #define L1 src1[ itr ].c3.r4 150 #define L2 src2[ itr ].c3.r4 152 #define M1 src1[ itr ].c4.r1 153 #define M2 src2[ itr ].c4.r1 154 #define N1 src1[ itr ].c4.r2 155 #define N2 src2[ itr ].c4.r2 156 #define O1 src1[ itr ].c4.r3 157 #define O2 src2[ itr ].c4.r3 158 #define P1 src1[ itr ].c4.r4 159 #define P2 src2[ itr ].c4.r4 161 NE10_X_OPERATION_FLOAT_C
163 dst[ itr ].c1.r1 = (A1 * A2) + (E1 * B2) + (I1 * C2) + (M1 * D2);
164 dst[ itr ].c1.r2 = (B1 * A2) + (F1 * B2) + (J1 * C2) + (N1 * D2);
165 dst[ itr ].c1.r3 = (C1 * A2) + (G1 * B2) + (K1 * C2) + (O1 * D2);
166 dst[ itr ].c1.r4 = (D1 * A2) + (H1 * B2) + (L1 * C2) + (P1 * D2);
168 dst[ itr ].c2.r1 = (A1 * E2) + (E1 * F2) + (I1 * G2) + (M1 * H2);
169 dst[ itr ].c2.r2 = (B1 * E2) + (F1 * F2) + (J1 * G2) + (N1 * H2);
170 dst[ itr ].c2.r3 = (C1 * E2) + (G1 * F2) + (K1 * G2) + (O1 * H2);
171 dst[ itr ].c2.r4 = (D1 * E2) + (H1 * F2) + (L1 * G2) + (P1 * H2);
173 dst[ itr ].c3.r1 = (A1 * I2) + (E1 * J2) + (I1 * K2) + (M1 * L2);
174 dst[ itr ].c3.r2 = (B1 * I2) + (F1 * J2) + (J1 * K2) + (N1 * L2);
175 dst[ itr ].c3.r3 = (C1 * I2) + (G1 * J2) + (K1 * K2) + (O1 * L2);
176 dst[ itr ].c3.r4 = (D1 * I2) + (H1 * J2) + (L1 * K2) + (P1 * L2);
178 dst[ itr ].c4.r1 = (A1 * M2) + (E1 * N2) + (I1 * O2) + (M1 * P2);
179 dst[ itr ].c4.r2 = (B1 * M2) + (F1 * N2) + (J1 * O2) + (N1 * P2);
180 dst[ itr ].c4.r3 = (C1 * M2) + (G1 * N2) + (K1 * O2) + (O1 * P2);
181 dst[ itr ].c4.r4 = (D1 * M2) + (H1 * N2) + (L1 * O2) + (P1 * P2);