[igt-dev] [PATCH i-g-t 1/4] lib/igt_matrix: Unroll and inline igt_matrix_transform()
Ville Syrjala
ville.syrjala at linux.intel.com
Wed Jun 6 20:16:39 UTC 2018
From: Ville Syrjälä <ville.syrjala at linux.intel.com>
Using the current igt_matrix for NV12 conversion ends up being
about 4x as slow as the current non-igt_matrix based code. Unrolling
and inlining igt_matrix_transform() improves that factor to ~1.5x.
Cc: Maarten Lankhorst <maarten.lankhorst at linux.intel.com>
Signed-off-by: Ville Syrjälä <ville.syrjala at linux.intel.com>
---
lib/igt_matrix.c | 25 -------------------------
lib/igt_matrix.h | 43 +++++++++++++++++++++++++++++++++++++++++--
2 files changed, 41 insertions(+), 27 deletions(-)
diff --git a/lib/igt_matrix.c b/lib/igt_matrix.c
index 3fa6c96cae8a..35a9c321defd 100644
--- a/lib/igt_matrix.c
+++ b/lib/igt_matrix.c
@@ -24,8 +24,6 @@
#include "igt_core.h"
#include "igt_matrix.h"
-#define m(row, col) ((col) * 4 + (row))
-
/**
* SECTION:igt_matrix
* @short_description: Matrix math library
@@ -110,29 +108,6 @@ struct igt_mat4 igt_matrix_translate(float x, float y, float z)
return ret;
}
-/**
- * igt_matrix_transform:
- *
- * Transform the vector @v by the matrix @m. @m is on the left,
- * @v on the right.
- *
- * Returns:
- * The transformed vector.
- */
-struct igt_vec4 igt_matrix_transform(const struct igt_mat4 *m,
- const struct igt_vec4 *v)
-{
- struct igt_vec4 ret = {};
-
- for (int row = 0; row < 4; row++) {
- for (int i = 0; i < 4; i++) {
- ret.d[row] += m->d[m(row, i)] * v->d[i];
- }
- }
-
- return ret;
-}
-
/**
* igt_matrix_multiply:
*
diff --git a/lib/igt_matrix.h b/lib/igt_matrix.h
index 33acb815197b..7a2b9ad8b573 100644
--- a/lib/igt_matrix.h
+++ b/lib/igt_matrix.h
@@ -44,13 +44,52 @@ struct igt_mat4 {
float d[16];
};
+#define m(row, col) ((col) * 4 + (row))
+
void igt_matrix_print(const struct igt_mat4 *m);
struct igt_mat4 igt_matrix_identity(void);
struct igt_mat4 igt_matrix_scale(float x, float y, float z);
struct igt_mat4 igt_matrix_translate(float x, float y, float z);
-struct igt_vec4 igt_matrix_transform(const struct igt_mat4 *m,
- const struct igt_vec4 *v);
struct igt_mat4 igt_matrix_multiply(const struct igt_mat4 *a,
const struct igt_mat4 *b);
+/**
+ * igt_matrix_transform:
+ *
+ * Transform the vector @v by the matrix @m. @m is on the left,
+ * @v on the right.
+ *
+ * Returns:
+ * The transformed vector.
+ */
+static inline struct igt_vec4
+igt_matrix_transform(const struct igt_mat4 *m,
+ const struct igt_vec4 *v)
+{
+ struct igt_vec4 ret = {
+ .d = { m->d[m(0, 0)] * v->d[0] +
+ m->d[m(0, 1)] * v->d[1] +
+ m->d[m(0, 2)] * v->d[2] +
+ m->d[m(0, 3)] * v->d[3],
+
+ m->d[m(1, 0)] * v->d[0] +
+ m->d[m(1, 1)] * v->d[1] +
+ m->d[m(1, 2)] * v->d[2] +
+ m->d[m(1, 3)] * v->d[3],
+
+ m->d[m(2, 0)] * v->d[0] +
+ m->d[m(2, 1)] * v->d[1] +
+ m->d[m(2, 2)] * v->d[2] +
+ m->d[m(2, 3)] * v->d[3],
+
+ m->d[m(3, 0)] * v->d[0] +
+ m->d[m(3, 1)] * v->d[1] +
+ m->d[m(3, 2)] * v->d[2] +
+ m->d[m(3, 3)] * v->d[3],
+ },
+ };
+
+ return ret;
+}
+
#endif /* __IGT_MATRIX_H__ */
--
2.16.4
More information about the igt-dev
mailing list