[math] Generic dense matrix implementation using BLAS calls for matrix-matrix multiplication if available

2016-08-06 00:40:01 -04:00
parent d4a792f33c
commit 46cd725c13
19 changed files with 469 additions and 425 deletions
--- a/src/matrix.h
+++ b/src/matrix.h
@@ -6,60 +6,374 @@
 #include <stdint.h>
 #include <stdbool.h>

+#include <config.h>
+
 #include "collections.h"
+#include "file_utils.h"
+#include "vector.h"
+#include "vector_math.h"

-typedef struct matrix {
-    size_t m;
-    size_t n;
-    double *values;
-} matrix_t;
+#ifdef HAVE_BLAS
+#include <cblas.h>
+#else
+#warning "No CLBAS"
+#endif

-matrix_t *matrix_new(size_t m, size_t n);
-matrix_t *matrix_new_value(size_t m, size_t n, double value);
-matrix_t *matrix_new_values(size_t m, size_t n, double *values);
-matrix_t *matrix_new_zeros(size_t m, size_t n);
-matrix_t *matrix_new_ones(size_t m, size_t n);
+#define MATRIX_INIT(name, type, type_name, array_type)                                                      \
+    typedef struct {                                                                                        \
+        size_t m, n;                                                                                        \
+        type *values;                                                                                       \
+    } name##_t;                                                                                             \
+                                                                                                            \
+    static name##_t *name##_new(size_t m, size_t n) {                                                       \
+        name##_t *matrix = malloc(sizeof(name##_t));                                                        \
+                                                                                                            \
+        if (matrix == NULL) {                                                                               \
+            return NULL;                                                                                    \
+        }                                                                                                   \
+                                                                                                            \
+        matrix->m = m;                                                                                      \
+        matrix->n = n;                                                                                      \
+                                                                                                            \
+        matrix->values = malloc(sizeof(type) * m * n);                                                      \
+        if (matrix->values == NULL) {                                                                       \
+            free(matrix);                                                                                   \
+            return NULL;                                                                                    \
+        }                                                                                                   \
+                                                                                                            \
+        return matrix;                                                                                      \
+                                                                                                            \
+    }                                                                                                       \
+                                                                                                            \
+    static void name##_destroy(name##_t *self) {                                                            \
+        if (self == NULL) return;                                                                           \
+                                                                                                            \
+        if (self->values != NULL) {                                                                         \
+            free(self->values);                                                                             \
+        }                                                                                                   \
+                                                                                                            \
+        free(self);                                                                                         \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_zero(name##_t *self) {                                                        \
+        memset(self->values, 0, self->m * self->n * sizeof(type));                                          \
+    }                                                                                                       \
+                                                                                                            \
+                                                                                                            \
+    static inline bool name##_resize(name##_t *self, size_t m, size_t n) {                                  \
+        if (self == NULL) return false;                                                                     \
+                                                                                                            \
+        if (m * n > (self->m * self->n)) {                                                                  \
+            self->values = realloc(self->values, sizeof(type) * m * n);                                     \
+            if (self->values == NULL) {                                                                     \
+                return false;                                                                               \
+            }                                                                                               \
+        }                                                                                                   \
+                                                                                                            \
+        self->m = m;                                                                                        \
+        self->n = n;                                                                                        \
+                                                                                                            \
+        name##_zero(self);                                                                                  \
+                                                                                                            \
+        return true;                                                                                        \
+    }                                                                                                       \
+                                                                                                            \
+    static inline name##_t *name##_new_copy(name##_t *self) {                                               \
+        name##_t *cpy = name##_new(self->m, self->n);                                                       \
+        size_t num_values = self->m * self->n;                                                              \
+        memcpy(cpy->values, self->values, num_values);                                                      \
+                                                                                                            \
+        return cpy;                                                                                         \
+    }                                                                                                       \
+                                                                                                            \
+    static inline bool name##_copy(name##_t *self, name##_t *other) {                                       \
+        if (self->m != other->m || self->n != other->n) {                                                   \
+            return false;                                                                                   \
+        }                                                                                                   \
+        size_t num_values = self->n * self->n;                                                              \
+                                                                                                            \
+        memcpy(other->values, self->values, num_values * sizeof(type));                                     \
+        return true;                                                                                        \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_init_values(name##_t *self, type *values) {                                   \
+        size_t num_values = self->m * self->n;                                                              \
+        memcpy(self->values, values, num_values * sizeof(type));                                            \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_set(name##_t *self, type value) {                                             \
+        array_type##_set(self->values, value, self->m * self->n);                                           \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_set_row(name##_t *self, size_t index, type *row) {                            \
+        size_t offset = index * self->n;                                                                    \
+        type *values = self->values;                                                                        \
+        size_t n = self->n;                                                                                 \
+        memcpy(values + offset, row, n * sizeof(type));                                                     \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_set_scalar(name##_t *self, size_t row_index, size_t col_index, type value) {  \
+        size_t offset = row_index * self->n + col_index;                                                    \
+        self->values[offset] = value;                                                                       \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_add_scalar(name##_t *self, size_t row_index, size_t col_index, type value) {  \
+        size_t offset = row_index * self->n + col_index;                                                    \
+        self->values[offset] += value;                                                                      \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_sub_scalar(name##_t *self, size_t row_index, size_t col_index, type value) {  \
+        size_t offset = row_index * self->n + col_index;                                                    \
+        self->values[offset] -= value;                                                                      \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_mul_scalar(name##_t *self, size_t row_index, size_t col_index, type value) {  \
+        size_t offset = row_index * self->n + col_index;                                                    \
+        self->values[offset] *= value;                                                                      \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_div_scalar(name##_t *self, size_t row_index, size_t col_index, type value) {  \
+        size_t offset = row_index * self->n + col_index;                                                    \
+        self->values[offset] /= value;                                                                      \
+    }                                                                                                       \
+                                                                                                            \
+    static inline type name##_get(name##_t *self, size_t row_index, size_t col_index) {                     \
+        size_t index = row_index * self->n + col_index;                                                     \
+        return self->values[index];                                                                         \
+    }                                                                                                       \
+                                                                                                            \
+    static inline type *name##_get_row(name##_t *self, size_t row_index) {                                  \
+        size_t index = row_index * self->n;                                                                 \
+        return self->values + index;                                                                        \
+    }                                                                                                       \
+                                                                                                            \
+    static inline name##_t *name##_new_value(size_t m, size_t n, type value) {                              \
+        name##_t *matrix = name##_new(m, n);                                                                \
+        name##_set(matrix, value);                                                                          \
+        return matrix;                                                                                      \
+    }                                                                                                       \
+                                                                                                            \
+    static inline name##_t *name##_new_zeros(size_t m, size_t n) {                                          \
+        name##_t *matrix = name##_new(m, n);                                                                \
+        name##_zero(matrix);                                                                                \
+        return matrix;                                                                                      \
+    }                                                                                                       \
+                                                                                                            \
+    static inline name##_t *name##_new_ones(size_t m, size_t n) {                                           \
+        return name##_new_value(m, n, (type)1);                                                             \
+    }                                                                                                       \
+                                                                                                            \
+    static inline name##_t *name##_new_values(size_t m, size_t n, type *values) {                           \
+        name##_t *matrix = name##_new(m, n);                                                                \
+        memcpy(matrix->values, values, m * n * sizeof(type));                                               \
+        return matrix;                                                                                      \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_div(name##_t *self, type value) {                                             \
+        array_type##_div(self->values, value, self->m * self->n);                                           \
+    }                                                                                                       \
+                                                                                                            \
+    static inline bool name##_div_matrix(name##_t *self, name##_t *other) {                                 \
+        if (self->m != other->m || self->n != other->n) return false;                                       \
+        array_type##_div_array(self->values, other->values, self->m * self->n);                             \
+        return true;                                                                                        \
+    }                                                                                                       \
+                                                                                                            \
+    static inline bool name##_div_matrix_times_scalar(name##_t *self, name##_t *other, type v) {            \
+        if (self->m != other->m || self->n != other->n) return false;                                       \
+        array_type##_div_array_times_scalar(self->values, other->values, v, self->m * self->n);             \
+        return true;                                                                                        \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_mul(name##_t *self, type value) {                                             \
+        array_type##_mul(self->values, value, self->m * self->n);                                           \
+    }                                                                                                       \
+                                                                                                            \
+    static inline bool name##_mul_matrix(name##_t *self, name##_t *other) {                                 \
+        if (self->m != other->m || self->n != other->n) return false;                                       \
+        array_type##_mul_array(self->values, other->values, self->m * self->n);                             \
+        return true;                                                                                        \
+    }                                                                                                       \
+                                                                                                            \
+    static inline bool name##_mul_matrix_times_scalar(name##_t *self, name##_t *other, type v) {            \
+        if (self->m != other->m || self->n != other->n) return false;                                       \
+        array_type##_mul_array_times_scalar(self->values, other->values, v, self->m * self->n);             \
+        return true;                                                                                        \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_add(name##_t *self, type value) {                                             \
+        array_type##_add(self->values, self->m * self->n, value);                                           \
+    }                                                                                                       \
+                                                                                                            \
+                                                                                                            \
+    static inline bool name##_add_matrix(name##_t *self, name##_t *other) {                                 \
+        if (self->m != other->m || self->n != other->n) return false;                                       \
+        array_type##_add_array(self->values, other->values, self->m * self->n);                             \
+        return true;                                                                                        \
+    }                                                                                                       \
+                                                                                                            \
+    static inline bool name##_add_matrix_times_scalar(name##_t *self, name##_t *other, type v) {            \
+        if (self->m != other->m || self->n != other->n) return false;                                       \
+        array_type##_add_array_times_scalar(self->values, other->values, v, self->m * self->n);             \
+        return true;                                                                                        \
+    }                                                                                                       \
+                                                                                                            \
+    static inline void name##_sub(name##_t *self, type value) {                                             \
+        array_type##_sub(self->values, value, self->m * self->n);                                           \
+    }                                                                                                       \
+                                                                                                            \
+    static inline bool name##_sub_matrix(name##_t *self, name##_t *other) {                                 \
+        if (self->m != other->m || self->n != other->n) return false;                                       \
+        array_type##_sub_array(self->values, other->values, self->m * self->n);                             \
+        return true;                                                                                        \
+    }                                                                                                       \
+                                                                                                            \
+    static inline bool name##_sub_matrix_times_scalar(name##_t *self, name##_t *other, type v) {            \
+        if (self->m != other->m || self->n != other->n) return false;                                       \
+        array_type##_sub_array_times_scalar(self->values, other->values, v, self->m * self->n);             \
+        return true;                                                                                        \
+    }                                                                                                       \
+                                                                                                            \
+    static name##_t *name##_read(FILE *f) {                                                                 \
+        name##_t *mat = malloc(sizeof(name##_t));                                                           \
+        if (mat == NULL) return NULL;                                                                       \
+                                                                                                            \
+        mat->values = NULL;                                                                                 \
+                                                                                                            \
+        uint64_t m = 0;                                                                                     \
+        uint64_t n = 0;                                                                                     \
+                                                                                                            \
+        if (!file_read_uint64(f, &m) ||                                                                     \
+            !file_read_uint64(f, &n)) {                                                                     \
+            goto exit_##name##_allocated;                                                                   \
+        }                                                                                                   \
+                                                                                                            \
+        mat->m = (size_t)m;                                                                                 \
+        mat->n = (size_t)n;                                                                                 \
+                                                                                                            \
+        size_t len_data = mat->m * mat->n;                                                                  \
+                                                                                                            \
+        type *data = malloc(len_data * sizeof(type));                                                       \
+        if (data == NULL) {                                                                                 \
+            log_error("error in data malloc\n");                                                            \
+            goto exit_##name##_allocated;                                                                   \
+        }                                                                                                   \
+                                                                                                            \
+        if (!file_read_##array_type(f, data, len_data)) {                                                   \
+            free(data);                                                                                     \
+            goto exit_##name##_allocated;                                                                   \
+        }                                                                                                   \
+                                                                                                            \
+        mat->values = data;                                                                                 \
+                                                                                                            \
+        return mat;                                                                                         \
+                                                                                                            \
+    exit_##name##_allocated:                                                                                \
+        name##_destroy(mat);                                                                                \
+        return NULL;                                                                                        \
+    }                                                                                                       \
+                                                                                                            \
+    static bool name##_write(name##_t *self, FILE *f) {                                                     \
+        if (self == NULL || self->values == NULL) {                                                         \
+            return false;                                                                                   \
+        }                                                                                                   \
+                                                                                                            \
+        if (!file_write_uint64(f, (uint64_t)self->m) ||                                                     \
+            !file_write_uint64(f, (uint64_t)self->n)) {                                                     \
+            return false;                                                                                   \
+        }                                                                                                   \
+                                                                                                            \
+        uint64_t len_data = (uint64_t)self->m * (uint64_t)self->n;                                          \
+                                                                                                            \
+        for (uint64_t i = 0; i < len_data; i++) {                                                           \
+            if (!file_write_##type_name(f, self->values[i])) {                                              \
+                return false;                                                                               \
+            }                                                                                               \
+        }                                                                                                   \
+                                                                                                            \
+        return true;                                                                                        \
+    }

-bool matrix_resize(matrix_t *self, size_t m, size_t n);

-matrix_t *matrix_new_copy(matrix_t *self);
-bool matrix_copy(matrix_t *self, matrix_t *other);
+#define MATRIX_INIT_FLOAT_BASE(name, type, type_name, array_type)                       \
+    MATRIX_INIT(name, type, type_name, array_type)                                      \
+                                                                                        \
+    static inline void name##_log(name##_t *self) {                                     \
+        array_type##_log(self->values, self->m * self->n);                              \
+    }                                                                                   \
+                                                                                        \
+    static inline void name##_exp(name##_t *self) {                                     \
+        array_type##_exp(self->values, self->m * self->n);                              \
+    }                                                                                   \
+                                                                                        \
+    static inline void name##_dot_vector(name##_t *self, type *vec, type *result) {     \
+        type *values = self->values;                                                    \
+        size_t m = self->m;                                                             \
+        size_t n = self->n;                                                             \
+        for (size_t i = 0; i < m; i++) {                                                \
+            for (size_t j = 0; j < n; j++) {                                            \
+                result[i] += values[n * i + j] * vec[j];                                \
+            }                                                                           \
+        }                                                                               \
+    }

-void matrix_init_values(matrix_t *self, double *values);
-void matrix_set(matrix_t *self, double value);
-void matrix_zero(matrix_t *self);
-void matrix_set_row(matrix_t *self, size_t index, double *row);
-void matrix_set_scalar(matrix_t *self, size_t row_index, size_t col_index, double value);
-void matrix_add_scalar(matrix_t *self, size_t row_index, size_t col_index, double value);
-void matrix_sub_scalar(matrix_t *self, size_t row_index, size_t col_index, double value);
-void matrix_mul_scalar(matrix_t *self, size_t row_index, size_t col_index, double value);
-void matrix_div_scalar(matrix_t *self, size_t row_index, size_t col_index, double value);

-double matrix_get(matrix_t *self, size_t row_index, size_t col_index);
-double *matrix_get_row(matrix_t *self, size_t row_index);
+#ifdef HAVE_BLAS
+#define MATRIX_INIT_FLOAT(name, type, type_name, array_type, blas_prefix)                                   \
+    MATRIX_INIT_FLOAT_BASE(name, type, type_name, array_type)                                               \
+                                                                                                            \
+    static inline bool name##_dot_matrix(name##_t *m1, name##_t *m2, name##_t *result) {                    \
+        if (m1->n != m2->m || m1->m != result->m || m2->n != result->n) {                                   \
+            return false;                                                                                   \
+        }                                                                                                   \
+                                                                                                            \
+        log_debug("doing CBLAS\n");                                                                         \
+        cblas_##blas_prefix##gemm(CblasRowMajor, CblasNoTrans, CblasNoTrans,                                \
+                    m1->m, m2->n, m1->n, 1.0,                                                               \
+                    m1->values, m1->n,                                                                      \
+                    m2->values, m2->n, 0.0,                                                                 \
+                    result->values, result->n                                                               \
+                    );                                                                                      \
+                                                                                                            \
+        return true;                                                                                        \
+    }

-void matrix_add(matrix_t *self, double value);
-bool matrix_add_matrix(matrix_t *self, matrix_t *other);
-bool matrix_add_matrix_times_scalar(matrix_t *self, matrix_t *other, double v);
-void matrix_sub(matrix_t *self, double value);
-bool matrix_sub_matrix(matrix_t *self, matrix_t *other);
-bool matrix_sub_matrix_times_scalar(matrix_t *self, matrix_t *other, double v);
-void matrix_mul(matrix_t *self, double value);
-bool matrix_mul_matrix(matrix_t *self, matrix_t *other);
-bool matrix_mul_matrix_times_scalar(matrix_t *self, matrix_t *other, double v);
-void matrix_div(matrix_t *self, double value);
-bool matrix_div_matrix(matrix_t *self, matrix_t *other);
-bool matrix_div_matrix_times_scalar(matrix_t *self, matrix_t *other, double v);
+#else
+#define MATRIX_INIT_FLOAT(name, type, type_name, array_type, blas_prefix)                                       \
+    MATRIX_INIT_FLOAT_BASE(name, type, type_name, array_type)                                                   \
+                                                                                                                \
+    static inline bool name##_dot_matrix(name##_t *m1, name##_t *m2, name##_t *result) {                        \
+        if (m1->n != m2->m || m1->m != result->m || m2->n != result->n) {                                       \
+            return false;                                                                                       \
+        }                                                                                                       \
+                                                                                                                \
+        size_t m1_rows = m1->m;                                                                                 \
+        size_t m1_cols = m1->n;                                                                                 \
+        size_t m2_rows = m2->m;                                                                                 \
+        size_t m2_cols = m2->n;                                                                                 \
+                                                                                                                \
+        type *m1_values = m1->values;                                                                           \
+        type *m2_values = m2->values;                                                                           \
+        type *result_values = result->values;                                                                   \
+                                                                                                                \
+        for (size_t i = 0; i < m1_rows; i++) {                                                                  \
+            for (size_t j = 0; j < m2_cols; j++) {                                                              \
+                size_t result_index = m2_cols * i + j;                                                          \
+                result_values[result_index] = 0.0;                                                              \
+                for (size_t k = 0; k < m2_rows; k++) {                                                          \
+                    result_values[result_index] += m1_values[m1_cols * i + k] * m2_values[m2_cols * k + j];     \
+                }                                                                                               \
+            }                                                                                                   \
+        }                                                                                                       \
+                                                                                                                \
+        return true;                                                                                            \
+    }
+#endif

-void matrix_log(matrix_t *self);
-void matrix_exp(matrix_t *self);
+MATRIX_INIT(uint32_matrix, uint32_t, uint32, uint32_array)

-void matrix_dot_vector(matrix_t *self, double *vec, double *result);
-bool matrix_dot_matrix(matrix_t *m1, matrix_t *m2, matrix_t *result);
+MATRIX_INIT_FLOAT(float_matrix, float, float, float_array,s)
+MATRIX_INIT_FLOAT(double_matrix, double, double, double_array,d)

-matrix_t *matrix_read(FILE *f);
-bool matrix_write(matrix_t *self, FILE *f);
-
-void matrix_destroy(matrix_t *self);

 #endif