aboutsummaryrefslogtreecommitdiffstats
path: root/test/monniaux/float_mat/float_mat_run.c
diff options
context:
space:
mode:
Diffstat (limited to 'test/monniaux/float_mat/float_mat_run.c')
-rw-r--r--test/monniaux/float_mat/float_mat_run.c133
1 files changed, 133 insertions, 0 deletions
diff --git a/test/monniaux/float_mat/float_mat_run.c b/test/monniaux/float_mat/float_mat_run.c
new file mode 100644
index 00000000..2f590f98
--- /dev/null
+++ b/test/monniaux/float_mat/float_mat_run.c
@@ -0,0 +1,133 @@
+#include <stdbool.h>
+#include <stdlib.h>
+#include <stdio.h>
+#include <inttypes.h>
+#include "float_mat.h"
+#include "../cycles.h"
+
+/* FIXME DMonniaux should be in the other but branches and float_of_int not implemented */
+bool REAL_mat_equal(unsigned m,
+ unsigned n,
+ const REAL *a, unsigned stride_a,
+ const REAL *b, unsigned stride_b) {
+ for(unsigned i=0; i<m; i++) {
+ for(unsigned j=0; j<n; j++) {
+ if (a[i*stride_a + j] != b[i*stride_b + j]) {
+ printf("at %u,%u: %g vs %g\n", i, j,
+ a[i*stride_a + j], b[i*stride_b + j]);
+ return false;
+ }
+ }
+ }
+ return true;
+}
+
+REAL REAL_random(void) {
+ static uint64_t next = 1325997111;
+ next = next * 1103515249 + 12345;
+ return next % 1000;
+}
+
+void REAL_mat_random(unsigned m,
+ unsigned n,
+ REAL *a, unsigned stride_a) {
+ for(unsigned i=0; i<m; i++) {
+ for(unsigned j=0; j<n; j++) {
+ a[i*stride_a + j] = REAL_random();
+ }
+ }
+}
+
+int main() {
+ const unsigned m = 60, n = 31, p = 50;
+ cycle_count_config();
+ REAL *a = malloc(sizeof(REAL) * m * n);
+ REAL_mat_random(m, n, a, n);
+ REAL *b = malloc(sizeof(REAL) * n * p);
+ REAL_mat_random(n, p, b, p);
+
+ REAL *c1 = malloc(sizeof(REAL) * m * p);
+ cycle_t c1_time = get_cycle();
+ REAL_mat_mul1(m, n, p, c1, p, a, n, b, p);
+ c1_time = get_cycle()-c1_time;
+
+ REAL *c2 = malloc(sizeof(REAL) * m * p);
+ cycle_t c2_time = get_cycle();
+ REAL_mat_mul2(m, n, p, c2, p, a, n, b, p);
+ c2_time = get_cycle()-c2_time;
+
+ REAL *c3 = malloc(sizeof(REAL) * m * p);
+ cycle_t c3_time = get_cycle();
+ REAL_mat_mul3(m, n, p, c3, p, a, n, b, p);
+ c3_time = get_cycle()-c3_time;
+
+ REAL *c4 = malloc(sizeof(REAL) * m * p);
+ cycle_t c4_time = get_cycle();
+ REAL_mat_mul4(m, n, p, c4, p, a, n, b, p);
+ c4_time = get_cycle()-c4_time;
+
+ REAL *c5 = malloc(sizeof(REAL) * m * p);
+ cycle_t c5_time = get_cycle();
+ REAL_mat_mul5(m, n, p, c5, p, a, n, b, p);
+ c5_time = get_cycle()-c5_time;
+
+ REAL *c6 = malloc(sizeof(REAL) * m * p);
+ cycle_t c6_time = get_cycle();
+ REAL_mat_mul6(m, n, p, c6, p, a, n, b, p);
+ c6_time = get_cycle()-c6_time;
+
+ REAL *c7 = malloc(sizeof(REAL) * m * p);
+ cycle_t c7_time = get_cycle();
+ REAL_mat_mul7(m, n, p, c7, p, a, n, b, p);
+ c7_time = get_cycle()-c7_time;
+
+ REAL *c8 = malloc(sizeof(REAL) * m * p);
+ cycle_t c8_time = get_cycle();
+ REAL_mat_mul8(m, n, p, c8, p, a, n, b, p);
+ c8_time = get_cycle()-c8_time;
+
+ printf("c1==c2: %s\n"
+ "c1==c3: %s\n"
+ "c1==c4: %s\n"
+ "c1==c5: %s\n"
+ "c1==c6: %s\n"
+ "c1==c7: %s\n"
+ "c1==c8: %s\n"
+ "c1 cycles: %" PRIu64 "\n"
+ "c2 cycles: %" PRIu64 "\n"
+ "c3 cycles: %" PRIu64 "\n"
+ "c4 cycles: %" PRIu64 "\n"
+ "c5 cycles: %" PRIu64 "\n"
+ "c6 cycles: %" PRIu64 "\n"
+ "c7 cycles: %" PRIu64 "\n"
+ "c8 cycles: %" PRIu64 "\n",
+
+ REAL_mat_equal(m, n, c1, p, c2, p)?"true":"false",
+ REAL_mat_equal(m, n, c1, p, c3, p)?"true":"false",
+ REAL_mat_equal(m, n, c1, p, c4, p)?"true":"false",
+ REAL_mat_equal(m, n, c1, p, c5, p)?"true":"false",
+ REAL_mat_equal(m, n, c1, p, c6, p)?"true":"false",
+ REAL_mat_equal(m, n, c1, p, c7, p)?"true":"false",
+ REAL_mat_equal(m, n, c1, p, c8, p)?"true":"false",
+
+ c1_time,
+ c2_time,
+ c3_time,
+ c4_time,
+ c5_time,
+ c6_time,
+ c7_time,
+ c8_time);
+
+ free(a);
+ free(b);
+ free(c1);
+ free(c2);
+ free(c3);
+ free(c4);
+ free(c5);
+ free(c6);
+ free(c7);
+ free(c8);
+ return 0;
+}