diff options
Diffstat (limited to 'test/monniaux/float_mat/float_mat_run.c')
-rw-r--r-- | test/monniaux/float_mat/float_mat_run.c | 133 |
1 files changed, 133 insertions, 0 deletions
diff --git a/test/monniaux/float_mat/float_mat_run.c b/test/monniaux/float_mat/float_mat_run.c new file mode 100644 index 00000000..2f590f98 --- /dev/null +++ b/test/monniaux/float_mat/float_mat_run.c @@ -0,0 +1,133 @@ +#include <stdbool.h> +#include <stdlib.h> +#include <stdio.h> +#include <inttypes.h> +#include "float_mat.h" +#include "../cycles.h" + +/* FIXME DMonniaux should be in the other but branches and float_of_int not implemented */ +bool REAL_mat_equal(unsigned m, + unsigned n, + const REAL *a, unsigned stride_a, + const REAL *b, unsigned stride_b) { + for(unsigned i=0; i<m; i++) { + for(unsigned j=0; j<n; j++) { + if (a[i*stride_a + j] != b[i*stride_b + j]) { + printf("at %u,%u: %g vs %g\n", i, j, + a[i*stride_a + j], b[i*stride_b + j]); + return false; + } + } + } + return true; +} + +REAL REAL_random(void) { + static uint64_t next = 1325997111; + next = next * 1103515249 + 12345; + return next % 1000; +} + +void REAL_mat_random(unsigned m, + unsigned n, + REAL *a, unsigned stride_a) { + for(unsigned i=0; i<m; i++) { + for(unsigned j=0; j<n; j++) { + a[i*stride_a + j] = REAL_random(); + } + } +} + +int main() { + const unsigned m = 60, n = 31, p = 50; + cycle_count_config(); + REAL *a = malloc(sizeof(REAL) * m * n); + REAL_mat_random(m, n, a, n); + REAL *b = malloc(sizeof(REAL) * n * p); + REAL_mat_random(n, p, b, p); + + REAL *c1 = malloc(sizeof(REAL) * m * p); + cycle_t c1_time = get_cycle(); + REAL_mat_mul1(m, n, p, c1, p, a, n, b, p); + c1_time = get_cycle()-c1_time; + + REAL *c2 = malloc(sizeof(REAL) * m * p); + cycle_t c2_time = get_cycle(); + REAL_mat_mul2(m, n, p, c2, p, a, n, b, p); + c2_time = get_cycle()-c2_time; + + REAL *c3 = malloc(sizeof(REAL) * m * p); + cycle_t c3_time = get_cycle(); + REAL_mat_mul3(m, n, p, c3, p, a, n, b, p); + c3_time = get_cycle()-c3_time; + + REAL *c4 = malloc(sizeof(REAL) * m * p); + cycle_t c4_time = get_cycle(); + REAL_mat_mul4(m, n, p, c4, p, a, n, b, p); + c4_time = get_cycle()-c4_time; + + REAL *c5 = malloc(sizeof(REAL) * m * p); + cycle_t c5_time = get_cycle(); + REAL_mat_mul5(m, n, p, c5, p, a, n, b, p); + c5_time = get_cycle()-c5_time; + + REAL *c6 = malloc(sizeof(REAL) * m * p); + cycle_t c6_time = get_cycle(); + REAL_mat_mul6(m, n, p, c6, p, a, n, b, p); + c6_time = get_cycle()-c6_time; + + REAL *c7 = malloc(sizeof(REAL) * m * p); + cycle_t c7_time = get_cycle(); + REAL_mat_mul7(m, n, p, c7, p, a, n, b, p); + c7_time = get_cycle()-c7_time; + + REAL *c8 = malloc(sizeof(REAL) * m * p); + cycle_t c8_time = get_cycle(); + REAL_mat_mul8(m, n, p, c8, p, a, n, b, p); + c8_time = get_cycle()-c8_time; + + printf("c1==c2: %s\n" + "c1==c3: %s\n" + "c1==c4: %s\n" + "c1==c5: %s\n" + "c1==c6: %s\n" + "c1==c7: %s\n" + "c1==c8: %s\n" + "c1 cycles: %" PRIu64 "\n" + "c2 cycles: %" PRIu64 "\n" + "c3 cycles: %" PRIu64 "\n" + "c4 cycles: %" PRIu64 "\n" + "c5 cycles: %" PRIu64 "\n" + "c6 cycles: %" PRIu64 "\n" + "c7 cycles: %" PRIu64 "\n" + "c8 cycles: %" PRIu64 "\n", + + REAL_mat_equal(m, n, c1, p, c2, p)?"true":"false", + REAL_mat_equal(m, n, c1, p, c3, p)?"true":"false", + REAL_mat_equal(m, n, c1, p, c4, p)?"true":"false", + REAL_mat_equal(m, n, c1, p, c5, p)?"true":"false", + REAL_mat_equal(m, n, c1, p, c6, p)?"true":"false", + REAL_mat_equal(m, n, c1, p, c7, p)?"true":"false", + REAL_mat_equal(m, n, c1, p, c8, p)?"true":"false", + + c1_time, + c2_time, + c3_time, + c4_time, + c5_time, + c6_time, + c7_time, + c8_time); + + free(a); + free(b); + free(c1); + free(c2); + free(c3); + free(c4); + free(c5); + free(c6); + free(c7); + free(c8); + return 0; +} |