/*
Copyright (C) 2010 Fredrik Johansson
Copyright (C) 2021 William Hart
This file is part of FLINT.
FLINT is free software: you can redistribute it and/or modify it under
the terms of the GNU Lesser General Public License (LGPL) as published
by the Free Software Foundation; either version 2.1 of the License, or
(at your option) any later version. See .
*/
#include
#include
#include
#include
#include "flint.h"
#include "nmod_mat.h"
#include "ulong_extras.h"
void
nmod_mat_mul_check(nmod_mat_t C, const nmod_mat_t A, const nmod_mat_t B)
{
slong i, j, k;
mp_limb_t s0, s1, s2;
mp_limb_t t0, t1;
for (i = 0; i < A->r; i++)
{
for (j = 0; j < B->c; j++)
{
s0 = s1 = s2 = UWORD(0);
for (k = 0; k < A->c; k++)
{
umul_ppmm(t1, t0, A->rows[i][k], B->rows[k][j]);
add_sssaaaaaa(s2, s1, s0, s2, s1, s0, 0, t1, t0);
}
NMOD_RED(s2, s2, C->mod);
NMOD_RED3(s0, s2, s1, s0, C->mod);
C->rows[i][j] = s0;
}
}
}
int
main(void)
{
slong i;
FLINT_TEST_INIT(state);
flint_printf("mul....");
fflush(stdout);
for (i = 0; i < 1000 * flint_test_multiplier(); i++)
{
nmod_mat_t A, B, C, D;
mp_limb_t mod;
slong m, k, n;
m = n_randint(state, 75);
k = n_randint(state, 75);
n = n_randint(state, 75);
/* We want to generate matrices with many entries close to half
or full limbs with high probability, to stress overflow handling */
switch (n_randint(state, 3))
{
case 0:
mod = n_randtest_not_zero(state);
break;
case 1:
mod = UWORD_MAX/2 + 1 - n_randbits(state, 4);
break;
case 2:
default:
mod = UWORD_MAX - n_randbits(state, 4);
break;
}
nmod_mat_init(A, m, n, mod);
nmod_mat_init(B, n, k, mod);
nmod_mat_init(C, m, k, mod);
nmod_mat_init(D, m, k, mod);
if (n_randint(state, 2))
nmod_mat_randtest(A, state);
else
nmod_mat_randfull(A, state);
if (n_randint(state, 2))
nmod_mat_randtest(B, state);
else
nmod_mat_randfull(B, state);
nmod_mat_randtest(C, state); /* make sure noise in the output is ok */
nmod_mat_mul(C, A, B);
nmod_mat_mul_check(D, A, B);
if (!nmod_mat_equal(C, D))
{
flint_printf("FAIL: results not equal\n");
nmod_mat_print_pretty(A);
nmod_mat_print_pretty(B);
nmod_mat_print_pretty(C);
nmod_mat_print_pretty(D);
abort();
}
if (n == k)
{
nmod_mat_mul(A, A, B);
if (!nmod_mat_equal(A, C))
{
flint_printf("FAIL: aliasing failed\n");
flint_abort();
}
}
nmod_mat_clear(A);
nmod_mat_clear(B);
nmod_mat_clear(C);
nmod_mat_clear(D);
}
/* Test aliasing with windows */
{
nmod_mat_t A, B, A_window;
nmod_mat_init(A, 2, 2, 3);
nmod_mat_init(B, 2, 2, 3);
nmod_mat_window_init(A_window, A, 0, 0, 2, 2);
nmod_mat_one(A);
nmod_mat_one(B);
nmod_mat_entry(B, 0, 1) = 1;
nmod_mat_entry(B, 1, 0) = 1;
nmod_mat_mul(A_window, B, A_window);
if (!nmod_mat_equal(A, B))
{
flint_printf("FAIL: window aliasing failed\n");
nmod_mat_print_pretty(A); flint_printf("\n\n");
nmod_mat_print_pretty(B); flint_printf("\n\n");
flint_abort();
}
nmod_mat_window_clear(A_window);
nmod_mat_clear(A);
nmod_mat_clear(B);
}
FLINT_TEST_CLEANUP(state);
flint_printf("PASS\n");
return 0;
}