ALL: Add flint
This commit is contained in:
258
external/flint-2.4.3/nmod_poly/compose_divconquer.c
vendored
Normal file
258
external/flint-2.4.3/nmod_poly/compose_divconquer.c
vendored
Normal file
@@ -0,0 +1,258 @@
|
||||
/*=============================================================================
|
||||
|
||||
This file is part of FLINT.
|
||||
|
||||
FLINT is free software; you can redistribute it and/or modify
|
||||
it under the terms of the GNU General Public License as published by
|
||||
the Free Software Foundation; either version 2 of the License, or
|
||||
(at your option) any later version.
|
||||
|
||||
FLINT is distributed in the hope that it will be useful,
|
||||
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||
GNU General Public License for more details.
|
||||
|
||||
You should have received a copy of the GNU General Public License
|
||||
along with FLINT; if not, write to the Free Software
|
||||
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
|
||||
|
||||
=============================================================================*/
|
||||
/******************************************************************************
|
||||
|
||||
Copyright (C) 2010 Sebastian Pancratz
|
||||
Copyright (C) 2010 William Hart
|
||||
|
||||
******************************************************************************/
|
||||
|
||||
#include <stdlib.h>
|
||||
#include <gmp.h>
|
||||
#include "flint.h"
|
||||
#include "nmod_vec.h"
|
||||
#include "nmod_poly.h"
|
||||
|
||||
/*
|
||||
Assumptions.
|
||||
|
||||
Suppose that $len1 \geq 3$ and $len2 \geq 2$.
|
||||
|
||||
|
||||
Definitions.
|
||||
|
||||
Define a sequence $(n_i)$ by $n_1 = \ceil{len1 / 2}$,
|
||||
$n_2 = \ceil{n_1 / 2}$, etc. all the way to
|
||||
$n_K = \ceil{n_{K-1} / 2} = 2$. Thus, $K = \ceil{\log_2 len1} - 1$.
|
||||
Note that we can write $n_i = \ceil{len1 / 2^i}$.
|
||||
|
||||
|
||||
Rough description (of the allocation process, or the algorithm).
|
||||
|
||||
Step 1.
|
||||
For $0 \leq i < n_1$, set h[i] to something of length at most len2.
|
||||
Set pow to $poly2^2$.
|
||||
|
||||
Step n.
|
||||
For $0 \leq i < n_n$, set h[i] to something of length at most the length
|
||||
of $poly2^{2^n - 1}$.
|
||||
Set pow to $poly^{2^n}$.
|
||||
|
||||
Step K.
|
||||
For $0 \leq i < n_K$, set h[i] to something of length at most the length
|
||||
of $poly2^{2^K - 1}$.
|
||||
Set pow to $poly^{2^K}$.
|
||||
|
||||
|
||||
Analysis of the space requirements.
|
||||
|
||||
Let $S$ be the over all space we need, measured in number of coefficients.
|
||||
Then
|
||||
\begin{align*}
|
||||
S & = 2 \times \bigl[ (2^K - 1) (len2 - 1) + 1 \bigr]
|
||||
+ \sum_{i=1}^{K-1} (n_i - n_{i+1}) \bigl[(2^i - 1) (len2 - 1) + 1\bigr] \\
|
||||
& = 2 \times \bigl[ (2^K - 1) (len2 - 1) + 1 \bigr]
|
||||
+ (len2 - 1) \sum_{i=1}^{K-1} (n_i - n_{i+1}) (2^i - 1) + n_1 - n_K.
|
||||
\end{align*}
|
||||
|
||||
If $K = 1$, or equivalently $len1$ is 3 or 4, then $S = 2 \times len2$.
|
||||
Otherwise, we can bound $n_i - n_{i+1}$ from above as follows. For any
|
||||
non-negative integer $x$,
|
||||
\begin{equation*}
|
||||
\ceil{x / 2^i} - \ceil{x / 2^{i+1}} \leq x/2^i - x/2^{i+1} = x / 2^{i+1}.
|
||||
\end{equation*}
|
||||
|
||||
Thus,
|
||||
\begin{align*}
|
||||
S & \leq 2 \times \bigl[ (2^K - 1) (len2 - 1) + 1 \bigr]
|
||||
+ (len2 - 1) \times len1 \times \sum_{i=1}^{K-1} (1/2 - 1/2^{i+1}) \\
|
||||
& \leq 2 \times \bigl[ (2^K - 1) (len2 - 1) + 1 \bigr]
|
||||
+ (len2 - 1) \times len1 \times (K/2 + 1).
|
||||
\end{align*}
|
||||
*/
|
||||
|
||||
void
|
||||
_nmod_poly_compose_divconquer(mp_ptr res, mp_srcptr poly1, slong len1,
|
||||
mp_srcptr poly2, slong len2, nmod_t mod)
|
||||
{
|
||||
slong i, j, k, n;
|
||||
slong * hlen, alloc, powlen;
|
||||
mp_ptr v, * h, pow, temp;
|
||||
|
||||
if (len1 == 1)
|
||||
{
|
||||
res[0] = poly1[0];
|
||||
return;
|
||||
}
|
||||
if (len2 == 1)
|
||||
{
|
||||
res[0] = _nmod_poly_evaluate_nmod(poly1, len1, poly2[0], mod);
|
||||
return;
|
||||
}
|
||||
if (len1 == 2)
|
||||
{
|
||||
_nmod_poly_compose_horner(res, poly1, len1, poly2, len2, mod);
|
||||
return;
|
||||
}
|
||||
|
||||
/* Initialisation */
|
||||
|
||||
hlen = (slong *) flint_malloc(((len1 + 1) / 2) * sizeof(slong));
|
||||
|
||||
for (k = 1; (2 << k) < len1; k++) ;
|
||||
|
||||
hlen[0] = hlen[1] = ((1 << k) - 1) * (len2 - 1) + 1;
|
||||
for (i = k - 1; i > 0; i--)
|
||||
{
|
||||
slong hi = (len1 + (1 << i) - 1) / (1 << i);
|
||||
for (n = (hi + 1) / 2; n < hi; n++)
|
||||
hlen[n] = ((1 << i) - 1) * (len2 - 1) + 1;
|
||||
}
|
||||
powlen = (1 << k) * (len2 - 1) + 1;
|
||||
|
||||
alloc = 0;
|
||||
for (i = 0; i < (len1 + 1) / 2; i++)
|
||||
alloc += hlen[i];
|
||||
|
||||
v = _nmod_vec_init(alloc + 2 * powlen);
|
||||
h = (mp_ptr *) flint_malloc(((len1 + 1) / 2) * sizeof(mp_ptr));
|
||||
h[0] = v;
|
||||
for (i = 0; i < (len1 - 1) / 2; i++)
|
||||
{
|
||||
h[i + 1] = h[i] + hlen[i];
|
||||
hlen[i] = 0;
|
||||
}
|
||||
hlen[(len1 - 1) / 2] = 0;
|
||||
pow = v + alloc;
|
||||
temp = pow + powlen;
|
||||
|
||||
/* Let's start the actual work */
|
||||
|
||||
for (i = 0, j = 0; i < len1 / 2; i++, j += 2)
|
||||
{
|
||||
if (poly1[j + 1] != WORD(0))
|
||||
{
|
||||
_nmod_vec_scalar_mul_nmod(h[i], poly2, len2, poly1[j + 1], mod);
|
||||
h[i][0] = n_addmod(h[i][0], poly1[j], mod.n);
|
||||
hlen[i] = len2;
|
||||
}
|
||||
else if (poly1[j] != WORD(0))
|
||||
{
|
||||
h[i][0] = poly1[j];
|
||||
hlen[i] = 1;
|
||||
}
|
||||
}
|
||||
if ((len1 & WORD(1)))
|
||||
{
|
||||
if (poly1[j] != WORD(0))
|
||||
{
|
||||
h[i][0] = poly1[j];
|
||||
hlen[i] = 1;
|
||||
}
|
||||
}
|
||||
|
||||
_nmod_poly_mul(pow, poly2, len2, poly2, len2, mod);
|
||||
powlen = 2 * len2 - 1;
|
||||
|
||||
for (n = (len1 + 1) / 2; n > 2; n = (n + 1) / 2)
|
||||
{
|
||||
if (hlen[1] > 0)
|
||||
{
|
||||
slong templen = powlen + hlen[1] - 1;
|
||||
_nmod_poly_mul(temp, pow, powlen, h[1], hlen[1], mod);
|
||||
_nmod_poly_add(h[0], temp, templen, h[0], hlen[0], mod);
|
||||
hlen[0] = FLINT_MAX(hlen[0], templen);
|
||||
}
|
||||
|
||||
for (i = 1; i < n / 2; i++)
|
||||
{
|
||||
if (hlen[2*i + 1] > 0)
|
||||
{
|
||||
_nmod_poly_mul(h[i], pow, powlen, h[2*i + 1], hlen[2*i + 1], mod);
|
||||
hlen[i] = hlen[2*i + 1] + powlen - 1;
|
||||
} else
|
||||
hlen[i] = 0;
|
||||
_nmod_poly_add(h[i], h[i], hlen[i], h[2*i], hlen[2*i], mod);
|
||||
hlen[i] = FLINT_MAX(hlen[i], hlen[2*i]);
|
||||
}
|
||||
if ((n & WORD(1)))
|
||||
{
|
||||
flint_mpn_copyi(h[i], h[2*i], hlen[2*i]);
|
||||
hlen[i] = hlen[2*i];
|
||||
}
|
||||
|
||||
_nmod_poly_mul(temp, pow, powlen, pow, powlen, mod);
|
||||
powlen += powlen - 1;
|
||||
{
|
||||
mp_ptr t = pow;
|
||||
pow = temp;
|
||||
temp = t;
|
||||
}
|
||||
}
|
||||
|
||||
_nmod_poly_mul(res, pow, powlen, h[1], hlen[1], mod);
|
||||
_nmod_vec_add(res, res, h[0], hlen[0], mod);
|
||||
|
||||
_nmod_vec_clear(v);
|
||||
flint_free(h);
|
||||
flint_free(hlen);
|
||||
}
|
||||
|
||||
void
|
||||
nmod_poly_compose_divconquer(nmod_poly_t res,
|
||||
const nmod_poly_t poly1, const nmod_poly_t poly2)
|
||||
{
|
||||
const slong len1 = poly1->length;
|
||||
const slong len2 = poly2->length;
|
||||
|
||||
if (len1 == 0)
|
||||
{
|
||||
nmod_poly_zero(res);
|
||||
}
|
||||
else if (len1 == 1 || len2 == 0)
|
||||
{
|
||||
nmod_poly_fit_length(res, 1);
|
||||
res->coeffs[0] = poly1->coeffs[0];
|
||||
res->length = (res->coeffs[0] != 0);
|
||||
}
|
||||
else
|
||||
{
|
||||
const slong lenr = (len1 - 1) * (len2 - 1) + 1;
|
||||
|
||||
if (res != poly1 && res != poly2)
|
||||
{
|
||||
nmod_poly_fit_length(res, lenr);
|
||||
_nmod_poly_compose_horner(res->coeffs, poly1->coeffs, len1,
|
||||
poly2->coeffs, len2, poly1->mod);
|
||||
}
|
||||
else
|
||||
{
|
||||
nmod_poly_t t;
|
||||
nmod_poly_init2(t, poly1->mod.n, lenr);
|
||||
_nmod_poly_compose_horner(t->coeffs, poly1->coeffs, len1,
|
||||
poly2->coeffs, len2, poly1->mod);
|
||||
nmod_poly_swap(res, t);
|
||||
nmod_poly_clear(t);
|
||||
}
|
||||
|
||||
res->length = lenr;
|
||||
_nmod_poly_normalise(res);
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user