~ubuntu-branches/ubuntu/wily/libzn-poly/wily

« back to all changes in this revision

Viewing changes to midmul.c

Committer: Bazaar Package Importer
Author(s): Tim Abbott
Date: 2008-05-27 20:23:43 UTC
Revision ID: james.westby@ubuntu.com-20080527202343-ufcb3fwj2as0edoz

Tags: upstream-0.8

Import upstream version 0.8

files added:

CHANGES

COPYING

README

REFERENCES

array-profile-main.c

array-profile.c

array.c

bernoulli.c

configure

gpl-2.0.txt

gpl-3.0.txt

invert-profile-main.c

invert-profile.c

invert-test.c

invert.c

makemakefile.py

midmul-profile-main.c

midmul-profile.c

midmul-tune.c

midmul.c

midmul_fft-test.c

midmul_fft.c

misc.c

mul-profile-main.c

mul-profile.c

mul-tune.c

mul.c

mul_fft-profile.c

mul_fft-test.c

mul_fft.c

mul_fft_dft.c

mul_ks-profile.c

mul_ks-test.c

mul_ks-tune.c

mul_ks.c

negamul-profile-main.c

negamul-profile.c

ntl-profile-dummy.c

ntl-profile.c

nussbaumer-test.c

nussbaumer-tune.c

nussbaumer.c

pack-test.c

pack.c

pmf.c

prof_main.c

profiler.c

profiler.h

ref_mul.c

support.c

support.h

test.c

tune.c

tuning.c

wide_arith.h

zn_mod.c

zn_poly.h

zn_poly_internal.h

Show diffs side-by-side

added added

removed removed

midmul.c

midmul.c: middle products

This file is part of the zn_poly library (version 0.8).

This program is free software: you can redistribute it and/or modify

it under the terms of the GNU General Public License as published by

the Free Software Foundation, either version 2 of the License, or

(at your option) version 3 of the License.

This program is distributed in the hope that it will be useful,

but WITHOUT ANY WARRANTY; without even the implied warranty of

MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

GNU General Public License for more details.

You should have received a copy of the GNU General Public License

along with this program. If not, see <http://www.gnu.org/licenses/>.

#include "zn_poly_internal.h"

ulong zn_array_midmul_fallback_get_fudge(size_t len1, size_t len2,

const zn_mod_t mod)

{

return _zn_array_mul_get_fudge(len1, len2, 0, mod);

}

void zn_array_midmul_fallback(ulong* res, const ulong* op1, size_t len1,

const ulong* op2, size_t len2, int fastred,

const zn_mod_t mod)

{

ZNP_ASSERT(len2 >= 1);

ZNP_ASSERT(len1 >= len2);

ZNP_FASTALLOC(temp, ulong, 6624, len1 + len2 - 1);

// just do full product and extract relevant segment

_zn_array_mul(temp, op1, len1, op2, len2, fastred, mod);

zn_array_copy(res, temp + len2 - 1, len1 - len2 + 1);

ZNP_FASTFREE(temp);

}

void _zn_array_midmul(ulong* res, const ulong* op1, size_t len1,

const ulong* op2, size_t len2, int fastred,

const zn_mod_t mod)

{

ZNP_ASSERT(len2 >= 1);

ZNP_ASSERT(len1 >= len2);

tuning_info_t* i = &tuning_info[mod->bits];

if (len2 < i->midmul_fft_crossover || !(mod->n & 1))

// (can't use FFT algorithm if the modulus is even)

zn_array_midmul_fallback(res, op1, len1, op2, len2, fastred, mod);

else

{

ulong scale = zn_array_midmul_fft_get_fudge(len1, len2, mod);

zn_array_midmul_fft(res, op1, len1, op2, len2, scale, mod);

}

void zn_array_midmul(ulong* res, const ulong* op1, size_t len1,

const ulong* op2, size_t len2, const zn_mod_t mod)

{

_zn_array_midmul(res, op1, len1, op2, len2, 0, mod);

}

void zn_array_midmul_precomp1_init(zn_array_midmul_precomp1_t res,

const ulong* op1, size_t len1,

size_t len2, const zn_mod_t mod)

{

res->len1 = len1;

res->len2 = len2;

res->mod = mod;

int odd = (mod->n & 1);

// figure out which algorithm to use

if (!odd)

// can't use FFT algorithm when modulus is even

res->algo = ZNP_MIDMUL_ALGO_FALLBACK;

else

{

tuning_info_t* i = &tuning_info[mod->bits];

if (len2 < i->midmul_fft_crossover)

res->algo = ZNP_MIDMUL_ALGO_FALLBACK;

else

100

res->algo = ZNP_MIDMUL_ALGO_FFT;

101

}

102

103

// now perform initialisation for chosen algorithm

104

105

switch (res->algo)

106

{

107

case ZNP_MIDMUL_ALGO_FALLBACK:

108

{

109

// Make a copy of op1[0, len1).

110

111

// If modulus is odd, multiply it by the appropriate fudge factor

112

// so that we can use faster REDC reduction in the execute() routine.

113

res->op1 = (ulong*) malloc(len1 * sizeof(ulong));

114

if (odd)

115

{

116

ulong scale = zn_array_midmul_fallback_get_fudge(len1, len2, mod);

117

zn_array_scalar_mul(res->op1, op1, len1, scale, mod);

118

}

119

else

120

zn_array_copy(res->op1, op1, len1);

121

}

122

break;

123

124

case ZNP_MIDMUL_ALGO_FFT:

125

{

126

res->precomp_fft = (struct zn_array_midmul_fft_precomp1_struct*)

127

malloc(sizeof(zn_array_midmul_fft_precomp1_t));

128

129

// we do scaling in this init() routine, to avoid doing it during

130

// each call to execute()

131

ulong scale = zn_array_midmul_fft_precomp1_get_fudge(len1, len2, mod);

132

zn_array_midmul_fft_precomp1_init(res->precomp_fft,

133

op1, len1, len2, scale, mod);

134

}

135

break;

136

137

default: ZNP_ASSERT(0);

138

}

139

}

140

141

142

void zn_array_midmul_precomp1_clear(zn_array_midmul_precomp1_t op)

143

{

144

// dispatch to appropriate cleanup code

145

switch (op->algo)

146

{

147

case ZNP_MIDMUL_ALGO_FALLBACK:

148

free(op->op1);

149

break;

150

151

case ZNP_MIDMUL_ALGO_FFT:

152

zn_array_midmul_fft_precomp1_clear(op->precomp_fft);

153

free(op->precomp_fft);

154

break;

155

156

default: ZNP_ASSERT(0);

157

}

158

}

159

160

161

162

void zn_array_midmul_precomp1_execute(

163

ulong* res, const ulong* op2,

164

const zn_array_midmul_precomp1_t precomp)

165

{

166

// dispatch to appropriate middle product code

167

switch (precomp->algo)

168

{

169

case ZNP_MIDMUL_ALGO_FALLBACK:

170

zn_array_midmul_fallback(res, precomp->op1, precomp->len1,

171

op2, precomp->len2, precomp->mod->n & 1,

172

precomp->mod);

173

break;

174

175

case ZNP_MIDMUL_ALGO_FFT:

176

zn_array_midmul_fft_precomp1_execute(res, op2, 1,

177

precomp->precomp_fft);

178

break;

179

180

default: ZNP_ASSERT(0);

181

}

182

}

183

184

185

// end of file ****************************************************************

Older »