~ubuntu-branches/ubuntu/lucid/openssl/lucid-proposed

« back to all changes in this revision

Viewing changes to crypto/bn/asm/x86-mont.pl

Committer: Bazaar Package Importer
Author(s): Kurt Roeckx
Date: 2009-06-13 18:15:46 UTC
mto: (11.1.5 squeeze)
mto: This revision was merged to the branch mainline in revision 34.
Revision ID: james.westby@ubuntu.com-20090613181546-vbfntai3b009dl1u

Tags: upstream-0.9.8k

Import upstream version 0.9.8k

files added:
apps/cms.c

apps/genpkey.c

apps/pkey.c

apps/pkeyparam.c

apps/pkeyutl.c

apps/ts.c

apps/tsget

certs/README.RootCerts

crypto/aes/aes_wrap.c

crypto/aes/aes_x86core.c

crypto/aes/asm/aes-armv4.pl

crypto/aes/asm/aes-ppc.pl

crypto/aes/asm/aes-s390x.pl

crypto/aes/asm/aes-sparcv9.pl

crypto/aes/asm/aes-x86_64.pl

crypto/asn1/ameth_lib.c

crypto/asn1/asn1_locl.h

crypto/asn1/asn_mime.c

crypto/asn1/bio_asn1.c

crypto/asn1/bio_ndef.c

crypto/asn1/x_nx509.c

crypto/bn/asm/alpha-mont.pl

crypto/bn/asm/armv4-mont.pl

crypto/bn/asm/mips3-mont.pl

crypto/bn/asm/mo-586.pl

crypto/bn/asm/ppc-mont.pl

crypto/bn/asm/ppc64-mont.pl

crypto/bn/asm/s390x-mont.pl

crypto/bn/asm/s390x.S

crypto/bn/asm/sparcv9-mont.pl

crypto/bn/asm/sparcv9a-mont.pl

crypto/bn/asm/via-mont.pl

crypto/bn/asm/x86-mont.pl

crypto/bn/asm/x86_64-mont.pl

crypto/bn/bn_opt.c

crypto/bn/bn_x931p.c

crypto/buffer/buf_str.c

crypto/camellia/asm

crypto/camellia/asm/cmll-x86.pl

crypto/camellia/asm/cmll-x86_64.pl

crypto/cms

crypto/cms/Makefile

crypto/cms/cms.h

crypto/cms/cms_asn1.c

crypto/cms/cms_att.c

crypto/cms/cms_cd.c

crypto/cms/cms_dd.c

crypto/cms/cms_enc.c

crypto/cms/cms_env.c

crypto/cms/cms_err.c

crypto/cms/cms_ess.c

crypto/cms/cms_io.c

crypto/cms/cms_lcl.h

crypto/cms/cms_lib.c

crypto/cms/cms_sd.c

crypto/cms/cms_smime.c

crypto/des/des_lib.c

crypto/dsa/dsa_utl.c

crypto/dyn_lck.c

crypto/err/err_bio.c

crypto/err/err_def.c

crypto/err/err_str.c

crypto/evp/dig_eng.c

crypto/evp/enc_min.c

crypto/evp/evp_cnf.c

crypto/fips_err.c

crypto/fips_err.h

crypto/jpake

crypto/jpake/Makefile

crypto/jpake/jpake.c

crypto/jpake/jpake.h

crypto/jpake/jpake_err.c

crypto/jpake/jpaketest.c

crypto/o_init.c

crypto/ppccpuid.pl

crypto/rand/rand_eng.c

crypto/rc4/rc4_fblk.c

crypto/rsa/rsa_eng.c

crypto/rsa/rsa_x931g.c

crypto/s390xcpuid.S

crypto/sha/asm/sha1-x86_64.pl

crypto/sha/asm/sha512-x86_64.pl

crypto/sparcv9cap.c

demos/jpake

demos/jpake/Makefile

demos/jpake/jpakedemo.c

engines/e_capi.c

engines/e_capi.ec

engines/e_capi_err.c

engines/e_capi_err.h

fips

fips/Makefile

fips/aes

fips/aes/Makefile

fips/aes/fips_aes_selftest.c

fips/aes/fips_aesavs.c

fips/des

fips/des/Makefile

fips/des/fips_des_selftest.c

fips/des/fips_desmovs.c

fips/dh

fips/dh/Makefile

fips/dh/dh_gen.c

fips/dh/fips_dh_check.c

fips/dh/fips_dh_gen.c

fips/dh/fips_dh_key.c

fips/dh/fips_dh_lib.c

fips/dsa

fips/dsa/Makefile

fips/dsa/fips_dsa_gen.c

fips/dsa/fips_dsa_key.c

fips/dsa/fips_dsa_lib.c

fips/dsa/fips_dsa_ossl.c

fips/dsa/fips_dsa_selftest.c

fips/dsa/fips_dsa_sign.c

fips/dsa/fips_dsatest.c

fips/dsa/fips_dssvs.c

fips/fips-lib.com

fips/fips-nodiff.txt

fips/fips.c

fips/fips.h

fips/fips_canister.c

fips/fips_locl.h

fips/fips_premain.c

fips/fips_premain.c.sha1

fips/fips_test_suite.c

fips/fips_utl.h

fips/fipsalgtest.pl

fips/fipsld

fips/fipstests.bat

fips/fipstests.sh

fips/hmac

fips/hmac/Makefile

fips/hmac/fips_hmac.c

fips/hmac/fips_hmac_selftest.c

fips/hmac/fips_hmactest.c

fips/install.com

fips/mkfipsscr.pl

fips/openssl_fips_fingerprint

fips/rand

fips/rand/Makefile

fips/rand/fips_rand.c

fips/rand/fips_rand.h

fips/rand/fips_rand_selftest.c

fips/rand/fips_randtest.c

fips/rand/fips_rngvs.c

fips/rsa

fips/rsa/Makefile

fips/rsa/fips_rsa_eay.c

fips/rsa/fips_rsa_gen.c

fips/rsa/fips_rsa_lib.c

fips/rsa/fips_rsa_selftest.c

fips/rsa/fips_rsa_sign.c

fips/rsa/fips_rsa_x931g.c

fips/rsa/fips_rsagtest.c

fips/rsa/fips_rsastest.c

fips/rsa/fips_rsavtest.c

fips/sha

fips/sha/Makefile

fips/sha/fips_sha1_selftest.c

fips/sha/fips_shatest.c

fips/sha/fips_standalone_sha1.c

include/openssl/fips.h

include/openssl/fips_rand.h

ms/do_fips.bat

ms/segrenam.pl

test/SHAmix.r

test/SHAmix.x

test/cms-examples.pl

test/cms-test.pl

test/fips_aesavs.c

test/fips_desmovs.c

test/fips_dsatest.c

test/fips_dssvs.c

test/fips_hmactest.c

test/fips_randtest.c

test/fips_rngvs.c

test/fips_rsagtest.c

test/fips_rsastest.c

test/fips_rsavtest.c

test/fips_shatest.c

test/fips_test_suite.c

test/jpaketest.c

test/smcont.txt

test/smime-certs

test/smime-certs/smdsa1.pem

test/smime-certs/smdsa2.pem

test/smime-certs/smdsa3.pem

test/smime-certs/smdsap.pem

test/smime-certs/smroot.pem

test/smime-certs/smrsa1.pem

test/smime-certs/smrsa2.pem

test/smime-certs/smrsa3.pem

test/testfipsssl

util/arx.pl

util/fipslink.pl

util/mksdef.pl

files removed:
ChangeLog.0_9_7-stable_not-in-head

ChangeLog.0_9_7-stable_not-in-head_FIPS

certs/RegTP-5R.pem

certs/RegTP-6R.pem

certs/aol1.pem

certs/aol2.pem

certs/aoltw1.pem

certs/aoltw2.pem

certs/argena.pem

certs/argeng.pem

certs/demo/nortelCA.pem

certs/demo/timCA.pem

certs/demo/tjhCA.pem

certs/demo/vsigntca.pem

certs/eng1.pem

certs/eng2.pem

certs/eng3.pem

certs/eng4.pem

certs/eng5.pem

certs/expired/ICE-CA.pem

certs/expired/ICE-root.pem

certs/expired/ICE-user.pem

certs/expired/RegTP-4R.pem

certs/expired/factory.pem

certs/expired/rsa-cca.pem

certs/expired/rsa-ssca.pem

certs/expired/vsign2.pem

certs/expired/vsign3.pem

certs/thawteCb.pem

certs/thawteCp.pem

certs/vsign1.pem

certs/vsign3.pem

certs/vsignss.pem

certs/wellsfgo.pem

crypto/md5/asm/md5-sparcv9.S

files modified:
CHANGES

Configure

INSTALL

INSTALL.NW

LICENSE

MacOS/GetHTTPS.src/ErrorHandling.hpp

Makefile

Makefile.org

Makefile.shared

NEWS

Netware/build.bat

Netware/cpy_tests.bat

Netware/do_tests.pl

Netware/set_env.bat

README

apps/Makefile

apps/apps.c

apps/apps.h

apps/asn1pars.c

apps/ca.c

apps/crl.c

apps/dgst.c

apps/dsa.c

apps/ec.c

apps/enc.c

apps/engine.c

apps/genrsa.c

apps/nseq.c

apps/ocsp.c

apps/openssl.c

apps/pkcs12.c

apps/pkcs8.c

apps/progs.h

apps/progs.pl

apps/rand.c

apps/req.c

apps/rsautl.c

apps/s_client.c

apps/s_server.c

apps/smime.c

apps/speed.c

apps/spkac.c

apps/verify.c

apps/version.c

apps/x509.c

config

crypto/Makefile

crypto/aes/Makefile

crypto/aes/aes.h

crypto/aes/aes_cbc.c

crypto/aes/aes_core.c

crypto/aes/asm/aes-586.pl

crypto/asn1/Makefile

crypto/asn1/a_bytes.c

crypto/asn1/a_mbstr.c

crypto/asn1/a_object.c

crypto/asn1/a_sign.c

crypto/asn1/a_strex.c

crypto/asn1/a_strnid.c

crypto/asn1/a_type.c

crypto/asn1/a_verify.c

crypto/asn1/asn1.h

crypto/asn1/asn1_err.c

crypto/asn1/asn1_gen.c

crypto/asn1/asn1_lib.c

crypto/asn1/asn1_par.c

crypto/asn1/asn1t.h

crypto/asn1/asn_moid.c

crypto/asn1/asn_pack.c

crypto/asn1/nsseq.c

crypto/asn1/p5_pbe.c

crypto/asn1/p5_pbev2.c

crypto/asn1/p8_pkey.c

crypto/asn1/t_bitst.c

crypto/asn1/t_crl.c

crypto/asn1/t_spki.c

crypto/asn1/t_x509.c

crypto/asn1/t_x509a.c

crypto/asn1/tasn_dec.c

crypto/asn1/tasn_enc.c

crypto/asn1/tasn_fre.c

crypto/asn1/tasn_new.c

crypto/asn1/tasn_prn.c

crypto/asn1/tasn_typ.c

crypto/asn1/tasn_utl.c

crypto/asn1/x_algor.c

crypto/asn1/x_bignum.c

crypto/asn1/x_exten.c

crypto/asn1/x_long.c

crypto/asn1/x_x509a.c

crypto/bf/Makefile

crypto/bf/bf_skey.c

crypto/bf/blowfish.h

crypto/bio/Makefile

crypto/bio/b_sock.c

crypto/bio/bio.h

crypto/bio/bss_bio.c

crypto/bio/bss_dgram.c

crypto/bio/bss_file.c

crypto/bio/bss_mem.c

crypto/bio/bss_sock.c

crypto/bn/Makefile

crypto/bn/bn.h

crypto/bn/bn_div.c

crypto/bn/bn_gf2m.c

crypto/bn/bn_lcl.h

crypto/bn/bn_lib.c

crypto/bn/bn_mont.c

crypto/bn/bn_mul.c

crypto/bn/bn_nist.c

crypto/bn/bn_rand.c

crypto/bn/bn_shift.c

crypto/bn/bntest.c

crypto/buffer/Makefile

crypto/buffer/buffer.c

crypto/camellia/Makefile

crypto/camellia/camellia.h

crypto/camellia/cmll_misc.c

crypto/cast/Makefile

crypto/cast/c_skey.c

crypto/cast/cast.h

crypto/comp/Makefile

crypto/comp/c_zlib.c

crypto/comp/comp.h

crypto/comp/comp_err.c

crypto/conf/Makefile

crypto/conf/conf_mall.c

crypto/conf/conf_mod.c

crypto/conf/conf_sap.c

crypto/cryptlib.c

crypto/cryptlib.h

crypto/crypto-lib.com

crypto/crypto.h

crypto/des/Makefile

crypto/des/asm/des_enc.m4

crypto/des/des.h

crypto/des/des_enc.c

crypto/des/des_old.c

crypto/des/des_old.h

crypto/des/ecb_enc.c

crypto/des/enc_read.c

crypto/des/enc_writ.c

crypto/des/set_key.c

crypto/des/times/usparc.cc

crypto/des/xcbc_enc.c

crypto/dh/Makefile

crypto/dh/dh.h

crypto/dh/dh_asn1.c

crypto/dh/dh_check.c

crypto/dh/dh_err.c

crypto/dh/dh_gen.c

crypto/dh/dh_key.c

crypto/dsa/Makefile

crypto/dsa/dsa.h

crypto/dsa/dsa_asn1.c

crypto/dsa/dsa_err.c

crypto/dsa/dsa_gen.c

crypto/dsa/dsa_key.c

crypto/dsa/dsa_lib.c

crypto/dsa/dsa_ossl.c

crypto/dsa/dsa_sign.c

crypto/dsa/dsa_vrf.c

crypto/dso/Makefile

crypto/ec/Makefile

crypto/ec/ec_key.c

crypto/ecdh/Makefile

crypto/ecdsa/Makefile

crypto/ecdsa/ecs_ossl.c

crypto/engine/Makefile

crypto/engine/eng_all.c

crypto/engine/eng_cnf.c

crypto/engine/eng_err.c

crypto/engine/eng_int.h

crypto/engine/eng_padlock.c

crypto/engine/eng_pkey.c

crypto/engine/eng_table.c

crypto/engine/engine.h

crypto/engine/enginetest.c

crypto/err/Makefile

crypto/err/err.c

crypto/err/err.h

crypto/err/err_all.c

crypto/err/err_prn.c

crypto/err/openssl.ec

crypto/evp/Makefile

crypto/evp/bio_md.c

crypto/evp/digest.c

crypto/evp/e_aes.c

crypto/evp/e_camellia.c

crypto/evp/e_des.c

crypto/evp/e_des3.c

crypto/evp/e_null.c

crypto/evp/e_rc4.c

crypto/evp/evp.h

crypto/evp/evp_acnf.c

crypto/evp/evp_enc.c

crypto/evp/evp_err.c

crypto/evp/evp_lib.c

crypto/evp/evp_locl.h

crypto/evp/evp_pbe.c

crypto/evp/evp_pkey.c

crypto/evp/evp_test.c

crypto/evp/m_dss.c

crypto/evp/m_dss1.c

crypto/evp/m_md2.c

crypto/evp/m_md4.c

crypto/evp/m_md5.c

crypto/evp/m_mdc2.c

crypto/evp/m_sha.c

crypto/evp/m_sha1.c

crypto/evp/names.c

crypto/evp/p5_crpt.c

crypto/evp/p5_crpt2.c

crypto/evp/p_sign.c

crypto/evp/p_verify.c

crypto/hmac/Makefile

crypto/hmac/hmac.c

crypto/hmac/hmac.h

crypto/idea/Makefile

crypto/idea/i_skey.c

crypto/idea/idea.h

crypto/install.com

crypto/krb5/Makefile

crypto/lhash/Makefile

crypto/md2/Makefile

crypto/md2/md2.h

crypto/md2/md2_dgst.c

crypto/md32_common.h

crypto/md4/Makefile

crypto/md4/md4.h

crypto/md4/md4_dgst.c

crypto/md4/md4_locl.h

crypto/md5/Makefile

crypto/md5/asm/md5-586.pl

crypto/md5/asm/md5-x86_64.pl

crypto/md5/md5.h

crypto/md5/md5_dgst.c

crypto/md5/md5_locl.h

crypto/mdc2/Makefile

crypto/mdc2/mdc2.h

crypto/mdc2/mdc2dgst.c

crypto/mem.c

crypto/mem_dbg.c

crypto/o_str.c

crypto/objects/Makefile

crypto/objects/obj_dat.c

crypto/objects/obj_dat.h

crypto/objects/obj_dat.pl

crypto/objects/obj_mac.h

crypto/objects/obj_mac.num

crypto/objects/objects.txt

crypto/ocsp/Makefile

crypto/ocsp/ocsp.h

crypto/ocsp/ocsp_asn.c

crypto/ocsp/ocsp_err.c

crypto/ocsp/ocsp_ht.c

crypto/ocsp/ocsp_srv.c

crypto/ocsp/ocsp_vfy.c

crypto/opensslconf.h

crypto/opensslconf.h.in

crypto/opensslv.h

crypto/ossl_typ.h

crypto/pem/Makefile

crypto/pem/pem.h

crypto/pem/pem_all.c

crypto/pem/pem_info.c

crypto/pem/pem_lib.c

crypto/pem/pem_x509.c

crypto/pem/pem_xaux.c

crypto/perlasm/x86_64-xlate.pl

crypto/perlasm/x86ms.pl

crypto/perlasm/x86nasm.pl

crypto/perlasm/x86unix.pl

crypto/pkcs12/Makefile

crypto/pkcs12/p12_add.c

crypto/pkcs12/p12_asn.c

crypto/pkcs12/p12_attr.c

crypto/pkcs12/p12_crpt.c

crypto/pkcs12/p12_crt.c

crypto/pkcs12/p12_decr.c

crypto/pkcs12/p12_init.c

crypto/pkcs12/p12_key.c

crypto/pkcs12/p12_kiss.c

crypto/pkcs12/p12_mutl.c

crypto/pkcs12/p12_npas.c

crypto/pkcs12/p12_p8d.c

crypto/pkcs12/p12_p8e.c

crypto/pkcs12/p12_utl.c

crypto/pkcs12/pkcs12.h

crypto/pkcs7/Makefile

crypto/pkcs7/pk7_asn1.c

crypto/pkcs7/pk7_attr.c

crypto/pkcs7/pk7_mime.c

crypto/pkcs7/pk7_smime.c

crypto/pqueue/Makefile

crypto/pqueue/pq_compat.h

crypto/rand/Makefile

crypto/rand/md_rand.c

crypto/rand/rand.h

crypto/rand/rand_err.c

crypto/rand/rand_lcl.h

crypto/rand/rand_lib.c

crypto/rand/rand_nw.c

crypto/rand/rand_unix.c

crypto/rand/randfile.c

crypto/rc2/Makefile

crypto/rc2/rc2.h

crypto/rc2/rc2_skey.c

crypto/rc4/Makefile

crypto/rc4/asm/rc4-586.pl

crypto/rc4/asm/rc4-x86_64.pl

crypto/rc4/rc4.h

crypto/rc4/rc4_skey.c

crypto/rc5/Makefile

crypto/rc5/rc5.h

crypto/rc5/rc5_skey.c

crypto/ripemd/Makefile

crypto/ripemd/README

crypto/ripemd/asm/rmd-586.pl

crypto/ripemd/ripemd.h

crypto/ripemd/rmd_dgst.c

crypto/ripemd/rmd_locl.h

crypto/rsa/Makefile

crypto/rsa/rsa.h

crypto/rsa/rsa_asn1.c

crypto/rsa/rsa_eay.c

crypto/rsa/rsa_err.c

crypto/rsa/rsa_gen.c

crypto/rsa/rsa_lib.c

crypto/rsa/rsa_null.c

crypto/rsa/rsa_oaep.c

crypto/rsa/rsa_pss.c

crypto/rsa/rsa_sign.c

crypto/rsa/rsa_ssl.c

crypto/rsa/rsa_x931.c

crypto/seed/Makefile

crypto/sha/Makefile

crypto/sha/asm/sha1-586.pl

crypto/sha/asm/sha1-ia64.pl

crypto/sha/asm/sha512-ia64.pl

crypto/sha/sha.h

crypto/sha/sha1_one.c

crypto/sha/sha1dgst.c

crypto/sha/sha256.c

crypto/sha/sha512.c

crypto/sha/sha_dgst.c

crypto/sha/sha_locl.h

crypto/sha/shatest.c

crypto/stack/Makefile

crypto/stack/safestack.h

crypto/store/Makefile

crypto/symhacks.h

crypto/txt_db/Makefile

crypto/ui/Makefile

crypto/ui/ui_lib.c

crypto/ui/ui_openssl.c

crypto/x509/Makefile

crypto/x509/by_dir.c

crypto/x509/x509.h

crypto/x509/x509_att.c

crypto/x509/x509_cmp.c

crypto/x509/x509_trs.c

crypto/x509/x509_vfy.c

crypto/x509/x509_vpm.c

crypto/x509/x509cset.c

crypto/x509/x509spki.c

crypto/x509v3/Makefile

crypto/x509v3/ext_dat.h

crypto/x509v3/pcy_cache.c

crypto/x509v3/pcy_data.c

crypto/x509v3/pcy_int.h

crypto/x509v3/pcy_lib.c

crypto/x509v3/pcy_map.c

crypto/x509v3/pcy_node.c

crypto/x509v3/pcy_tree.c

crypto/x509v3/tabtest.c

crypto/x509v3/v3_addr.c

crypto/x509v3/v3_akey.c

crypto/x509v3/v3_akeya.c

crypto/x509v3/v3_alt.c

crypto/x509v3/v3_asid.c

crypto/x509v3/v3_bcons.c

crypto/x509v3/v3_bitst.c

crypto/x509v3/v3_conf.c

crypto/x509v3/v3_cpols.c

crypto/x509v3/v3_crld.c

crypto/x509v3/v3_enum.c

crypto/x509v3/v3_extku.c

crypto/x509v3/v3_genn.c

crypto/x509v3/v3_ia5.c

crypto/x509v3/v3_info.c

crypto/x509v3/v3_int.c

crypto/x509v3/v3_lib.c

crypto/x509v3/v3_ncons.c

crypto/x509v3/v3_ocsp.c

crypto/x509v3/v3_pcons.c

crypto/x509v3/v3_pku.c

crypto/x509v3/v3_pmaps.c

crypto/x509v3/v3_prn.c

crypto/x509v3/v3_purp.c

crypto/x509v3/v3_skey.c

crypto/x509v3/v3_sxnet.c

crypto/x509v3/v3_utl.c

crypto/x509v3/v3conf.c

crypto/x509v3/v3prin.c

crypto/x509v3/x509v3.h

crypto/x86_64cpuid.pl

crypto/x86cpuid.pl

demos/asn1/ocsp.c

demos/engines/cluster_labs/hw_cluster_labs_err.h

demos/engines/ibmca/hw_ibmca_err.h

demos/engines/zencod/hw_zencod_err.h

doc/apps/dgst.pod

doc/apps/ocsp.pod

doc/apps/rand.pod

doc/apps/s_server.pod

doc/apps/verify.pod

doc/apps/x509.pod

doc/c-indentation.el

doc/crypto/ASN1_generate_nconf.pod

doc/crypto/DH_set_method.pod

doc/crypto/DSA_set_method.pod

doc/crypto/OPENSSL_ia32cap.pod

doc/crypto/RAND_egd.pod

doc/crypto/RAND_set_rand_method.pod

doc/crypto/RSA_set_method.pod

doc/crypto/engine.pod

doc/ssl/SSL_CIPHER_get_name.pod

doc/ssl/SSL_CTX_set_verify.pod

doc/ssl/SSL_SESSION_free.pod

doc/ssl/SSL_free.pod

doc/ssl/SSL_read.pod

doc/ssleay.txt

e_os.h

engines/Makefile

engines/e_4758cca_err.h

engines/e_aep.c

engines/e_aep_err.h

engines/e_atalla_err.h

engines/e_chil.c

engines/e_chil_err.c

engines/e_chil_err.h

engines/e_cswift_err.h

engines/e_gmp.c

engines/e_gmp_err.h

engines/e_nuron_err.h

engines/e_sureware_err.h

engines/e_ubsec_err.h

engines/makeengines.com

makevms.com

ms/do_masm.bat

ms/do_nasm.bat

ms/test.bat

openssl.spec

ssl/Makefile

ssl/d1_clnt.c

ssl/d1_enc.c

ssl/d1_lib.c

ssl/d1_pkt.c

ssl/d1_srvr.c

ssl/dtls1.h

ssl/kssl.c

ssl/s23_clnt.c

ssl/s23_srvr.c

ssl/s2_clnt.c

ssl/s2_srvr.c

ssl/s3_clnt.c

ssl/s3_enc.c

ssl/s3_lib.c

ssl/s3_pkt.c

ssl/s3_srvr.c

ssl/ssl.h

ssl/ssl3.h

ssl/ssl_asn1.c

ssl/ssl_ciph.c

ssl/ssl_err.c

ssl/ssl_lib.c

ssl/ssl_locl.h

ssl/ssl_rsa.c

ssl/ssl_sess.c

ssl/ssl_stat.c

ssl/ssltest.c

ssl/t1_enc.c

ssl/t1_lib.c

ssl/tls1.h

test/CAss.cnf

test/Makefile

test/Uss.cnf

test/igetest.c

test/tests.com

test/times

util/copy.pl

util/domd

util/libeay.num

util/mk1mf.pl

util/mkdef.pl

util/mkerr.pl

util/mkfiles.pl

util/mklink.pl

util/opensslwrap.sh

util/pl/VC-32.pl

util/pl/netware.pl

util/ssleay.num

Show diffs side-by-side

added added

removed removed

crypto/bn/asm/x86-mont.pl

#!/usr/bin/env perl

# ====================================================================

# Written by Andy Polyakov <appro@fy.chalmers.se> for the OpenSSL

# project. The module is, however, dual licensed under OpenSSL and

# CRYPTOGAMS licenses depending on where you obtain it. For further

# details see http://www.openssl.org/~appro/cryptogams/.

# ====================================================================

# October 2005

# This is a "teaser" code, as it can be improved in several ways...

# First of all non-SSE2 path should be implemented (yes, for now it

# performs Montgomery multiplication/convolution only on SSE2-capable

# CPUs such as P4, others fall down to original code). Then inner loop

# can be unrolled and modulo-scheduled to improve ILP and possibly

# moved to 128-bit XMM register bank (though it would require input

# rearrangement and/or increase bus bandwidth utilization). Dedicated

# squaring procedure should give further performance improvement...

# Yet, for being draft, the code improves rsa512 *sign* benchmark by

# 110%(!), rsa1024 one - by 70% and rsa4096 - by 20%:-)

# December 2006

# Modulo-scheduling SSE2 loops results in further 15-20% improvement.

# Integer-only code [being equipped with dedicated squaring procedure]

# gives ~40% on rsa512 sign benchmark...

$0 =~ m/(.*[\/\\])[^\/\\]+$/; $dir=$1;

push(@INC,"${dir}","${dir}../../perlasm");

require "x86asm.pl";

&asm_init($ARGV[0],$0);

$sse2=0;

for (@ARGV) { $sse2=1 if (/-DOPENSSL_IA32_SSE2/); }

&external_label("OPENSSL_ia32cap_P") if ($sse2);

&function_begin("bn_mul_mont");

$i="edx";

$j="ecx";

$ap="esi"; $tp="esi"; # overlapping variables!!!

$rp="edi"; $bp="edi"; # overlapping variables!!!

$np="ebp";

$num="ebx";

$_num=&DWP(4*0,"esp"); # stack top layout

$_rp=&DWP(4*1,"esp");

$_ap=&DWP(4*2,"esp");

$_bp=&DWP(4*3,"esp");

$_np=&DWP(4*4,"esp");

$_n0=&DWP(4*5,"esp"); $_n0q=&QWP(4*5,"esp");

$_sp=&DWP(4*6,"esp");

$_bpend=&DWP(4*7,"esp");

$frame=32; # size of above frame rounded up to 16n

&xor ("eax","eax");

&mov ("edi",&wparam(5)); # int num

&cmp ("edi",4);

&jl (&label("just_leave"));

&lea ("esi",&wparam(0)); # put aside pointer to argument block

&lea ("edx",&wparam(1)); # load ap

&mov ("ebp","esp"); # saved stack pointer!

&add ("edi",2); # extra two words on top of tp

&neg ("edi");

&lea ("esp",&DWP(-$frame,"esp","edi",4)); # alloca($frame+4*(num+2))

&neg ("edi");

# minimize cache contention by arraning 2K window between stack

# pointer and ap argument [np is also position sensitive vector,

# but it's assumed to be near ap, as it's allocated at ~same

# time].

&mov ("eax","esp");

&sub ("eax","edx");

&and ("eax",2047);

&sub ("esp","eax"); # this aligns sp and ap modulo 2048

&xor ("edx","esp");

&and ("edx",2048);

&xor ("edx",2048);

&sub ("esp","edx"); # this splits them apart modulo 4096

&and ("esp",-64); # align to cache line

################################# load argument block...

&mov ("eax",&DWP(0*4,"esi"));# BN_ULONG *rp

&mov ("ebx",&DWP(1*4,"esi"));# const BN_ULONG *ap

&mov ("ecx",&DWP(2*4,"esi"));# const BN_ULONG *bp

&mov ("edx",&DWP(3*4,"esi"));# const BN_ULONG *np

&mov ("esi",&DWP(4*4,"esi"));# const BN_ULONG *n0

#&mov ("edi",&DWP(5*4,"esi"));# int num

&mov ("esi",&DWP(0,"esi")); # pull n0[0]

&mov ($_rp,"eax"); # ... save a copy of argument block

&mov ($_ap,"ebx");

&mov ($_bp,"ecx");

100

&mov ($_np,"edx");

101

&mov ($_n0,"esi");

102

&lea ($num,&DWP(-3,"edi")); # num=num-1 to assist modulo-scheduling

103

#&mov ($_num,$num); # redundant as $num is not reused

104

&mov ($_sp,"ebp"); # saved stack pointer!

105

106

if($sse2) {

107

$acc0="mm0"; # mmx register bank layout

108

$acc1="mm1";

109

$car0="mm2";

110

$car1="mm3";

111

$mul0="mm4";

112

$mul1="mm5";

113

$temp="mm6";

114

$mask="mm7";

115

116

&picmeup("eax","OPENSSL_ia32cap_P");

117

&bt (&DWP(0,"eax"),26);

118

&jnc (&label("non_sse2"));

119

120

&mov ("eax",-1);

121

&movd ($mask,"eax"); # mask 32 lower bits

122

123

&mov ($ap,$_ap); # load input pointers

124

&mov ($bp,$_bp);

125

&mov ($np,$_np);

126

127

&xor ($i,$i); # i=0

128

&xor ($j,$j); # j=0

129

130

&movd ($mul0,&DWP(0,$bp)); # bp[0]

131

&movd ($mul1,&DWP(0,$ap)); # ap[0]

132

&movd ($car1,&DWP(0,$np)); # np[0]

133

134

&pmuludq($mul1,$mul0); # ap[0]*bp[0]

135

&movq ($car0,$mul1);

136

&movq ($acc0,$mul1); # I wish movd worked for

137

&pand ($acc0,$mask); # inter-register transfers

138

139

&pmuludq($mul1,$_n0q); # *=n0

140

141

&pmuludq($car1,$mul1); # "t[0]"*np[0]*n0

142

&paddq ($car1,$acc0);

143

144

&movd ($acc1,&DWP(4,$np)); # np[1]

145

&movd ($acc0,&DWP(4,$ap)); # ap[1]

146

147

&psrlq ($car0,32);

148

&psrlq ($car1,32);

149

150

&inc ($j); # j++

151

&set_label("1st",16);

152

&pmuludq($acc0,$mul0); # ap[j]*bp[0]

153

&pmuludq($acc1,$mul1); # np[j]*m1

154

&paddq ($car0,$acc0); # +=c0

155

&paddq ($car1,$acc1); # +=c1

156

157

&movq ($acc0,$car0);

158

&pand ($acc0,$mask);

159

&movd ($acc1,&DWP(4,$np,$j,4)); # np[j+1]

160

&paddq ($car1,$acc0); # +=ap[j]*bp[0];

161

&movd ($acc0,&DWP(4,$ap,$j,4)); # ap[j+1]

162

&psrlq ($car0,32);

163

&movd (&DWP($frame-4,"esp",$j,4),$car1); # tp[j-1]=

164

&psrlq ($car1,32);

165

166

&lea ($j,&DWP(1,$j));

167

&cmp ($j,$num);

168

&jl (&label("1st"));

169

170

&pmuludq($acc0,$mul0); # ap[num-1]*bp[0]

171

&pmuludq($acc1,$mul1); # np[num-1]*m1

172

&paddq ($car0,$acc0); # +=c0

173

&paddq ($car1,$acc1); # +=c1

174

175

&movq ($acc0,$car0);

176

&pand ($acc0,$mask);

177

&paddq ($car1,$acc0); # +=ap[num-1]*bp[0];

178

&movd (&DWP($frame-4,"esp",$j,4),$car1); # tp[num-2]=

179

180

&psrlq ($car0,32);

181

&psrlq ($car1,32);

182

183

&paddq ($car1,$car0);

184

&movq (&QWP($frame,"esp",$num,4),$car1); # tp[num].tp[num-1]

185

186

&inc ($i); # i++

187

&set_label("outer");

188

&xor ($j,$j); # j=0

189

190

&movd ($mul0,&DWP(0,$bp,$i,4)); # bp[i]

191

&movd ($mul1,&DWP(0,$ap)); # ap[0]

192

&movd ($temp,&DWP($frame,"esp")); # tp[0]

193

&movd ($car1,&DWP(0,$np)); # np[0]

194

&pmuludq($mul1,$mul0); # ap[0]*bp[i]

195

196

&paddq ($mul1,$temp); # +=tp[0]

197

&movq ($acc0,$mul1);

198

&movq ($car0,$mul1);

199

&pand ($acc0,$mask);

200

201

&pmuludq($mul1,$_n0q); # *=n0

202

203

&pmuludq($car1,$mul1);

204

&paddq ($car1,$acc0);

205

206

&movd ($temp,&DWP($frame+4,"esp")); # tp[1]

207

&movd ($acc1,&DWP(4,$np)); # np[1]

208

&movd ($acc0,&DWP(4,$ap)); # ap[1]

209

210

&psrlq ($car0,32);

211

&psrlq ($car1,32);

212

&paddq ($car0,$temp); # +=tp[1]

213

214

&inc ($j); # j++

215

&dec ($num);

216

&set_label("inner");

217

&pmuludq($acc0,$mul0); # ap[j]*bp[i]

218

&pmuludq($acc1,$mul1); # np[j]*m1

219

&paddq ($car0,$acc0); # +=c0

220

&paddq ($car1,$acc1); # +=c1

221

222

&movq ($acc0,$car0);

223

&movd ($temp,&DWP($frame+4,"esp",$j,4));# tp[j+1]

224

&pand ($acc0,$mask);

225

&movd ($acc1,&DWP(4,$np,$j,4)); # np[j+1]

226

&paddq ($car1,$acc0); # +=ap[j]*bp[i]+tp[j]

227

&movd ($acc0,&DWP(4,$ap,$j,4)); # ap[j+1]

228

&psrlq ($car0,32);

229

&movd (&DWP($frame-4,"esp",$j,4),$car1);# tp[j-1]=

230

&psrlq ($car1,32);

231

&paddq ($car0,$temp); # +=tp[j+1]

232

233

&dec ($num);

234

&lea ($j,&DWP(1,$j)); # j++

235

&jnz (&label("inner"));

236

237

&mov ($num,$j);

238

&pmuludq($acc0,$mul0); # ap[num-1]*bp[i]

239

&pmuludq($acc1,$mul1); # np[num-1]*m1

240

&paddq ($car0,$acc0); # +=c0

241

&paddq ($car1,$acc1); # +=c1

242

243

&movq ($acc0,$car0);

244

&pand ($acc0,$mask);

245

&paddq ($car1,$acc0); # +=ap[num-1]*bp[i]+tp[num-1]

246

&movd (&DWP($frame-4,"esp",$j,4),$car1); # tp[num-2]=

247

&psrlq ($car0,32);

248

&psrlq ($car1,32);

249

250

&movd ($temp,&DWP($frame+4,"esp",$num,4)); # += tp[num]

251

&paddq ($car1,$car0);

252

&paddq ($car1,$temp);

253

&movq (&QWP($frame,"esp",$num,4),$car1); # tp[num].tp[num-1]

254

255

&lea ($i,&DWP(1,$i)); # i++

256

&cmp ($i,$num);

257

&jle (&label("outer"));

258

259

&emms (); # done with mmx bank

260

&jmp (&label("common_tail"));

261

262

&set_label("non_sse2",16);

263

}

264

265

if (0) {

266

&mov ("esp",$_sp);

267

&xor ("eax","eax"); # signal "not fast enough [yet]"

268

&jmp (&label("just_leave"));

269

# While the below code provides competitive performance for

270

# all key lengthes on modern Intel cores, it's still more

271

# than 10% slower for 4096-bit key elsewhere:-( "Competitive"

272

# means compared to the original integer-only assembler.

273

# 512-bit RSA sign is better by ~40%, but that's about all

274

# one can say about all CPUs...

275

} else {

276

$inp="esi"; # integer path uses these registers differently

277

$word="edi";

278

$carry="ebp";

279

280

&mov ($inp,$_ap);

281

&lea ($carry,&DWP(1,$num));

282

&mov ($word,$_bp);

283

&xor ($j,$j); # j=0

284

&mov ("edx",$inp);

285

&and ($carry,1); # see if num is even

286

&sub ("edx",$word); # see if ap==bp

287

&lea ("eax",&DWP(4,$word,$num,4)); # &bp[num]

288

&or ($carry,"edx");

289

&mov ($word,&DWP(0,$word)); # bp[0]

290

&jz (&label("bn_sqr_mont"));

291

&mov ($_bpend,"eax");

292

&mov ("eax",&DWP(0,$inp));

293

&xor ("edx","edx");

294

295

&set_label("mull",16);

296

&mov ($carry,"edx");

297

&mul ($word); # ap[j]*bp[0]

298

&add ($carry,"eax");

299

&lea ($j,&DWP(1,$j));

300

&adc ("edx",0);

301

&mov ("eax",&DWP(0,$inp,$j,4)); # ap[j+1]

302

&cmp ($j,$num);

303

&mov (&DWP($frame-4,"esp",$j,4),$carry); # tp[j]=

304

&jl (&label("mull"));

305

306

&mov ($carry,"edx");

307

&mul ($word); # ap[num-1]*bp[0]

308

&mov ($word,$_n0);

309

&add ("eax",$carry);

310

&mov ($inp,$_np);

311

&adc ("edx",0);

312

&imul ($word,&DWP($frame,"esp")); # n0*tp[0]

313

314

&mov (&DWP($frame,"esp",$num,4),"eax"); # tp[num-1]=

315

&xor ($j,$j);

316

&mov (&DWP($frame+4,"esp",$num,4),"edx"); # tp[num]=

317

&mov (&DWP($frame+8,"esp",$num,4),$j); # tp[num+1]=

318

319

&mov ("eax",&DWP(0,$inp)); # np[0]

320

&mul ($word); # np[0]*m

321

&add ("eax",&DWP($frame,"esp")); # +=tp[0]

322

&mov ("eax",&DWP(4,$inp)); # np[1]

323

&adc ("edx",0);

324

&inc ($j);

325

326

&jmp (&label("2ndmadd"));

327

328

&set_label("1stmadd",16);

329

&mov ($carry,"edx");

330

&mul ($word); # ap[j]*bp[i]

331

&add ($carry,&DWP($frame,"esp",$j,4)); # +=tp[j]

332

&lea ($j,&DWP(1,$j));

333

&adc ("edx",0);

334

&add ($carry,"eax");

335

&mov ("eax",&DWP(0,$inp,$j,4)); # ap[j+1]

336

&adc ("edx",0);

337

&cmp ($j,$num);

338

&mov (&DWP($frame-4,"esp",$j,4),$carry); # tp[j]=

339

&jl (&label("1stmadd"));

340

341

&mov ($carry,"edx");

342

&mul ($word); # ap[num-1]*bp[i]

343

&add ("eax",&DWP($frame,"esp",$num,4)); # +=tp[num-1]

344

&mov ($word,$_n0);

345

&adc ("edx",0);

346

&mov ($inp,$_np);

347

&add ($carry,"eax");

348

&adc ("edx",0);

349

&imul ($word,&DWP($frame,"esp")); # n0*tp[0]

350

351

&xor ($j,$j);

352

&add ("edx",&DWP($frame+4,"esp",$num,4)); # carry+=tp[num]

353

&mov (&DWP($frame,"esp",$num,4),$carry); # tp[num-1]=

354

&adc ($j,0);

355

&mov ("eax",&DWP(0,$inp)); # np[0]

356

&mov (&DWP($frame+4,"esp",$num,4),"edx"); # tp[num]=

357

&mov (&DWP($frame+8,"esp",$num,4),$j); # tp[num+1]=

358

359

&mul ($word); # np[0]*m

360

&add ("eax",&DWP($frame,"esp")); # +=tp[0]

361

&mov ("eax",&DWP(4,$inp)); # np[1]

362

&adc ("edx",0);

363

&mov ($j,1);

364

365

&set_label("2ndmadd",16);

366

&mov ($carry,"edx");

367

&mul ($word); # np[j]*m

368

&add ($carry,&DWP($frame,"esp",$j,4)); # +=tp[j]

369

&lea ($j,&DWP(1,$j));

370

&adc ("edx",0);

371

&add ($carry,"eax");

372

&mov ("eax",&DWP(0,$inp,$j,4)); # np[j+1]

373

&adc ("edx",0);

374

&cmp ($j,$num);

375

&mov (&DWP($frame-8,"esp",$j,4),$carry); # tp[j-1]=

376

&jl (&label("2ndmadd"));

377

378

&mov ($carry,"edx");

379

&mul ($word); # np[j]*m

380

&add ($carry,&DWP($frame,"esp",$num,4)); # +=tp[num-1]

381

&adc ("edx",0);

382

&add ($carry,"eax");

383

&adc ("edx",0);

384

&mov (&DWP($frame-4,"esp",$num,4),$carry); # tp[num-2]=

385

386

&xor ("eax","eax");

387

&mov ($j,$_bp); # &bp[i]

388

&add ("edx",&DWP($frame+4,"esp",$num,4)); # carry+=tp[num]

389

&adc ("eax",&DWP($frame+8,"esp",$num,4)); # +=tp[num+1]

390

&lea ($j,&DWP(4,$j));

391

&mov (&DWP($frame,"esp",$num,4),"edx"); # tp[num-1]=

392

&cmp ($j,$_bpend);

393

&mov (&DWP($frame+4,"esp",$num,4),"eax"); # tp[num]=

394

&je (&label("common_tail"));

395

396

&mov ($word,&DWP(0,$j)); # bp[i+1]

397

&mov ($inp,$_ap);

398

&mov ($_bp,$j); # &bp[++i]

399

&xor ($j,$j);

400

&xor ("edx","edx");

401

&mov ("eax",&DWP(0,$inp));

402

&jmp (&label("1stmadd"));

403

404

&set_label("bn_sqr_mont",16);

405

$sbit=$num;

406

&mov ($_num,$num);

407

&mov ($_bp,$j); # i=0

408

409

&mov ("eax",$word); # ap[0]

410

&mul ($word); # ap[0]*ap[0]

411

&mov (&DWP($frame,"esp"),"eax"); # tp[0]=

412

&mov ($sbit,"edx");

413

&shr ("edx",1);

414

&and ($sbit,1);

415

&inc ($j);

416

&set_label("sqr",16);

417

&mov ("eax",&DWP(0,$inp,$j,4)); # ap[j]

418

&mov ($carry,"edx");

419

&mul ($word); # ap[j]*ap[0]

420

&add ("eax",$carry);

421

&lea ($j,&DWP(1,$j));

422

&adc ("edx",0);

423

&lea ($carry,&DWP(0,$sbit,"eax",2));

424

&shr ("eax",31);

425

&cmp ($j,$_num);

426

&mov ($sbit,"eax");

427

&mov (&DWP($frame-4,"esp",$j,4),$carry); # tp[j]=

428

&jl (&label("sqr"));

429

430

&mov ("eax",&DWP(0,$inp,$j,4)); # ap[num-1]

431

&mov ($carry,"edx");

432

&mul ($word); # ap[num-1]*ap[0]

433

&add ("eax",$carry);

434

&mov ($word,$_n0);

435

&adc ("edx",0);

436

&mov ($inp,$_np);

437

&lea ($carry,&DWP(0,$sbit,"eax",2));

438

&imul ($word,&DWP($frame,"esp")); # n0*tp[0]

439

&shr ("eax",31);

440

&mov (&DWP($frame,"esp",$j,4),$carry); # tp[num-1]=

441

442

&lea ($carry,&DWP(0,"eax","edx",2));

443

&mov ("eax",&DWP(0,$inp)); # np[0]

444

&shr ("edx",31);

445

&mov (&DWP($frame+4,"esp",$j,4),$carry); # tp[num]=

446

&mov (&DWP($frame+8,"esp",$j,4),"edx"); # tp[num+1]=

447

448

&mul ($word); # np[0]*m

449

&add ("eax",&DWP($frame,"esp")); # +=tp[0]

450

&mov ($num,$j);

451

&adc ("edx",0);

452

&mov ("eax",&DWP(4,$inp)); # np[1]

453

&mov ($j,1);

454

455

&set_label("3rdmadd",16);

456

&mov ($carry,"edx");

457

&mul ($word); # np[j]*m

458

&add ($carry,&DWP($frame,"esp",$j,4)); # +=tp[j]

459

&adc ("edx",0);

460

&add ($carry,"eax");

461

&mov ("eax",&DWP(4,$inp,$j,4)); # np[j+1]

462

&adc ("edx",0);

463

&mov (&DWP($frame-4,"esp",$j,4),$carry); # tp[j-1]=

464

465

&mov ($carry,"edx");

466

&mul ($word); # np[j+1]*m

467

&add ($carry,&DWP($frame+4,"esp",$j,4)); # +=tp[j+1]

468

&lea ($j,&DWP(2,$j));

469

&adc ("edx",0);

470

&add ($carry,"eax");

471

&mov ("eax",&DWP(0,$inp,$j,4)); # np[j+2]

472

&adc ("edx",0);

473

&cmp ($j,$num);

474

&mov (&DWP($frame-8,"esp",$j,4),$carry); # tp[j]=

475

&jl (&label("3rdmadd"));

476

477

&mov ($carry,"edx");

478

&mul ($word); # np[j]*m

479

&add ($carry,&DWP($frame,"esp",$num,4)); # +=tp[num-1]

480

&adc ("edx",0);

481

&add ($carry,"eax");

482

&adc ("edx",0);

483

&mov (&DWP($frame-4,"esp",$num,4),$carry); # tp[num-2]=

484

485

&mov ($j,$_bp); # i

486

&xor ("eax","eax");

487

&mov ($inp,$_ap);

488

&add ("edx",&DWP($frame+4,"esp",$num,4)); # carry+=tp[num]

489

&adc ("eax",&DWP($frame+8,"esp",$num,4)); # +=tp[num+1]

490

&mov (&DWP($frame,"esp",$num,4),"edx"); # tp[num-1]=

491

&cmp ($j,$num);

492

&mov (&DWP($frame+4,"esp",$num,4),"eax"); # tp[num]=

493

&je (&label("common_tail"));

494

495

&mov ($word,&DWP(4,$inp,$j,4)); # ap[i]

496

&lea ($j,&DWP(1,$j));

497

&mov ("eax",$word);

498

&mov ($_bp,$j); # ++i

499

&mul ($word); # ap[i]*ap[i]

500

&add ("eax",&DWP($frame,"esp",$j,4)); # +=tp[i]

501

&adc ("edx",0);

502

&mov (&DWP($frame,"esp",$j,4),"eax"); # tp[i]=

503

&xor ($carry,$carry);

504

&cmp ($j,$num);

505

&lea ($j,&DWP(1,$j));

506

&je (&label("sqrlast"));

507

508

&mov ($sbit,"edx"); # zaps $num

509

&shr ("edx",1);

510

&and ($sbit,1);

511

&set_label("sqradd",16);

512

&mov ("eax",&DWP(0,$inp,$j,4)); # ap[j]

513

&mov ($carry,"edx");

514

&mul ($word); # ap[j]*ap[i]

515

&add ("eax",$carry);

516

&lea ($carry,&DWP(0,"eax","eax"));

517

&adc ("edx",0);

518

&shr ("eax",31);

519

&add ($carry,&DWP($frame,"esp",$j,4)); # +=tp[j]

520

&lea ($j,&DWP(1,$j));

521

&adc ("eax",0);

522

&add ($carry,$sbit);

523

&adc ("eax",0);

524

&cmp ($j,$_num);

525

&mov (&DWP($frame-4,"esp",$j,4),$carry); # tp[j]=

526

&mov ($sbit,"eax");

527

&jle (&label("sqradd"));

528

529

&mov ($carry,"edx");

530

&lea ("edx",&DWP(0,$sbit,"edx",2));

531

&shr ($carry,31);

532

&set_label("sqrlast");

533

&mov ($word,$_n0);

534

&mov ($inp,$_np);

535

&imul ($word,&DWP($frame,"esp")); # n0*tp[0]

536

537

&add ("edx",&DWP($frame,"esp",$j,4)); # +=tp[num]

538

&mov ("eax",&DWP(0,$inp)); # np[0]

539

&adc ($carry,0);

540

&mov (&DWP($frame,"esp",$j,4),"edx"); # tp[num]=

541

&mov (&DWP($frame+4,"esp",$j,4),$carry); # tp[num+1]=

542

543

&mul ($word); # np[0]*m

544

&add ("eax",&DWP($frame,"esp")); # +=tp[0]

545

&lea ($num,&DWP(-1,$j));

546

&adc ("edx",0);

547

&mov ($j,1);

548

&mov ("eax",&DWP(4,$inp)); # np[1]

549

550

&jmp (&label("3rdmadd"));

551

}

552

553

&set_label("common_tail",16);

554

&mov ($np,$_np); # load modulus pointer

555

&mov ($rp,$_rp); # load result pointer

556

&lea ($tp,&DWP($frame,"esp")); # [$ap and $bp are zapped]

557

558

&mov ("eax",&DWP(0,$tp)); # tp[0]

559

&mov ($j,$num); # j=num-1

560

&xor ($i,$i); # i=0 and clear CF!

561

562

&set_label("sub",16);

563

&sbb ("eax",&DWP(0,$np,$i,4));

564

&mov (&DWP(0,$rp,$i,4),"eax"); # rp[i]=tp[i]-np[i]

565

&dec ($j); # doesn't affect CF!

566

&mov ("eax",&DWP(4,$tp,$i,4)); # tp[i+1]

567

&lea ($i,&DWP(1,$i)); # i++

568

&jge (&label("sub"));

569

570

&sbb ("eax",0); # handle upmost overflow bit

571

&and ($tp,"eax");

572

&not ("eax");

573

&mov ($np,$rp);

574

&and ($np,"eax");

575

&or ($tp,$np); # tp=carry?tp:rp

576

577

&set_label("copy",16); # copy or in-place refresh

578

&mov ("eax",&DWP(0,$tp,$num,4));

579

&mov (&DWP(0,$rp,$num,4),"eax"); # rp[i]=tp[i]

580

&mov (&DWP($frame,"esp",$num,4),$j); # zap temporary vector

581

&dec ($num);

582

&jge (&label("copy"));

583

584

&mov ("esp",$_sp); # pull saved stack pointer

585

&mov ("eax",1);

586

&set_label("just_leave");

587

&function_end("bn_mul_mont");

588

589

&asciz("Montgomery Multiplication for x86, CRYPTOGAMS by <appro\@openssl.org>");

590

591

&asm_finish();

Older »