~ubuntu-branches/ubuntu/lucid/openssl/lucid-proposed

« back to all changes in this revision

Viewing changes to crypto/bn/asm/sparcv9a-mont.pl

Committer: Bazaar Package Importer
Author(s): Kurt Roeckx
Date: 2009-06-13 18:15:46 UTC
mto: (11.1.5 squeeze)
mto: This revision was merged to the branch mainline in revision 34.
Revision ID: james.westby@ubuntu.com-20090613181546-vbfntai3b009dl1u

Tags: upstream-0.9.8k

Import upstream version 0.9.8k

files added:
apps/cms.c

apps/genpkey.c

apps/pkey.c

apps/pkeyparam.c

apps/pkeyutl.c

apps/ts.c

apps/tsget

certs/README.RootCerts

crypto/aes/aes_wrap.c

crypto/aes/aes_x86core.c

crypto/aes/asm/aes-armv4.pl

crypto/aes/asm/aes-ppc.pl

crypto/aes/asm/aes-s390x.pl

crypto/aes/asm/aes-sparcv9.pl

crypto/aes/asm/aes-x86_64.pl

crypto/asn1/ameth_lib.c

crypto/asn1/asn1_locl.h

crypto/asn1/asn_mime.c

crypto/asn1/bio_asn1.c

crypto/asn1/bio_ndef.c

crypto/asn1/x_nx509.c

crypto/bn/asm/alpha-mont.pl

crypto/bn/asm/armv4-mont.pl

crypto/bn/asm/mips3-mont.pl

crypto/bn/asm/mo-586.pl

crypto/bn/asm/ppc-mont.pl

crypto/bn/asm/ppc64-mont.pl

crypto/bn/asm/s390x-mont.pl

crypto/bn/asm/s390x.S

crypto/bn/asm/sparcv9-mont.pl

crypto/bn/asm/sparcv9a-mont.pl

crypto/bn/asm/via-mont.pl

crypto/bn/asm/x86-mont.pl

crypto/bn/asm/x86_64-mont.pl

crypto/bn/bn_opt.c

crypto/bn/bn_x931p.c

crypto/buffer/buf_str.c

crypto/camellia/asm

crypto/camellia/asm/cmll-x86.pl

crypto/camellia/asm/cmll-x86_64.pl

crypto/cms

crypto/cms/Makefile

crypto/cms/cms.h

crypto/cms/cms_asn1.c

crypto/cms/cms_att.c

crypto/cms/cms_cd.c

crypto/cms/cms_dd.c

crypto/cms/cms_enc.c

crypto/cms/cms_env.c

crypto/cms/cms_err.c

crypto/cms/cms_ess.c

crypto/cms/cms_io.c

crypto/cms/cms_lcl.h

crypto/cms/cms_lib.c

crypto/cms/cms_sd.c

crypto/cms/cms_smime.c

crypto/des/des_lib.c

crypto/dsa/dsa_utl.c

crypto/dyn_lck.c

crypto/err/err_bio.c

crypto/err/err_def.c

crypto/err/err_str.c

crypto/evp/dig_eng.c

crypto/evp/enc_min.c

crypto/evp/evp_cnf.c

crypto/fips_err.c

crypto/fips_err.h

crypto/jpake

crypto/jpake/Makefile

crypto/jpake/jpake.c

crypto/jpake/jpake.h

crypto/jpake/jpake_err.c

crypto/jpake/jpaketest.c

crypto/o_init.c

crypto/ppccpuid.pl

crypto/rand/rand_eng.c

crypto/rc4/rc4_fblk.c

crypto/rsa/rsa_eng.c

crypto/rsa/rsa_x931g.c

crypto/s390xcpuid.S

crypto/sha/asm/sha1-x86_64.pl

crypto/sha/asm/sha512-x86_64.pl

crypto/sparcv9cap.c

demos/jpake

demos/jpake/Makefile

demos/jpake/jpakedemo.c

engines/e_capi.c

engines/e_capi.ec

engines/e_capi_err.c

engines/e_capi_err.h

fips

fips/Makefile

fips/aes

fips/aes/Makefile

fips/aes/fips_aes_selftest.c

fips/aes/fips_aesavs.c

fips/des

fips/des/Makefile

fips/des/fips_des_selftest.c

fips/des/fips_desmovs.c

fips/dh

fips/dh/Makefile

fips/dh/dh_gen.c

fips/dh/fips_dh_check.c

fips/dh/fips_dh_gen.c

fips/dh/fips_dh_key.c

fips/dh/fips_dh_lib.c

fips/dsa

fips/dsa/Makefile

fips/dsa/fips_dsa_gen.c

fips/dsa/fips_dsa_key.c

fips/dsa/fips_dsa_lib.c

fips/dsa/fips_dsa_ossl.c

fips/dsa/fips_dsa_selftest.c

fips/dsa/fips_dsa_sign.c

fips/dsa/fips_dsatest.c

fips/dsa/fips_dssvs.c

fips/fips-lib.com

fips/fips-nodiff.txt

fips/fips.c

fips/fips.h

fips/fips_canister.c

fips/fips_locl.h

fips/fips_premain.c

fips/fips_premain.c.sha1

fips/fips_test_suite.c

fips/fips_utl.h

fips/fipsalgtest.pl

fips/fipsld

fips/fipstests.bat

fips/fipstests.sh

fips/hmac

fips/hmac/Makefile

fips/hmac/fips_hmac.c

fips/hmac/fips_hmac_selftest.c

fips/hmac/fips_hmactest.c

fips/install.com

fips/mkfipsscr.pl

fips/openssl_fips_fingerprint

fips/rand

fips/rand/Makefile

fips/rand/fips_rand.c

fips/rand/fips_rand.h

fips/rand/fips_rand_selftest.c

fips/rand/fips_randtest.c

fips/rand/fips_rngvs.c

fips/rsa

fips/rsa/Makefile

fips/rsa/fips_rsa_eay.c

fips/rsa/fips_rsa_gen.c

fips/rsa/fips_rsa_lib.c

fips/rsa/fips_rsa_selftest.c

fips/rsa/fips_rsa_sign.c

fips/rsa/fips_rsa_x931g.c

fips/rsa/fips_rsagtest.c

fips/rsa/fips_rsastest.c

fips/rsa/fips_rsavtest.c

fips/sha

fips/sha/Makefile

fips/sha/fips_sha1_selftest.c

fips/sha/fips_shatest.c

fips/sha/fips_standalone_sha1.c

include/openssl/fips.h

include/openssl/fips_rand.h

ms/do_fips.bat

ms/segrenam.pl

test/SHAmix.r

test/SHAmix.x

test/cms-examples.pl

test/cms-test.pl

test/fips_aesavs.c

test/fips_desmovs.c

test/fips_dsatest.c

test/fips_dssvs.c

test/fips_hmactest.c

test/fips_randtest.c

test/fips_rngvs.c

test/fips_rsagtest.c

test/fips_rsastest.c

test/fips_rsavtest.c

test/fips_shatest.c

test/fips_test_suite.c

test/jpaketest.c

test/smcont.txt

test/smime-certs

test/smime-certs/smdsa1.pem

test/smime-certs/smdsa2.pem

test/smime-certs/smdsa3.pem

test/smime-certs/smdsap.pem

test/smime-certs/smroot.pem

test/smime-certs/smrsa1.pem

test/smime-certs/smrsa2.pem

test/smime-certs/smrsa3.pem

test/testfipsssl

util/arx.pl

util/fipslink.pl

util/mksdef.pl

files removed:
ChangeLog.0_9_7-stable_not-in-head

ChangeLog.0_9_7-stable_not-in-head_FIPS

certs/RegTP-5R.pem

certs/RegTP-6R.pem

certs/aol1.pem

certs/aol2.pem

certs/aoltw1.pem

certs/aoltw2.pem

certs/argena.pem

certs/argeng.pem

certs/demo/nortelCA.pem

certs/demo/timCA.pem

certs/demo/tjhCA.pem

certs/demo/vsigntca.pem

certs/eng1.pem

certs/eng2.pem

certs/eng3.pem

certs/eng4.pem

certs/eng5.pem

certs/expired/ICE-CA.pem

certs/expired/ICE-root.pem

certs/expired/ICE-user.pem

certs/expired/RegTP-4R.pem

certs/expired/factory.pem

certs/expired/rsa-cca.pem

certs/expired/rsa-ssca.pem

certs/expired/vsign2.pem

certs/expired/vsign3.pem

certs/thawteCb.pem

certs/thawteCp.pem

certs/vsign1.pem

certs/vsign3.pem

certs/vsignss.pem

certs/wellsfgo.pem

crypto/md5/asm/md5-sparcv9.S

files modified:
CHANGES

Configure

INSTALL

INSTALL.NW

LICENSE

MacOS/GetHTTPS.src/ErrorHandling.hpp

Makefile

Makefile.org

Makefile.shared

NEWS

Netware/build.bat

Netware/cpy_tests.bat

Netware/do_tests.pl

Netware/set_env.bat

README

apps/Makefile

apps/apps.c

apps/apps.h

apps/asn1pars.c

apps/ca.c

apps/crl.c

apps/dgst.c

apps/dsa.c

apps/ec.c

apps/enc.c

apps/engine.c

apps/genrsa.c

apps/nseq.c

apps/ocsp.c

apps/openssl.c

apps/pkcs12.c

apps/pkcs8.c

apps/progs.h

apps/progs.pl

apps/rand.c

apps/req.c

apps/rsautl.c

apps/s_client.c

apps/s_server.c

apps/smime.c

apps/speed.c

apps/spkac.c

apps/verify.c

apps/version.c

apps/x509.c

config

crypto/Makefile

crypto/aes/Makefile

crypto/aes/aes.h

crypto/aes/aes_cbc.c

crypto/aes/aes_core.c

crypto/aes/asm/aes-586.pl

crypto/asn1/Makefile

crypto/asn1/a_bytes.c

crypto/asn1/a_mbstr.c

crypto/asn1/a_object.c

crypto/asn1/a_sign.c

crypto/asn1/a_strex.c

crypto/asn1/a_strnid.c

crypto/asn1/a_type.c

crypto/asn1/a_verify.c

crypto/asn1/asn1.h

crypto/asn1/asn1_err.c

crypto/asn1/asn1_gen.c

crypto/asn1/asn1_lib.c

crypto/asn1/asn1_par.c

crypto/asn1/asn1t.h

crypto/asn1/asn_moid.c

crypto/asn1/asn_pack.c

crypto/asn1/nsseq.c

crypto/asn1/p5_pbe.c

crypto/asn1/p5_pbev2.c

crypto/asn1/p8_pkey.c

crypto/asn1/t_bitst.c

crypto/asn1/t_crl.c

crypto/asn1/t_spki.c

crypto/asn1/t_x509.c

crypto/asn1/t_x509a.c

crypto/asn1/tasn_dec.c

crypto/asn1/tasn_enc.c

crypto/asn1/tasn_fre.c

crypto/asn1/tasn_new.c

crypto/asn1/tasn_prn.c

crypto/asn1/tasn_typ.c

crypto/asn1/tasn_utl.c

crypto/asn1/x_algor.c

crypto/asn1/x_bignum.c

crypto/asn1/x_exten.c

crypto/asn1/x_long.c

crypto/asn1/x_x509a.c

crypto/bf/Makefile

crypto/bf/bf_skey.c

crypto/bf/blowfish.h

crypto/bio/Makefile

crypto/bio/b_sock.c

crypto/bio/bio.h

crypto/bio/bss_bio.c

crypto/bio/bss_dgram.c

crypto/bio/bss_file.c

crypto/bio/bss_mem.c

crypto/bio/bss_sock.c

crypto/bn/Makefile

crypto/bn/bn.h

crypto/bn/bn_div.c

crypto/bn/bn_gf2m.c

crypto/bn/bn_lcl.h

crypto/bn/bn_lib.c

crypto/bn/bn_mont.c

crypto/bn/bn_mul.c

crypto/bn/bn_nist.c

crypto/bn/bn_rand.c

crypto/bn/bn_shift.c

crypto/bn/bntest.c

crypto/buffer/Makefile

crypto/buffer/buffer.c

crypto/camellia/Makefile

crypto/camellia/camellia.h

crypto/camellia/cmll_misc.c

crypto/cast/Makefile

crypto/cast/c_skey.c

crypto/cast/cast.h

crypto/comp/Makefile

crypto/comp/c_zlib.c

crypto/comp/comp.h

crypto/comp/comp_err.c

crypto/conf/Makefile

crypto/conf/conf_mall.c

crypto/conf/conf_mod.c

crypto/conf/conf_sap.c

crypto/cryptlib.c

crypto/cryptlib.h

crypto/crypto-lib.com

crypto/crypto.h

crypto/des/Makefile

crypto/des/asm/des_enc.m4

crypto/des/des.h

crypto/des/des_enc.c

crypto/des/des_old.c

crypto/des/des_old.h

crypto/des/ecb_enc.c

crypto/des/enc_read.c

crypto/des/enc_writ.c

crypto/des/set_key.c

crypto/des/times/usparc.cc

crypto/des/xcbc_enc.c

crypto/dh/Makefile

crypto/dh/dh.h

crypto/dh/dh_asn1.c

crypto/dh/dh_check.c

crypto/dh/dh_err.c

crypto/dh/dh_gen.c

crypto/dh/dh_key.c

crypto/dsa/Makefile

crypto/dsa/dsa.h

crypto/dsa/dsa_asn1.c

crypto/dsa/dsa_err.c

crypto/dsa/dsa_gen.c

crypto/dsa/dsa_key.c

crypto/dsa/dsa_lib.c

crypto/dsa/dsa_ossl.c

crypto/dsa/dsa_sign.c

crypto/dsa/dsa_vrf.c

crypto/dso/Makefile

crypto/ec/Makefile

crypto/ec/ec_key.c

crypto/ecdh/Makefile

crypto/ecdsa/Makefile

crypto/ecdsa/ecs_ossl.c

crypto/engine/Makefile

crypto/engine/eng_all.c

crypto/engine/eng_cnf.c

crypto/engine/eng_err.c

crypto/engine/eng_int.h

crypto/engine/eng_padlock.c

crypto/engine/eng_pkey.c

crypto/engine/eng_table.c

crypto/engine/engine.h

crypto/engine/enginetest.c

crypto/err/Makefile

crypto/err/err.c

crypto/err/err.h

crypto/err/err_all.c

crypto/err/err_prn.c

crypto/err/openssl.ec

crypto/evp/Makefile

crypto/evp/bio_md.c

crypto/evp/digest.c

crypto/evp/e_aes.c

crypto/evp/e_camellia.c

crypto/evp/e_des.c

crypto/evp/e_des3.c

crypto/evp/e_null.c

crypto/evp/e_rc4.c

crypto/evp/evp.h

crypto/evp/evp_acnf.c

crypto/evp/evp_enc.c

crypto/evp/evp_err.c

crypto/evp/evp_lib.c

crypto/evp/evp_locl.h

crypto/evp/evp_pbe.c

crypto/evp/evp_pkey.c

crypto/evp/evp_test.c

crypto/evp/m_dss.c

crypto/evp/m_dss1.c

crypto/evp/m_md2.c

crypto/evp/m_md4.c

crypto/evp/m_md5.c

crypto/evp/m_mdc2.c

crypto/evp/m_sha.c

crypto/evp/m_sha1.c

crypto/evp/names.c

crypto/evp/p5_crpt.c

crypto/evp/p5_crpt2.c

crypto/evp/p_sign.c

crypto/evp/p_verify.c

crypto/hmac/Makefile

crypto/hmac/hmac.c

crypto/hmac/hmac.h

crypto/idea/Makefile

crypto/idea/i_skey.c

crypto/idea/idea.h

crypto/install.com

crypto/krb5/Makefile

crypto/lhash/Makefile

crypto/md2/Makefile

crypto/md2/md2.h

crypto/md2/md2_dgst.c

crypto/md32_common.h

crypto/md4/Makefile

crypto/md4/md4.h

crypto/md4/md4_dgst.c

crypto/md4/md4_locl.h

crypto/md5/Makefile

crypto/md5/asm/md5-586.pl

crypto/md5/asm/md5-x86_64.pl

crypto/md5/md5.h

crypto/md5/md5_dgst.c

crypto/md5/md5_locl.h

crypto/mdc2/Makefile

crypto/mdc2/mdc2.h

crypto/mdc2/mdc2dgst.c

crypto/mem.c

crypto/mem_dbg.c

crypto/o_str.c

crypto/objects/Makefile

crypto/objects/obj_dat.c

crypto/objects/obj_dat.h

crypto/objects/obj_dat.pl

crypto/objects/obj_mac.h

crypto/objects/obj_mac.num

crypto/objects/objects.txt

crypto/ocsp/Makefile

crypto/ocsp/ocsp.h

crypto/ocsp/ocsp_asn.c

crypto/ocsp/ocsp_err.c

crypto/ocsp/ocsp_ht.c

crypto/ocsp/ocsp_srv.c

crypto/ocsp/ocsp_vfy.c

crypto/opensslconf.h

crypto/opensslconf.h.in

crypto/opensslv.h

crypto/ossl_typ.h

crypto/pem/Makefile

crypto/pem/pem.h

crypto/pem/pem_all.c

crypto/pem/pem_info.c

crypto/pem/pem_lib.c

crypto/pem/pem_x509.c

crypto/pem/pem_xaux.c

crypto/perlasm/x86_64-xlate.pl

crypto/perlasm/x86ms.pl

crypto/perlasm/x86nasm.pl

crypto/perlasm/x86unix.pl

crypto/pkcs12/Makefile

crypto/pkcs12/p12_add.c

crypto/pkcs12/p12_asn.c

crypto/pkcs12/p12_attr.c

crypto/pkcs12/p12_crpt.c

crypto/pkcs12/p12_crt.c

crypto/pkcs12/p12_decr.c

crypto/pkcs12/p12_init.c

crypto/pkcs12/p12_key.c

crypto/pkcs12/p12_kiss.c

crypto/pkcs12/p12_mutl.c

crypto/pkcs12/p12_npas.c

crypto/pkcs12/p12_p8d.c

crypto/pkcs12/p12_p8e.c

crypto/pkcs12/p12_utl.c

crypto/pkcs12/pkcs12.h

crypto/pkcs7/Makefile

crypto/pkcs7/pk7_asn1.c

crypto/pkcs7/pk7_attr.c

crypto/pkcs7/pk7_mime.c

crypto/pkcs7/pk7_smime.c

crypto/pqueue/Makefile

crypto/pqueue/pq_compat.h

crypto/rand/Makefile

crypto/rand/md_rand.c

crypto/rand/rand.h

crypto/rand/rand_err.c

crypto/rand/rand_lcl.h

crypto/rand/rand_lib.c

crypto/rand/rand_nw.c

crypto/rand/rand_unix.c

crypto/rand/randfile.c

crypto/rc2/Makefile

crypto/rc2/rc2.h

crypto/rc2/rc2_skey.c

crypto/rc4/Makefile

crypto/rc4/asm/rc4-586.pl

crypto/rc4/asm/rc4-x86_64.pl

crypto/rc4/rc4.h

crypto/rc4/rc4_skey.c

crypto/rc5/Makefile

crypto/rc5/rc5.h

crypto/rc5/rc5_skey.c

crypto/ripemd/Makefile

crypto/ripemd/README

crypto/ripemd/asm/rmd-586.pl

crypto/ripemd/ripemd.h

crypto/ripemd/rmd_dgst.c

crypto/ripemd/rmd_locl.h

crypto/rsa/Makefile

crypto/rsa/rsa.h

crypto/rsa/rsa_asn1.c

crypto/rsa/rsa_eay.c

crypto/rsa/rsa_err.c

crypto/rsa/rsa_gen.c

crypto/rsa/rsa_lib.c

crypto/rsa/rsa_null.c

crypto/rsa/rsa_oaep.c

crypto/rsa/rsa_pss.c

crypto/rsa/rsa_sign.c

crypto/rsa/rsa_ssl.c

crypto/rsa/rsa_x931.c

crypto/seed/Makefile

crypto/sha/Makefile

crypto/sha/asm/sha1-586.pl

crypto/sha/asm/sha1-ia64.pl

crypto/sha/asm/sha512-ia64.pl

crypto/sha/sha.h

crypto/sha/sha1_one.c

crypto/sha/sha1dgst.c

crypto/sha/sha256.c

crypto/sha/sha512.c

crypto/sha/sha_dgst.c

crypto/sha/sha_locl.h

crypto/sha/shatest.c

crypto/stack/Makefile

crypto/stack/safestack.h

crypto/store/Makefile

crypto/symhacks.h

crypto/txt_db/Makefile

crypto/ui/Makefile

crypto/ui/ui_lib.c

crypto/ui/ui_openssl.c

crypto/x509/Makefile

crypto/x509/by_dir.c

crypto/x509/x509.h

crypto/x509/x509_att.c

crypto/x509/x509_cmp.c

crypto/x509/x509_trs.c

crypto/x509/x509_vfy.c

crypto/x509/x509_vpm.c

crypto/x509/x509cset.c

crypto/x509/x509spki.c

crypto/x509v3/Makefile

crypto/x509v3/ext_dat.h

crypto/x509v3/pcy_cache.c

crypto/x509v3/pcy_data.c

crypto/x509v3/pcy_int.h

crypto/x509v3/pcy_lib.c

crypto/x509v3/pcy_map.c

crypto/x509v3/pcy_node.c

crypto/x509v3/pcy_tree.c

crypto/x509v3/tabtest.c

crypto/x509v3/v3_addr.c

crypto/x509v3/v3_akey.c

crypto/x509v3/v3_akeya.c

crypto/x509v3/v3_alt.c

crypto/x509v3/v3_asid.c

crypto/x509v3/v3_bcons.c

crypto/x509v3/v3_bitst.c

crypto/x509v3/v3_conf.c

crypto/x509v3/v3_cpols.c

crypto/x509v3/v3_crld.c

crypto/x509v3/v3_enum.c

crypto/x509v3/v3_extku.c

crypto/x509v3/v3_genn.c

crypto/x509v3/v3_ia5.c

crypto/x509v3/v3_info.c

crypto/x509v3/v3_int.c

crypto/x509v3/v3_lib.c

crypto/x509v3/v3_ncons.c

crypto/x509v3/v3_ocsp.c

crypto/x509v3/v3_pcons.c

crypto/x509v3/v3_pku.c

crypto/x509v3/v3_pmaps.c

crypto/x509v3/v3_prn.c

crypto/x509v3/v3_purp.c

crypto/x509v3/v3_skey.c

crypto/x509v3/v3_sxnet.c

crypto/x509v3/v3_utl.c

crypto/x509v3/v3conf.c

crypto/x509v3/v3prin.c

crypto/x509v3/x509v3.h

crypto/x86_64cpuid.pl

crypto/x86cpuid.pl

demos/asn1/ocsp.c

demos/engines/cluster_labs/hw_cluster_labs_err.h

demos/engines/ibmca/hw_ibmca_err.h

demos/engines/zencod/hw_zencod_err.h

doc/apps/dgst.pod

doc/apps/ocsp.pod

doc/apps/rand.pod

doc/apps/s_server.pod

doc/apps/verify.pod

doc/apps/x509.pod

doc/c-indentation.el

doc/crypto/ASN1_generate_nconf.pod

doc/crypto/DH_set_method.pod

doc/crypto/DSA_set_method.pod

doc/crypto/OPENSSL_ia32cap.pod

doc/crypto/RAND_egd.pod

doc/crypto/RAND_set_rand_method.pod

doc/crypto/RSA_set_method.pod

doc/crypto/engine.pod

doc/ssl/SSL_CIPHER_get_name.pod

doc/ssl/SSL_CTX_set_verify.pod

doc/ssl/SSL_SESSION_free.pod

doc/ssl/SSL_free.pod

doc/ssl/SSL_read.pod

doc/ssleay.txt

e_os.h

engines/Makefile

engines/e_4758cca_err.h

engines/e_aep.c

engines/e_aep_err.h

engines/e_atalla_err.h

engines/e_chil.c

engines/e_chil_err.c

engines/e_chil_err.h

engines/e_cswift_err.h

engines/e_gmp.c

engines/e_gmp_err.h

engines/e_nuron_err.h

engines/e_sureware_err.h

engines/e_ubsec_err.h

engines/makeengines.com

makevms.com

ms/do_masm.bat

ms/do_nasm.bat

ms/test.bat

openssl.spec

ssl/Makefile

ssl/d1_clnt.c

ssl/d1_enc.c

ssl/d1_lib.c

ssl/d1_pkt.c

ssl/d1_srvr.c

ssl/dtls1.h

ssl/kssl.c

ssl/s23_clnt.c

ssl/s23_srvr.c

ssl/s2_clnt.c

ssl/s2_srvr.c

ssl/s3_clnt.c

ssl/s3_enc.c

ssl/s3_lib.c

ssl/s3_pkt.c

ssl/s3_srvr.c

ssl/ssl.h

ssl/ssl3.h

ssl/ssl_asn1.c

ssl/ssl_ciph.c

ssl/ssl_err.c

ssl/ssl_lib.c

ssl/ssl_locl.h

ssl/ssl_rsa.c

ssl/ssl_sess.c

ssl/ssl_stat.c

ssl/ssltest.c

ssl/t1_enc.c

ssl/t1_lib.c

ssl/tls1.h

test/CAss.cnf

test/Makefile

test/Uss.cnf

test/igetest.c

test/tests.com

test/times

util/copy.pl

util/domd

util/libeay.num

util/mk1mf.pl

util/mkdef.pl

util/mkerr.pl

util/mkfiles.pl

util/mklink.pl

util/opensslwrap.sh

util/pl/VC-32.pl

util/pl/netware.pl

util/ssleay.num

Show diffs side-by-side

added added

removed removed

crypto/bn/asm/sparcv9a-mont.pl

#!/usr/bin/env perl

# ====================================================================

# Written by Andy Polyakov <appro@fy.chalmers.se> for the OpenSSL

# project. The module is, however, dual licensed under OpenSSL and

# CRYPTOGAMS licenses depending on where you obtain it. For further

# details see http://www.openssl.org/~appro/cryptogams/.

# ====================================================================

# October 2005

# "Teaser" Montgomery multiplication module for UltraSPARC. Why FPU?

# Because unlike integer multiplier, which simply stalls whole CPU,

# FPU is fully pipelined and can effectively emit 48 bit partial

# product every cycle. Why not blended SPARC v9? One can argue that

# making this module dependent on UltraSPARC VIS extension limits its

# binary compatibility. Well yes, it does exclude SPARC64 prior-V(!)

# implementations from compatibility matrix. But the rest, whole Sun

# UltraSPARC family and brand new Fujitsu's SPARC64 V, all support

# VIS extension instructions used in this module. This is considered

# good enough to not care about HAL SPARC64 users [if any] who have

# integer-only pure SPARCv9 module to "fall down" to.

# USI&II cores currently exhibit uniform 2x improvement [over pre-

# bn_mul_mont codebase] for all key lengths and benchmarks. On USIII

# performance improves few percents for shorter keys and worsens few

# percents for longer keys. This is because USIII integer multiplier

# is >3x faster than USI&II one, which is harder to match [but see

# TODO list below]. It should also be noted that SPARC64 V features

# out-of-order execution, which *might* mean that integer multiplier

# is pipelined, which in turn *might* be impossible to match... On

# additional note, SPARC64 V implements FP Multiply-Add instruction,

# which is perfectly usable in this context... In other words, as far

# as Fujitsu SPARC64 V goes, talk to the author:-)

# The implementation implies following "non-natural" limitations on

# input arguments:

# - num may not be less than 4;

# - num has to be even;

# Failure to meet either condition has no fatal effects, simply

# doesn't give any performance gain.

# TODO:

# - modulo-schedule inner loop for better performance (on in-order

# execution core such as UltraSPARC this shall result in further

# noticeable(!) improvement);

# - dedicated squaring procedure[?];

######################################################################

# November 2006

# Modulo-scheduled inner loops allow to interleave floating point and

# integer instructions and minimize Read-After-Write penalties. This

# results in *further* 20-50% perfromance improvement [depending on

# key length, more for longer keys] on USI&II cores and 30-80% - on

# USIII&IV.

$fname="bn_mul_mont_fpu";

$bits=32;

for (@ARGV) { $bits=64 if (/\-m64/ || /\-xarch\=v9/); }

if ($bits==64) {

$bias=2047;

$frame=192;

} else {

$bias=0;

$frame=128; # 96 rounded up to largest known cache-line

}

$locals=64;

# In order to provide for 32-/64-bit ABI duality, I keep integers wider

# than 32 bit in %g1-%g4 and %o0-%o5. %l0-%l7 and %i0-%i5 are used

# exclusively for pointers, indexes and other small values...

# int bn_mul_mont(

$rp="%i0"; # BN_ULONG *rp,

$ap="%i1"; # const BN_ULONG *ap,

$bp="%i2"; # const BN_ULONG *bp,

$np="%i3"; # const BN_ULONG *np,

$n0="%i4"; # const BN_ULONG *n0,

$num="%i5"; # int num);

$tp="%l0"; # t[num]

$ap_l="%l1"; # a[num],n[num] are smashed to 32-bit words and saved

$ap_h="%l2"; # to these four vectors as double-precision FP values.

$np_l="%l3"; # This way a bunch of fxtods are eliminated in second

$np_h="%l4"; # loop and L1-cache aliasing is minimized...

$i="%l5";

$j="%l6";

$mask="%l7"; # 16-bit mask, 0xffff

$n0="%g4"; # reassigned(!) to "64-bit" register

$carry="%i4"; # %i4 reused(!) for a carry bit

# FP register naming chart

# ..HILO

# dcba

# --------

# LOa

100

# LOb

101

# LOc

102

# LOd

103

# HIa

104

# HIb

105

# HIc

106

# HId

107

# ..a

108

# ..b

109

$ba="%f0"; $bb="%f2"; $bc="%f4"; $bd="%f6";

110

$na="%f8"; $nb="%f10"; $nc="%f12"; $nd="%f14";

111

$alo="%f16"; $alo_="%f17"; $ahi="%f18"; $ahi_="%f19";

112

$nlo="%f20"; $nlo_="%f21"; $nhi="%f22"; $nhi_="%f23";

113

114

$dota="%f24"; $dotb="%f26";

115

116

$aloa="%f32"; $alob="%f34"; $aloc="%f36"; $alod="%f38";

117

$ahia="%f40"; $ahib="%f42"; $ahic="%f44"; $ahid="%f46";

118

$nloa="%f48"; $nlob="%f50"; $nloc="%f52"; $nlod="%f54";

119

$nhia="%f56"; $nhib="%f58"; $nhic="%f60"; $nhid="%f62";

120

121

$ASI_FL16_P=0xD2; # magic ASI value to engage 16-bit FP load

122

123

$code=<<___;

124

.section ".text",#alloc,#execinstr

125

126

.global $fname

127

.align 32

128

$fname:

129

save %sp,-$frame-$locals,%sp

130

131

cmp $num,4

132

bl,a,pn %icc,.Lret

133

clr %i0

134

andcc $num,1,%g0 ! $num has to be even...

135

bnz,a,pn %icc,.Lret

136

clr %i0 ! signal "unsupported input value"

137

138

srl $num,1,$num

139

sethi %hi(0xffff),$mask

140

ld [%i4+0],$n0 ! $n0 reassigned, remember?

141

or $mask,%lo(0xffff),$mask

142

ld [%i4+4],%o0

143

sllx %o0,32,%o0

144

or %o0,$n0,$n0 ! $n0=n0[1].n0[0]

145

146

sll $num,3,$num ! num*=8

147

148

add %sp,$bias,%o0 ! real top of stack

149

sll $num,2,%o1

150

add %o1,$num,%o1 ! %o1=num*5

151

sub %o0,%o1,%o0

152

and %o0,-2048,%o0 ! optimize TLB utilization

153

sub %o0,$bias,%sp ! alloca(5*num*8)

154

155

rd %asi,%o7 ! save %asi

156

add %sp,$bias+$frame+$locals,$tp

157

add $tp,$num,$ap_l

158

add $ap_l,$num,$ap_l ! [an]p_[lh] point at the vectors' ends !

159

add $ap_l,$num,$ap_h

160

add $ap_h,$num,$np_l

161

add $np_l,$num,$np_h

162

163

wr %g0,$ASI_FL16_P,%asi ! setup %asi for 16-bit FP loads

164

165

add $rp,$num,$rp ! readjust input pointers to point

166

add $ap,$num,$ap ! at the ends too...

167

add $bp,$num,$bp

168

add $np,$num,$np

169

170

stx %o7,[%sp+$bias+$frame+48] ! save %asi

171

172

sub %g0,$num,$i ! i=-num

173

sub %g0,$num,$j ! j=-num

174

175

add $ap,$j,%o3

176

add $bp,$i,%o4

177

178

ld [%o3+4],%g1 ! bp[0]

179

ld [%o3+0],%o0

180

ld [%o4+4],%g5 ! ap[0]

181

sllx %g1,32,%g1

182

ld [%o4+0],%o1

183

sllx %g5,32,%g5

184

or %g1,%o0,%o0

185

or %g5,%o1,%o1

186

187

add $np,$j,%o5

188

189

mulx %o1,%o0,%o0 ! ap[0]*bp[0]

190

mulx $n0,%o0,%o0 ! ap[0]*bp[0]*n0

191

stx %o0,[%sp+$bias+$frame+0]

192

193

ld [%o3+0],$alo_ ! load a[j] as pair of 32-bit words

194

fzeros $alo

195

ld [%o3+4],$ahi_

196

fzeros $ahi

197

ld [%o5+0],$nlo_ ! load n[j] as pair of 32-bit words

198

fzeros $nlo

199

ld [%o5+4],$nhi_

200

fzeros $nhi

201

202

! transfer b[i] to FPU as 4x16-bit values

203

ldda [%o4+2]%asi,$ba

204

fxtod $alo,$alo

205

ldda [%o4+0]%asi,$bb

206

fxtod $ahi,$ahi

207

ldda [%o4+6]%asi,$bc

208

fxtod $nlo,$nlo

209

ldda [%o4+4]%asi,$bd

210

fxtod $nhi,$nhi

211

212

! transfer ap[0]*b[0]*n0 to FPU as 4x16-bit values

213

ldda [%sp+$bias+$frame+6]%asi,$na

214

fxtod $ba,$ba

215

ldda [%sp+$bias+$frame+4]%asi,$nb

216

fxtod $bb,$bb

217

ldda [%sp+$bias+$frame+2]%asi,$nc

218

fxtod $bc,$bc

219

ldda [%sp+$bias+$frame+0]%asi,$nd

220

fxtod $bd,$bd

221

222

std $alo,[$ap_l+$j] ! save smashed ap[j] in double format

223

fxtod $na,$na

224

std $ahi,[$ap_h+$j]

225

fxtod $nb,$nb

226

std $nlo,[$np_l+$j] ! save smashed np[j] in double format

227

fxtod $nc,$nc

228

std $nhi,[$np_h+$j]

229

fxtod $nd,$nd

230

231

fmuld $alo,$ba,$aloa

232

fmuld $nlo,$na,$nloa

233

fmuld $alo,$bb,$alob

234

fmuld $nlo,$nb,$nlob

235

fmuld $alo,$bc,$aloc

236

faddd $aloa,$nloa,$nloa

237

fmuld $nlo,$nc,$nloc

238

fmuld $alo,$bd,$alod

239

faddd $alob,$nlob,$nlob

240

fmuld $nlo,$nd,$nlod

241

fmuld $ahi,$ba,$ahia

242

faddd $aloc,$nloc,$nloc

243

fmuld $nhi,$na,$nhia

244

fmuld $ahi,$bb,$ahib

245

faddd $alod,$nlod,$nlod

246

fmuld $nhi,$nb,$nhib

247

fmuld $ahi,$bc,$ahic

248

faddd $ahia,$nhia,$nhia

249

fmuld $nhi,$nc,$nhic

250

fmuld $ahi,$bd,$ahid

251

faddd $ahib,$nhib,$nhib

252

fmuld $nhi,$nd,$nhid

253

254

faddd $ahic,$nhic,$dota ! $nhic

255

faddd $ahid,$nhid,$dotb ! $nhid

256

257

faddd $nloc,$nhia,$nloc

258

faddd $nlod,$nhib,$nlod

259

260

fdtox $nloa,$nloa

261

fdtox $nlob,$nlob

262

fdtox $nloc,$nloc

263

fdtox $nlod,$nlod

264

265

std $nloa,[%sp+$bias+$frame+0]

266

add $j,8,$j

267

std $nlob,[%sp+$bias+$frame+8]

268

add $ap,$j,%o4

269

std $nloc,[%sp+$bias+$frame+16]

270

add $np,$j,%o5

271

std $nlod,[%sp+$bias+$frame+24]

272

273

ld [%o4+0],$alo_ ! load a[j] as pair of 32-bit words

274

fzeros $alo

275

ld [%o4+4],$ahi_

276

fzeros $ahi

277

ld [%o5+0],$nlo_ ! load n[j] as pair of 32-bit words

278

fzeros $nlo

279

ld [%o5+4],$nhi_

280

fzeros $nhi

281

282

fxtod $alo,$alo

283

fxtod $ahi,$ahi

284

fxtod $nlo,$nlo

285

fxtod $nhi,$nhi

286

287

ldx [%sp+$bias+$frame+0],%o0

288

fmuld $alo,$ba,$aloa

289

ldx [%sp+$bias+$frame+8],%o1

290

fmuld $nlo,$na,$nloa

291

ldx [%sp+$bias+$frame+16],%o2

292

fmuld $alo,$bb,$alob

293

ldx [%sp+$bias+$frame+24],%o3

294

fmuld $nlo,$nb,$nlob

295

296

srlx %o0,16,%o7

297

std $alo,[$ap_l+$j] ! save smashed ap[j] in double format

298

fmuld $alo,$bc,$aloc

299

add %o7,%o1,%o1

300

std $ahi,[$ap_h+$j]

301

faddd $aloa,$nloa,$nloa

302

fmuld $nlo,$nc,$nloc

303

srlx %o1,16,%o7

304

std $nlo,[$np_l+$j] ! save smashed np[j] in double format

305

fmuld $alo,$bd,$alod

306

add %o7,%o2,%o2

307

std $nhi,[$np_h+$j]

308

faddd $alob,$nlob,$nlob

309

fmuld $nlo,$nd,$nlod

310

srlx %o2,16,%o7

311

fmuld $ahi,$ba,$ahia

312

add %o7,%o3,%o3 ! %o3.%o2[0..15].%o1[0..15].%o0[0..15]

313

faddd $aloc,$nloc,$nloc

314

fmuld $nhi,$na,$nhia

315

!and %o0,$mask,%o0

316

!and %o1,$mask,%o1

317

!and %o2,$mask,%o2

318

!sllx %o1,16,%o1

319

!sllx %o2,32,%o2

320

!sllx %o3,48,%o7

321

!or %o1,%o0,%o0

322

!or %o2,%o0,%o0

323

!or %o7,%o0,%o0 ! 64-bit result

324

srlx %o3,16,%g1 ! 34-bit carry

325

fmuld $ahi,$bb,$ahib

326

327

faddd $alod,$nlod,$nlod

328

fmuld $nhi,$nb,$nhib

329

fmuld $ahi,$bc,$ahic

330

faddd $ahia,$nhia,$nhia

331

fmuld $nhi,$nc,$nhic

332

fmuld $ahi,$bd,$ahid

333

faddd $ahib,$nhib,$nhib

334

fmuld $nhi,$nd,$nhid

335

336

faddd $dota,$nloa,$nloa

337

faddd $dotb,$nlob,$nlob

338

faddd $ahic,$nhic,$dota ! $nhic

339

faddd $ahid,$nhid,$dotb ! $nhid

340

341

faddd $nloc,$nhia,$nloc

342

faddd $nlod,$nhib,$nlod

343

344

fdtox $nloa,$nloa

345

fdtox $nlob,$nlob

346

fdtox $nloc,$nloc

347

fdtox $nlod,$nlod

348

349

std $nloa,[%sp+$bias+$frame+0]

350

std $nlob,[%sp+$bias+$frame+8]

351

addcc $j,8,$j

352

std $nloc,[%sp+$bias+$frame+16]

353

bz,pn %icc,.L1stskip

354

std $nlod,[%sp+$bias+$frame+24]

355

356

.align 32 ! incidentally already aligned !

357

.L1st:

358

add $ap,$j,%o4

359

add $np,$j,%o5

360

ld [%o4+0],$alo_ ! load a[j] as pair of 32-bit words

361

fzeros $alo

362

ld [%o4+4],$ahi_

363

fzeros $ahi

364

ld [%o5+0],$nlo_ ! load n[j] as pair of 32-bit words

365

fzeros $nlo

366

ld [%o5+4],$nhi_

367

fzeros $nhi

368

369

fxtod $alo,$alo

370

fxtod $ahi,$ahi

371

fxtod $nlo,$nlo

372

fxtod $nhi,$nhi

373

374

ldx [%sp+$bias+$frame+0],%o0

375

fmuld $alo,$ba,$aloa

376

ldx [%sp+$bias+$frame+8],%o1

377

fmuld $nlo,$na,$nloa

378

ldx [%sp+$bias+$frame+16],%o2

379

fmuld $alo,$bb,$alob

380

ldx [%sp+$bias+$frame+24],%o3

381

fmuld $nlo,$nb,$nlob

382

383

srlx %o0,16,%o7

384

std $alo,[$ap_l+$j] ! save smashed ap[j] in double format

385

fmuld $alo,$bc,$aloc

386

add %o7,%o1,%o1

387

std $ahi,[$ap_h+$j]

388

faddd $aloa,$nloa,$nloa

389

fmuld $nlo,$nc,$nloc

390

srlx %o1,16,%o7

391

std $nlo,[$np_l+$j] ! save smashed np[j] in double format

392

fmuld $alo,$bd,$alod

393

add %o7,%o2,%o2

394

std $nhi,[$np_h+$j]

395

faddd $alob,$nlob,$nlob

396

fmuld $nlo,$nd,$nlod

397

srlx %o2,16,%o7

398

fmuld $ahi,$ba,$ahia

399

add %o7,%o3,%o3 ! %o3.%o2[0..15].%o1[0..15].%o0[0..15]

400

and %o0,$mask,%o0

401

faddd $aloc,$nloc,$nloc

402

fmuld $nhi,$na,$nhia

403

and %o1,$mask,%o1

404

and %o2,$mask,%o2

405

fmuld $ahi,$bb,$ahib

406

sllx %o1,16,%o1

407

faddd $alod,$nlod,$nlod

408

fmuld $nhi,$nb,$nhib

409

sllx %o2,32,%o2

410

fmuld $ahi,$bc,$ahic

411

sllx %o3,48,%o7

412

or %o1,%o0,%o0

413

faddd $ahia,$nhia,$nhia

414

fmuld $nhi,$nc,$nhic

415

or %o2,%o0,%o0

416

fmuld $ahi,$bd,$ahid

417

or %o7,%o0,%o0 ! 64-bit result

418

faddd $ahib,$nhib,$nhib

419

fmuld $nhi,$nd,$nhid

420

addcc %g1,%o0,%o0

421

faddd $dota,$nloa,$nloa

422

srlx %o3,16,%g1 ! 34-bit carry

423

faddd $dotb,$nlob,$nlob

424

bcs,a %xcc,.+8

425

add %g1,1,%g1

426

427

stx %o0,[$tp] ! tp[j-1]=

428

429

faddd $ahic,$nhic,$dota ! $nhic

430

faddd $ahid,$nhid,$dotb ! $nhid

431

432

faddd $nloc,$nhia,$nloc

433

faddd $nlod,$nhib,$nlod

434

435

fdtox $nloa,$nloa

436

fdtox $nlob,$nlob

437

fdtox $nloc,$nloc

438

fdtox $nlod,$nlod

439

440

std $nloa,[%sp+$bias+$frame+0]

441

std $nlob,[%sp+$bias+$frame+8]

442

std $nloc,[%sp+$bias+$frame+16]

443

std $nlod,[%sp+$bias+$frame+24]

444

445

addcc $j,8,$j

446

bnz,pt %icc,.L1st

447

add $tp,8,$tp

448

449

.L1stskip:

450

fdtox $dota,$dota

451

fdtox $dotb,$dotb

452

453

ldx [%sp+$bias+$frame+0],%o0

454

ldx [%sp+$bias+$frame+8],%o1

455

ldx [%sp+$bias+$frame+16],%o2

456

ldx [%sp+$bias+$frame+24],%o3

457

458

srlx %o0,16,%o7

459

std $dota,[%sp+$bias+$frame+32]

460

add %o7,%o1,%o1

461

std $dotb,[%sp+$bias+$frame+40]

462

srlx %o1,16,%o7

463

add %o7,%o2,%o2

464

srlx %o2,16,%o7

465

add %o7,%o3,%o3 ! %o3.%o2[0..15].%o1[0..15].%o0[0..15]

466

and %o0,$mask,%o0

467

and %o1,$mask,%o1

468

and %o2,$mask,%o2

469

sllx %o1,16,%o1

470

sllx %o2,32,%o2

471

sllx %o3,48,%o7

472

or %o1,%o0,%o0

473

or %o2,%o0,%o0

474

or %o7,%o0,%o0 ! 64-bit result

475

ldx [%sp+$bias+$frame+32],%o4

476

addcc %g1,%o0,%o0

477

ldx [%sp+$bias+$frame+40],%o5

478

srlx %o3,16,%g1 ! 34-bit carry

479

bcs,a %xcc,.+8

480

add %g1,1,%g1

481

482

stx %o0,[$tp] ! tp[j-1]=

483

add $tp,8,$tp

484

485

srlx %o4,16,%o7

486

add %o7,%o5,%o5

487

and %o4,$mask,%o4

488

sllx %o5,16,%o7

489

or %o7,%o4,%o4

490

addcc %g1,%o4,%o4

491

srlx %o5,48,%g1

492

bcs,a %xcc,.+8

493

add %g1,1,%g1

494

495

mov %g1,$carry

496

stx %o4,[$tp] ! tp[num-1]=

497

498

ba .Louter

499

add $i,8,$i

500

.align 32

501

.Louter:

502

sub %g0,$num,$j ! j=-num

503

add %sp,$bias+$frame+$locals,$tp

504

505

add $ap,$j,%o3

506

add $bp,$i,%o4

507

508

ld [%o3+4],%g1 ! bp[i]

509

ld [%o3+0],%o0

510

ld [%o4+4],%g5 ! ap[0]

511

sllx %g1,32,%g1

512

ld [%o4+0],%o1

513

sllx %g5,32,%g5

514

or %g1,%o0,%o0

515

or %g5,%o1,%o1

516

517

ldx [$tp],%o2 ! tp[0]

518

mulx %o1,%o0,%o0

519

addcc %o2,%o0,%o0

520

mulx $n0,%o0,%o0 ! (ap[0]*bp[i]+t[0])*n0

521

stx %o0,[%sp+$bias+$frame+0]

522

523

! transfer b[i] to FPU as 4x16-bit values

524

ldda [%o4+2]%asi,$ba

525

ldda [%o4+0]%asi,$bb

526

ldda [%o4+6]%asi,$bc

527

ldda [%o4+4]%asi,$bd

528

529

! transfer (ap[0]*b[i]+t[0])*n0 to FPU as 4x16-bit values

530

ldda [%sp+$bias+$frame+6]%asi,$na

531

fxtod $ba,$ba

532

ldda [%sp+$bias+$frame+4]%asi,$nb

533

fxtod $bb,$bb

534

ldda [%sp+$bias+$frame+2]%asi,$nc

535

fxtod $bc,$bc

536

ldda [%sp+$bias+$frame+0]%asi,$nd

537

fxtod $bd,$bd

538

ldd [$ap_l+$j],$alo ! load a[j] in double format

539

fxtod $na,$na

540

ldd [$ap_h+$j],$ahi

541

fxtod $nb,$nb

542

ldd [$np_l+$j],$nlo ! load n[j] in double format

543

fxtod $nc,$nc

544

ldd [$np_h+$j],$nhi

545

fxtod $nd,$nd

546

547

fmuld $alo,$ba,$aloa

548

fmuld $nlo,$na,$nloa

549

fmuld $alo,$bb,$alob

550

fmuld $nlo,$nb,$nlob

551

fmuld $alo,$bc,$aloc

552

faddd $aloa,$nloa,$nloa

553

fmuld $nlo,$nc,$nloc

554

fmuld $alo,$bd,$alod

555

faddd $alob,$nlob,$nlob

556

fmuld $nlo,$nd,$nlod

557

fmuld $ahi,$ba,$ahia

558

faddd $aloc,$nloc,$nloc

559

fmuld $nhi,$na,$nhia

560

fmuld $ahi,$bb,$ahib

561

faddd $alod,$nlod,$nlod

562

fmuld $nhi,$nb,$nhib

563

fmuld $ahi,$bc,$ahic

564

faddd $ahia,$nhia,$nhia

565

fmuld $nhi,$nc,$nhic

566

fmuld $ahi,$bd,$ahid

567

faddd $ahib,$nhib,$nhib

568

fmuld $nhi,$nd,$nhid

569

570

faddd $ahic,$nhic,$dota ! $nhic

571

faddd $ahid,$nhid,$dotb ! $nhid

572

573

faddd $nloc,$nhia,$nloc

574

faddd $nlod,$nhib,$nlod

575

576

fdtox $nloa,$nloa

577

fdtox $nlob,$nlob

578

fdtox $nloc,$nloc

579

fdtox $nlod,$nlod

580

581

std $nloa,[%sp+$bias+$frame+0]

582

std $nlob,[%sp+$bias+$frame+8]

583

std $nloc,[%sp+$bias+$frame+16]

584

add $j,8,$j

585

std $nlod,[%sp+$bias+$frame+24]

586

587

ldd [$ap_l+$j],$alo ! load a[j] in double format

588

ldd [$ap_h+$j],$ahi

589

ldd [$np_l+$j],$nlo ! load n[j] in double format

590

ldd [$np_h+$j],$nhi

591

592

fmuld $alo,$ba,$aloa

593

fmuld $nlo,$na,$nloa

594

fmuld $alo,$bb,$alob

595

fmuld $nlo,$nb,$nlob

596

fmuld $alo,$bc,$aloc

597

ldx [%sp+$bias+$frame+0],%o0

598

faddd $aloa,$nloa,$nloa

599

fmuld $nlo,$nc,$nloc

600

ldx [%sp+$bias+$frame+8],%o1

601

fmuld $alo,$bd,$alod

602

ldx [%sp+$bias+$frame+16],%o2

603

faddd $alob,$nlob,$nlob

604

fmuld $nlo,$nd,$nlod

605

ldx [%sp+$bias+$frame+24],%o3

606

fmuld $ahi,$ba,$ahia

607

608

srlx %o0,16,%o7

609

faddd $aloc,$nloc,$nloc

610

fmuld $nhi,$na,$nhia

611

add %o7,%o1,%o1

612

fmuld $ahi,$bb,$ahib

613

srlx %o1,16,%o7

614

faddd $alod,$nlod,$nlod

615

fmuld $nhi,$nb,$nhib

616

add %o7,%o2,%o2

617

fmuld $ahi,$bc,$ahic

618

srlx %o2,16,%o7

619

faddd $ahia,$nhia,$nhia

620

fmuld $nhi,$nc,$nhic

621

add %o7,%o3,%o3 ! %o3.%o2[0..15].%o1[0..15].%o0[0..15]

622

! why?

623

and %o0,$mask,%o0

624

fmuld $ahi,$bd,$ahid

625

and %o1,$mask,%o1

626

and %o2,$mask,%o2

627

faddd $ahib,$nhib,$nhib

628

fmuld $nhi,$nd,$nhid

629

sllx %o1,16,%o1

630

faddd $dota,$nloa,$nloa

631

sllx %o2,32,%o2

632

faddd $dotb,$nlob,$nlob

633

sllx %o3,48,%o7

634

or %o1,%o0,%o0

635

faddd $ahic,$nhic,$dota ! $nhic

636

or %o2,%o0,%o0

637

faddd $ahid,$nhid,$dotb ! $nhid

638

or %o7,%o0,%o0 ! 64-bit result

639

ldx [$tp],%o7

640

faddd $nloc,$nhia,$nloc

641

addcc %o7,%o0,%o0

642

! end-of-why?

643

faddd $nlod,$nhib,$nlod

644

srlx %o3,16,%g1 ! 34-bit carry

645

fdtox $nloa,$nloa

646

bcs,a %xcc,.+8

647

add %g1,1,%g1

648

649

fdtox $nlob,$nlob

650

fdtox $nloc,$nloc

651

fdtox $nlod,$nlod

652

653

std $nloa,[%sp+$bias+$frame+0]

654

std $nlob,[%sp+$bias+$frame+8]

655

addcc $j,8,$j

656

std $nloc,[%sp+$bias+$frame+16]

657

bz,pn %icc,.Linnerskip

658

std $nlod,[%sp+$bias+$frame+24]

659

660

ba .Linner

661

nop

662

.align 32

663

.Linner:

664

ldd [$ap_l+$j],$alo ! load a[j] in double format

665

ldd [$ap_h+$j],$ahi

666

ldd [$np_l+$j],$nlo ! load n[j] in double format

667

ldd [$np_h+$j],$nhi

668

669

fmuld $alo,$ba,$aloa

670

fmuld $nlo,$na,$nloa

671

fmuld $alo,$bb,$alob

672

fmuld $nlo,$nb,$nlob

673

fmuld $alo,$bc,$aloc

674

ldx [%sp+$bias+$frame+0],%o0

675

faddd $aloa,$nloa,$nloa

676

fmuld $nlo,$nc,$nloc

677

ldx [%sp+$bias+$frame+8],%o1

678

fmuld $alo,$bd,$alod

679

ldx [%sp+$bias+$frame+16],%o2

680

faddd $alob,$nlob,$nlob

681

fmuld $nlo,$nd,$nlod

682

ldx [%sp+$bias+$frame+24],%o3

683

fmuld $ahi,$ba,$ahia

684

685

srlx %o0,16,%o7

686

faddd $aloc,$nloc,$nloc

687

fmuld $nhi,$na,$nhia

688

add %o7,%o1,%o1

689

fmuld $ahi,$bb,$ahib

690

srlx %o1,16,%o7

691

faddd $alod,$nlod,$nlod

692

fmuld $nhi,$nb,$nhib

693

add %o7,%o2,%o2

694

fmuld $ahi,$bc,$ahic

695

srlx %o2,16,%o7

696

faddd $ahia,$nhia,$nhia

697

fmuld $nhi,$nc,$nhic

698

add %o7,%o3,%o3 ! %o3.%o2[0..15].%o1[0..15].%o0[0..15]

699

and %o0,$mask,%o0

700

fmuld $ahi,$bd,$ahid

701

and %o1,$mask,%o1

702

and %o2,$mask,%o2

703

faddd $ahib,$nhib,$nhib

704

fmuld $nhi,$nd,$nhid

705

sllx %o1,16,%o1

706

faddd $dota,$nloa,$nloa

707

sllx %o2,32,%o2

708

faddd $dotb,$nlob,$nlob

709

sllx %o3,48,%o7

710

or %o1,%o0,%o0

711

faddd $ahic,$nhic,$dota ! $nhic

712

or %o2,%o0,%o0

713

faddd $ahid,$nhid,$dotb ! $nhid

714

or %o7,%o0,%o0 ! 64-bit result

715

faddd $nloc,$nhia,$nloc

716

addcc %g1,%o0,%o0

717

ldx [$tp+8],%o7 ! tp[j]

718

faddd $nlod,$nhib,$nlod

719

srlx %o3,16,%g1 ! 34-bit carry

720

fdtox $nloa,$nloa

721

bcs,a %xcc,.+8

722

add %g1,1,%g1

723

fdtox $nlob,$nlob

724

addcc %o7,%o0,%o0

725

fdtox $nloc,$nloc

726

bcs,a %xcc,.+8

727

add %g1,1,%g1

728

729

stx %o0,[$tp] ! tp[j-1]

730

fdtox $nlod,$nlod

731

732

std $nloa,[%sp+$bias+$frame+0]

733

std $nlob,[%sp+$bias+$frame+8]

734

std $nloc,[%sp+$bias+$frame+16]

735

addcc $j,8,$j

736

std $nlod,[%sp+$bias+$frame+24]

737

bnz,pt %icc,.Linner

738

add $tp,8,$tp

739

740

.Linnerskip:

741

fdtox $dota,$dota

742

fdtox $dotb,$dotb

743

744

ldx [%sp+$bias+$frame+0],%o0

745

ldx [%sp+$bias+$frame+8],%o1

746

ldx [%sp+$bias+$frame+16],%o2

747

ldx [%sp+$bias+$frame+24],%o3

748

749

srlx %o0,16,%o7

750

std $dota,[%sp+$bias+$frame+32]

751

add %o7,%o1,%o1

752

std $dotb,[%sp+$bias+$frame+40]

753

srlx %o1,16,%o7

754

add %o7,%o2,%o2

755

srlx %o2,16,%o7

756

add %o7,%o3,%o3 ! %o3.%o2[0..15].%o1[0..15].%o0[0..15]

757

and %o0,$mask,%o0

758

and %o1,$mask,%o1

759

and %o2,$mask,%o2

760

sllx %o1,16,%o1

761

sllx %o2,32,%o2

762

sllx %o3,48,%o7

763

or %o1,%o0,%o0

764

or %o2,%o0,%o0

765

ldx [%sp+$bias+$frame+32],%o4

766

or %o7,%o0,%o0 ! 64-bit result

767

ldx [%sp+$bias+$frame+40],%o5

768

addcc %g1,%o0,%o0

769

ldx [$tp+8],%o7 ! tp[j]

770

srlx %o3,16,%g1 ! 34-bit carry

771

bcs,a %xcc,.+8

772

add %g1,1,%g1

773

774

addcc %o7,%o0,%o0

775

bcs,a %xcc,.+8

776

add %g1,1,%g1

777

778

stx %o0,[$tp] ! tp[j-1]

779

add $tp,8,$tp

780

781

srlx %o4,16,%o7

782

add %o7,%o5,%o5

783

and %o4,$mask,%o4

784

sllx %o5,16,%o7

785

or %o7,%o4,%o4

786

addcc %g1,%o4,%o4

787

srlx %o5,48,%g1

788

bcs,a %xcc,.+8

789

add %g1,1,%g1

790

791

addcc $carry,%o4,%o4

792

stx %o4,[$tp] ! tp[num-1]

793

mov %g1,$carry

794

bcs,a %xcc,.+8

795

add $carry,1,$carry

796

797

addcc $i,8,$i

798

bnz %icc,.Louter

799

nop

800

801

add $tp,8,$tp ! adjust tp to point at the end

802

orn %g0,%g0,%g4

803

sub %g0,$num,%o7 ! n=-num

804

ba .Lsub

805

subcc %g0,%g0,%g0 ! clear %icc.c

806

807

.align 32

808

.Lsub:

809

ldx [$tp+%o7],%o0

810

add $np,%o7,%g1

811

ld [%g1+0],%o2

812

ld [%g1+4],%o3

813

srlx %o0,32,%o1

814

subccc %o0,%o2,%o2

815

add $rp,%o7,%g1

816

subccc %o1,%o3,%o3

817

st %o2,[%g1+0]

818

add %o7,8,%o7

819

brnz,pt %o7,.Lsub

820

st %o3,[%g1+4]

821

subc $carry,0,%g4

822

sub %g0,$num,%o7 ! n=-num

823

ba .Lcopy

824

nop

825

826

.align 32

827

.Lcopy:

828

ldx [$tp+%o7],%o0

829

add $rp,%o7,%g1

830

ld [%g1+0],%o2

831

ld [%g1+4],%o3

832

stx %g0,[$tp+%o7]

833

and %o0,%g4,%o0

834

srlx %o0,32,%o1

835

andn %o2,%g4,%o2

836

andn %o3,%g4,%o3

837

or %o2,%o0,%o0

838

or %o3,%o1,%o1

839

st %o0,[%g1+0]

840

add %o7,8,%o7

841

brnz,pt %o7,.Lcopy

842

st %o1,[%g1+4]

843

sub %g0,$num,%o7 ! n=-num

844

845

.Lzap:

846

stx %g0,[$ap_l+%o7]

847

stx %g0,[$ap_h+%o7]

848

stx %g0,[$np_l+%o7]

849

stx %g0,[$np_h+%o7]

850

add %o7,8,%o7

851

brnz,pt %o7,.Lzap

852

nop

853

854

ldx [%sp+$bias+$frame+48],%o7

855

wr %g0,%o7,%asi ! restore %asi

856

857

mov 1,%i0

858

.Lret:

859

ret

860

restore

861

.type $fname,#function

862

.size $fname,(.-$fname)

863

.asciz "Montgomery Multipltication for UltraSPARC, CRYPTOGAMS by <appro\@openssl.org>"

864

.align 32

865

___

866

867

$code =~ s/\`([^\`]*)\`/eval($1)/gem;

868

869

# Below substitution makes it possible to compile without demanding

870

# VIS extentions on command line, e.g. -xarch=v9 vs. -xarch=v9a. I

871

# dare to do this, because VIS capability is detected at run-time now

872

# and this routine is not called on CPU not capable to execute it. Do

873

# note that fzeros is not the only VIS dependency! Another dependency

874

# is implicit and is just _a_ numerical value loaded to %asi register,

875

# which assembler can't recognize as VIS specific...

876

$code =~ s/fzeros\s+%f([0-9]+)/

877

sprintf(".word\t0x%x\t! fzeros %%f%d",0x81b00c20|($1<<25),$1)

878

/gem;

879

880

print $code;

881

# flush

882

close STDOUT;

Older »