diff options
author | Andy Polyakov <appro@openssl.org> | 2010-11-29 20:52:43 +0000 |
---|---|---|
committer | Andy Polyakov <appro@openssl.org> | 2010-11-29 20:52:43 +0000 |
commit | e822c756b66024d49ab936bf77b745206660fcd2 (patch) | |
tree | c5c6cd2bec509720a0753e245bd3731e99c6de83 /crypto/modes/asm/ghash-s390x.pl | |
parent | 300b1d76fe27541c662ca606a6a201b2718e0c65 (diff) |
s390x assembler pack: adapt for -m31 build, see commentary in Configure
for more details.
Diffstat (limited to 'crypto/modes/asm/ghash-s390x.pl')
-rw-r--r-- | crypto/modes/asm/ghash-s390x.pl | 29 |
1 files changed, 26 insertions, 3 deletions
diff --git a/crypto/modes/asm/ghash-s390x.pl b/crypto/modes/asm/ghash-s390x.pl index d7689de541..16ad034fc1 100644 --- a/crypto/modes/asm/ghash-s390x.pl +++ b/crypto/modes/asm/ghash-s390x.pl @@ -18,6 +18,26 @@ # and the result should be close to 12. In the lack of instruction- # level profiling data it's impossible to tell why... +# November 2010. +# +# Adapt for -m31 build. If kernel supports what's called "highgprs" +# feature on Linux [see /proc/cpuinfo], it's possible to use 64-bit +# instructions and achieve "64-bit" performance even in 31-bit legacy +# application context. The feature is not specific to any particular +# processor, as long as it's "z-CPU". Latter implies that the code +# remains z/Architecture specific. On z990 it was measured to perform +# 2.8x better than 32-bit code generated by gcc 4.3. + +$flavour = shift; + +if ($flavour =~ /3[12]/) { + $SIZE_T=4; + $g=""; +} else { + $SIZE_T=8; + $g="g"; +} + while (($output=shift) && ($output!~/^\w[\w\-]*\.\w+$/)) {} open STDOUT,">$output"; @@ -74,7 +94,7 @@ $code.=<<___ if(!$softonly); .Lsoft_gmult: ___ $code.=<<___; - stmg %r6,%r14,48($sp) + stm${g} %r6,%r14,6*$SIZE_T($sp) aghi $Xi,-1 lghi $len,1 @@ -109,8 +129,11 @@ $code.=<<___ if(!$softonly); .align 32 .Lsoft_ghash: ___ +$cdoe.=<<___ if ($flavour =~ /3[12]/); + llgfr $len,$len +___ $code.=<<___; - stmg %r6,%r14,48($sp) + stm${g} %r6,%r14,6*$SIZE_T($sp) aghi $Xi,-1 srlg $len,$len,4 @@ -209,7 +232,7 @@ $code.=<<___; xgr $Zhi,$tmp stg $Zlo,8+1($Xi) stg $Zhi,0+1($Xi) - lmg %r6,%r14,48($sp) + lm${g} %r6,%r14,6*$SIZE_T($sp) br %r14 .type gcm_ghash_4bit,\@function .size gcm_ghash_4bit,(.-gcm_ghash_4bit) |