From 5cd8ce42ec7f92beac8a7b9d7760f4c873747190 Mon Sep 17 00:00:00 2001 From: Andy Polyakov Date: Tue, 24 Jun 2014 08:06:05 +0200 Subject: ARMv8 assembly pack: add Cortex performance numbers. (cherry picked from commit 0f777aeb50b109052d41b8a55d97faecf728ea00) --- crypto/sha/asm/sha1-armv8.pl | 3 ++- crypto/sha/asm/sha512-armv8.pl | 10 ++++++++-- 2 files changed, 10 insertions(+), 3 deletions(-) (limited to 'crypto/sha') diff --git a/crypto/sha/asm/sha1-armv8.pl b/crypto/sha/asm/sha1-armv8.pl index c1f552b6b3..deb1238d36 100644 --- a/crypto/sha/asm/sha1-armv8.pl +++ b/crypto/sha/asm/sha1-armv8.pl @@ -14,7 +14,8 @@ # # hardware-assisted software(*) # Apple A7 2.31 4.13 (+14%) -# Cortex-A5x n/a n/a +# Cortex-A53 2.19 8.73 (+108%) +# Cortex-A57 2.35 7.88 (+74%) # # (*) Software results are presented mostly for reference purposes. diff --git a/crypto/sha/asm/sha512-armv8.pl b/crypto/sha/asm/sha512-armv8.pl index 6935ed6521..bd7a0a5662 100644 --- a/crypto/sha/asm/sha512-armv8.pl +++ b/crypto/sha/asm/sha512-armv8.pl @@ -14,12 +14,18 @@ # # SHA256-hw SHA256(*) SHA512 # Apple A7 1.97 10.5 (+33%) 6.73 (-1%(**)) -# Cortex-A5x n/a n/a n/a +# Cortex-A53 2.38 15.6 (+110%) 10.1 (+190%(***)) +# Cortex-A57 2.31 11.6 (+86%) 7.51 (+260%(***)) # # (*) Software SHA256 results are of lesser relevance, presented # mostly for informational purposes. # (**) The result is a trade-off: it's possible to improve it by -# 10%, but at the cost of 20% loss on Cortex-A5x. +# 10% (or by 1 cycle per round), but at the cost of 20% loss +# on Cortex-A53 (or by 4 cycles per round). +# (***) Super-impressive coefficients over gcc-generated code are +# indication of some compiler "pathology", most notably code +# generated with -mgeneral-regs-only is significanty faster +# and lags behind assembly only by 50-90%. $flavour=shift; $output=shift; -- cgit v1.2.3