summaryrefslogtreecommitdiffstats
path: root/crypto
diff options
context:
space:
mode:
authorAndy Polyakov <appro@openssl.org>2015-12-21 14:26:12 +0100
committerAndy Polyakov <appro@openssl.org>2015-12-22 10:30:03 +0100
commitb859d70d4a04db2e3b39b5c86cb6750d3c5b9593 (patch)
tree8e739dc3aeb492fc986b3e70ae7e29dded9011a2 /crypto
parentsha/asm/sha256-armv4.pl: one of "universal" flags combination didn't compile. (diff)
downloadopenssl-b859d70d4a04db2e3b39b5c86cb6750d3c5b9593.tar.xz
openssl-b859d70d4a04db2e3b39b5c86cb6750d3c5b9593.zip
bn/asm/bn-c64xplus.asm: update commentary.
Reviewed-by: Rich Salz <rsalz@openssl.org>
Diffstat (limited to 'crypto')
-rw-r--r--crypto/bn/asm/bn-c64xplus.asm5
1 files changed, 3 insertions, 2 deletions
diff --git a/crypto/bn/asm/bn-c64xplus.asm b/crypto/bn/asm/bn-c64xplus.asm
index 7cd58817e7..7b72bff4ac 100644
--- a/crypto/bn/asm/bn-c64xplus.asm
+++ b/crypto/bn/asm/bn-c64xplus.asm
@@ -284,8 +284,9 @@ _bn_mul_comba4:
.if 0
BNOP sploopNxM?,3
;; Above mentioned m*2*(n+1)+10 does not apply in n=m=4 case,
- ;; because of read-after-write penalties, it's rather
- ;; n*2*(n+3)+10, or 66 cycles [plus various overheads]...
+ ;; because of low-counter effect, when prologue phase finishes
+ ;; before SPKERNEL instruction is reached. As result it's 25%
+ ;; slower than expected...
MVK 4,B0 ; N, RILC
|| MVK 4,A0 ; M, outer loop counter
|| MV ARG1,A5 ; copy ap