ARMv8 assembly pack: add Qualcomm Kryo results.
authorAndy Polyakov <appro@openssl.org>
Sat, 11 Nov 2017 22:49:16 +0000 (23:49 +0100)
committerAndy Polyakov <appro@openssl.org>
Mon, 13 Nov 2017 10:13:00 +0000 (11:13 +0100)
[skip ci]

Reviewed-by: Tim Hudson <tjh@openssl.org>
crypto/aes/asm/aesv8-armx.pl
crypto/chacha/asm/chacha-armv8.pl
crypto/modes/asm/ghashv8-armx.pl
crypto/poly1305/asm/poly1305-armv8.pl
crypto/sha/asm/keccak1600-armv8.pl
crypto/sha/asm/sha1-armv8.pl
crypto/sha/asm/sha512-armv8.pl

index 385b31fd54e4d7477e00b5616f0b79062f74b4e2..8b37cfc452a02d57f83f666b49a4960dc8570464 100755 (executable)
@@ -35,6 +35,7 @@
 # Cortex-A57(*)        1.95            0.85            0.93
 # Denver       1.96            0.86            0.80
 # Mongoose     1.33            1.20            1.20
+# Kryo         1.26            0.94            1.00
 #
 # (*)  original 3.64/1.34/1.32 results were for r0p0 revision
 #      and are still same even for updated module;
index db3776a2fc17b578085efbcb10f87d84213f0015..4a838bc2b32e204e0d0f3a3f7176a3f5b8e57dce 100755 (executable)
@@ -28,6 +28,7 @@
 # Denver               4.50/+82%       2.63            2.67(*)
 # X-Gene               9.50/+46%       8.82            8.89(*)
 # Mongoose             8.00/+44%       3.64            3.25
+# Kryo                 8.17/+50%       4.83            4.65
 #
 # (*)  it's expected that doubling interleave factor doesn't help
 #      all processors, only those with higher NEON latency and
index a2b0db29ff1841959459f2d8f4754b500a14d999..7187d28b78eafe3c4937e2585a7815531397c97e 100644 (file)
@@ -33,6 +33,7 @@
 # Cortex-A57   1.17            7.61
 # Denver       0.71            6.02
 # Mongoose     1.10            8.06
+# Kryo         1.16            8.00
 #
 # (*)  presented for reference/comparison purposes;
 
index 0fc8667ac7b1674fb55a9b5e753aa03fc6de36bd..ac06457b65301a4dd8b95e8aa30f12f5b02bd389 100755 (executable)
@@ -28,6 +28,7 @@
 # Denver       1.64/+50%       1.18(*)
 # X-Gene       2.13/+68%       2.27
 # Mongoose     1.77/+75%       1.12
+# Kryo         2.70/+55%       1.13
 #
 # (*)  estimate based on resources availability is less than 1.0,
 #      i.e. measured result is worse than expected, presumably binary
index 6ab28accd4de361a4c5718a425cf349b4916c5de..5e4cf77003ddd3b6c2c91988eb6e2a28541d582e 100755 (executable)
@@ -35,6 +35,7 @@
 # Cortex-A57   12
 # X-Gene       14
 # Mongoose     10
+# Kryo         12
 # Denver       7.8
 # Apple A7     7.2
 #
index 84a00bf2afe80b04f5f6e96d16cbba19a7784594..3ba871fedee65f0bce247e8da67a2c588dbbd134 100644 (file)
@@ -26,6 +26,7 @@
 # Denver       2.13                    3.97 (+0%)(**)
 # X-Gene                               8.80 (+200%)
 # Mongoose     2.05                    6.50 (+160%)
+# Kryo         1.88                    8.00 (+90%)
 #
 # (*)  Software results are presented mostly for reference purposes.
 # (**) Keep in mind that Denver relies on binary translation, which
index 88ad44ee5e57f77cce1bca383e9f704a9f93e6d0..a4755e6c364095a9cec2146357f4ae02649e6ca3 100644 (file)
@@ -27,6 +27,7 @@
 # Denver       2.01            10.5 (+26%)     6.70 (+8%)
 # X-Gene                       20.0 (+100%)    12.8 (+300%(***))
 # Mongoose     2.36            13.0 (+50%)     8.36 (+33%)
+# Kryo         1.92            17.4 (+30%)     11.2 (+8%)
 #
 # (*)  Software SHA256 results are of lesser relevance, presented
 #      mostly for informational purposes.