ARMv8 assembly pack: add Samsung Mongoose results.
authorAndy Polyakov <appro@openssl.org>
Sun, 14 Aug 2016 20:37:58 +0000 (22:37 +0200)
committerAndy Polyakov <appro@openssl.org>
Tue, 16 Aug 2016 10:47:49 +0000 (12:47 +0200)
Reviewed-by: Tim Hudson <tjh@openssl.org>
crypto/aes/asm/aesv8-armx.pl
crypto/aes/asm/vpaes-armv8.pl
crypto/chacha/asm/chacha-armv8.pl
crypto/modes/asm/ghashv8-armx.pl
crypto/poly1305/asm/poly1305-armv8.pl
crypto/sha/asm/sha1-armv8.pl
crypto/sha/asm/sha512-armv8.pl

index aa36ed272405ff172c50cef012dc5d1bcf6a1d2a..9246dbb43722fbf09079eb1af87c47707dfbe2ae 100755 (executable)
@@ -34,6 +34,7 @@
 # Cortex-A53   1.32            1.29            1.46
 # Cortex-A57(*)        1.95            0.85            0.93
 # Denver       1.96            0.86            0.80
+# Mongoose     1.33            1.20            1.20
 #
 # (*)  original 3.64/1.34/1.32 results were for r0p0 revision
 #      and are still same even for updated module;
index 776a9b744f3d8ce8a52bcc755b86cc643569d633..d6b5f561c4cff586591ce27817ca6e6e0d039793 100755 (executable)
@@ -29,6 +29,7 @@
 # X-Gene            45.9(**)    45.8/57.7(**)    [33.1/37.6(**)     ]
 # Denver(***)       16.6(**)    15.1/17.8(**)    [8.80/9.93         ]
 # Apple A7(***)     22.7(**)    10.9/14.3        [8.45/10.0         ]
+# Mongoose(***)     26.3(**)    21.0/25.0(**)    [13.3/16.8         ]
 #
 # (*)  ECB denotes approximate result for parallelizeable modes
 #      such as CBC decrypt, CTR, etc.;
index 03e8616a035f81c772851cbcb0dc70003e1d25cf..f7e10747145026f336a7d847e51234a2147d7e26 100755 (executable)
@@ -27,6 +27,7 @@
 # Cortex-A57           8.06/+43%       4.90            4.43(**)
 # Denver               4.50/+82%       2.63            2.67(*)
 # X-Gene               9.50/+46%       8.82            8.89(*)
+# Mongoose             8.00/+44%       3.64            3.25
 #
 # (*)  it's expected that doubling interleave factor doesn't help
 #      all processors, only those with higher NEON latency and
index 5fcd0b9d032ba04189eefef8b81b6acfb63f61fa..cb4537b2217c7e9f5909ddefe46cd1a981d60909 100644 (file)
@@ -35,6 +35,7 @@
 # Cortex-A53   1.01            8.39
 # Cortex-A57   1.17            7.61
 # Denver       0.71            6.02
+# Mongoose     1.10            8.06
 #
 # (*)  presented for reference/comparison purposes;
 
index 98a96b799fa5977b2512078a242a954ee938dd47..607696cab2031397c3a3e01e73f1d4a8eec80794 100755 (executable)
@@ -27,6 +27,7 @@
 # Cortex-A57   2.70/+7%        1.14
 # Denver       1.64/+50%       1.18(*)
 # X-Gene       2.13/+68%       2.27
+# Mongoose     1.77/+75%       1.12
 #
 # (*)  estimate based on resources availability is less than 1.0,
 #      i.e. measured result is worse than expected, presumably binary
index 39609a45bd45174d24919811d3dab58d6d968280..84a00bf2afe80b04f5f6e96d16cbba19a7784594 100644 (file)
@@ -25,6 +25,7 @@
 # Cortex-A57   2.35                    7.88 (+74%)
 # Denver       2.13                    3.97 (+0%)(**)
 # X-Gene                               8.80 (+200%)
+# Mongoose     2.05                    6.50 (+160%)
 #
 # (*)  Software results are presented mostly for reference purposes.
 # (**) Keep in mind that Denver relies on binary translation, which
index ef517df64bf328bb4fabe9922e6e54e7af1762ae..c1aaf778f45a6ef72f6b8308c5fb0658207e8127 100644 (file)
@@ -25,6 +25,7 @@
 # Cortex-A57   2.31            11.6 (+86%)     7.51 (+260%(***))
 # Denver       2.01            10.5 (+26%)     6.70 (+8%)
 # X-Gene                       20.0 (+100%)    12.8 (+300%(***))
+# Mongoose     2.36            13.0 (+50%)     8.36 (+33%)
 # 
 # (*)  Software SHA256 results are of lesser relevance, presented
 #      mostly for informational purposes.