[arch-commits] Commit in libgcrypt/trunk (3 files)

Andreas Radke andyrtr at nymeria.archlinux.org
Fri Jan 17 09:20:21 UTC 2014


    Date: Friday, January 17, 2014 @ 10:20:21
  Author: andyrtr
Revision: 204313

upgpkg: libgcrypt 1.6.0-2

add post release fixes to properly detect AVX/AVX2 cpu extension and fix PBKDF2 slowness; FS#38533/FS#38538

Added:
  libgcrypt/trunk/fix_avx_detection.patch
  libgcrypt/trunk/fix_slow_PBKDF2.patch
Modified:
  libgcrypt/trunk/PKGBUILD

-------------------------+
 PKGBUILD                |   20 ++++-
 fix_avx_detection.patch |  159 ++++++++++++++++++++++++++++++++++++++++++++++
 fix_slow_PBKDF2.patch   |   75 +++++++++++++++++++++
 3 files changed, 251 insertions(+), 3 deletions(-)

Modified: PKGBUILD
===================================================================
--- PKGBUILD	2014-01-17 09:05:40 UTC (rev 204312)
+++ PKGBUILD	2014-01-17 09:20:21 UTC (rev 204313)
@@ -7,7 +7,7 @@
 
 pkgname=libgcrypt
 pkgver=1.6.0
-pkgrel=1
+pkgrel=2
 pkgdesc="General purpose cryptographic library based on the code from GnuPG"
 arch=(i686 x86_64)
 url="http://www.gnupg.org"
@@ -15,9 +15,23 @@
 depends=('libgpg-error>=1.10-2')
 options=('!emptydirs')
 install=$pkgname.install
-source=(ftp://ftp.gnupg.org/gcrypt/${pkgname}/${pkgname}-${pkgver}.tar.bz2)
-sha1sums=('43283c0b41c41e3d3bc13c2d8f937dfe2aaa1a77')
+source=(ftp://ftp.gnupg.org/gcrypt/${pkgname}/${pkgname}-${pkgver}.tar.bz2
+        fix_avx_detection.patch
+        fix_slow_PBKDF2.patch)
+sha1sums=('43283c0b41c41e3d3bc13c2d8f937dfe2aaa1a77'
+          '5219ee3d6e08155149f0fa410b07736d4f502d17'
+          'a27baab3f4bda7ff6fb493115f6bdd1c990184f1')
 
+prepare() {
+  cd ${pkgname}-${pkgver}
+  
+  # fix AVX/AVX2 detextion
+  patch -Np1 -i ${srcdir}/fix_avx_detection.patch
+  
+  # fix slow PBKDF2
+  patch -Np1 -i ${srcdir}/fix_slow_PBKDF2.patch
+}
+
 build() {
   cd ${pkgname}-${pkgver}
   ./configure --prefix=/usr \

Added: fix_avx_detection.patch
===================================================================
--- fix_avx_detection.patch	                        (rev 0)
+++ fix_avx_detection.patch	2014-01-17 09:20:21 UTC (rev 204313)
@@ -0,0 +1,159 @@
+From: Jussi Kivilinna <jussi.kivilinna at iki.fi>
+Date: Sun, 12 Jan 2014 09:31:20 +0000 (+0200)
+Subject: Fix buggy/incomplete detection of AVX/AVX2 support
+X-Git-Url: http://git.gnupg.org/cgi-bin/gitweb.cgi?p=libgcrypt.git;a=commitdiff_plain;h=8302d66d140d5c78c5e808fa1555ed7a8ee27921
+
+Fix buggy/incomplete detection of AVX/AVX2 support
+
+* configure.ac: Also check for 'xgetbv' instruction in AVX and AVX2
+inline assembly checks.
+* src/hwf-x86.c [__i386__] (get_xgetbv): New function.
+[__x86_64__] (get_xgetbv): New function.
+[HAS_X86_CPUID] (detect_x86_gnuc): Check for OSXSAVE and OS support for
+XMM&YMM registers and enable AVX/AVX2 only if XMM&YMM registers are
+supported by OS.
+--
+
+This patch is based on original patch and bug report by Panagiotis Christopoulos:
+
+  Adding better detection of AVX/AVX2 support
+
+  After upgrading libgcrypt from 1.5.3 to 1.6.0 on a remote XEN system (linode) my
+  gpg2 stopped working properly, throwing SIGILL signals when doing sha512
+  operations etc. I managed to debug this with the help of Doublas Freed
+  (dwfreed at mtu.edu) and it seems that the current AVX detection just checks for
+  bit 28 on cpuid but the check still works  on systems that have disabled the avx/avx2
+  instructions for some reason (eg. performance/unstability) resulting in SIGILLs
+  (eg. when trying _gcry_sha512_transform_amd64_avx() ).
+  From Intel resources[1][2], I found additional checks for better AVX
+  detection and applied them in the following patch. Please review/change
+  accordingly and commit some better AVX detection mechanism. The AVX part is
+  tested but could not test the AVX2 one, because I lack proper hardware. I can
+  provide additional information upon request. Use the patch only as a guideline,
+  as it's not thoroughly tested.
+
+  [1] http://software.intel.com/en-us/blogs/2011/04/14/is-avx-enabled
+  [2] http://www.intel.com/content/dam/www/public/us/en/documents/manuals/64-ia-32-architectures-software-developer-manual-325462.pdf (sections 14.3 
+and 14.7.1)
+
+Reported-by: Panagiotis Christopoulos (pchrist) <pchrist at gentoo.org>
+Cc: Doublas Freed <dwfreed at mtu.edu>
+Cc: Tim Harder <radhermit at gentoo.org>
+Signed-off-by: Jussi Kivilinna <jussi.kivilinna at iki.fi>
+(cherry picked from commit bbcb12187afb1756cb27296166b57fa19ee45d4d)
+---
+
+diff --git a/configure.ac b/configure.ac
+index a47e13e..3387b9a 100644
+--- a/configure.ac
++++ b/configure.ac
+@@ -1035,7 +1035,7 @@ AC_CACHE_CHECK([whether GCC inline assembler supports AVX instructions],
+        [gcry_cv_gcc_inline_asm_avx=no
+         AC_COMPILE_IFELSE([AC_LANG_SOURCE(
+           [[void a(void) {
+-              __asm__("vaesdeclast (%[mem]),%%xmm0,%%xmm7\n\t"::[mem]"r"(0):);
++              __asm__("xgetbv; vaesdeclast (%[mem]),%%xmm0,%%xmm7\n\t"::[mem]"r"(0):);
+             }]])],
+           [gcry_cv_gcc_inline_asm_avx=yes])])
+ if test "$gcry_cv_gcc_inline_asm_avx" = "yes" ; then
+@@ -1052,7 +1052,7 @@ AC_CACHE_CHECK([whether GCC inline assembler supports AVX2 instructions],
+        [gcry_cv_gcc_inline_asm_avx2=no
+         AC_COMPILE_IFELSE([AC_LANG_SOURCE(
+           [[void a(void) {
+-              __asm__("vpbroadcastb %%xmm7,%%ymm1\n\t":::"cc");
++              __asm__("xgetbv; vpbroadcastb %%xmm7,%%ymm1\n\t":::"cc");
+             }]])],
+           [gcry_cv_gcc_inline_asm_avx2=yes])])
+ if test "$gcry_cv_gcc_inline_asm_avx2" = "yes" ; then
+diff --git a/src/hwf-x86.c b/src/hwf-x86.c
+index 4e82558..0591b4f 100644
+--- a/src/hwf-x86.c
++++ b/src/hwf-x86.c
+@@ -95,6 +95,21 @@ get_cpuid(unsigned int in, unsigned int *eax, unsigned int *ebx,
+   if (edx)
+     *edx = regs[3];
+ }
++
++static unsigned int
++get_xgetbv(void)
++{
++  unsigned int t_eax;
++
++  asm volatile
++    ("xgetbv\n\t"
++     : "=a" (t_eax)
++     : "c" (0)
++    );
++
++  return t_eax;
++}
++
+ #endif /* i386 && GNUC */
+ 
+ 
+@@ -129,6 +144,21 @@ get_cpuid(unsigned int in, unsigned int *eax, unsigned int *ebx,
+   if (edx)
+     *edx = regs[3];
+ }
++
++static unsigned int
++get_xgetbv(void)
++{
++  unsigned int t_eax;
++
++  asm volatile
++    ("xgetbv\n\t"
++     : "=a" (t_eax)
++     : "c" (0)
++    );
++
++  return t_eax;
++}
++
+ #endif /* x86-64 && GNUC */
+ 
+ 
+@@ -138,9 +168,12 @@ detect_x86_gnuc (void)
+ {
+   char vendor_id[12+1];
+   unsigned int features;
++  unsigned int os_supports_avx_avx2_registers = 0;
+   unsigned int max_cpuid_level;
+   unsigned int result = 0;
+ 
++  (void)os_supports_avx_avx2_registers;
++
+   if (!is_cpuid_available())
+     return 0;
+ 
+@@ -215,10 +248,20 @@ detect_x86_gnuc (void)
+   if (features & 0x02000000)
+      result |= HWF_INTEL_AESNI;
+ #endif /*ENABLE_AESNI_SUPPORT*/
++#if defined(ENABLE_AVX_SUPPORT) || defined(ENABLE_AVX2_SUPPORT)
++  /* Test bit 27 for OSXSAVE (required for AVX/AVX2).  */
++  if (features & 0x08000000)
++    {
++      /* Check that OS has enabled both XMM and YMM state support.  */
++      if ((get_xgetbv() & 0x6) == 0x6)
++        os_supports_avx_avx2_registers = 1;
++    }
++#endif
+ #ifdef ENABLE_AVX_SUPPORT
+   /* Test bit 28 for AVX.  */
+   if (features & 0x10000000)
+-     result |= HWF_INTEL_AVX;
++    if (os_supports_avx_avx2_registers)
++      result |= HWF_INTEL_AVX;
+ #endif /*ENABLE_AVX_SUPPORT*/
+ #ifdef ENABLE_DRNG_SUPPORT
+   /* Test bit 30 for RDRAND.  */
+@@ -242,6 +285,7 @@ detect_x86_gnuc (void)
+ #ifdef ENABLE_AVX2_SUPPORT
+       /* Test bit 5 for AVX2.  */
+       if (features & 0x00000020)
++        if (os_supports_avx_avx2_registers)
+           result |= HWF_INTEL_AVX2;
+ #endif /*ENABLE_AVX_SUPPORT*/
+     }
+

Added: fix_slow_PBKDF2.patch
===================================================================
--- fix_slow_PBKDF2.patch	                        (rev 0)
+++ fix_slow_PBKDF2.patch	2014-01-17 09:20:21 UTC (rev 204313)
@@ -0,0 +1,75 @@
+From: Milan Broz <gmazyland at gmail.com>
+Date: Mon, 13 Jan 2014 20:30:42 +0000 (+0100)
+Subject: PBKDF2: Use gcry_md_reset to speed up calculation.
+X-Git-Url: http://git.gnupg.org/cgi-bin/gitweb.cgi?p=libgcrypt.git;a=commitdiff_plain;h=ead3a097a9ee5908e562e6ec683707c38191acf3
+
+PBKDF2: Use gcry_md_reset to speed up calculation.
+
+* cipher/kdf.c (_gcry_kdf_pkdf2): Use gcry_md_reset
+to speed up calculation.
+--
+
+Current PBKDF2 implementation uses gcry_md_set_key in every iteration
+which is extremely slow (even in comparison with other implementations).
+
+Use gcry_md_reset instead and set key only once.
+
+With this test program:
+
+  char input[32000], salt[8], key[16];
+  gcry_kdf_derive(input, sizeof(input), GCRY_KDF_PBKDF2,
+                  gcry_md_map_name("sha1"),
+                  salt, sizeof(salt), 100000, sizeof(key), key);
+
+running time without patch:
+  real    0m11.165s
+  user    0m11.136s
+  sys     0m0.000s
+
+and with patch applied
+  real    0m0.230s
+  user    0m0.184s
+  sys     0m0.024s
+
+(The problem was found when cryptsetup started to use gcrypt internal PBKDF2
+and for very long keyfiles unlocking time increased drastically.
+See https://bugzilla.redhat.com/show_bug.cgi?id=1051733)
+
+Signed-off-by: Milan Broz <gmazyland at gmail.com>
+(cherry picked from commit 04cda6b7cc16f3f52c12d9d3e46c56701003496e)
+---
+
+diff --git a/cipher/kdf.c b/cipher/kdf.c
+index 503f068..af0dc48 100644
+--- a/cipher/kdf.c
++++ b/cipher/kdf.c
+@@ -175,19 +175,21 @@ _gcry_kdf_pkdf2 (const void *passphrase, size_t passphraselen,
+       return ec;
+     }
+ 
++  ec = _gcry_md_setkey (md, passphrase, passphraselen);
++  if (ec)
++    {
++      _gcry_md_close (md);
++      xfree (sbuf);
++      return ec;
++    }
++
+   /* Step 3 and 4. */
+   memcpy (sbuf, salt, saltlen);
+   for (lidx = 1; lidx <= l; lidx++)
+     {
+       for (iter = 0; iter < iterations; iter++)
+         {
+-          ec = _gcry_md_setkey (md, passphrase, passphraselen);
+-          if (ec)
+-            {
+-              _gcry_md_close (md);
+-              xfree (sbuf);
+-              return ec;
+-            }
++          _gcry_md_reset (md);
+           if (!iter) /* Compute U_1:  */
+             {
+               sbuf[saltlen]     = (lidx >> 24);
+




More information about the arch-commits mailing list