Skip to content
Snippets Groups Projects
Select Git revision
  • master
  • siv-mode
  • delete-des-compat
  • delete-rsa_blind
  • aes-struct-layout
  • master-updates
  • release-3.4-fixes
  • struct-layout
  • attribute-deprecated
  • rename-data-symbols
  • x86_64-sha_ni-sha256
  • ecc-params-tweak
  • delete-old-aes
  • cmac-support
  • x86_64-sha_ni-sha1
  • gcm-ctr-opt
  • ctr-opt
  • skein
  • api-opaque-fix
  • curve448
  • nettle_3.4.1_release_20181204
  • nettle_3.4.1rc1
  • nettle_3.4_release_20171119
  • nettle_3.4rc2
  • nettle_3.4rc1
  • nettle_3.3_release_20161001
  • nettle_3.2_release_20160128
  • nettle_3.1.1_release_20150424
  • nettle_3.1_release_20150407
  • nettle_3.1rc3
  • nettle_3.1rc2
  • nettle_3.1rc1
  • nettle_3.0_release_20140607
  • nettle_2.7.1_release_20130528
  • nettle_2.7_release_20130424
  • nettle_2.6_release_20130116
  • nettle_2.5_release_20120707
  • converted-master-branch-to-git
  • nettle_2.4_release_20110903
  • nettle_2.3_release_20110902
40 results

fat-setup.h

Blame
  • Forked from Nettle / nettle
    Source project has a limited visibility.
    • Yuriy M. Kaminskiy's avatar
      67bae1b9
      Add --enable-fat support for arm neon chacha20 · 67bae1b9
      Yuriy M. Kaminskiy authored and Niels Möller's avatar Niels Möller committed
      On BCM2837B0 (Cortex-A53) @1.4GHz (Raspberry Pi 3B+),
      Before:
      `gnutls-cli --benchmark-ciphers`
             CHACHA20-POLY1305 (16384) 51.54 MB/sec
      `gnutls-cli --benchmark-tls-ciphers`:
             ECDHE_RSA_CHACHA20_POLY1305 (payload 1400)  21.31 MB/sec
             ECDHE_RSA_CHACHA20_POLY1305 (payload 15360)  24.60 MB/sec
      `nettle-benchmark`
      		 chacha     encrypt   71.90
      		 chacha     decrypt   71.89
      	chacha_poly1305     encrypt   48.17
      	chacha_poly1305     decrypt   48.17
      	chacha_poly1305      update  146.03
      
      After:
      `gnutls-cli --benchmark-ciphers`
             CHACHA20-POLY1305 (16384) 68.44 MB/sec
      `gnutls-cli --benchmark-tls-ciphers`:
             ECDHE_RSA_CHACHA20_POLY1305 (payload 1400) 27.25 MB/sec
             ECDHE_RSA_CHACHA20_POLY1305 (payload 15360) 32.41 MB/sec
      `nettle-benchmark`
      		 chacha     encrypt  106.00
      		 chacha     decrypt  105.94
      	chacha_poly1305     encrypt   65.94
      	chacha_poly1305     decrypt   65.96
      	chacha_poly1305      update  175.24
      67bae1b9
      History
      Add --enable-fat support for arm neon chacha20
      Yuriy M. Kaminskiy authored and Niels Möller's avatar Niels Möller committed
      On BCM2837B0 (Cortex-A53) @1.4GHz (Raspberry Pi 3B+),
      Before:
      `gnutls-cli --benchmark-ciphers`
             CHACHA20-POLY1305 (16384) 51.54 MB/sec
      `gnutls-cli --benchmark-tls-ciphers`:
             ECDHE_RSA_CHACHA20_POLY1305 (payload 1400)  21.31 MB/sec
             ECDHE_RSA_CHACHA20_POLY1305 (payload 15360)  24.60 MB/sec
      `nettle-benchmark`
      		 chacha     encrypt   71.90
      		 chacha     decrypt   71.89
      	chacha_poly1305     encrypt   48.17
      	chacha_poly1305     decrypt   48.17
      	chacha_poly1305      update  146.03
      
      After:
      `gnutls-cli --benchmark-ciphers`
             CHACHA20-POLY1305 (16384) 68.44 MB/sec
      `gnutls-cli --benchmark-tls-ciphers`:
             ECDHE_RSA_CHACHA20_POLY1305 (payload 1400) 27.25 MB/sec
             ECDHE_RSA_CHACHA20_POLY1305 (payload 15360) 32.41 MB/sec
      `nettle-benchmark`
      		 chacha     encrypt  106.00
      		 chacha     decrypt  105.94
      	chacha_poly1305     encrypt   65.94
      	chacha_poly1305     decrypt   65.96
      	chacha_poly1305      update  175.24
    umac-poly128.c 3.12 KiB
    /* umac-poly128.c
    
       Copyright (C) 2013 Niels Möller
    
       This file is part of GNU Nettle.
    
       GNU Nettle is free software: you can redistribute it and/or
       modify it under the terms of either:
    
         * the GNU Lesser General Public License as published by the Free
           Software Foundation; either version 3 of the License, or (at your
           option) any later version.
    
       or
    
         * the GNU General Public License as published by the Free
           Software Foundation; either version 2 of the License, or (at your
           option) any later version.
    
       or both in parallel, as here.
    
       GNU Nettle is distributed in the hope that it will be useful,
       but WITHOUT ANY WARRANTY; without even the implied warranty of
       MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
       General Public License for more details.
    
       You should have received copies of the GNU General Public License and
       the GNU Lesser General Public License along with this program.  If
       not, see http://www.gnu.org/licenses/.
    */
    
    #if HAVE_CONFIG_H
    # include "config.h"
    #endif
    
    #include <assert.h>
    
    #include "umac.h"
    #include "umac-internal.h"
    
    #define HI(x) (x >> 32)
    #define LO(x) (x & 0xffffffffUL)
    
    static void
    poly128_mul (const uint32_t *k, uint64_t *y)
    {
      uint64_t y0,y1,y2,y3,p0,p1,p2,p3,m0,m1,m2;
      y0 = LO (y[1]);
      y1 = HI (y[1]);
      y2 = LO (y[0]);
      y3 = HI (y[0]);
    
      p0 = y0 * k[3];
      m0 = y0 * k[2] + y1 * k[3];
      p1 = y0 * k[1] + y1 * k[2] + y2 * k[3];
      m1 = y0 * k[0] + y1 * k[1] + y2 * k[2] + y3 * k[3];
      p2 = y1 * k[0] + y2 * k[1] + y3 * k[2];
      m2 = y2 * k[0] + y3 * k[1];
      p3 = y3 * k[0];
    
      /* Collaps to 4 64-bit words,
         +---+---+---+---+
         | p3| p2| p1| p0|
         +-+-+-+-+-+-+-+-+
        +  | m2| m1| m0|
        -+-+-+-+-+-+-+-+-+
      */
      /* But it's convenient to reduce (p3,p2,p1,p0) and (m2,m1,m0) mod p first.*/
      m1 += UMAC_P128_OFFSET * HI(p3);
      p1 += UMAC_P128_OFFSET * (LO(p3) + HI(m2));
      m0 += UMAC_P128_OFFSET * (HI(p2) + LO(m2));
      p0 += UMAC_P128_OFFSET * (LO(p2) + HI(m1));
    
      /* Left to add
         +---+---+
         | p1| p0|
         +-+-+-+-+
         m1| m0|
         +-+---+
      */
      /* First add high parts, with no possibilities for carries */
      p1 += m0 >> 32;
    
      m0 <<= 32;
      m1 <<= 32;
    
      /* Remains:
         +---+---+
         | p1| p0|
         +-+-+---+
        +| m1| m0|
        -+---+---+
      */
      p0 += m0;
      p1 += (p0 < m0);
      p1 += m1;
      if (p1 < m1)
        {
          p0 += UMAC_P128_OFFSET;
          p1 += (p0 < UMAC_P128_OFFSET);
        }
    
      y[0] = p1;
      y[1] = p0;
    }
    
    void
    _umac_poly128 (const uint32_t *k, uint64_t *y, uint64_t mh, uint64_t ml)
    {
      uint64_t yh, yl, cy;
    
      if ( (mh >> 32) == 0xffffffff)
        {
          poly128_mul (k, y);
          if (y[1] > 0)
    	y[1]--;
          else if (y[0] > 0)
    	{
    	  y[0]--;
    	  y[1] = UMAC_P128_HI;
    	}
          else
    	{
    	  y[0] = UMAC_P128_HI;
    	  y[1] = UMAC_P128_LO-1;
    	}
    
          mh -= (ml < UMAC_P128_OFFSET);
          ml -= UMAC_P128_OFFSET;
        }
      assert (mh < UMAC_P128_HI || ml < UMAC_P128_LO);
    
      poly128_mul (k, y);
      yl = y[1] + ml;
      cy = (yl < ml);
      yh = y[0] + cy;
      cy = (yh < cy);
      yh += mh;
      cy += (yh < mh);
      assert (cy <= 1);
      if (cy)
        {
          yl += UMAC_P128_OFFSET;
          yh += yl < UMAC_P128_OFFSET;
        }
    
      y[0] = yh;
      y[1] = yl;
    }