From d27373b5f0bd958862144495bdc5ef452c432fef Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Niels=20M=C3=B6ller?= <nisse@lysator.liu.se>
Date: Thu, 5 Feb 2004 17:01:47 +0100
Subject: [PATCH] New file. About three times faster than the optimized C code.

Rev: src/nettle/x86/arcfour-crypt.asm:1.1
---
 x86/arcfour-crypt.asm | 75 +++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 75 insertions(+)
 create mode 100644 x86/arcfour-crypt.asm

diff --git a/x86/arcfour-crypt.asm b/x86/arcfour-crypt.asm
new file mode 100644
index 00000000..9f2f8eb4
--- /dev/null
+++ b/x86/arcfour-crypt.asm
@@ -0,0 +1,75 @@
+C nettle, low-level cryptographics library
+C 
+C Copyright (C) 2004, Niels Möller
+C  
+C The nettle library is free software; you can redistribute it and/or modify
+C it under the terms of the GNU Lesser General Public License as published by
+C the Free Software Foundation; either version 2.1 of the License, or (at your
+C option) any later version.
+C 
+C The nettle library is distributed in the hope that it will be useful, but
+C WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+C or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
+C License for more details.
+C 
+C You should have received a copy of the GNU Lesser General Public License
+C along with the nettle library; see the file COPYING.LIB.  If not, write to
+C the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
+C MA 02111-1307, USA.
+
+	.file "arcfour.asm"
+
+	C arcfour_crypt(struct arcfour_ctx *ctx,
+	C               unsigned length, uint8_t *dst,
+	C               const uint8_t *src)
+	.text
+	.align 16
+	.globl nettle_arcfour_crypt
+	.type  nettle_arcfour_crypt,@function
+nettle_arcfour_crypt:
+	C save all registers that need to be saved
+	pushl	%ebx		C  16(%esp)
+	pushl	%ebp		C  12(%esp)
+	pushl	%esi		C  8(%esp)
+	pushl	%edi		C  4(%esp)
+
+	C ctx = 20(%esp)
+	C length = 24(%esp)
+	C dst = 28(%esp)
+	C src = 32(%esp)
+
+	movl	24(%esp), %edx		C  length
+	testl	%edx,%edx
+	jz	.Lend
+
+	movl	20(%esp), %ebp		C  ctx
+	movl	28(%esp), %edi
+	movl	32(%esp), %esi
+	addl	%esi, %edx		C  Keep src + length
+	
+	movzbl  256(%ebp), %eax		C  i
+	movzbl  257(%ebp), %ebx		C  j
+.Lloop:
+	incb	%al
+	movzbl  (%ebp, %eax), %ecx	C  si. Clears high bytes
+	addb    %cl, %bl
+	movb    (%ebp, %ebx), %ch	C  sj
+	movb    %ch, (%ebp, %eax)
+	addb    %ch, %cl
+	xorb    %ch, %ch		C  Clear, so it can be used
+					C  for indexing.
+	movb    (%ebp, %ecx), %cl
+	xorb    (%esi), %cl
+	incl    %esi
+	movb    %cl, (%edi)
+	incl    %edi
+	cmpl	%esi, %edx
+	jne	.Lloop
+.Lend:
+	popl	%edi
+	popl	%esi
+	popl	%ebp
+	popl	%ebx
+	ret
+.Leord:
+	.size	nettle_arcfour_crypt,.Leord-aes_decrypt
-- 
GitLab