Commentary update motivating code update in 0.9.7.

author Andy Polyakov <appro@openssl.org>

Wed, 4 May 2005 14:51:38 +0000 (14:51 +0000)

committer Andy Polyakov <appro@openssl.org>

Wed, 4 May 2005 14:51:38 +0000 (14:51 +0000)
author Andy Polyakov <appro@openssl.org>
Wed, 4 May 2005 14:51:38 +0000 (14:51 +0000)
committer Andy Polyakov <appro@openssl.org>
Wed, 4 May 2005 14:51:38 +0000 (14:51 +0000)
diff --git a/crypto/rc4/asm/rc4-x86_64.pl b/crypto/rc4/asm/rc4-x86_64.pl

index f96df377b5c791565a26181214abb8f8110d9bd8..4b990cba077e21ac5233724af0e1f1d9d1045dcf 100755 (executable)
--- a/crypto/rc4/asm/rc4-x86_64.pl
+++ b/crypto/rc4/asm/rc4-x86_64.pl
@@ -45,9 +45,9 @@
  # achieves respectful 432MBps on 2.8GHz processor now. For reference.
  # If executed on Xeon, current RC4_CHAR code-path is 2.7x faster than
  # RC4_INT code-path. While if executed on Opteron, it's only 25%
-# slower slower than the RC4_INT one [meaning that if detecting CPU
-# is not desired, then RC4_CHAR code-path should be preferred, as it
-# provides better *all-round* performance].
+# slower than the RC4_INT one [meaning that if CPU µ-arch detection
+# is not implemented, then this final RC4_CHAR code-path should be
+# preferred, as it provides better *all-round* performance].
  
  $output=shift;
  open STDOUT,"| $^X ../perlasm/x86_64-xlate.pl $output";
@@ -184,7 +184,7 @@ $code.=<<___;
         add     $TX[0]#b,$YY#b
         lea     1($XX[0]),$XX[1]
         movzb   ($dat,$YY),$TY#d
-       movzb   $XX[1]#b,$XX[1]
+       movzb   $XX[1]#b,$XX[1]#d
         movzb   ($dat,$XX[1]),$TX[1]#d
         movb    $TX[0]#b,($dat,$YY)
         cmp     $XX[1],$YY
author	Andy Polyakov <appro@openssl.org>
	Wed, 4 May 2005 14:51:38 +0000 (14:51 +0000)
committer	Andy Polyakov <appro@openssl.org>
	Wed, 4 May 2005 14:51:38 +0000 (14:51 +0000)