提交 81ee80ab 编写于 作者: A Andy Polyakov

+45% RC4 performance boost on Intel EM64T core. Unrolled loop providing

further +35% will follow...

Submitted by: Zou Nanhai
上级 7d727231
......@@ -181,7 +181,7 @@ $code.=<<___;
.align 16
.LRC4_CHAR:
inc $XX#b
add \$1,$XX#b
movzb `&PTR("BYTE:[$dat+$XX]")`,$TX#d
add $TX#b,$YY#b
movzb `&PTR("BYTE:[$dat+$YY]")`,$TY#d
......@@ -191,9 +191,9 @@ $code.=<<___;
movzb `&PTR("BYTE:[$dat+$TY]")`,$TY#d
xorb `&PTR("BYTE:[$inp]")`,$TY#b
movb $TY#b,`&PTR("BYTE:[$out]")`
inc $inp
inc $out
dec $len
lea 1($inp),$inp
lea 1($out),$out
sub \$1,$len
jnz .LRC4_CHAR
jmp .Lexit
___
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册