From 2d9a6642a92bc783a85d645562621357a902fab7 Mon Sep 17 00:00:00 2001 From: sigsegv7 Date: Mon, 18 Sep 2023 00:54:22 -0400 Subject: Optimize with SSE2/SSE3 and 128 bit inversions Signed-off-by: sigsegv7 --- src/sse_accel.S | 45 +++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 45 insertions(+) create mode 100644 src/sse_accel.S (limited to 'src/sse_accel.S') diff --git a/src/sse_accel.S b/src/sse_accel.S new file mode 100644 index 0000000..928caaf --- /dev/null +++ b/src/sse_accel.S @@ -0,0 +1,45 @@ +/* + * Copyright (c) 2023 Ian Marco Moffett and the VegaOS team. + * All rights reserved. + * + * Redistribution and use in source and binary forms, with or without + * modification, are permitted provided that the following conditions are met: + * + * 1. Redistributions of source code must retain the above copyright notice, + * this list of conditions and the following disclaimer. + * 2. Redistributions in binary form must reproduce the above copyright + * notice, this list of conditions and the following disclaimer in the + * documentation and/or other materials provided with the distribution. + * 3. Neither the name of VegaOS nor the names of its + * contributors may be used to endorse or promote products derived from + * this software without specific prior written permission. + * + * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" + * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE + * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE + * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE + * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR + * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF + * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS + * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN + * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) + * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE + * POSSIBILITY OF SUCH DAMAGE. + */ + + .section .text + .globl accel_invert128 + + /* + * accel_invert128(uint64_t addr) + */ + accel_invert128: + movq %rdi, %rax + movdqu (%rax), %xmm0 + + /* Set %xmm1 to all 1s and emulate NOT for %xmm0 */ + pcmpeqb %xmm1, %xmm1 + pxor %xmm0, %xmm1 + + movdqu %xmm0, (%rax) + retq -- cgit v1.2.3