You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
71 lines
3.0 KiB
71 lines
3.0 KiB
/*-*- mode:unix-assembly; indent-tabs-mode:t; tab-width:8; coding:utf-8 -*-│ |
|
│vi: set et ft=asm ts=8 tw=8 fenc=utf-8 :vi│ |
|
╞══════════════════════════════════════════════════════════════════════════════╡ |
|
│ Copyright 2020 Justine Alexandra Roberts Tunney │ |
|
│ │ |
|
│ This program is free software; you can redistribute it and/or modify │ |
|
│ it under the terms of the GNU General Public License as published by │ |
|
│ the Free Software Foundation; version 2 of the License. │ |
|
│ │ |
|
│ This program is distributed in the hope that it will be useful, but │ |
|
│ WITHOUT ANY WARRANTY; without even the implied warranty of │ |
|
│ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU │ |
|
│ General Public License for more details. │ |
|
│ │ |
|
│ You should have received a copy of the GNU General Public License │ |
|
│ along with this program; if not, write to the Free Software │ |
|
│ Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA │ |
|
│ 02110-1301 USA │ |
|
╚─────────────────────────────────────────────────────────────────────────────*/ |
|
#include "libc/macros.h" |
|
|
|
/ Generates lookup table for computing CRC-32 byte-by-byte. |
|
/ |
|
/ void crc32init(uint32_t table[256], uint32_t polynomial) { |
|
/ uint32_t d, i, r; |
|
/ for (d = 0; d < 256; ++d) { |
|
/ r = d; |
|
/ for (i = 0; i < 8; ++i) { |
|
/ r = r >> 1 ^ (r & 1 ? polynomial : 0); |
|
/ } |
|
/ table[d] = r; |
|
/ } |
|
/ } |
|
/ |
|
/ @param rdi is pointer to uint32_t[256] array |
|
/ @param esi 32-bit binary polynomial config |
|
/ @note imposes ~300ns one-time cost |
|
crc32init: |
|
push %rbp |
|
mov %rsp,%rbp |
|
.profilable |
|
lea 256*4(%rdi),%rdx |
|
movd %esi,%xmm0 |
|
pshufd $0,%xmm0,%xmm0 # (uint32_t[]){esi,esi,esi,esi} → %xmm0 |
|
pushpop 4,%rax |
|
movd %eax,%xmm2 # (int[]){4,4,4,4} → %xmm2 |
|
pshufd $0,%xmm2,%xmm2 |
|
0: sub $4,%rsp # (int[]){0,1,2,3} → %xmm1 |
|
dec %eax |
|
mov %eax,(%rsp) |
|
jnz 0b |
|
movdqu (%rsp),%xmm1 |
|
1: mov $8,%ecx |
|
movdqa %xmm1,%xmm3 |
|
2: movdqa %xmm3,%xmm4 |
|
psrld $1,%xmm4 |
|
pslld $31,%xmm3 |
|
psrad $31,%xmm3 |
|
pand %xmm0,%xmm3 |
|
pxor %xmm4,%xmm3 |
|
movdqa %xmm3,%xmm4 |
|
.loop 2b |
|
movdqu %xmm3,(%rdi) |
|
add $16,%rdi |
|
paddd %xmm2,%xmm1 |
|
cmp %rdx,%rdi |
|
jb 1b |
|
leave |
|
ret |
|
.endfn crc32init,globl |
|
.source __FILE__
|
|
|