From 17748f18b9f46a39c1cc38cfc9e6b4bf93da1a22 Mon Sep 17 00:00:00 2001 From: Jeroen van Rijn Date: Thu, 24 Jun 2021 19:06:39 +0200 Subject: [PATCH] Adler32 speedup. --- core/hash/hash.odin | 45 +++++++++++++++++++++++++++++++++++++++------ 1 file changed, 39 insertions(+), 6 deletions(-) diff --git a/core/hash/hash.odin b/core/hash/hash.odin index 6740629be..36dda9333 100644 --- a/core/hash/hash.odin +++ b/core/hash/hash.odin @@ -1,16 +1,49 @@ package hash import "core:mem" +import "intrinsics" @(optimization_mode="speed") -adler32 :: proc(data: []byte, seed := u32(1)) -> u32 { +adler32 :: proc(data: []byte, seed := u32(1)) -> u32 #no_bounds_check { + ADLER_CONST :: 65521; - a, b: u32 = seed & 0xFFFF, seed >> 16; - #no_bounds_check for x in data { - a = (a + u32(x)) % ADLER_CONST; - b = (b + a) % ADLER_CONST; + + buffer := raw_data(data); + a, b: u64 = u64(seed) & 0xFFFF, u64(seed) >> 16; + buf := data[:]; + + for len(buf) != 0 && uintptr(buffer) & 7 != 0 { + a = (a + u64(buf[0])); + b = (b + a); + buffer = intrinsics.ptr_offset(buffer, 1); + buf = buf[1:]; } - return (b << 16) | a; + + for len(buf) > 7 { + count := min(len(buf), 5552); + for count > 7 { + a += u64(buf[0]); b += a; + a += u64(buf[1]); b += a; + a += u64(buf[2]); b += a; + a += u64(buf[3]); b += a; + a += u64(buf[4]); b += a; + a += u64(buf[5]); b += a; + a += u64(buf[6]); b += a; + a += u64(buf[7]); b += a; + + buf = buf[8:]; + count -= 8; + } + a %= ADLER_CONST; + b %= ADLER_CONST; + } + + for len(buf) != 0 { + a = (a + u64(buf[0])) % ADLER_CONST; + b = (b + a) % ADLER_CONST; + buf = buf[1:]; + } + return (u32(b) << 16) | u32(a); } @(optimization_mode="speed")