| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111 |
- // Package rollinghash/adler32 implements a rolling version of hash/adler32
- package adler32
- import (
- "hash"
- vanilla "hash/adler32"
- "github.com/chmduquesne/rollinghash"
- )
- const (
- Mod = 65521
- Size = 4
- )
- type digest struct {
- a, b uint32
- // window is treated like a circular buffer, where the oldest element
- // is indicated by d.oldest
- window []byte
- oldest int
- n uint32
- vanilla hash.Hash32
- }
- // Reset resets the Hash to its initial state.
- func (d *digest) Reset() {
- d.window = d.window[:0] // Reset the size but don't reallocate
- d.a = 1
- d.b = 0
- d.oldest = 0
- }
- // New returns a new rollinghash.Hash32 computing the rolling Adler-32
- // checksum. The window is copied from the last Write(). This window is
- // only used to determine which is the oldest element (leaving the
- // window). The calls to Roll() do not recompute the whole checksum.
- func New() rollinghash.Hash32 {
- return &digest{
- a: 1,
- b: 0,
- window: make([]byte, 0),
- oldest: 0,
- vanilla: vanilla.New(),
- }
- }
- // Size returns the number of bytes Sum will return.
- func (d *digest) Size() int { return Size }
- // BlockSize returns the hash's underlying block size.
- // The Write method must be able to accept any amount
- // of data, but it may operate more efficiently if all
- // writes are a multiple of the block size.
- func (d *digest) BlockSize() int { return 1 }
- // Write (via the embedded io.Writer interface) adds more data to the
- // running hash. It never returns an error.
- func (d *digest) Write(p []byte) (int, error) {
- // Copy the window, avoiding allocations where possible
- if len(d.window) != len(p) {
- if cap(d.window) >= len(p) {
- d.window = d.window[:len(p)]
- } else {
- d.window = make([]byte, len(p))
- }
- }
- copy(d.window, p)
- // Piggy-back on the core implementation
- d.vanilla.Reset()
- d.vanilla.Write(p)
- s := d.vanilla.Sum32()
- d.a, d.b = s&0xffff, s>>16
- d.n = uint32(len(p)) % Mod
- return len(d.window), nil
- }
- func (d *digest) Sum32() uint32 {
- return d.b<<16 | d.a
- }
- func (d *digest) Sum(b []byte) []byte {
- v := d.Sum32()
- return append(b, byte(v>>24), byte(v>>16), byte(v>>8), byte(v))
- }
- // Roll updates the checksum of the window from the leaving byte and the
- // entering byte. See
- // http://stackoverflow.com/questions/40985080/why-does-my-rolling-adler32-checksum-not-work-in-go-modulo-arithmetic
- func (d *digest) Roll(b byte) {
- if len(d.window) == 0 {
- d.window = make([]byte, 1)
- d.window[0] = b
- }
- // extract the entering/leaving bytes and update the circular buffer.
- enter := uint32(b)
- leave := uint32(d.window[d.oldest])
- d.window[d.oldest] = b
- d.oldest += 1
- if d.oldest >= len(d.window) {
- d.oldest = 0
- }
- // compute
- d.a = (d.a + Mod + enter - leave) % Mod
- d.b = (d.b + (d.n*leave/Mod+1)*Mod + d.a - (d.n * leave) - 1) % Mod
- }
|