265 lines
9.4 KiB
Go
265 lines
9.4 KiB
Go
package mishmash
|
|
|
|
import (
|
|
"fmt"
|
|
"hash"
|
|
"os"
|
|
"strconv"
|
|
"strings"
|
|
)
|
|
|
|
const (
|
|
UINT32_RESULTS_MASK uint64 = 0x00000000FFFFFFFF // used to mask the uint64 accumulator used by Mishmash
|
|
NUM_PRIMES = 0x100 // sizeof PrimeSet
|
|
|
|
MISHMASH128_DEFAULT_LEFT, MISHMASH128_DEFAULT_RIGHT uint64 = 0, 0x8888888888888888 // default accumulator values used by 128-bit Mishmash
|
|
)
|
|
|
|
type PrimesSet [NUM_PRIMES]uint32 // typedef for an array of uint32 prime numbers
|
|
|
|
func (p *PrimesSet) Select(n uint64) uint32 {
|
|
return (*p)[n&(NUM_PRIMES-1)]
|
|
}
|
|
|
|
// allows loading a primeset from a file - useful for experimenting with new primes
|
|
func LoadPrimesSet(filename string) (PrimesSet, error) {
|
|
f, err := os.ReadFile(filename)
|
|
if err != nil {
|
|
return PrimesSet{}, fmt.Errorf("error reading %s: %w", filename, err)
|
|
}
|
|
fields := strings.Fields(string(f))
|
|
if want, got := NUM_PRIMES, len(fields); want != got {
|
|
return PrimesSet{}, fmt.Errorf("error: requires %d primes (got %d)", want, got)
|
|
}
|
|
results := PrimesSet{}
|
|
for i, s := range fields {
|
|
if n, err := strconv.ParseUint(s, 10, 32); err != nil {
|
|
return PrimesSet{}, fmt.Errorf("error parsing %s: %w", s, err)
|
|
} else {
|
|
results[i] = uint32(n)
|
|
}
|
|
}
|
|
return results, nil
|
|
}
|
|
|
|
// the default PrimeSet used by the various Mishmash implementations
|
|
var ThePrimes = PrimesSet{
|
|
3825240899, 3652005211, 2966014067, 3432177659, 3109134187, 3139884271, 3108258589, 2277840529,
|
|
3748140223, 4206444373, 2684505017, 3883989821, 4076539213, 3880335997, 2603229667, 2358458953,
|
|
4061135443, 3826856503, 2671898833, 3266747401, 3403611587, 2483486933, 3889003891, 2820911959,
|
|
2318077829, 3470930861, 3231587809, 3225029887, 4123396483, 3422817119, 3612514831, 2170177423,
|
|
3058754837, 3000926393, 2825656217, 3387930461, 3532314017, 3245479361, 3466327211, 4080294503,
|
|
4252034179, 2302986211, 3394476707, 3697851029, 3957195257, 2862308587, 4285266071, 3681357247,
|
|
3157577413, 3839398561, 3097979117, 3590787463, 3354450497, 3110291879, 3938796493, 3196834463,
|
|
2374254481, 2702597567, 3046228397, 3461690719, 2641445467, 2401060583, 2483505539, 2775297373,
|
|
2262447391, 3118976533, 3014355683, 3355176449, 4055753381, 2277045713, 3098402119, 3894957487,
|
|
2770620887, 4125228329, 2575044467, 4162428989, 3294651817, 2308925797, 3698223103, 2150023273,
|
|
3075614681, 2410764047, 3624889381, 3264455489, 3241969651, 3001767217, 3407799859, 2998917373,
|
|
2629826653, 2714272271, 3987786247, 2880807353, 3608804803, 2231694917, 3790372403, 4156893413,
|
|
2563320007, 2423350621, 2735169119, 4021079791, 4150641413, 2907916357, 3772971647, 2481168307,
|
|
2842943119, 2234753693, 3966637117, 2732029457, 3207475039, 3533605151, 2349367747, 3336108011,
|
|
2431060103, 2263416899, 2350941683, 3869512277, 3880987697, 3062735029, 2512894603, 3669845519,
|
|
2235487739, 3201016501, 2438124943, 4170458909, 2938134889, 4231610087, 3187120061, 2378420137,
|
|
3365835877, 3078766697, 3704906059, 3541986781, 3969072823, 3510542281, 2306290751, 3898737419,
|
|
2898069347, 4092904481, 2484285403, 2721169823, 4293617527, 2928584759, 2213966141, 2335957513,
|
|
3367371923, 2965261109, 4175805451, 3541995157, 2964065479, 3997902791, 3053542259, 2168926237,
|
|
3253268639, 2620083509, 3314283407, 3873087809, 2636771209, 2737638653, 3209154931, 3414204793,
|
|
3451689091, 2638985941, 2899591693, 2654878441, 2748067627, 3395485733, 2679070523, 3100687721,
|
|
2520033701, 2980087373, 2873947007, 2565436501, 2400053783, 4163039563, 3517993571, 4263192407,
|
|
3385597069, 2768101117, 3502890653, 3092130347, 3748553827, 4109944849, 2418961109, 3398621741,
|
|
3073383031, 2167592489, 2950739053, 3529429811, 3167420899, 4254703357, 3344014309, 3725480141,
|
|
3745944539, 3456003191, 2832137237, 4202217191, 3730577581, 2837794231, 2155546451, 2539211039,
|
|
2256984649, 2458975411, 2986340839, 3412432363, 3596817463, 2973444983, 2409734297, 3273292601,
|
|
3302556869, 3630727567, 3670056499, 3300959521, 3949319809, 3047032057, 3412226563, 2147483647,
|
|
2914045411, 2882644273, 4065606553, 2735903059, 3195020617, 3887229457, 3232900987, 3409357867,
|
|
3037985513, 3162012463, 3340137193, 2186608547, 4018093523, 4153387103, 2566863161, 3087918809,
|
|
3332247019, 3579407009, 3082973791, 4178339461, 3269728331, 2270495261, 2400046513, 2641204147,
|
|
2593078337, 2398468271, 3861488311, 3766456459, 2970457213, 3491800771, 3797865553, 2756555203,
|
|
3154883449, 3782386073, 3324965471, 4088422453, 3784508591, 3903657481, 3010059277, 2936392909,
|
|
}
|
|
|
|
// the mishmash engine - allows use of any prime set to allow experimentation
|
|
func Engine(buffer []byte, length int, accumulator uint64, primes *PrimesSet) uint64 {
|
|
for _, b := range buffer[:length] {
|
|
accumulator1 := uint64(primes.Select(accumulator) + uint32(b))
|
|
accumulator2 := ^accumulator * uint64(primes.Select(uint64(b)))
|
|
accumulator3 := accumulator >> (32 + ((b & 0x1F) ^ (b >> 5)))
|
|
accumulator = accumulator1 + accumulator2 + accumulator3
|
|
}
|
|
return accumulator
|
|
}
|
|
|
|
// general mishmash function - carried over from C++ for feature parity
|
|
func Mishmash(buffer []byte, length int) uint32 {
|
|
accumulator := Engine(buffer, length, 0, &ThePrimes)
|
|
return uint32(accumulator & UINT32_RESULTS_MASK)
|
|
}
|
|
|
|
// general mishmash function - carried over from C++ for feature parity
|
|
func MishmashString(buffer string) uint32 {
|
|
return Mishmash([]byte(buffer), len(buffer))
|
|
}
|
|
|
|
// *Mishmash32 implements the hash.Hash and hash.Hash32 interfaces
|
|
type Mishmash32 struct {
|
|
accumulator uint64
|
|
}
|
|
|
|
// returns the uint32 hash as a byte slice
|
|
func (m *Mishmash32) Bytes() []byte {
|
|
hash := m.Sum32()
|
|
return []byte{
|
|
byte((hash & 0xFF000000) >> 24),
|
|
byte((hash & 0x00FF0000) >> 16),
|
|
byte((hash & 0x0000FF00) >> 8),
|
|
byte((hash & 0x000000FF)),
|
|
}
|
|
}
|
|
|
|
func New32() hash.Hash32 {
|
|
return &Mishmash32{}
|
|
}
|
|
|
|
// Sum appends the current hash to b and returns the resulting slice.
|
|
// It does not change the underlying hash state.
|
|
func (m *Mishmash32) Sum(p []byte) []byte {
|
|
return append(p, m.Bytes()...)
|
|
}
|
|
|
|
// returns the current uint32 hash
|
|
func (m *Mishmash32) Sum32() uint32 {
|
|
return uint32(m.accumulator & UINT32_RESULTS_MASK)
|
|
}
|
|
|
|
// reset accumulator
|
|
func (m *Mishmash32) Reset() {
|
|
m.accumulator = 0
|
|
}
|
|
|
|
// returns the number of bytes Sum() will return
|
|
func (m *Mishmash32) Size() int {
|
|
return 4
|
|
}
|
|
|
|
// BlockSize returns the hash's underlying block size.
|
|
// The Write method must be able to accept any amount
|
|
// of data, but it may operate more efficiently if all writes
|
|
// are a multiple of the block size.
|
|
func (m *Mishmash32) BlockSize() int {
|
|
return 1
|
|
}
|
|
|
|
// Write (via the embedded io.Writer interface) adds more data to the running hash.
|
|
// It never returns an error.
|
|
func (m *Mishmash32) Write(p []byte) (int, error) {
|
|
m.accumulator = Engine(p, len(p), m.accumulator, &ThePrimes)
|
|
return len(p), nil
|
|
}
|
|
|
|
// *Mishmash64 implements the hash.Hash and hash.Hash64 interfaces.
|
|
type Mishmash64 struct {
|
|
accumulator uint64
|
|
}
|
|
|
|
// returns the uint64 hash as a byte slice
|
|
func (m *Mishmash64) Bytes() []byte {
|
|
hash := m.accumulator
|
|
return []byte{
|
|
byte((hash & 0xFF00000000000000) >> 56),
|
|
byte((hash & 0x00FF000000000000) >> 48),
|
|
byte((hash & 0x0000FF0000000000) >> 40),
|
|
byte((hash & 0x000000FF00000000) >> 32),
|
|
byte((hash & 0x00000000FF000000) >> 24),
|
|
byte((hash & 0x0000000000FF0000) >> 16),
|
|
byte((hash & 0x000000000000FF00) >> 8),
|
|
byte((hash & 0x00000000000000FF)),
|
|
}
|
|
}
|
|
|
|
func New64() hash.Hash64 {
|
|
return &Mishmash64{}
|
|
}
|
|
|
|
// Sum appends the current hash to b and returns the resulting slice.
|
|
// It does not change the underlying hash state.
|
|
func (m *Mishmash64) Sum(p []byte) []byte {
|
|
return append(p, m.Bytes()...)
|
|
}
|
|
|
|
// returns the current uint64 hash
|
|
func (m *Mishmash64) Sum64() uint64 {
|
|
return m.accumulator
|
|
}
|
|
|
|
// resets the accumulator to 0
|
|
func (m *Mishmash64) Reset() {
|
|
m.accumulator = 0
|
|
}
|
|
|
|
// returns the number of bytes Sum() will return
|
|
func (m *Mishmash64) Size() int {
|
|
return 8
|
|
}
|
|
|
|
// BlockSize returns the hash's underlying block size.
|
|
// The Write method must be able to accept any amount
|
|
// of data, but it may operate more efficiently if all writes
|
|
// are a multiple of the block size.
|
|
func (m *Mishmash64) BlockSize() int {
|
|
return 1
|
|
}
|
|
|
|
// Write (via the embedded io.Writer interface) adds more data to the running hash.
|
|
// It never returns an error.
|
|
func (m *Mishmash64) Write(p []byte) (int, error) {
|
|
m.accumulator = Engine(p, len(p), m.accumulator, &ThePrimes)
|
|
return len(p), nil
|
|
}
|
|
|
|
// experimental and subject to change
|
|
// *Mishmash128 implements the hash.Hash interface
|
|
type Mishmash128 struct {
|
|
hash1, hash2 Mishmash64
|
|
}
|
|
|
|
func (m *Mishmash128) Bytes() []byte {
|
|
return append(m.hash1.Bytes(), m.hash2.Bytes()...)
|
|
}
|
|
|
|
func New128() hash.Hash {
|
|
hash := &Mishmash128{}
|
|
hash.Reset()
|
|
return hash
|
|
}
|
|
|
|
// Sum appends the current hash to b and returns the resulting slice.
|
|
// It does not change the underlying hash state.
|
|
func (m *Mishmash128) Sum(b []byte) []byte {
|
|
return append(b, m.Bytes()...)
|
|
}
|
|
|
|
func (m *Mishmash128) Reset() {
|
|
m.hash1.accumulator, m.hash2.accumulator = MISHMASH128_DEFAULT_LEFT, MISHMASH128_DEFAULT_RIGHT
|
|
}
|
|
|
|
// returns the number of bytes Sum() will return
|
|
func (m *Mishmash128) Size() int {
|
|
return 16
|
|
}
|
|
|
|
// BlockSize returns the hash's underlying block size.
|
|
// The Write method must be able to accept any amount
|
|
// of data, but it may operate more efficiently if all writes
|
|
// are a multiple of the block size.
|
|
func (m *Mishmash128) BlockSize() int {
|
|
return 1
|
|
}
|
|
|
|
// Write (via the embedded io.Writer interface) adds more data to the running hash.
|
|
// It never returns an error.
|
|
func (m *Mishmash128) Write(p []byte) (int, error) {
|
|
m.hash1.Write(p)
|
|
m.hash2.Write(p)
|
|
return len(p), nil
|
|
}
|