123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444 |
- /**
- xxHash64 implementation in pure Javascript
- Copyright (C) 2016, Pierre Curto
- MIT license
- */
- var UINT64 = require('cuint').UINT64
- /*
- * Constants
- */
- var PRIME64_1 = UINT64( '11400714785074694791' )
- var PRIME64_2 = UINT64( '14029467366897019727' )
- var PRIME64_3 = UINT64( '1609587929392839161' )
- var PRIME64_4 = UINT64( '9650029242287828579' )
- var PRIME64_5 = UINT64( '2870177450012600261' )
- /**
- * Convert string to proper UTF-8 array
- * @param str Input string
- * @returns {Uint8Array} UTF8 array is returned as uint8 array
- */
- function toUTF8Array (str) {
- var utf8 = []
- for (var i=0, n=str.length; i < n; i++) {
- var charcode = str.charCodeAt(i)
- if (charcode < 0x80) utf8.push(charcode)
- else if (charcode < 0x800) {
- utf8.push(0xc0 | (charcode >> 6),
- 0x80 | (charcode & 0x3f))
- }
- else if (charcode < 0xd800 || charcode >= 0xe000) {
- utf8.push(0xe0 | (charcode >> 12),
- 0x80 | ((charcode>>6) & 0x3f),
- 0x80 | (charcode & 0x3f))
- }
- // surrogate pair
- else {
- i++;
- // UTF-16 encodes 0x10000-0x10FFFF by
- // subtracting 0x10000 and splitting the
- // 20 bits of 0x0-0xFFFFF into two halves
- charcode = 0x10000 + (((charcode & 0x3ff)<<10)
- | (str.charCodeAt(i) & 0x3ff))
- utf8.push(0xf0 | (charcode >>18),
- 0x80 | ((charcode>>12) & 0x3f),
- 0x80 | ((charcode>>6) & 0x3f),
- 0x80 | (charcode & 0x3f))
- }
- }
- return new Uint8Array(utf8)
- }
- /**
- * XXH64 object used as a constructor or a function
- * @constructor
- * or
- * @param {Object|String} input data
- * @param {Number|UINT64} seed
- * @return ThisExpression
- * or
- * @return {UINT64} xxHash
- */
- function XXH64 () {
- if (arguments.length == 2)
- return new XXH64( arguments[1] ).update( arguments[0] ).digest()
- if (!(this instanceof XXH64))
- return new XXH64( arguments[0] )
- init.call(this, arguments[0])
- }
- /**
- * Initialize the XXH64 instance with the given seed
- * @method init
- * @param {Number|Object} seed as a number or an unsigned 32 bits integer
- * @return ThisExpression
- */
- function init (seed) {
- this.seed = seed instanceof UINT64 ? seed.clone() : UINT64(seed)
- this.v1 = this.seed.clone().add(PRIME64_1).add(PRIME64_2)
- this.v2 = this.seed.clone().add(PRIME64_2)
- this.v3 = this.seed.clone()
- this.v4 = this.seed.clone().subtract(PRIME64_1)
- this.total_len = 0
- this.memsize = 0
- this.memory = null
- return this
- }
- XXH64.prototype.init = init
- /**
- * Add data to be computed for the XXH64 hash
- * @method update
- * @param {String|Buffer|ArrayBuffer} input as a string or nodejs Buffer or ArrayBuffer
- * @return ThisExpression
- */
- XXH64.prototype.update = function (input) {
- var isString = typeof input == 'string'
- var isArrayBuffer
- // Convert all strings to utf-8 first (issue #5)
- if (isString) {
- input = toUTF8Array(input)
- isString = false
- isArrayBuffer = true
- }
- if (typeof ArrayBuffer !== "undefined" && input instanceof ArrayBuffer)
- {
- isArrayBuffer = true
- input = new Uint8Array(input);
- }
- var p = 0
- var len = input.length
- var bEnd = p + len
- if (len == 0) return this
- this.total_len += len
- if (this.memsize == 0)
- {
- if (isString) {
- this.memory = ''
- } else if (isArrayBuffer) {
- this.memory = new Uint8Array(32)
- } else {
- this.memory = new Buffer(32)
- }
- }
- if (this.memsize + len < 32) // fill in tmp buffer
- {
- // XXH64_memcpy(this.memory + this.memsize, input, len)
- if (isString) {
- this.memory += input
- } else if (isArrayBuffer) {
- this.memory.set( input.subarray(0, len), this.memsize )
- } else {
- input.copy( this.memory, this.memsize, 0, len )
- }
- this.memsize += len
- return this
- }
- if (this.memsize > 0) // some data left from previous update
- {
- // XXH64_memcpy(this.memory + this.memsize, input, 16-this.memsize);
- if (isString) {
- this.memory += input.slice(0, 32 - this.memsize)
- } else if (isArrayBuffer) {
- this.memory.set( input.subarray(0, 32 - this.memsize), this.memsize )
- } else {
- input.copy( this.memory, this.memsize, 0, 32 - this.memsize )
- }
- var p64 = 0
- if (isString) {
- var other
- other = UINT64(
- (this.memory.charCodeAt(p64+1) << 8) | this.memory.charCodeAt(p64)
- , (this.memory.charCodeAt(p64+3) << 8) | this.memory.charCodeAt(p64+2)
- , (this.memory.charCodeAt(p64+5) << 8) | this.memory.charCodeAt(p64+4)
- , (this.memory.charCodeAt(p64+7) << 8) | this.memory.charCodeAt(p64+6)
- )
- this.v1.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- p64 += 8
- other = UINT64(
- (this.memory.charCodeAt(p64+1) << 8) | this.memory.charCodeAt(p64)
- , (this.memory.charCodeAt(p64+3) << 8) | this.memory.charCodeAt(p64+2)
- , (this.memory.charCodeAt(p64+5) << 8) | this.memory.charCodeAt(p64+4)
- , (this.memory.charCodeAt(p64+7) << 8) | this.memory.charCodeAt(p64+6)
- )
- this.v2.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- p64 += 8
- other = UINT64(
- (this.memory.charCodeAt(p64+1) << 8) | this.memory.charCodeAt(p64)
- , (this.memory.charCodeAt(p64+3) << 8) | this.memory.charCodeAt(p64+2)
- , (this.memory.charCodeAt(p64+5) << 8) | this.memory.charCodeAt(p64+4)
- , (this.memory.charCodeAt(p64+7) << 8) | this.memory.charCodeAt(p64+6)
- )
- this.v3.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- p64 += 8
- other = UINT64(
- (this.memory.charCodeAt(p64+1) << 8) | this.memory.charCodeAt(p64)
- , (this.memory.charCodeAt(p64+3) << 8) | this.memory.charCodeAt(p64+2)
- , (this.memory.charCodeAt(p64+5) << 8) | this.memory.charCodeAt(p64+4)
- , (this.memory.charCodeAt(p64+7) << 8) | this.memory.charCodeAt(p64+6)
- )
- this.v4.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- } else {
- var other
- other = UINT64(
- (this.memory[p64+1] << 8) | this.memory[p64]
- , (this.memory[p64+3] << 8) | this.memory[p64+2]
- , (this.memory[p64+5] << 8) | this.memory[p64+4]
- , (this.memory[p64+7] << 8) | this.memory[p64+6]
- )
- this.v1.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- p64 += 8
- other = UINT64(
- (this.memory[p64+1] << 8) | this.memory[p64]
- , (this.memory[p64+3] << 8) | this.memory[p64+2]
- , (this.memory[p64+5] << 8) | this.memory[p64+4]
- , (this.memory[p64+7] << 8) | this.memory[p64+6]
- )
- this.v2.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- p64 += 8
- other = UINT64(
- (this.memory[p64+1] << 8) | this.memory[p64]
- , (this.memory[p64+3] << 8) | this.memory[p64+2]
- , (this.memory[p64+5] << 8) | this.memory[p64+4]
- , (this.memory[p64+7] << 8) | this.memory[p64+6]
- )
- this.v3.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- p64 += 8
- other = UINT64(
- (this.memory[p64+1] << 8) | this.memory[p64]
- , (this.memory[p64+3] << 8) | this.memory[p64+2]
- , (this.memory[p64+5] << 8) | this.memory[p64+4]
- , (this.memory[p64+7] << 8) | this.memory[p64+6]
- )
- this.v4.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- }
- p += 32 - this.memsize
- this.memsize = 0
- if (isString) this.memory = ''
- }
- if (p <= bEnd - 32)
- {
- var limit = bEnd - 32
- do
- {
- if (isString) {
- var other
- other = UINT64(
- (input.charCodeAt(p+1) << 8) | input.charCodeAt(p)
- , (input.charCodeAt(p+3) << 8) | input.charCodeAt(p+2)
- , (input.charCodeAt(p+5) << 8) | input.charCodeAt(p+4)
- , (input.charCodeAt(p+7) << 8) | input.charCodeAt(p+6)
- )
- this.v1.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- p += 8
- other = UINT64(
- (input.charCodeAt(p+1) << 8) | input.charCodeAt(p)
- , (input.charCodeAt(p+3) << 8) | input.charCodeAt(p+2)
- , (input.charCodeAt(p+5) << 8) | input.charCodeAt(p+4)
- , (input.charCodeAt(p+7) << 8) | input.charCodeAt(p+6)
- )
- this.v2.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- p += 8
- other = UINT64(
- (input.charCodeAt(p+1) << 8) | input.charCodeAt(p)
- , (input.charCodeAt(p+3) << 8) | input.charCodeAt(p+2)
- , (input.charCodeAt(p+5) << 8) | input.charCodeAt(p+4)
- , (input.charCodeAt(p+7) << 8) | input.charCodeAt(p+6)
- )
- this.v3.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- p += 8
- other = UINT64(
- (input.charCodeAt(p+1) << 8) | input.charCodeAt(p)
- , (input.charCodeAt(p+3) << 8) | input.charCodeAt(p+2)
- , (input.charCodeAt(p+5) << 8) | input.charCodeAt(p+4)
- , (input.charCodeAt(p+7) << 8) | input.charCodeAt(p+6)
- )
- this.v4.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- } else {
- var other
- other = UINT64(
- (input[p+1] << 8) | input[p]
- , (input[p+3] << 8) | input[p+2]
- , (input[p+5] << 8) | input[p+4]
- , (input[p+7] << 8) | input[p+6]
- )
- this.v1.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- p += 8
- other = UINT64(
- (input[p+1] << 8) | input[p]
- , (input[p+3] << 8) | input[p+2]
- , (input[p+5] << 8) | input[p+4]
- , (input[p+7] << 8) | input[p+6]
- )
- this.v2.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- p += 8
- other = UINT64(
- (input[p+1] << 8) | input[p]
- , (input[p+3] << 8) | input[p+2]
- , (input[p+5] << 8) | input[p+4]
- , (input[p+7] << 8) | input[p+6]
- )
- this.v3.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- p += 8
- other = UINT64(
- (input[p+1] << 8) | input[p]
- , (input[p+3] << 8) | input[p+2]
- , (input[p+5] << 8) | input[p+4]
- , (input[p+7] << 8) | input[p+6]
- )
- this.v4.add( other.multiply(PRIME64_2) ).rotl(31).multiply(PRIME64_1);
- }
- p += 8
- } while (p <= limit)
- }
- if (p < bEnd)
- {
- // XXH64_memcpy(this.memory, p, bEnd-p);
- if (isString) {
- this.memory += input.slice(p)
- } else if (isArrayBuffer) {
- this.memory.set( input.subarray(p, bEnd), this.memsize )
- } else {
- input.copy( this.memory, this.memsize, p, bEnd )
- }
- this.memsize = bEnd - p
- }
- return this
- }
- /**
- * Finalize the XXH64 computation. The XXH64 instance is ready for reuse for the given seed
- * @method digest
- * @return {UINT64} xxHash
- */
- XXH64.prototype.digest = function () {
- var input = this.memory
- var isString = typeof input == 'string'
- var p = 0
- var bEnd = this.memsize
- var h64, h
- var u = new UINT64
- if (this.total_len >= 32)
- {
- h64 = this.v1.clone().rotl(1)
- h64.add( this.v2.clone().rotl(7) )
- h64.add( this.v3.clone().rotl(12) )
- h64.add( this.v4.clone().rotl(18) )
- h64.xor( this.v1.multiply(PRIME64_2).rotl(31).multiply(PRIME64_1) )
- h64.multiply(PRIME64_1).add(PRIME64_4)
- h64.xor( this.v2.multiply(PRIME64_2).rotl(31).multiply(PRIME64_1) )
- h64.multiply(PRIME64_1).add(PRIME64_4)
- h64.xor( this.v3.multiply(PRIME64_2).rotl(31).multiply(PRIME64_1) )
- h64.multiply(PRIME64_1).add(PRIME64_4)
- h64.xor( this.v4.multiply(PRIME64_2).rotl(31).multiply(PRIME64_1) )
- h64.multiply(PRIME64_1).add(PRIME64_4)
- }
- else
- {
- h64 = this.seed.clone().add( PRIME64_5 )
- }
- h64.add( u.fromNumber(this.total_len) )
- while (p <= bEnd - 8)
- {
- if (isString) {
- u.fromBits(
- (input.charCodeAt(p+1) << 8) | input.charCodeAt(p)
- , (input.charCodeAt(p+3) << 8) | input.charCodeAt(p+2)
- , (input.charCodeAt(p+5) << 8) | input.charCodeAt(p+4)
- , (input.charCodeAt(p+7) << 8) | input.charCodeAt(p+6)
- )
- } else {
- u.fromBits(
- (input[p+1] << 8) | input[p]
- , (input[p+3] << 8) | input[p+2]
- , (input[p+5] << 8) | input[p+4]
- , (input[p+7] << 8) | input[p+6]
- )
- }
- u.multiply(PRIME64_2).rotl(31).multiply(PRIME64_1)
- h64
- .xor(u)
- .rotl(27)
- .multiply( PRIME64_1 )
- .add( PRIME64_4 )
- p += 8
- }
- if (p + 4 <= bEnd) {
- if (isString) {
- u.fromBits(
- (input.charCodeAt(p+1) << 8) | input.charCodeAt(p)
- , (input.charCodeAt(p+3) << 8) | input.charCodeAt(p+2)
- , 0
- , 0
- )
- } else {
- u.fromBits(
- (input[p+1] << 8) | input[p]
- , (input[p+3] << 8) | input[p+2]
- , 0
- , 0
- )
- }
- h64
- .xor( u.multiply(PRIME64_1) )
- .rotl(23)
- .multiply( PRIME64_2 )
- .add( PRIME64_3 )
- p += 4
- }
- while (p < bEnd)
- {
- u.fromBits( isString ? input.charCodeAt(p++) : input[p++], 0, 0, 0 )
- h64
- .xor( u.multiply(PRIME64_5) )
- .rotl(11)
- .multiply(PRIME64_1)
- }
- h = h64.clone().shiftRight(33)
- h64.xor(h).multiply(PRIME64_2)
- h = h64.clone().shiftRight(29)
- h64.xor(h).multiply(PRIME64_3)
- h = h64.clone().shiftRight(32)
- h64.xor(h)
- // Reset the state
- this.init( this.seed )
- return h64
- }
- module.exports = XXH64
|