Calculate the simhash value for a list of tokens


A node module to calculate the simhash (

npm install simhash

Simhash is hash that returns similar hash(es) for similar input - in contrast to other hashing algorithms.

// will use crc32 as crypto algorithm as standard
var simhash = require('simhash')();
var result1 = simhash(['a', 'list', 'of', 'a', 'couple', 'of', 'tokens']);
// return1 is [0,0,0,1,0,0,1,1,1,0,1,1,0,1,1,0,1,0,0,0,1,1,0,1,0,1,0,1,0,0,1,0]
var result2 = simhash(['a', 'list', 'of', 'a', 'couple', 'of', 'tokens', '!']);
// result2 is [0,0,0,1,0,0,0,1,1,0,0,1,0,1,1,0,1,0,0,0,1,1,0,1,0,1,0,1,0,0,1,0]

You can also choose to use another algoritm than the standard crc32 one

var simhash = require('simhash')('md5');
var result = simhash(['a', 'list', 'of', 'a', 'couple', 'of', 'tokens']);