123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211 |
- (function() {
- 'use strict';
- /**
- * Extend an Object with another Object's properties.
- *
- * The source objects are specified as additional arguments.
- *
- * @param dst Object the object to extend.
- *
- * @return Object the final object.
- */
- var _extend = function(dst) {
- var sources = Array.prototype.slice.call(arguments, 1);
- for (var i=0; i<sources.length; ++i) {
- var src = sources[i];
- for (var p in src) {
- if (src.hasOwnProperty(p)) dst[p] = src[p];
- }
- }
- return dst;
- };
- /**
- * Defer execution of given function.
- * @param {Function} func
- */
- var _defer = function(func) {
- if (typeof setImmediate === 'function') {
- return setImmediate(func);
- } else {
- return setTimeout(func, 0);
- }
- };
- /**
- * Based on the algorithm at http://en.wikipedia.org/wiki/Levenshtein_distance.
- */
- var Levenshtein = {
- /**
- * Calculate levenshtein distance of the two strings.
- *
- * @param str1 String the first string.
- * @param str2 String the second string.
- * @return Integer the levenshtein distance (0 and above).
- */
- get: function(str1, str2) {
- // base cases
- if (str1 === str2) return 0;
- if (str1.length === 0) return str2.length;
- if (str2.length === 0) return str1.length;
- // two rows
- var prevRow = new Array(str2.length + 1),
- curCol, nextCol, i, j, tmp;
- // initialise previous row
- for (i=0; i<prevRow.length; ++i) {
- prevRow[i] = i;
- }
- // calculate current row distance from previous row
- for (i=0; i<str1.length; ++i) {
- nextCol = i + 1;
- for (j=0; j<str2.length; ++j) {
- curCol = nextCol;
- // substution
- nextCol = prevRow[j] + ( (str1.charAt(i) === str2.charAt(j)) ? 0 : 1 );
- // insertion
- tmp = curCol + 1;
- if (nextCol > tmp) {
- nextCol = tmp;
- }
- // deletion
- tmp = prevRow[j + 1] + 1;
- if (nextCol > tmp) {
- nextCol = tmp;
- }
- // copy current col value into previous (in preparation for next iteration)
- prevRow[j] = curCol;
- }
- // copy last col value into previous (in preparation for next iteration)
- prevRow[j] = nextCol;
- }
- return nextCol;
- },
- /**
- * Asynchronously calculate levenshtein distance of the two strings.
- *
- * @param str1 String the first string.
- * @param str2 String the second string.
- * @param cb Function callback function with signature: function(Error err, int distance)
- * @param [options] Object additional options.
- * @param [options.progress] Function progress callback with signature: function(percentComplete)
- */
- getAsync: function(str1, str2, cb, options) {
- options = _extend({}, {
- progress: null
- }, options);
- // base cases
- if (str1 === str2) return cb(null, 0);
- if (str1.length === 0) return cb(null, str2.length);
- if (str2.length === 0) return cb(null, str1.length);
- // two rows
- var prevRow = new Array(str2.length + 1),
- curCol, nextCol,
- i, j, tmp,
- startTime, currentTime;
- // initialise previous row
- for (i=0; i<prevRow.length; ++i) {
- prevRow[i] = i;
- }
- nextCol = 1;
- i = 0;
- j = -1;
- var __calculate = function() {
- // reset timer
- startTime = new Date().valueOf();
- currentTime = startTime;
- // keep going until one second has elapsed
- while (currentTime - startTime < 1000) {
- // reached end of current row?
- if (str2.length <= (++j)) {
- // copy current into previous (in preparation for next iteration)
- prevRow[j] = nextCol;
- // if already done all chars
- if (str1.length <= (++i)) {
- return cb(null, nextCol);
- }
- // else if we have more left to do
- else {
- nextCol = i + 1;
- j = 0;
- }
- }
- // calculation
- curCol = nextCol;
- // substution
- nextCol = prevRow[j] + ( (str1.charAt(i) === str2.charAt(j)) ? 0 : 1 );
- // insertion
- tmp = curCol + 1;
- if (nextCol > tmp) {
- nextCol = tmp;
- }
- // deletion
- tmp = prevRow[j + 1] + 1;
- if (nextCol > tmp) {
- nextCol = tmp;
- }
- // copy current into previous (in preparation for next iteration)
- prevRow[j] = curCol;
- // get current time
- currentTime = new Date().valueOf();
- }
- // send a progress update?
- if (null !== options.progress) {
- try {
- options.progress.call(null, (i * 100.0/ str1.length));
- } catch (err) {
- return cb('Progress callback: ' + err.toString());
- }
- }
- // next iteration
- _defer(__calculate);
- };
- __calculate();
- }
- };
- // amd
- if (typeof define !== "undefined" && define !== null && define.amd) {
- define(function() {
- return Levenshtein;
- });
- }
- // commonjs
- else if (typeof module !== "undefined" && module !== null && typeof exports !== "undefined" && module.exports === exports) {
- module.exports = Levenshtein;
- }
- // web worker
- else if (typeof self !== "undefined" && typeof self.postMessage === 'function' && typeof self.importScripts === 'function') {
- self.Levenshtein = Levenshtein;
- }
- // browser main thread
- else if (typeof window !== "undefined" && window !== null) {
- window.Levenshtein = Levenshtein;
- }
- }());
|