︙ | | | ︙ | |
119
120
121
122
123
124
125
126
127
128
129
130
131
132
|
} else {
table[i+1][j+1] = 0;
}
}
}
return longestCommonSubstring;
},
distanceDamerauLevenshtein: function (s1, s2) {
// distance of Damerau-Levenshtein between <s1> and <s2>
// https://fr.wikipedia.org/wiki/Distance_de_Damerau-Levenshtein
try {
let nLen1 = s1.length;
let nLen2 = s2.length;
|
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
>
|
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
|
} else {
table[i+1][j+1] = 0;
}
}
}
return longestCommonSubstring;
},
distanceDamerauLevenshteinX: function (s1, s2) {
// distance of Damerau-Levenshtein between <s1> and <s2>
// https://fr.wikipedia.org/wiki/Distance_de_Damerau-Levenshtein
try {
let nLen1 = s1.length;
let nLen2 = s2.length;
let matrix = [];
for (let i = 0; i <= nLen1+1; i++) {
matrix[i] = new Array(nLen2 + 2);
}
for (let i = 0; i <= nLen1+1; i++) {
matrix[i][0] = i;
}
for (let j = 0; j <= nLen2+1; j++) {
matrix[0][j] = j;
}
for (let i = 1; i <= nLen1; i++) {
for (let j = 1; j <= nLen2; j++) {
//let nCost = (s1[i-1] === s2[j-1]) ? 0 : 1;
let nCost = char_player.distanceBetweenChars(s1[i-1], s2[j-1]);
matrix[i][j] = Math.min(
matrix[i-1][j] + 1, // Deletion
matrix[i][j-1] + 1, // Insertion
matrix[i-1][j-1] + nCost // Substitution
);
if (i > 1 && j > 1 && s1[i] == s2[j-1] && s1[i-1] == s2[j]) {
matrix[i][j] = Math.min(matrix[i][j], matrix[i-2][j-2] + nCost); // Transposition
}
}
}
return matrix[nLen1][nLen2];
}
catch (e) {
console.error(e);
}
},
distanceDamerauLevenshtein: function (s1, s2) {
// distance of Damerau-Levenshtein between <s1> and <s2>
// https://fr.wikipedia.org/wiki/Distance_de_Damerau-Levenshtein
try {
let nLen1 = s1.length;
let nLen2 = s2.length;
|
︙ | | | ︙ | |
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
|
catch (e) {
console.error(e);
}
},
distanceJaroWinkler: function(a, b, boost = .666) {
// https://github.com/thsig/jaro-winkler-JS
//if (a == b) { return 1.0; }
let a_len = a.length;
let b_len = b.length;
let a_flag = [];
let b_flag = [];
let search_range = Math.floor(Math.max(a_len, b_len) / 2) - 1;
let minv = Math.min(a_len, b_len);
|
|
|
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
|
catch (e) {
console.error(e);
}
},
distanceJaroWinkler: function(a, b, boost = .666) {
// https://github.com/thsig/jaro-winkler-JS
if (a == b) { return 1.0; }
let a_len = a.length;
let b_len = b.length;
let a_flag = [];
let b_flag = [];
let search_range = Math.floor(Math.max(a_len, b_len) / 2) - 1;
let minv = Math.min(a_len, b_len);
|
︙ | | | ︙ | |
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
|
lcss += local_cs;
return Math.round(Math.max(l1, l2) - lcss);
},
showDistance: function (s1, s2) {
console.log(`${s1} ≠ ${s2}`);
let nDL = this.distanceDamerauLevenshtein(s1, s2);
let nS4 = this.distanceSift4(s1, s2);
let fJW = this.distanceJaroWinkler(s1, s2);
console.log(`DL: ${nDL} — S4: ${nS4} — JW: ${fJW}`);
},
// Suffix only
defineSuffixCode: function (sFlex, sStem) {
/*
Returns a string defining how to get stem from flexion
"n(sfx)"
|
>
|
|
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
|
lcss += local_cs;
return Math.round(Math.max(l1, l2) - lcss);
},
showDistance: function (s1, s2) {
console.log(`${s1} ≠ ${s2}`);
let nDL = this.distanceDamerauLevenshtein(s1, s2);
let fDLX = this.distanceDamerauLevenshteinX(s1, s2);
let nS4 = this.distanceSift4(s1, s2);
let fJW = this.distanceJaroWinkler(s1, s2);
console.log(`DL: ${nDL} DLX: ${fDLX} — S4: ${nS4} — JW: ${fJW}`);
},
// Suffix only
defineSuffixCode: function (sFlex, sStem) {
/*
Returns a string defining how to get stem from flexion
"n(sfx)"
|
︙ | | | ︙ | |
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
|
if (typeof(exports) !== 'undefined') {
exports.simplifyWord = str_transform.simplifyWord;
exports.numbersToExponent = str_transform.numbersToExponent;
exports.spellingNormalization = str_transform.spellingNormalization;
exports.longestCommonSubstring = str_transform.longestCommonSubstring;
exports.distanceDamerauLevenshtein = str_transform.distanceDamerauLevenshtein;
exports.distanceJaroWinkler = str_transform.distanceJaroWinkler;
exports.showDistance = str_transform.showDistance;
exports.changeWordWithSuffixCode = str_transform.changeWordWithSuffixCode;
exports.changeWordWithAffixCode = str_transform.changeWordWithAffixCode;
exports.defineAffixCode = str_transform.defineAffixCode;
exports.defineSuffixCode = str_transform.defineSuffixCode;
}
|
>
|
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
|
if (typeof(exports) !== 'undefined') {
exports.simplifyWord = str_transform.simplifyWord;
exports.numbersToExponent = str_transform.numbersToExponent;
exports.spellingNormalization = str_transform.spellingNormalization;
exports.longestCommonSubstring = str_transform.longestCommonSubstring;
exports.distanceDamerauLevenshteinX = str_transform.distanceDamerauLevenshteinX;
exports.distanceDamerauLevenshtein = str_transform.distanceDamerauLevenshtein;
exports.distanceJaroWinkler = str_transform.distanceJaroWinkler;
exports.showDistance = str_transform.showDistance;
exports.changeWordWithSuffixCode = str_transform.changeWordWithSuffixCode;
exports.changeWordWithAffixCode = str_transform.changeWordWithAffixCode;
exports.defineAffixCode = str_transform.defineAffixCode;
exports.defineSuffixCode = str_transform.defineSuffixCode;
}
|