Disable keyers that are super-seeded by others.

This commit is contained in:
Antonin Delpeuch 2018-12-30 21:20:17 +01:00
parent 22cf0517b9
commit 626c17c649
2 changed files with 12 additions and 4 deletions

View File

@ -46,12 +46,15 @@ public class KeyerFactory {
static final private List<String> _keyerNames = new LinkedList<>();
static {
// Some keyers are disabled as they are super-seeded by others
// See https://github.com/OpenRefine/OpenRefine/pull/1906
put("fingerprint", new FingerprintKeyer());
put("ngram-fingerprint", new NGramFingerprintKeyer());
put("metaphone", new MetaphoneKeyer());
put("double-metaphone", new DoubleMetaphoneKeyer());
// put("metaphone", new MetaphoneKeyer());
// put("double-metaphone", new DoubleMetaphoneKeyer());
put("metaphone3", new Metaphone3Keyer());
put("soundex", new SoundexKeyer());
// put("soundex", new SoundexKeyer());
put("cologne-phonetic", new ColognePhoneticKeyer());
}

View File

@ -55,13 +55,18 @@ public class DistanceFactory {
static {
put("levenshtein", new VicinoDistance(new LevenshteinDistance()));
put("ppm", new VicinoDistance(new PPMDistance()));
// Distances not activated as they are not very useful:
// See https://github.com/OpenRefine/OpenRefine/pull/1906
/*
put("jaccard", new VicinoDistance(new JaccardDistance()));
put("jaro", new VicinoDistance(new JaroDistance()));
put("jaro-winkler", new VicinoDistance(new JaroWinklerDistance()));
put("jaro-winkler-tfidf", new VicinoDistance(new JaroWinklerTFIDFDistance()));
put("gzip", new VicinoDistance(new GZipDistance()));
put("bzip2", new VicinoDistance(new BZip2Distance()));
put("ppm", new VicinoDistance(new PPMDistance()));
*/
}
/**