1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
|
package com.rockymadden.stringmetric
object Metric {
import Transform.StringTransform
trait Metric[A, B] {
def compare(a: A, b: A): Option[B]
}
trait StringMetric[A] extends Metric[Array[Char], A] {
def compare(a: String, b: String): Option[A]
}
object StringMetric {
val DiceSorensen = similarity.DiceSorensenMetric
val Hamming = similarity.HammingMetric
val Jaccard = similarity.JaccardMetric
val Jaro = similarity.JaroMetric
val JaroWinkler = similarity.JaroWinklerMetric
val Levenshtein = similarity.LevenshteinMetric
val Metaphone = phonetic.MetaphoneMetric
val NGram = similarity.NGramMetric
val Nysiis = phonetic.NysiisMetric
val Overlap = similarity.OverlapMetric
val RefinedNysiis = phonetic.RefinedNysiisMetric
val RefinedSoundex = phonetic.RefinedSoundexMetric
val Soundex = phonetic.SoundexMetric
val WeightedLevenshtein = similarity.WeightedLevenshteinMetric
def compareWithDiceSorensen(n: Int)(a: Array[Char], b: Array[Char]) = DiceSorensen(n).compare(a, b)
def compareWithHamming(a: Array[Char], b: Array[Char]) = Hamming.compare(a, b)
def compareWithJaccard(n: Int)(a: Array[Char], b: Array[Char]) = Jaccard(n).compare(a, b)
def compareWithJaro(a: Array[Char], b: Array[Char]) = Jaro.compare(a, b)
def compareWithJaroWinkler(a: Array[Char], b: Array[Char]) = JaroWinkler.compare(a, b)
def compareWithLevenshtein(a: Array[Char], b: Array[Char]) = Levenshtein.compare(a, b)
def compareWithMetaphone(a: Array[Char], b: Array[Char]) = Metaphone.compare(a, b)
def compareWithNGram(n: Int)(a: Array[Char], b: Array[Char]) = NGram(n).compare(a, b)
def compareWithNysiis(a: Array[Char], b: Array[Char]) = Nysiis.compare(a, b)
def compareWithOverlap(n: Int)(a: Array[Char], b: Array[Char]) = Overlap(n).compare(a, b)
def compareWithRefinedNysiis(a: Array[Char], b: Array[Char]) = RefinedNysiis.compare(a, b)
def compareWithRefinedSoundex(a: Array[Char], b: Array[Char]) = RefinedSoundex.compare(a, b)
def compareWithSoundex(a: Array[Char], b: Array[Char]) = Soundex.compare(a, b)
def compareWithWeightedLevenshtein(delete: BigDecimal, insert: BigDecimal, substitute: BigDecimal)
(a: Array[Char], b: Array[Char]) =
WeightedLevenshtein(delete, insert, substitute).compare(a, b)
}
final class StringMetricDecorator[A](val sm: StringMetric[A]) {
val withMemoization: StringMetric[A] = new StringMetric[A] {
private val base: StringMetric[A] = sm
private var memo: Map[(String, String), Option[A]] = Map()
override def compare(a: Array[Char], b: Array[Char]): Option[A] = compare(a.toString, b.toString)
override def compare(a: String, b: String): Option[A] = {
val t = (a, b)
if (memo.contains(t)) memo(t)
else {
memo = memo + (t -> base.compare(a, b))
memo(t)
}
}
}
val withTransform: (StringTransform => StringMetric[A]) = (st) => new StringMetric[A] {
private val base: StringMetric[A] = sm
private val transform: StringTransform = st
override def compare(a: Array[Char], b: Array[Char]): Option[A] = base.compare(transform(a), transform(b))
override def compare(a: String, b: String): Option[A] = compare(a.toCharArray, b.toCharArray)
}
}
}
|