summaryrefslogtreecommitdiff
path: root/core/src/main/scala/com/rockymadden/stringmetric/Metric.scala
blob: f217f521b4963deb7172dceb795ed1a1a77c6dc6 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
package com.rockymadden.stringmetric

object Metric {
	import Transform.StringTransform


	trait Metric[A, B] {
		def compare(a: A, b: A): Option[B]
	}


	trait StringMetric[A] extends Metric[Array[Char], A] {
		def compare(a: String, b: String): Option[A]
	}


	object StringMetric {
		val DiceSorensen = similarity.DiceSorensenMetric
		val Hamming = similarity.HammingMetric
		val Jaccard = similarity.JaccardMetric
		val Jaro = similarity.JaroMetric
		val JaroWinkler = similarity.JaroWinklerMetric
		val Levenshtein = similarity.LevenshteinMetric
		val Metaphone = phonetic.MetaphoneMetric
		val NGram = similarity.NGramMetric
		val Nysiis = phonetic.NysiisMetric
		val Overlap = similarity.OverlapMetric
		val RefinedNysiis = phonetic.RefinedNysiisMetric
		val RefinedSoundex = phonetic.RefinedSoundexMetric
		val Soundex = phonetic.SoundexMetric
		val WeightedLevenshtein = similarity.WeightedLevenshteinMetric

		def compareWithDiceSorensen(n: Int)(a: Array[Char], b: Array[Char]) = DiceSorensen(n).compare(a, b)

		def compareWithHamming(a: Array[Char], b: Array[Char]) = Hamming.compare(a, b)

		def compareWithJaccard(n: Int)(a: Array[Char], b: Array[Char]) = Jaccard(n).compare(a, b)

		def compareWithJaro(a: Array[Char], b: Array[Char]) = Jaro.compare(a, b)

		def compareWithJaroWinkler(a: Array[Char], b: Array[Char]) = JaroWinkler.compare(a, b)

		def compareWithLevenshtein(a: Array[Char], b: Array[Char]) = Levenshtein.compare(a, b)

		def compareWithMetaphone(a: Array[Char], b: Array[Char]) = Metaphone.compare(a, b)

		def compareWithNGram(n: Int)(a: Array[Char], b: Array[Char]) = NGram(n).compare(a, b)

		def compareWithNysiis(a: Array[Char], b: Array[Char]) = Nysiis.compare(a, b)

		def compareWithOverlap(n: Int)(a: Array[Char], b: Array[Char]) = Overlap(n).compare(a, b)

		def compareWithRefinedNysiis(a: Array[Char], b: Array[Char]) = RefinedNysiis.compare(a, b)

		def compareWithRefinedSoundex(a: Array[Char], b: Array[Char]) = RefinedSoundex.compare(a, b)

		def compareWithSoundex(a: Array[Char], b: Array[Char]) = Soundex.compare(a, b)

		def compareWithWeightedLevenshtein(delete: BigDecimal, insert: BigDecimal, substitute: BigDecimal)
			(a: Array[Char], b: Array[Char]) =

			WeightedLevenshtein(delete, insert, substitute).compare(a, b)
	}

	final class StringMetricDecorator[A](val sm: StringMetric[A]) {
		val withMemoization: StringMetric[A] = new StringMetric[A] {
			private val base: StringMetric[A] = sm
			private var memo: Map[(String, String), Option[A]] = Map()

			override def compare(a: Array[Char], b: Array[Char]): Option[A] =  compare(a.toString, b.toString)

			override def compare(a: String, b: String): Option[A] = {
				val t = (a, b)

				if (memo.contains(t)) memo(t)
				else {
					memo = memo + (t -> base.compare(a, b))
					memo(t)
				}
			}
		}

		val withTransform: (StringTransform => StringMetric[A]) = (st) => new StringMetric[A] {
			private val base: StringMetric[A] = sm
			private val transform: StringTransform = st

			override def compare(a: Array[Char], b: Array[Char]): Option[A] = base.compare(transform(a), transform(b))

			override def compare(a: String, b: String): Option[A] = compare(a.toCharArray, b.toCharArray)
		}
	}
}