summaryrefslogtreecommitdiff
path: root/src/compiler/scala/tools/util/EditDistance.scala
blob: a8d7408532d984a3b99412af9793fbc985214f4d (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
/* NSC -- new Scala compiler
 * Copyright 2005-2011 LAMP/EPFL
 * @author  Paul Phillips
 */

package scala.tools
package util

object EditDistance {
  def similarString(name: String, allowed: TraversableOnce[String]): String = {
    val suggested = suggestions(name, allowed.toSeq, maxDistance = 1, maxSuggestions = 2)
    if (suggested.isEmpty) ""
    else suggested.mkString(" (similar: ", ", ", ")")
  }

  def suggestions(a: String, bs: Seq[String], maxDistance: Int, maxSuggestions: Int): Seq[String] = (
    bs map (b => (b, distance(a, b)))
      filter (_._2 <= maxDistance)
      sortBy (_._2)
      take   (maxSuggestions)
      map    (_._1)
  )

  def distance(a: String, b: String): Int = levenshtein(a, b, transpositions = true)

  def levenshtein(s: String, t: String, transpositions: Boolean): Int = {
    val n = s.length
    val m = t.length
    if (n == 0) return m
    if (m == 0) return n

    val d = Array.ofDim[Int](n + 1, m + 1)
    0 to n foreach (x => d(x)(0) = x)
    0 to m foreach (x => d(0)(x) = x)

    for (i <- 1 to n ; val s_i = s(i - 1) ; j <- 1 to m) {
      val t_j   = t(j - 1)
      val cost  = if (s_i == t_j) 0 else 1

      val c1 = d(i - 1)(j) + 1
      val c2 = d(i)(j - 1) + 1
      val c3 = d(i - 1)(j - 1) + cost

      d(i)(j) = c1 min c2 min c3

      if (transpositions) {
        if (i > 1 && j > 1 && s(i - 1) == t(j - 2) && s(i - 2) == t(j - 1))
          d(i)(j) = d(i)(j) min (d(i - 2)(j - 2) + cost)
      }
    }

    d(n)(m)
  }
}