src/share/jaxws_classes/com/sun/xml/internal/bind/v2/util/EditDistance.java

changeset 0
373ffda63c9a
child 637
9c07ef4934dd
     1.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     1.2 +++ b/src/share/jaxws_classes/com/sun/xml/internal/bind/v2/util/EditDistance.java	Wed Apr 27 01:27:09 2016 +0800
     1.3 @@ -0,0 +1,143 @@
     1.4 +/*
     1.5 + * Copyright (c) 1997, 2011, Oracle and/or its affiliates. All rights reserved.
     1.6 + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
     1.7 + *
     1.8 + * This code is free software; you can redistribute it and/or modify it
     1.9 + * under the terms of the GNU General Public License version 2 only, as
    1.10 + * published by the Free Software Foundation.  Oracle designates this
    1.11 + * particular file as subject to the "Classpath" exception as provided
    1.12 + * by Oracle in the LICENSE file that accompanied this code.
    1.13 + *
    1.14 + * This code is distributed in the hope that it will be useful, but WITHOUT
    1.15 + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
    1.16 + * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
    1.17 + * version 2 for more details (a copy is included in the LICENSE file that
    1.18 + * accompanied this code).
    1.19 + *
    1.20 + * You should have received a copy of the GNU General Public License version
    1.21 + * 2 along with this work; if not, write to the Free Software Foundation,
    1.22 + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
    1.23 + *
    1.24 + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
    1.25 + * or visit www.oracle.com if you need additional information or have any
    1.26 + * questions.
    1.27 + */
    1.28 +
    1.29 +package com.sun.xml.internal.bind.v2.util;
    1.30 +
    1.31 +import java.util.AbstractMap;
    1.32 +import java.util.Arrays;
    1.33 +import java.util.Collection;
    1.34 +import java.util.WeakHashMap;
    1.35 +
    1.36 +/**
    1.37 + * Computes the string edit distance.
    1.38 + *
    1.39 + * <p>
    1.40 + * Refer to a computer science text book for the definition
    1.41 + * of the "string edit distance".
    1.42 + *
    1.43 + * @author
    1.44 + *     Kohsuke Kawaguchi (kohsuke.kawaguchi@sun.com)
    1.45 + */
    1.46 +public class EditDistance {
    1.47 +
    1.48 +    /**
    1.49 +     * Weak results cache to avoid additional computations.
    1.50 +     * Because of high complexity caching is required.
    1.51 +     */
    1.52 +    private static final WeakHashMap<AbstractMap.SimpleEntry<String,String>, Integer> CACHE = new WeakHashMap<AbstractMap.SimpleEntry<String, String>, Integer>();
    1.53 +
    1.54 +    /**
    1.55 +     * Computes the edit distance between two strings.
    1.56 +     *
    1.57 +     * <p>
    1.58 +     * The complexity is O(nm) where n=a.length() and m=b.length().
    1.59 +     */
    1.60 +    public static int editDistance( String a, String b ) {
    1.61 +        // let's check cache
    1.62 +        AbstractMap.SimpleEntry<String,String> entry = new AbstractMap.SimpleEntry<String, String>(a, b); // using this class to avoid creation of my own which will handle PAIR of values
    1.63 +        Integer result = null;
    1.64 +        if (CACHE.containsKey(entry))
    1.65 +            result = CACHE.get(entry); // looks like we have it
    1.66 +
    1.67 +        if (result == null) {
    1.68 +            result = new EditDistance(a, b).calc();
    1.69 +            CACHE.put(entry, result); // cache the result
    1.70 +        }
    1.71 +        return result;
    1.72 +    }
    1.73 +
    1.74 +    /**
    1.75 +     * Finds the string in the <code>group</code> closest to
    1.76 +     * <code>key</code> and returns it.
    1.77 +     *
    1.78 +     * @return null if group.length==0.
    1.79 +     */
    1.80 +    public static String findNearest( String key, String[] group ) {
    1.81 +        return findNearest(key, Arrays.asList(group));
    1.82 +    }
    1.83 +
    1.84 +    /**
    1.85 +     * Finds the string in the <code>group</code> closest to
    1.86 +     * <code>key</code> and returns it.
    1.87 +     *
    1.88 +     * @return null if group.length==0.
    1.89 +     */
    1.90 +    public static String findNearest( String key, Collection<String> group ) {
    1.91 +        int c = Integer.MAX_VALUE;
    1.92 +        String r = null;
    1.93 +
    1.94 +        for (String s : group) {
    1.95 +            int ed = editDistance(key,s);
    1.96 +            if( c>ed ) {
    1.97 +                c = ed;
    1.98 +                r = s;
    1.99 +            }
   1.100 +        }
   1.101 +        return r;
   1.102 +    }
   1.103 +
   1.104 +    /** cost vector. */
   1.105 +    private int[] cost;
   1.106 +    /** back buffer. */
   1.107 +    private int[] back;
   1.108 +
   1.109 +    /** Two strings to be compared. */
   1.110 +    private final String a,b;
   1.111 +
   1.112 +    private EditDistance( String a, String b ) {
   1.113 +        this.a=a;
   1.114 +        this.b=b;
   1.115 +        cost = new int[a.length()+1];
   1.116 +        back = new int[a.length()+1]; // back buffer
   1.117 +
   1.118 +        for( int i=0; i<=a.length(); i++ )
   1.119 +            cost[i] = i;
   1.120 +    }
   1.121 +
   1.122 +    /**
   1.123 +     * Swaps two buffers.
   1.124 +     */
   1.125 +    private void flip() {
   1.126 +        int[] t = cost;
   1.127 +        cost = back;
   1.128 +        back = t;
   1.129 +    }
   1.130 +
   1.131 +    private int min(int a,int b,int c) {
   1.132 +        return Math.min(a,Math.min(b,c));
   1.133 +    }
   1.134 +
   1.135 +    private int calc() {
   1.136 +        for( int j=0; j<b.length(); j++ ) {
   1.137 +            flip();
   1.138 +            cost[0] = j+1;
   1.139 +            for( int i=0; i<a.length(); i++ ) {
   1.140 +                int match = (a.charAt(i)==b.charAt(j))?0:1;
   1.141 +                cost[i+1] = min( back[i]+match, cost[i]+1, back[i+1]+1 );
   1.142 +            }
   1.143 +        }
   1.144 +        return cost[a.length()];
   1.145 +    }
   1.146 +}

mercurial