diff -r 88b85470e72c -r f50545b5e2f1 src/share/jaxws_classes/javax/xml/bind/WhiteSpaceProcessor.java --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/src/share/jaxws_classes/javax/xml/bind/WhiteSpaceProcessor.java Tue Mar 06 16:09:35 2012 -0800 @@ -0,0 +1,198 @@ +/* + * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. Oracle designates this + * particular file as subject to the "Classpath" exception as provided + * by Oracle in the LICENSE file that accompanied this code. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + */ + +package javax.xml.bind; + +/** + * Processes white space normalization. + * + * @since 1.0 + */ +abstract class WhiteSpaceProcessor { + +// benchmarking (see test/src/ReplaceTest.java in the CVS Attic) +// showed that this code is slower than the current code. +// +// public static String replace(String text) { +// final int len = text.length(); +// StringBuffer result = new StringBuffer(len); +// +// for (int i = 0; i < len; i++) { +// char ch = text.charAt(i); +// if (isWhiteSpace(ch)) +// result.append(' '); +// else +// result.append(ch); +// } +// +// return result.toString(); +// } + + public static String replace(String text) { + return replace( (CharSequence)text ).toString(); + } + + /** + * @since 2.0 + */ + public static CharSequence replace(CharSequence text) { + int i=text.length()-1; + + // look for the first whitespace char. + while( i>=0 && !isWhiteSpaceExceptSpace(text.charAt(i)) ) + i--; + + if( i<0 ) + // no such whitespace. replace(text)==text. + return text; + + // we now know that we need to modify the text. + // allocate a char array to do it. + StringBuilder buf = new StringBuilder(text); + + buf.setCharAt(i--,' '); + for( ; i>=0; i-- ) + if( isWhiteSpaceExceptSpace(buf.charAt(i))) + buf.setCharAt(i,' '); + + return new String(buf); + } + + /** + * Equivalent of {@link String#trim()}. + * @since 2.0 + */ + public static CharSequence trim(CharSequence text) { + int len = text.length(); + int start = 0; + + while( startstart && isWhiteSpace(text.charAt(end)) ) + end--; + + if(start==0 && end==len-1) + return text; // no change + else + return text.subSequence(start,end+1); + } + + public static String collapse(String text) { + return collapse( (CharSequence)text ).toString(); + } + + /** + * This is usually the biggest processing bottleneck. + * + * @since 2.0 + */ + public static CharSequence collapse(CharSequence text) { + int len = text.length(); + + // most of the texts are already in the collapsed form. + // so look for the first whitespace in the hope that we will + // never see it. + int s=0; + while(s 0 && result.charAt(len - 1) == ' ') + result.setLength(len - 1); + // whitespaces are already collapsed, + // so all we have to do is to remove the last one character + // if it's a whitespace. + + return result; + } + + /** + * Returns true if the specified string is all whitespace. + */ + public static final boolean isWhiteSpace(CharSequence s) { + for( int i=s.length()-1; i>=0; i-- ) + if(!isWhiteSpace(s.charAt(i))) + return false; + return true; + } + + /** returns true if the specified char is a white space character. */ + public static final boolean isWhiteSpace(char ch) { + // most of the characters are non-control characters. + // so check that first to quickly return false for most of the cases. + if( ch>0x20 ) return false; + + // other than we have to do four comparisons. + return ch == 0x9 || ch == 0xA || ch == 0xD || ch == 0x20; + } + + /** + * Returns true if the specified char is a white space character + * but not 0x20. + */ + protected static final boolean isWhiteSpaceExceptSpace(char ch) { + // most of the characters are non-control characters. + // so check that first to quickly return false for most of the cases. + if( ch>=0x20 ) return false; + + // other than we have to do four comparisons. + return ch == 0x9 || ch == 0xA || ch == 0xD; + } +}