blob: 613862f428bd3922787912724b3a4ecc2bb421f3 [file] [log] [blame]
/*
* Copyright (c) 2004, 2021 Oracle and/or its affiliates. All rights reserved.
*
* This program and the accompanying materials are made available under the
* terms of the Eclipse Distribution License v. 1.0, which is available at
* http://www.eclipse.org/org/documents/edl-v10.php.
*
* SPDX-License-Identifier: BSD-3-Clause
*/
package jakarta.xml.bind.annotation.adapters;
/**
* {@link XmlAdapter} to handle {@code xs:normalizedString}.
*
* <p>
* Replaces any tab, CR, and LF by a whitespace character ' ',
* as specified in <a href="http://www.w3.org/TR/xmlschema-2/#rf-whiteSpace">the whitespace facet 'replace'</a>
*
* @author Kohsuke Kawaguchi, Martin Grebac
* @since 1.6, JAXB 2.0
*/
public final class NormalizedStringAdapter extends XmlAdapter<String,String> {
public NormalizedStringAdapter() {}
/**
* Replace any tab, CR, and LF by a whitespace character ' ',
* as specified in <a href="http://www.w3.org/TR/xmlschema-2/#rf-whiteSpace">the whitespace facet 'replace'</a>
*/
@Override
public String unmarshal(String text) {
if(text==null) return null; // be defensive
int i=text.length()-1;
// look for the first whitespace char.
while( i>=0 && !isWhiteSpaceExceptSpace(text.charAt(i)) )
i--;
if( i<0 )
// no such whitespace. replace(text)==text.
return text;
// we now know that we need to modify the text.
// allocate a char array to do it.
char[] buf = text.toCharArray();
buf[i--] = ' ';
for( ; i>=0; i-- )
if( isWhiteSpaceExceptSpace(buf[i]))
buf[i] = ' ';
return new String(buf);
}
/**
* No-op.
*
* Just return the same string given as the parameter.
*/
@Override
public String marshal(String s) {
return s;
}
/**
* Returns true if the specified char is a white space character
* but not 0x20.
*/
protected static boolean isWhiteSpaceExceptSpace(char ch) {
// most of the characters are non-control characters.
// so check that first to quickly return false for most of the cases.
if( ch>=0x20 ) return false;
// other than we have to do four comparisons.
return ch == 0x9 || ch == 0xA || ch == 0xD;
}
}