/** * Removes leading and trailing whitespaces of the string * given as the parameter, then truncate any * sequnce of tab, CR, LF, and SP by a single whitespace character ' '. */ public String unmarshal(String text) { if(text==null) returnnull; // be defensive
intlen= text.length();
// most of the texts are already in the collapsed form. // so look for the first whitespace in the hope that we will // never see it. int s=0; while(s<len) { if(isWhiteSpace(text.charAt(s))) break; s++; } if(s==len) // the input happens to be already collapsed. return text;
// we now know that the input contains spaces. // let's sit down and do the collapsing normally.
StringBuilderresult=newStringBuilder(len /*allocate enough size to avoid re-allocation*/ );
booleaninStripMode=true; for (inti= s+1; i < len; i++) { charch= text.charAt(i); booleanb= isWhiteSpace(ch); if (inStripMode && b) continue; // skip this character
inStripMode = b; if (inStripMode) result.append(' '); else result.append(ch); }
// remove trailing whitespaces len = result.length(); if (len > 0 && result.charAt(len - 1) == ' ') result.setLength(len - 1); // whitespaces are already collapsed, // so all we have to do is to remove the last one character // if it's a whitespace.
// tran html encoding Strings1= result.toString(); return StringEscapeUtils.unescapeHtml(s1); }
/** * No-op. * * Just return the same string given as the parameter. */ public String marshal(String s) { return s; }
/** returns true if the specified char is a white space character. */ protectedstaticbooleanisWhiteSpace(char ch) { // most of the characters are non-control characters. // so check that first to quickly return false for most of the cases. if( ch>0x20 ) returnfalse;
// other than we have to do four comparisons. return ch == 0x9 || ch == 0xA || ch == 0xD || ch == 0x20; } }