public class LexerUtils
extends java.lang.Object
Modifier and Type | Method and Description |
---|---|
static java.lang.String |
minimallyNormalizeCurrency(java.lang.String in)
Still at least turn cp1252 euro symbol to Unicode one.
|
static java.lang.String |
normalizeAmp(java.lang.String in)
Convert an XML-escaped ampersand back into an ampersand.
|
static java.lang.String |
normalizeCurrency(java.lang.String in) |
static java.lang.String |
processCp1252misc(java.lang.String arg) |
static java.lang.String |
removeSoftHyphens(java.lang.String in) |
public static java.lang.String normalizeCurrency(java.lang.String in)
public static java.lang.String minimallyNormalizeCurrency(java.lang.String in)
public static java.lang.String removeSoftHyphens(java.lang.String in)
public static java.lang.String processCp1252misc(java.lang.String arg)
public static java.lang.String normalizeAmp(java.lang.String in)