public class StringUtils
extends org.apache.commons.lang3.StringUtils
| Modifier and Type | Field and Description |
|---|---|
static int |
NUM_OF_PADDED_SPACES |
| Constructor and Description |
|---|
StringUtils() |
| Modifier and Type | Method and Description |
|---|---|
static String |
cleanForPrint(String input) |
static String |
convert(byte[] data) |
static String |
convert(byte[] data,
int offset,
int length) |
static String |
convert(ByteBuffer value) |
static byte[] |
convert(char[] word) |
static byte[] |
convert(String word) |
static void |
convertToLowerCase(char[] inputFile)
This method is faster (for some unknown reason) then String.toLowerCase();
|
static String |
createStringContext(BowString ex,
int length) |
static boolean |
crossesParagraphBoundaries(String ngram) |
static String |
escapeFileName(String inputString) |
static String |
escapeNewLine(String inputString) |
static String |
escapePathName(String inputString) |
static String |
escapeTab(String inputString) |
static String |
getFirstNgram(BowString example,
int length) |
static String |
getLastNgram(BowString example,
int length) |
static BowStringImpl |
getNextWord(BowString err,
Set<String> wordsWithPunctuation) |
static int |
getPartition(char firstLetter,
int numOfPartitions) |
static int |
getPartition(String word,
int numOfPartitions) |
static String |
getPrefix(String word,
int length,
int reductionLevel) |
static BowStringImpl |
getPrevWord(BowString err,
Set<String> wordsWithPunctuation) |
static String |
getSuffix(BowString word,
int length,
int reductionLevel) |
static String |
getSuffix(String word,
int length,
int reductionLevel) |
static boolean |
isASCIIConsonant(char c) |
static boolean |
isASCIIVowel(char c) |
static boolean |
isCapital(char letter) |
static boolean |
isPossibleName(String ngram) |
static boolean |
mightBeUrlOrEmailOrHashTag(String fullString) |
static void |
normalizeQuotationMarks(char[] extracted) |
static String |
prepareWordForIndex(String word) |
static String |
reduceCharacterDiversityLevel(int level,
String text) |
static String |
reduceCharacterDiversityLevel0(char[] word) |
static String |
reduceCharacterDiversityLevel0(String word) |
static String |
reduceCharacterDiversityLevel1(BowString word) |
static String |
reduceCharacterDiversityLevel1(char[] text) |
static String |
reduceCharacterDiversityLevel1(String word) |
static String |
reduceCharacterDiversityLevel2(BowString word) |
static String |
reduceCharacterDiversityLevel2(String word) |
static String |
reduceCharacterDiversityLevel3(String word) |
static char |
removeAccent(char orig) |
static String |
removeAccents(char[] newS) |
static String |
removeAccents(String origWord) |
static String |
removeAccentsSlow(String str) |
static void |
removeHTML(MappedText mappedText) |
static String |
removeIncorrectDash(String origWord) |
static String |
removeRedundantWhiteSpace(String origString) |
static void |
replaceAll(String regex,
String repl,
MappedText mappedText) |
static void |
replaceAll(String regex,
String repl,
MappedText mappedText,
boolean keepMapping) |
static String |
replaceHTMLEntities(String line) |
static void |
replaceMatches(List<Match> matches,
MappedText mappedText) |
static void |
replaceMatches(List<Pair<Integer,Integer>> matches,
String repl,
MappedText mappedText) |
static void |
replaceMatches(List<Pair<Integer,Integer>> matches,
String repl,
MappedText mappedText,
boolean keepWorMapping) |
static void |
replaceString(int start,
int end,
String repl,
MappedText mappedText) |
static void |
split(MappedText mappedText,
int start,
int end) |
static List<BowString> |
splitInWords(String text,
Set<String> wordsWithPunct) |
static String |
unescapeFileName(String inputString) |
static String |
unescapeNewLine(String inputString) |
static String |
unescapePathName(String inputString) |
static String |
unescapeTab(String inputString) |
static String |
urlDecode(String input) |
static String |
urlEncode(String input) |
abbreviate, abbreviate, abbreviateMiddle, appendIfMissing, appendIfMissingIgnoreCase, capitalize, center, center, center, chomp, chomp, chop, contains, contains, containsAny, containsAny, containsIgnoreCase, containsNone, containsNone, containsOnly, containsOnly, containsWhitespace, countMatches, defaultIfBlank, defaultIfEmpty, defaultString, defaultString, deleteWhitespace, difference, endsWith, endsWithAny, endsWithIgnoreCase, equals, equalsIgnoreCase, getCommonPrefix, getJaroWinklerDistance, getLevenshteinDistance, getLevenshteinDistance, indexOf, indexOf, indexOf, indexOf, indexOfAny, indexOfAny, indexOfAny, indexOfAnyBut, indexOfAnyBut, indexOfDifference, indexOfDifference, indexOfIgnoreCase, indexOfIgnoreCase, isAllLowerCase, isAllUpperCase, isAlpha, isAlphanumeric, isAlphanumericSpace, isAlphaSpace, isAnyBlank, isAnyEmpty, isAsciiPrintable, isBlank, isEmpty, isNoneBlank, isNoneEmpty, isNotBlank, isNotEmpty, isNumeric, isNumericSpace, isWhitespace, join, join, join, join, join, join, join, join, join, join, join, join, join, join, join, join, join, join, join, join, join, join, join, lastIndexOf, lastIndexOf, lastIndexOf, lastIndexOf, lastIndexOfAny, lastIndexOfIgnoreCase, lastIndexOfIgnoreCase, lastOrdinalIndexOf, left, leftPad, leftPad, leftPad, length, lowerCase, lowerCase, mid, normalizeSpace, ordinalIndexOf, overlay, prependIfMissing, prependIfMissingIgnoreCase, remove, remove, removeEnd, removeEndIgnoreCase, removePattern, removeStart, removeStartIgnoreCase, repeat, repeat, repeat, replace, replace, replaceChars, replaceChars, replaceEach, replaceEachRepeatedly, replaceOnce, replacePattern, reverse, reverseDelimited, right, rightPad, rightPad, rightPad, split, split, split, split, splitByCharacterType, splitByCharacterTypeCamelCase, splitByWholeSeparator, splitByWholeSeparator, splitByWholeSeparatorPreserveAllTokens, splitByWholeSeparatorPreserveAllTokens, splitPreserveAllTokens, splitPreserveAllTokens, splitPreserveAllTokens, splitPreserveAllTokens, startsWith, startsWithAny, startsWithIgnoreCase, strip, strip, stripAccents, stripAll, stripAll, stripEnd, stripStart, stripToEmpty, stripToNull, substring, substring, substringAfter, substringAfterLast, substringBefore, substringBeforeLast, substringBetween, substringBetween, substringsBetween, swapCase, toEncodedString, toString, trim, trimToEmpty, trimToNull, uncapitalize, upperCase, upperCasepublic static final int NUM_OF_PADDED_SPACES
public static void normalizeQuotationMarks(char[] extracted)
public static boolean isASCIIVowel(char c)
public static boolean isASCIIConsonant(char c)
public static void removeHTML(MappedText mappedText)
public static void replaceMatches(List<Match> matches, MappedText mappedText)
public static void replaceMatches(List<Pair<Integer,Integer>> matches, String repl, MappedText mappedText)
public static void replaceMatches(List<Pair<Integer,Integer>> matches, String repl, MappedText mappedText, boolean keepWorMapping)
public static void convertToLowerCase(char[] inputFile)
inputFile - public static void split(MappedText mappedText, int start, int end)
public static void replaceString(int start,
int end,
String repl,
MappedText mappedText)
public static void replaceAll(String regex, String repl, MappedText mappedText)
public static void replaceAll(String regex, String repl, MappedText mappedText, boolean keepMapping)
public static byte[] convert(String word)
public static byte[] convert(char[] word)
public static String convert(byte[] data)
public static String convert(byte[] data, int offset, int length)
public static String convert(ByteBuffer value)
public static String removeAccents(char[] newS)
public static char removeAccent(char orig)
public static int getPartition(String word, int numOfPartitions)
public static int getPartition(char firstLetter,
int numOfPartitions)
public static boolean crossesParagraphBoundaries(String ngram)
public static boolean isPossibleName(String ngram)
public static String reduceCharacterDiversityLevel1(char[] text)
public static String reduceCharacterDiversityLevel0(char[] word)
public static String reduceCharacterDiversityLevel(int level, String text)
public static boolean mightBeUrlOrEmailOrHashTag(String fullString)
public static BowStringImpl getPrevWord(BowString err, Set<String> wordsWithPunctuation)
public static BowStringImpl getNextWord(BowString err, Set<String> wordsWithPunctuation)
public static boolean isCapital(char letter)
Copyright © 2015. All rights reserved.