/**
* 除去数字
*
* @param title
* @return
*/
private static String parseTitle(String title) {
char[] charArray = title.toCharArray();
char[] chars = null;// 除去数字后的数组
for (int i = 0; i < charArray.length; i++) {
char c = charArray[i];
if (isChinese(c) || Character.isLetter(c)) {
chars = new char[charArray.length - i];
System.arraycopy(charArray, i, chars, 0, charArray.length - i);
break;
}
}
return new String(chars);
}
/**
* 汉字在前,英文在后
* @param title
* @return
*/
public static String getCNTitle(String title) {
char[] chars = title.toCharArray();
char[] result = null;
int length = chars.length;
for (int i = length - 1; i >= 0; i--) {
char c = chars[i];
if (isChinese(c)) {
char cc = chars[i + 1];
if (Character.isDigit(cc)) {
result = new char[i + 2];
System.arraycopy(chars, 0, result, 0, i + 2);
break;
} else {
result = new char[i + 1];
System.arraycopy(chars, 0, result, 0, i + 1);
break;
}
}
}
String s = new String(result);
return replaceBlank(s);
}
public static String getENTitle(String title) {
char[] chars = title.toCharArray();
char[] result = null;
int length = chars.length;
for (int i = length - 1; i >= 0; i--) {
char c = chars[i];
if (isChinese(c)) {
char cc = chars[i + 1];
if (Character.isDigit(cc)) {
result = new char[length - i - 2];
System.arraycopy(chars, i + 2, result, 0, length - i - 2);
break;
} else {
result = new char[length - i - 1];
System.arraycopy(chars, i + 1, result, 0, length - i - 1);
break;
}
}
}
String s = new String(result);
return replaceBlank(s);
}
private static String replaceBlank(String s) {
Pattern p = Pattern.compile("\\s*|\t|\r|\n");
Matcher m = p.matcher(s);
String after = m.replaceAll("");
return after;
}
private static boolean isChinese(char c) {
Character.UnicodeBlock ub = Character.UnicodeBlock.of(c);
if (ub == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS
|| ub == Character.UnicodeBlock.CJK_COMPATIBILITY_IDEOGRAPHS
|| ub == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A
|| ub == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS_EXTENSION_B
|| ub == Character.UnicodeBlock.CJK_SYMBOLS_AND_PUNCTUATION
|| ub == Character.UnicodeBlock.HALFWIDTH_AND_FULLWIDTH_FORMS
|| ub == Character.UnicodeBlock.GENERAL_PUNCTUATION) {
return true;
}
return false;
}
Java中的字符串的中英文处理
最新推荐文章于 2023-03-07 14:50:09 发布