Sharing of tools to determine whether a string is Chinese or English in Java

Author：Eve Cole Update Time：2025-01-15 09:12:01

Go directly to the code:

Copy the code code as follows:
import java.util.regex.Matcher;
import java.util.regex.Pattern;

/**
*
* 
* ClassName ShowChineseInUnicodeBlock
* 
* 
* Description provides an idea for determining whether a string is Chinese or English.
* 
*
* @author wangxu [email protected]
* 
* Date 2014-9-16 06:45:35 PM
* 
* @version V1.0
*
*/
public class ShowChineseInUnicodeBlock {
public static void main(String[] args) {
String str = "I love you!? ():;"",.";
char[] charArray = str.toCharArray();
for (int i = 0; i < charArray.length; i++) {
isChinese(charArray[i]);
}
String chinese = "Chinese god damn";
System.out.println(isContainChinese(chinese));
String english = "dfafdabac";
System.out.println(isEnglish(english));
}

/**
*
* 
* Title: isChinese
* 
* 
* Description: This function is used to print some characters to see what they belong to
* 
*
* @param c
*
*/
public static void isChinese(char c) {
Character.UnicodeBlock ub = Character.UnicodeBlock.of(c);
if (ub == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS) {
System.out.println(c + "--CJK_UNIFIED_IDEOGRAPHS");
} else if (ub == Character.UnicodeBlock.CJK_COMPATIBILITY_IDEOGRAPHS) {
System.out.println(c + "--CJK_COMPATIBILITY_IDEOGRAPHS");
} else if (ub == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A) {
// CJK Unified Ideographs Extension WikipediaUnicode extends Chinese characters
// CJK Unified Ideographs Extension A CJK Unified Ideographs Extension A; Ideographs Extension A
// CJK Unified Ideographs Extension B CJK Unified Ideographs Extension B
System.out.println(c + "--CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A");
} else if (ub == Character.UnicodeBlock.GENERAL_PUNCTUATION) {//General punctuation
System.out.println(c + "--GENERAL_PUNCTUATION");

} else if (ub == Character.UnicodeBlock.CJK_SYMBOLS_AND_PUNCTUATION) {
System.out.println(c + "--CJK_SYMBOLS_AND_PUNCTUATION");

} else if (ub == Character.UnicodeBlock.HALFWIDTH_AND_FULLWIDTH_FORMS) {
System.out.println(c + "--HALFWIDTH_AND_FULLWIDTH_FORMS");

}
}

public static boolean isEnglish(String charaString) {
return charaString.matches("^[a-zA-Z]*");
}

public static boolean isContainChinese(String str) {//Detect whether it contains Chinese
String regEx = "[//u4E00-//u9FA5]+";
Pattern p = Pattern.compile(regEx);
Matcher m = p.matcher(str);
if (m.find()) {
return true;
} else {
return false;
}
}
}