Java中判断字符串是中文或者英文的工具类分享

时间:2022-06-16 22:33:03

直接上代码:

 

复制代码代码如下:


import java.util.regex.Matcher;
import java.util.regex.Pattern;

 

/**
 * 
 * <p>
 * ClassName ShowChineseInUnicodeBlock
 * </p>
 * <p>
 * Description 提供判断字符串中文或者是英文的一种思路
 * </p>
 * 
 * @author wangxu wangx89@126.com
 *         <p>
 *         Date 2014-9-16 下午06:45:35
 *         </p>
 * @version V1.0
 * 
 */
public class ShowChineseInUnicodeBlock {
 public static void main(String[] args) {
  String str = "我爱你,!?():;“”、。";
  char[] charArray = str.toCharArray();
  for (int i = 0; i < charArray.length; i++) {
   isChinese(charArray[i]);
  }
  String chinese = "中国god damn";
  System.out.println(isContainChinese(chinese));
  String english = "dfafdabac";
  System.out.println(isEnglish(english));
 }

 /**
  * 
  * <p>
  * Title: isChinese
  * </p>
  * <p>
  * Description: 该函数就用来打印一些字符看看属于什么
  * </p>
  * 
  * @param c
  * 
  */
 public static void isChinese(char c) {
  Character.UnicodeBlock ub = Character.UnicodeBlock.of(c);
  if (ub == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS) {
   System.out.println(c + "--CJK_UNIFIED_IDEOGRAPHS");
  } else if (ub == Character.UnicodeBlock.CJK_COMPATIBILITY_IDEOGRAPHS) {
   System.out.println(c + "--CJK_COMPATIBILITY_IDEOGRAPHS");
  } else if (ub == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A) {
   // CJK Unified Ideographs Extension WikipediaUnicode扩展汉字
   // CJK Unified Ideographs Extension A 中日韩统一表意文字扩展区A ; 表意文字扩充A
   // CJK Unified Ideographs Extension B 中日韩统一表意文字扩展区B
   System.out.println(c + "--CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A");
  } else if (ub == Character.UnicodeBlock.GENERAL_PUNCTUATION) {// 通用标点
   System.out.println(c + "--GENERAL_PUNCTUATION");

  } else if (ub == Character.UnicodeBlock.CJK_SYMBOLS_AND_PUNCTUATION) {
   System.out.println(c + "--CJK_SYMBOLS_AND_PUNCTUATION");

  } else if (ub == Character.UnicodeBlock.HALFWIDTH_AND_FULLWIDTH_FORMS) {
   System.out.println(c + "--HALFWIDTH_AND_FULLWIDTH_FORMS");

  }
 }

 public static boolean isEnglish(String charaString) {
  return charaString.matches("^[a-zA-Z]*");
 }

 public static boolean isContainChinese(String str) {// 检测是否包含中文
  String regEx = "[\\u4E00-\\u9FA5]+";
  Pattern p = Pattern.compile(regEx);
  Matcher m = p.matcher(str);
  if (m.find()) {
   return true;
  } else {
   return false;
  }
 }
}