具体代码如下所示:
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
|
/**
* 判断字符是否是中文
*
* @param c 字符
* @return 是否是中文
*/
public static boolean ischinese( char c) {
character.unicodeblock ub = character.unicodeblock.of(c);
if (ub == character.unicodeblock.cjk_unified_ideographs
|| ub == character.unicodeblock.cjk_compatibility_ideographs
|| ub == character.unicodeblock.cjk_unified_ideographs_extension_a
|| ub == character.unicodeblock.general_punctuation
|| ub == character.unicodeblock.cjk_symbols_and_punctuation
|| ub == character.unicodeblock.halfwidth_and_fullwidth_forms) {
return true ;
}
return false ;
}
/**
* 判断字符串是否是乱码
*
* @param strname 字符串
* @return 是否是乱码
*/
public static boolean ismessycode(string strname) {
pattern p = pattern.compile( "\s*|t*|r*|n*" );
matcher m = p.matcher(strname);
string after = m.replaceall( "" );
string temp = after.replaceall( "\p{p}" , "" );
char [] ch = temp.trim().tochararray();
float chlength = ch.length;
float count = 0 ;
for ( int i = 0 ; i < ch.length; i++) {
char c = ch[i];
if (!character.isletterordigit(c)) {
if (!ischinese(c)) {
count = count + 1 ;
}
}
}
float result = count / chlength;
if (result > 0.4 ) {
return true ;
} else {
return false ;
}
}
public static void main(string[] args) {
system.out.println(ismessycode( "ã©å¸â©ã©â¡âºã¥â¹â³" ));
system.out.println(ismessycode( "你好" ));
}
|
总结
以上所述是小编给大家介绍的java判断字符串是否含有乱码实例代码,希望对大家有所帮助,如果大家有任何疑问请给我留言,小编会及时回复大家的。在此也非常感谢大家对服务器之家网站的支持!
原文链接:https://blog.csdn.net/albg_boy/article/details/83988152