当前位置: 首页 > 工具软件 > Emojicon > 使用案例 >

判别是否包含了emojicon表情

王鹏飞
2023-12-01

public static String filterEmoji(String source) { 
          if (source != null )
          {
              Pattern emoji = Pattern.compile ( "[\ud83c\udc00-\ud83c\udfff]|[\ud83d\udc00-\ud83d\udfff]|[\u2600-\u27ff]" ,Pattern.UNICODE_CASE | Pattern . CASE_INSENSITIVE ) ;
              Matcher emojiMatcher = emoji.matcher(source);
              if ( emojiMatcher.find())
              {
                  source = emojiMatcher.replaceAll( "*" );
                  return source ;
              }
          return source;
         }
         return source; 
      }
 
如果没有改变的话,可以在该类中书写以下代码:
private static final long serialVersionUID = -5916500037685553487L;
    public void destroy() {
       // TODO Auto-generated method stub
    }

    @SuppressWarnings("unchecked")
    public void doFilter(ServletRequest request, ServletResponse response,
        FilterChain arg2) throws IOException, ServletException {
       HttpServletRequest servletrequest = (HttpServletRequest) request;
       //新加代码http://www.2cto.com/kf/201512/455191.html
       HttpServletResponse servletresponse = (HttpServletResponse) response;
       String param = "";
       String paramValue = "";

       servletresponse.setContentType("text/html");
       servletresponse.setCharacterEncoding("UTF-8");
       servletrequest.setCharacterEncoding("UTF-8");
       java.util.Enumeration params = request.getParameterNames();
       while (params.hasMoreElements()) {

        param = (String) params.nextElement();
        String[] values = servletrequest.getParameterValues(param);//获得每个参数的value
       
        for (int i = 0; i < values.length; i++) {

         paramValue = values[i];
        
         
         paramValue = paramValue.replaceAll("<script>", "(*");
         paramValue = paramValue.replaceAll("</script>", ")");
         paramValue = paramValue.replaceAll("[\ud83c\udc00-\ud83c\udfff]|[\ud83d\udc00-\ud83d\udfff]|[\u2600-\u27ff]", ""); //过滤emoji表情
        
         
        //这里还可以增加,如领导人 自动转义成****,可以从数据库中读取非法关键字。
         values[i] = paramValue;
        }

    //把转义后的参数重新放回request中
        request.setAttribute(param, paramValue);
       }
       //继续向下

       arg2.doFilter(request, response);

    }

    public void init(FilterConfig arg0) throws ServletException {
       // 初始化

    }
}
  





public static String filterEmoji(String source) {  

      if (!containsEmoji(source)) {  
       return source;// 如果不包含,直接返回  
      }  
        
      StringBuilder buf = null;  
      int len = source.length();  
      for (int i = 0; i < len; i++) {  
       char codePoint = source.charAt(i);  
       if (!isEmojiCharacter(codePoint)) {  
        if (buf == null) {  
         buf = new StringBuilder(source.length());  
        }  
        buf.append(codePoint);  
       } else {  
       }  
      }  
      if (buf == null) {  
       return "";  
      } else {  
       if (buf.length() == len) {// 这里的意义在于尽可能少的toString,因为会重新生成字符串  
        buf = null;  
        return source;  
       } else {  
        return buf.toString();  
       }  
      }  
     }  
       


    // 判别是否包含Emoji表情  
     private static boolean containsEmoji(String str) {  
      int len = str.length();  
      for (int i = 0; i < len; i++) {  
       if (isEmojiCharacter(str.charAt(i))) {  
        return true;  
       }  
      }  
      return false;  
     }  
       
     private static boolean isEmojiCharacter(char codePoint) {  
            return !((codePoint == 0x0) ||  
                    (codePoint == 0x9) ||  
                    (codePoint == 0xA) ||  
                    (codePoint == 0xD) ||  
                    ((codePoint >= 0x20) && (codePoint <= 0xD7FF)) ||  
                    ((codePoint >= 0xE000) && (codePoint <= 0xFFFD)) ||  
                    ((codePoint >= 0x10000) && (codePoint <= 0x10FFFF)));  
        }  


 类似资料: