功能非常强大的敏感字符处理Java类

jopen 11年前

敏感字符的处理,性能非常好,采用文件的方式,可通过代码增加敏感词等强大的功能

依赖apache的io 和lang包

package com.wiker;      import java.io.File;  import java.io.IOException;  import java.util.ArrayList;  import java.util.List;    import org.apache.commons.io.FileUtils;  import org.apache.commons.io.LineIterator;  import org.apache.commons.lang.StringUtils;    /**   * 敏感字词处理类   * @author Wiker   * @date 2010-1-11 下午10:51:30   */  public class BadWord {     private final static File wordfilter = new File("C:/wordfilter.txt");     private static long lastModified = 0L;   private static List<String> words = new ArrayList<String>();      private static void checkReload(){    if(wordfilter.lastModified() > lastModified){     synchronized(BadWord.class){      try{       lastModified = wordfilter.lastModified();       LineIterator lines = FileUtils.lineIterator(wordfilter, "utf-8");       while(lines.hasNext()){        String line = lines.nextLine();        if(StringUtils.isNotBlank(line))         words.add(StringUtils.trim(line).toLowerCase());       }      }catch(IOException e){       e.printStackTrace();      }     }    }   }      /**    * 检查敏感字内容    * @param contents    */   public static String check(String ...contents) {    if(!wordfilter.exists())     return null;    checkReload();    for(String word : words){     for(String content : contents)      if(content!=null && content.indexOf(word) >= 0)       return word;    }    return null;   }      /**    * 检查字符串是否包含敏感词    *    * @param content    * @return    */   public static boolean isContain(String content) {       if(!wordfilter.exists())           return false;       checkReload();       for(String word : words){              if(content!=null && content.indexOf(word) >= 0)                  return true;       }       return false;   }      /**    * 替换掉字符串中的敏感词    *    * @param str 等待替换的字符串    * @param replaceChar 替换字符    * @return    */   public static String replace(String str,String replaceChar){       checkReload();          for(String word : words){              if(str.indexOf(word)>=0){                  String reChar = "";                  for(int i=0;i<word.length();i++){                      reChar += replaceChar;                  }                  str = str.replaceAll(word, reChar);              }          }          return str;   }      public static List<String> lists() {    checkReload();    return words;   }      /**    * 添加敏感词    *    * @param word    * @throws IOException    */   public static void add(String word) throws IOException {    word = word.toLowerCase();    if(!words.contains(word)){     words.add(word);     FileUtils.writeLines(wordfilter, "UTF-8", words);     lastModified = wordfilter.lastModified();    }   }     /**    * 删除敏感词    *    * @param word    * @throws IOException    */   public static void delete(String word) throws IOException {    word = word.toLowerCase();    words.remove(word);    FileUtils.writeLines(wordfilter, "UTF-8", words);    lastModified = wordfilter.lastModified();   }      public static void main(String[] args) throws Exception{          System.out.println(BadWord.replace("中国共产党钓鱼岛","*"));          System.out.println(BadWord.isContain("岛"));          BadWord.add("傻逼");      }     }
来自:http://blog.csdn.net/wiker_yong/article/details/16823535