キーワードフィルタ
7380 ワード
package filter;
import java.io.BufferedReader;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStreamReader;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.HashMap;
import java.util.Iterator;
import java.util.Map;
import java.util.Map.Entry;
public class Test {
static int key_max = 0; //
static String[] keys = {" ", " ", " ", " ", " "};
static String tContent = " ";
static ArrayList first = new ArrayList();
static String[] sortFirst;
static char[] charFirst;
static HashMap> map = new HashMap>();
static HashMap sortMap = new HashMap();
static HashMap charMap = new HashMap();
static void init(String[] keys) {
ArrayList temp;
String key, value;
int length;
for (String k : keys) {
if (!first.contains(k.substring(0, 1))) {
first.add(k.substring(0, 1));
}
length = k.length();
if (length > key_max) key_max = length;
for (int i = 1; i < length; i ++) {
key = k.substring(0, i);
value = k.substring(i, i + 1);
if (i == 1 && !first.contains(key)) {
first.add(key);
}
// ,
if (map.containsKey(key)) {
if (!map.get(key).contains(value)) {
map.get(key).add(value);
}
}
//
else {
temp = new ArrayList();
temp.add(value);
map.put(key, temp);
}
}
}
sortFirst = first.toArray(new String[first.size()]);
Arrays.sort(sortFirst); //
charFirst = new char[first.size()];
for (int i = 0; i < charFirst.length; i ++) {
charFirst[i] = first.get(i).charAt(0);
}
Arrays.sort(charFirst); //
String[] sortValue;
ArrayList v;
Map.Entry> entry;
Iterator>> iter = map.entrySet().iterator();
while (iter.hasNext()) {
entry = (Map.Entry>) iter.next();
v = (ArrayList)entry.getValue();
sortValue = v.toArray(new String[v.size()]);
Arrays.sort(sortValue); //
sortMap.put(entry.getKey(), sortValue);
}
char[] charValue;
iter = map.entrySet().iterator();
while (iter.hasNext()) {
entry = (Map.Entry>) iter.next();
v = (ArrayList)entry.getValue();
charValue = new char[v.size()];
for (int i = 0; i < charValue.length; i ++) {
charValue[i] = v.get(i).charAt(0);
}
Arrays.sort(charValue); //
charMap.put(entry.getKey(), charValue);
}
}
/**
*
*/
public final static String test1(String content) {
for (String k : keys) {
if (content.indexOf(k) > -1)
return k;
}
return null;
}
/**
*
*/
public final static String test2(String content) {
boolean bFirst = false;
int length = content.length();
for (int i = 0; i < length; i ++) {
if (first.contains(content.substring(i, i + 1))) {
bFirst = true;
break;
}
}
return bFirst ? test1(content) : null;
}
/**
*
*/
public final static String test3(String content) {
String r = null, f, g, c = content;
ArrayList temps;
int length = c.length();
tag : for (int i = 0; i < length - 1; i++) {
f = c.substring(i, i + 1);
if (first.contains(f)) {
for (int j = i + 1; j < length; j++) {
f = c.substring(i, j);
g = c.substring(j, j + 1);
temps = map.get(f);
if (temps == null) { //
//System.out.println("ok");
r = f;
break tag;
}
if (temps.contains(g)) {
if (j == length - 1) {
//System.out.println("find!");
r = c.substring(i, j + 1);
break tag;
}
} else { //
break;
}
}
}
}
return r;
}
/**
*
*/
public final static String test4(String content) {
String r = null, f, g, c = content;
String[] temps;
int length = c.length();
tag : for (int i = 0; i < length - 1; i++) {
f = c.substring(i, i + 1);
//
if (Arrays.binarySearch(sortFirst, f) > -1) {
for (int j = i + 1; j < length; j++) {
f = c.substring(i, j);
g = c.substring(j, j + 1);
temps = sortMap.get(f);
if (temps == null) { //
//System.out.println("ok");
r = f;
break tag;
}
//
if (Arrays.binarySearch(temps, g) > -1) {
if (j == length - 1) {
//System.out.println("find!");
r = c.substring(i, j + 1);
break tag;
}
} else { //
break;
}
}
}
}
return r;
}
/**
*
*/
public final static String test5(String content) {
String r = null, f, c = content;
char g;
char[] temps;
int length = c.length();
tag : for (int i = 0; i < length - 1; i++) {
g = c.charAt(i);
//
if (Arrays.binarySearch(charFirst, g) > -1) {
for (int j = i + 1; j < length; j++) {
f = c.substring(i, j);
g = c.charAt(j);
temps = charMap.get(f);
if (temps == null) { //
//System.out.println("ok");
r = f;
break tag;
}
//
if (Arrays.binarySearch(temps, g) > -1) {
if (j == length - 1) {
//System.out.println("find!");
r = c.substring(i, j + 1);
break tag;
}
} else { //
break;
}
}
}
}
return r;
}
/**
*
*/
public final static String test6(String content) {
String r = null, c = content;
char g;
char[] temps;
char[] keys = new char[key_max];
int length = c.length(), index;
tag : for (int i = 0; i < length - 1; i++) {
index = 0;
g = c.charAt(i);
//
if (Arrays.binarySearch(filters, g) > -1) {
continue;
}
//
if (Arrays.binarySearch(charFirst, g) > -1) {
keys[index++] = g;
for (int j = i + 1; j < length; j++) {
g = c.charAt(j);
//
if (Arrays.binarySearch(filters, g) > -1) {
continue;
}
temps = charMap.get(String.valueOf(keys, 0, index));
if (temps == null) { //
//System.out.println("ok");
r = String.valueOf(keys, 0, index);
break tag;
}
//
if (Arrays.binarySearch(temps, g) > -1) {
if (j == length - 1) {
//System.out.println("find!");
keys[index++] = g;
r = String.valueOf(keys, 0, index);
break tag;
}
} else { //
break;
}
keys[index++] = g;
}
}
}
return r;
}
public static StringBuffer read(String file) throws IOException{
BufferedReader in = new BufferedReader(new InputStreamReader(new FileInputStream(file), "GBK"));
String line = null;
StringBuffer buffer = new StringBuffer();
while((line = in.readLine())!= null){
if(line.trim().length()==0){
continue;
}
buffer.append(line);
}
return buffer;
}
// [ 、 ]
static char[] filters = " `1234567890-=[]\\qwertyuiopasdfghjklzxcvbnmQWERTYUIOPASDFGHJKLZXCVBNM;',./~!@#$%^&*()_+{}:\"?>