package tf_idf;
import java.io.BufferedReader;
import java.io.FileReader;
import java.io.IOException;
import java.util.StringTokenizer;
import java.util.Vector;
public class fileFilter {
private Vector<String> v = new Vector<String>();
public fileFilter(String orgFile, String destFile) {
String line = "";
String buf = "";
StringBuffer sb = new StringBuffer();
v.add("N");
try {
FileReader fr = new FileReader(orgFile);
BufferedReader inFile = new BufferedReader(fr);
inFile.readLine(); // SOF
while((line = inFile.readLine()) != null && !line.equals("EOF")) {
line = inFile.readLine(); //홀수 번째 라인을 읽는다
StringTokenizer st = new StringTokenizer(line, ":");
st.nextToken(); // 줄 번호 제거
sb.setLength(0);
while(st.hasMoreTokens()) {
st.nextToken(":");
buf = st.nextToken(":");
if(v.contains(buf)) {
sb.append(st.nextToken(" "))
.append(" ");
}
}
line = sb.toString();
System.out.println(line);
}
} catch(IOException e) {
e.printStackTrace();
}
}
public static void main(String args[]) {
fileFilter ff = new fileFilter("C:\\tf_idf\\2_ds_posinfo.txt", "kk");
}
}
댓글 없음:
댓글 쓰기