⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 tokenizer.java

📁 Practical AI in Java 人工智能编程
💻 JAVA
字号:
import java.io.StreamTokenizer;import java.io.StringReader;import java.io.Reader;import java.util.Vector;public class Tokenizer {    static public Vector getTokens(String ss) throws Exception {        return getTokens(new StringReader(ss));    }    static public Vector getTokens(Reader reader) throws Exception {        Vector words = new Vector();        StreamTokenizer str_tok = new StreamTokenizer(reader);        while (str_tok.nextToken() !=                StreamTokenizer.TT_EOF) {            String s;            switch (str_tok.ttype) {                case StreamTokenizer.TT_EOL:                    s = ""; // ignore this                    break;                case StreamTokenizer.TT_WORD:                    s = str_tok.sval;                    break;                case StreamTokenizer.TT_NUMBER:                    s = ""; // ignore this                    break;                default:                    s = String.valueOf((char) str_tok.ttype);            }            if (s.startsWith("$")) continue;            if (s.indexOf("-") > -1) continue;            s = s.toLowerCase();            s = s.replace('"', ' ').replace('%', ' ').replace('(', ' ');            s = s.replace(')', ' ').replace('\'', ' ');            s = s.trim();            if (s.indexOf(" ") != -1) continue;            if (s.endsWith(".")) {                s = s.substring(0, s.length() - 1);            } else if (s.endsWith(",")) {                s = s.substring(0, s.length() - 1);            } else if (s.endsWith(";")) {                s = s.substring(0, s.length() - 1);            } else if (s.endsWith(":")) {                s = s.substring(0, s.length() - 1);            }            if (s.length() < 2) continue;            if (s.indexOf(".") > -1) continue;            if (s.indexOf("0") > -1) continue;            if (s.indexOf("1") > -1) continue;            if (s.indexOf("2") > -1) continue;            if (s.indexOf("3") > -1) continue;            if (s.indexOf("4") > -1) continue;            if (s.indexOf("5") > -1) continue;            if (s.indexOf("6") > -1) continue;            if (s.indexOf("7") > -1) continue;            if (s.indexOf("8") > -1) continue;            if (s.indexOf("9") > -1) continue;            words.add(s.toLowerCase());        }        return words;    }}

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -