⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 frenchstemmer.java

📁 一个很不错的词频统计程序,目前只支持英文,中文的本人正在修改中.改好后上传给大家分享
💻 JAVA
📖 第 1 页 / 共 4 页
字号:
// This file was generated automatically by the Snowball to Java compiler

package org.tartarus.snowball.ext;
import org.tartarus.snowball.SnowballProgram;
import org.tartarus.snowball.Among;

/**
 * Generated class implementing code defined by a snowball script.
 */
public class frenchStemmer extends SnowballProgram {

        private Among a_0[] = {
            new Among ( "col", -1, -1, "", this),
            new Among ( "par", -1, -1, "", this),
            new Among ( "tap", -1, -1, "", this)
        };

        private Among a_1[] = {
            new Among ( "", -1, 4, "", this),
            new Among ( "I", 0, 1, "", this),
            new Among ( "U", 0, 2, "", this),
            new Among ( "Y", 0, 3, "", this)
        };

        private Among a_2[] = {
            new Among ( "iqU", -1, 3, "", this),
            new Among ( "abl", -1, 3, "", this),
            new Among ( "I\u00E8r", -1, 4, "", this),
            new Among ( "i\u00E8r", -1, 4, "", this),
            new Among ( "eus", -1, 2, "", this),
            new Among ( "iv", -1, 1, "", this)
        };

        private Among a_3[] = {
            new Among ( "ic", -1, 2, "", this),
            new Among ( "abil", -1, 1, "", this),
            new Among ( "iv", -1, 3, "", this)
        };

        private Among a_4[] = {
            new Among ( "iqUe", -1, 1, "", this),
            new Among ( "atrice", -1, 2, "", this),
            new Among ( "ance", -1, 1, "", this),
            new Among ( "ence", -1, 5, "", this),
            new Among ( "logie", -1, 3, "", this),
            new Among ( "able", -1, 1, "", this),
            new Among ( "isme", -1, 1, "", this),
            new Among ( "euse", -1, 11, "", this),
            new Among ( "iste", -1, 1, "", this),
            new Among ( "ive", -1, 8, "", this),
            new Among ( "if", -1, 8, "", this),
            new Among ( "usion", -1, 4, "", this),
            new Among ( "ation", -1, 2, "", this),
            new Among ( "ution", -1, 4, "", this),
            new Among ( "ateur", -1, 2, "", this),
            new Among ( "iqUes", -1, 1, "", this),
            new Among ( "atrices", -1, 2, "", this),
            new Among ( "ances", -1, 1, "", this),
            new Among ( "ences", -1, 5, "", this),
            new Among ( "logies", -1, 3, "", this),
            new Among ( "ables", -1, 1, "", this),
            new Among ( "ismes", -1, 1, "", this),
            new Among ( "euses", -1, 11, "", this),
            new Among ( "istes", -1, 1, "", this),
            new Among ( "ives", -1, 8, "", this),
            new Among ( "ifs", -1, 8, "", this),
            new Among ( "usions", -1, 4, "", this),
            new Among ( "ations", -1, 2, "", this),
            new Among ( "utions", -1, 4, "", this),
            new Among ( "ateurs", -1, 2, "", this),
            new Among ( "ments", -1, 15, "", this),
            new Among ( "ements", 30, 6, "", this),
            new Among ( "issements", 31, 12, "", this),
            new Among ( "it\u00E9s", -1, 7, "", this),
            new Among ( "ment", -1, 15, "", this),
            new Among ( "ement", 34, 6, "", this),
            new Among ( "issement", 35, 12, "", this),
            new Among ( "amment", 34, 13, "", this),
            new Among ( "emment", 34, 14, "", this),
            new Among ( "aux", -1, 10, "", this),
            new Among ( "eaux", 39, 9, "", this),
            new Among ( "eux", -1, 1, "", this),
            new Among ( "it\u00E9", -1, 7, "", this)
        };

        private Among a_5[] = {
            new Among ( "ira", -1, 1, "", this),
            new Among ( "ie", -1, 1, "", this),
            new Among ( "isse", -1, 1, "", this),
            new Among ( "issante", -1, 1, "", this),
            new Among ( "i", -1, 1, "", this),
            new Among ( "irai", 4, 1, "", this),
            new Among ( "ir", -1, 1, "", this),
            new Among ( "iras", -1, 1, "", this),
            new Among ( "ies", -1, 1, "", this),
            new Among ( "\u00EEmes", -1, 1, "", this),
            new Among ( "isses", -1, 1, "", this),
            new Among ( "issantes", -1, 1, "", this),
            new Among ( "\u00EEtes", -1, 1, "", this),
            new Among ( "is", -1, 1, "", this),
            new Among ( "irais", 13, 1, "", this),
            new Among ( "issais", 13, 1, "", this),
            new Among ( "irions", -1, 1, "", this),
            new Among ( "issions", -1, 1, "", this),
            new Among ( "irons", -1, 1, "", this),
            new Among ( "issons", -1, 1, "", this),
            new Among ( "issants", -1, 1, "", this),
            new Among ( "it", -1, 1, "", this),
            new Among ( "irait", 21, 1, "", this),
            new Among ( "issait", 21, 1, "", this),
            new Among ( "issant", -1, 1, "", this),
            new Among ( "iraIent", -1, 1, "", this),
            new Among ( "issaIent", -1, 1, "", this),
            new Among ( "irent", -1, 1, "", this),
            new Among ( "issent", -1, 1, "", this),
            new Among ( "iront", -1, 1, "", this),
            new Among ( "\u00EEt", -1, 1, "", this),
            new Among ( "iriez", -1, 1, "", this),
            new Among ( "issiez", -1, 1, "", this),
            new Among ( "irez", -1, 1, "", this),
            new Among ( "issez", -1, 1, "", this)
        };

        private Among a_6[] = {
            new Among ( "a", -1, 3, "", this),
            new Among ( "era", 0, 2, "", this),
            new Among ( "asse", -1, 3, "", this),
            new Among ( "ante", -1, 3, "", this),
            new Among ( "\u00E9e", -1, 2, "", this),
            new Among ( "ai", -1, 3, "", this),
            new Among ( "erai", 5, 2, "", this),
            new Among ( "er", -1, 2, "", this),
            new Among ( "as", -1, 3, "", this),
            new Among ( "eras", 8, 2, "", this),
            new Among ( "\u00E2mes", -1, 3, "", this),
            new Among ( "asses", -1, 3, "", this),
            new Among ( "antes", -1, 3, "", this),
            new Among ( "\u00E2tes", -1, 3, "", this),
            new Among ( "\u00E9es", -1, 2, "", this),
            new Among ( "ais", -1, 3, "", this),
            new Among ( "erais", 15, 2, "", this),
            new Among ( "ions", -1, 1, "", this),
            new Among ( "erions", 17, 2, "", this),
            new Among ( "assions", 17, 3, "", this),
            new Among ( "erons", -1, 2, "", this),
            new Among ( "ants", -1, 3, "", this),
            new Among ( "\u00E9s", -1, 2, "", this),
            new Among ( "ait", -1, 3, "", this),
            new Among ( "erait", 23, 2, "", this),
            new Among ( "ant", -1, 3, "", this),
            new Among ( "aIent", -1, 3, "", this),
            new Among ( "eraIent", 26, 2, "", this),
            new Among ( "\u00E8rent", -1, 2, "", this),
            new Among ( "assent", -1, 3, "", this),
            new Among ( "eront", -1, 2, "", this),
            new Among ( "\u00E2t", -1, 3, "", this),
            new Among ( "ez", -1, 2, "", this),
            new Among ( "iez", 32, 2, "", this),
            new Among ( "eriez", 33, 2, "", this),
            new Among ( "assiez", 33, 3, "", this),
            new Among ( "erez", 32, 2, "", this),
            new Among ( "\u00E9", -1, 2, "", this)
        };

        private Among a_7[] = {
            new Among ( "e", -1, 3, "", this),
            new Among ( "I\u00E8re", 0, 2, "", this),
            new Among ( "i\u00E8re", 0, 2, "", this),
            new Among ( "ion", -1, 1, "", this),
            new Among ( "Ier", -1, 2, "", this),
            new Among ( "ier", -1, 2, "", this),
            new Among ( "\u00EB", -1, 4, "", this)
        };

        private Among a_8[] = {
            new Among ( "ell", -1, -1, "", this),
            new Among ( "eill", -1, -1, "", this),
            new Among ( "enn", -1, -1, "", this),
            new Among ( "onn", -1, -1, "", this),
            new Among ( "ett", -1, -1, "", this)
        };

        private static final char g_v[] = {17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 128, 130, 103, 8, 5 };

        private static final char g_keep_with_s[] = {1, 65, 20, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 128 };

        private int I_p2;
        private int I_p1;
        private int I_pV;

        private void copy_from(frenchStemmer other) {
            I_p2 = other.I_p2;
            I_p1 = other.I_p1;
            I_pV = other.I_pV;
            super.copy_from(other);
        }

        private boolean r_prelude() {
            int v_1;
            int v_2;
            int v_3;
            int v_4;
            // repeat, line 38
            replab0: while(true)
            {
                v_1 = cursor;
                lab1: do {
                    // goto, line 38
                    golab2: while(true)
                    {
                        v_2 = cursor;
                        lab3: do {
                            // (, line 38
                            // or, line 44
                            lab4: do {
                                v_3 = cursor;
                                lab5: do {
                                    // (, line 40
                                    if (!(in_grouping(g_v, 97, 251)))
                                    {
                                        break lab5;
                                    }
                                    // [, line 40
                                    bra = cursor;
                                    // or, line 40
                                    lab6: do {
                                        v_4 = cursor;
                                        lab7: do {
                                            // (, line 40
                                            // literal, line 40
                                            if (!(eq_s(1, "u")))
                                            {
                                                break lab7;
                                            }
                                            // ], line 40
                                            ket = cursor;
                                            if (!(in_grouping(g_v, 97, 251)))
                                            {
                                                break lab7;
                                            }
                                            // <-, line 40
                                            slice_from("U");
                                            break lab6;
                                        } while (false);
                                        cursor = v_4;
                                        lab8: do {
                                            // (, line 41
                                            // literal, line 41
                                            if (!(eq_s(1, "i")))
                                            {
                                                break lab8;
                                            }
                                            // ], line 41
                                            ket = cursor;
                                            if (!(in_grouping(g_v, 97, 251)))
                                            {
                                                break lab8;
                                            }
                                            // <-, line 41
                                            slice_from("I");
                                            break lab6;
                                        } while (false);
                                        cursor = v_4;
                                        // (, line 42
                                        // literal, line 42
                                        if (!(eq_s(1, "y")))
                                        {
                                            break lab5;
                                        }
                                        // ], line 42
                                        ket = cursor;
                                        // <-, line 42
                                        slice_from("Y");
                                    } while (false);
                                    break lab4;
                                } while (false);
                                cursor = v_3;
                                lab9: do {
                                    // (, line 45
                                    // [, line 45
                                    bra = cursor;
                                    // literal, line 45
                                    if (!(eq_s(1, "y")))
                                    {
                                        break lab9;
                                    }
                                    // ], line 45
                                    ket = cursor;
                                    if (!(in_grouping(g_v, 97, 251)))
                                    {
                                        break lab9;
                                    }
                                    // <-, line 45
                                    slice_from("Y");
                                    break lab4;
                                } while (false);
                                cursor = v_3;
                                // (, line 47
                                // literal, line 47
                                if (!(eq_s(1, "q")))
                                {
                                    break lab3;
                                }
                                // [, line 47
                                bra = cursor;
                                // literal, line 47
                                if (!(eq_s(1, "u")))
                                {
                                    break lab3;
                                }
                                // ], line 47
                                ket = cursor;
                                // <-, line 47
                                slice_from("U");
                            } while (false);
                            cursor = v_2;
                            break golab2;
                        } while (false);
                        cursor = v_2;
                        if (cursor >= limit)
                        {
                            break lab1;
                        }
                        cursor++;
                    }
                    continue replab0;
                } while (false);
                cursor = v_1;
                break replab0;
            }
            return true;
        }

        private boolean r_mark_regions() {
            int v_1;
            int v_2;
            int v_4;
            // (, line 50
            I_pV = limit;
            I_p1 = limit;
            I_p2 = limit;
            // do, line 56
            v_1 = cursor;
            lab0: do {
                // (, line 56
                // or, line 58
                lab1: do {
                    v_2 = cursor;
                    lab2: do {
                        // (, line 57
                        if (!(in_grouping(g_v, 97, 251)))
                        {
                            break lab2;
                        }
                        if (!(in_grouping(g_v, 97, 251)))
                        {
                            break lab2;
                        }
                        // next, line 57
                        if (cursor >= limit)
                        {
                            break lab2;
                        }
                        cursor++;
                        break lab1;
                    } while (false);
                    cursor = v_2;
                    lab3: do {
                        // among, line 59
                        if (find_among(a_0, 3) == 0)
                        {
                            break lab3;
                        }
                        break lab1;
                    } while (false);
                    cursor = v_2;

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -