⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 turkishstemmer.java

📁 一个很不错的词频统计程序,目前只支持英文,中文的本人正在修改中.改好后上传给大家分享
💻 JAVA
📖 第 1 页 / 共 5 页
字号:
// This file was generated automatically by the Snowball to Java compiler

package org.tartarus.snowball.ext;
import org.tartarus.snowball.SnowballProgram;
import org.tartarus.snowball.Among;

/**
 * Generated class implementing code defined by a snowball script.
 */
public class turkishStemmer extends SnowballProgram {

        private Among a_0[] = {
            new Among ( "m", -1, -1, "", this),
            new Among ( "n", -1, -1, "", this),
            new Among ( "miz", -1, -1, "", this),
            new Among ( "niz", -1, -1, "", this),
            new Among ( "muz", -1, -1, "", this),
            new Among ( "nuz", -1, -1, "", this),
            new Among ( "m\u00FCz", -1, -1, "", this),
            new Among ( "n\u00FCz", -1, -1, "", this),
            new Among ( "m\u0131z", -1, -1, "", this),
            new Among ( "n\u0131z", -1, -1, "", this)
        };

        private Among a_1[] = {
            new Among ( "leri", -1, -1, "", this),
            new Among ( "lar\u0131", -1, -1, "", this)
        };

        private Among a_2[] = {
            new Among ( "ni", -1, -1, "", this),
            new Among ( "nu", -1, -1, "", this),
            new Among ( "n\u00FC", -1, -1, "", this),
            new Among ( "n\u0131", -1, -1, "", this)
        };

        private Among a_3[] = {
            new Among ( "in", -1, -1, "", this),
            new Among ( "un", -1, -1, "", this),
            new Among ( "\u00FCn", -1, -1, "", this),
            new Among ( "\u0131n", -1, -1, "", this)
        };

        private Among a_4[] = {
            new Among ( "a", -1, -1, "", this),
            new Among ( "e", -1, -1, "", this)
        };

        private Among a_5[] = {
            new Among ( "na", -1, -1, "", this),
            new Among ( "ne", -1, -1, "", this)
        };

        private Among a_6[] = {
            new Among ( "da", -1, -1, "", this),
            new Among ( "ta", -1, -1, "", this),
            new Among ( "de", -1, -1, "", this),
            new Among ( "te", -1, -1, "", this)
        };

        private Among a_7[] = {
            new Among ( "nda", -1, -1, "", this),
            new Among ( "nde", -1, -1, "", this)
        };

        private Among a_8[] = {
            new Among ( "dan", -1, -1, "", this),
            new Among ( "tan", -1, -1, "", this),
            new Among ( "den", -1, -1, "", this),
            new Among ( "ten", -1, -1, "", this)
        };

        private Among a_9[] = {
            new Among ( "ndan", -1, -1, "", this),
            new Among ( "nden", -1, -1, "", this)
        };

        private Among a_10[] = {
            new Among ( "la", -1, -1, "", this),
            new Among ( "le", -1, -1, "", this)
        };

        private Among a_11[] = {
            new Among ( "ca", -1, -1, "", this),
            new Among ( "ce", -1, -1, "", this)
        };

        private Among a_12[] = {
            new Among ( "im", -1, -1, "", this),
            new Among ( "um", -1, -1, "", this),
            new Among ( "\u00FCm", -1, -1, "", this),
            new Among ( "\u0131m", -1, -1, "", this)
        };

        private Among a_13[] = {
            new Among ( "sin", -1, -1, "", this),
            new Among ( "sun", -1, -1, "", this),
            new Among ( "s\u00FCn", -1, -1, "", this),
            new Among ( "s\u0131n", -1, -1, "", this)
        };

        private Among a_14[] = {
            new Among ( "iz", -1, -1, "", this),
            new Among ( "uz", -1, -1, "", this),
            new Among ( "\u00FCz", -1, -1, "", this),
            new Among ( "\u0131z", -1, -1, "", this)
        };

        private Among a_15[] = {
            new Among ( "siniz", -1, -1, "", this),
            new Among ( "sunuz", -1, -1, "", this),
            new Among ( "s\u00FCn\u00FCz", -1, -1, "", this),
            new Among ( "s\u0131n\u0131z", -1, -1, "", this)
        };

        private Among a_16[] = {
            new Among ( "lar", -1, -1, "", this),
            new Among ( "ler", -1, -1, "", this)
        };

        private Among a_17[] = {
            new Among ( "niz", -1, -1, "", this),
            new Among ( "nuz", -1, -1, "", this),
            new Among ( "n\u00FCz", -1, -1, "", this),
            new Among ( "n\u0131z", -1, -1, "", this)
        };

        private Among a_18[] = {
            new Among ( "dir", -1, -1, "", this),
            new Among ( "tir", -1, -1, "", this),
            new Among ( "dur", -1, -1, "", this),
            new Among ( "tur", -1, -1, "", this),
            new Among ( "d\u00FCr", -1, -1, "", this),
            new Among ( "t\u00FCr", -1, -1, "", this),
            new Among ( "d\u0131r", -1, -1, "", this),
            new Among ( "t\u0131r", -1, -1, "", this)
        };

        private Among a_19[] = {
            new Among ( "cas\u0131na", -1, -1, "", this),
            new Among ( "cesine", -1, -1, "", this)
        };

        private Among a_20[] = {
            new Among ( "di", -1, -1, "", this),
            new Among ( "ti", -1, -1, "", this),
            new Among ( "dik", -1, -1, "", this),
            new Among ( "tik", -1, -1, "", this),
            new Among ( "duk", -1, -1, "", this),
            new Among ( "tuk", -1, -1, "", this),
            new Among ( "d\u00FCk", -1, -1, "", this),
            new Among ( "t\u00FCk", -1, -1, "", this),
            new Among ( "d\u0131k", -1, -1, "", this),
            new Among ( "t\u0131k", -1, -1, "", this),
            new Among ( "dim", -1, -1, "", this),
            new Among ( "tim", -1, -1, "", this),
            new Among ( "dum", -1, -1, "", this),
            new Among ( "tum", -1, -1, "", this),
            new Among ( "d\u00FCm", -1, -1, "", this),
            new Among ( "t\u00FCm", -1, -1, "", this),
            new Among ( "d\u0131m", -1, -1, "", this),
            new Among ( "t\u0131m", -1, -1, "", this),
            new Among ( "din", -1, -1, "", this),
            new Among ( "tin", -1, -1, "", this),
            new Among ( "dun", -1, -1, "", this),
            new Among ( "tun", -1, -1, "", this),
            new Among ( "d\u00FCn", -1, -1, "", this),
            new Among ( "t\u00FCn", -1, -1, "", this),
            new Among ( "d\u0131n", -1, -1, "", this),
            new Among ( "t\u0131n", -1, -1, "", this),
            new Among ( "du", -1, -1, "", this),
            new Among ( "tu", -1, -1, "", this),
            new Among ( "d\u00FC", -1, -1, "", this),
            new Among ( "t\u00FC", -1, -1, "", this),
            new Among ( "d\u0131", -1, -1, "", this),
            new Among ( "t\u0131", -1, -1, "", this)
        };

        private Among a_21[] = {
            new Among ( "sa", -1, -1, "", this),
            new Among ( "se", -1, -1, "", this),
            new Among ( "sak", -1, -1, "", this),
            new Among ( "sek", -1, -1, "", this),
            new Among ( "sam", -1, -1, "", this),
            new Among ( "sem", -1, -1, "", this),
            new Among ( "san", -1, -1, "", this),
            new Among ( "sen", -1, -1, "", this)
        };

        private Among a_22[] = {
            new Among ( "mi\u015F", -1, -1, "", this),
            new Among ( "mu\u015F", -1, -1, "", this),
            new Among ( "m\u00FC\u015F", -1, -1, "", this),
            new Among ( "m\u0131\u015F", -1, -1, "", this)
        };

        private Among a_23[] = {
            new Among ( "b", -1, 1, "", this),
            new Among ( "c", -1, 2, "", this),
            new Among ( "d", -1, 3, "", this),
            new Among ( "\u011F", -1, 4, "", this)
        };

        private static final char g_vowel[] = {17, 65, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 32, 8, 0, 0, 0, 0, 0, 0, 1 };

        private static final char g_U[] = {1, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 0, 0, 0, 0, 0, 1 };

        private static final char g_vowel1[] = {1, 64, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1 };

        private static final char g_vowel2[] = {17, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 130 };

        private static final char g_vowel3[] = {1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1 };

        private static final char g_vowel4[] = {17 };

        private static final char g_vowel5[] = {65 };

        private static final char g_vowel6[] = {65 };

        private boolean B_continue_stemming_noun_suffixes;
        private int I_strlen;

        private void copy_from(turkishStemmer other) {
            B_continue_stemming_noun_suffixes = other.B_continue_stemming_noun_suffixes;
            I_strlen = other.I_strlen;
            super.copy_from(other);
        }

        private boolean r_check_vowel_harmony() {
            int v_1;
            int v_2;
            int v_3;
            int v_4;
            int v_5;
            int v_6;
            int v_7;
            int v_8;
            int v_9;
            int v_10;
            int v_11;
            // (, line 111
            // test, line 112
            v_1 = limit - cursor;
            // (, line 113
            // (, line 114
            // goto, line 114
            golab0: while(true)
            {
                v_2 = limit - cursor;
                lab1: do {
                    if (!(in_grouping_b(g_vowel, 97, 305)))
                    {
                        break lab1;
                    }
                    cursor = limit - v_2;
                    break golab0;
                } while (false);
                cursor = limit - v_2;
                if (cursor <= limit_backward)
                {
                    return false;
                }
                cursor--;
            }
            // (, line 115
            // or, line 116
            lab2: do {
                v_3 = limit - cursor;
                lab3: do {
                    // (, line 116
                    // literal, line 116
                    if (!(eq_s_b(1, "a")))
                    {
                        break lab3;
                    }
                    // goto, line 116
                    golab4: while(true)
                    {
                        v_4 = limit - cursor;
                        lab5: do {
                            if (!(in_grouping_b(g_vowel1, 97, 305)))
                            {
                                break lab5;
                            }
                            cursor = limit - v_4;
                            break golab4;
                        } while (false);
                        cursor = limit - v_4;
                        if (cursor <= limit_backward)
                        {
                            break lab3;
                        }
                        cursor--;
                    }
                    break lab2;
                } while (false);
                cursor = limit - v_3;
                lab6: do {
                    // (, line 117
                    // literal, line 117
                    if (!(eq_s_b(1, "e")))
                    {
                        break lab6;
                    }
                    // goto, line 117
                    golab7: while(true)
                    {
                        v_5 = limit - cursor;
                        lab8: do {
                            if (!(in_grouping_b(g_vowel2, 101, 252)))
                            {
                                break lab8;
                            }
                            cursor = limit - v_5;
                            break golab7;
                        } while (false);
                        cursor = limit - v_5;
                        if (cursor <= limit_backward)
                        {
                            break lab6;
                        }
                        cursor--;
                    }
                    break lab2;
                } while (false);
                cursor = limit - v_3;
                lab9: do {
                    // (, line 118
                    // literal, line 118
                    if (!(eq_s_b(1, "\u0131")))
                    {
                        break lab9;
                    }
                    // goto, line 118
                    golab10: while(true)
                    {
                        v_6 = limit - cursor;
                        lab11: do {
                            if (!(in_grouping_b(g_vowel3, 97, 305)))
                            {
                                break lab11;
                            }
                            cursor = limit - v_6;
                            break golab10;
                        } while (false);
                        cursor = limit - v_6;
                        if (cursor <= limit_backward)
                        {
                            break lab9;
                        }
                        cursor--;
                    }
                    break lab2;
                } while (false);
                cursor = limit - v_3;
                lab12: do {
                    // (, line 119
                    // literal, line 119
                    if (!(eq_s_b(1, "i")))
                    {
                        break lab12;
                    }
                    // goto, line 119
                    golab13: while(true)
                    {
                        v_7 = limit - cursor;
                        lab14: do {
                            if (!(in_grouping_b(g_vowel4, 101, 105)))
                            {

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -