arabicligaturizer.java

来自「源码包含生成 PDF 和 HTML 的类库」· Java 代码 · 共 775 行 · 第 1/3 页

JAVA
775
字号
/* * Copyright 2003 by Paulo Soares. * * The contents of this file are subject to the Mozilla Public License Version 1.1 * (the "License"); you may not use this file except in compliance with the License. * You may obtain a copy of the License at http://www.mozilla.org/MPL/ * * Software distributed under the License is distributed on an "AS IS" basis, * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License * for the specific language governing rights and limitations under the License. * * The Original Code is 'iText, a free JAVA-PDF library'. * * The Initial Developer of the Original Code is Bruno Lowagie. Portions created by * the Initial Developer are Copyright (C) 1999, 2000, 2001, 2002 by Bruno Lowagie. * All Rights Reserved. * Co-Developer of the code is Paulo Soares. Portions created by the Co-Developer * are Copyright (C) 2000, 2001, 2002 by Paulo Soares. All Rights Reserved. * * Contributor(s): all the names of the contributors are added in the source code * where applicable. * * Alternatively, the contents of this file may be used under the terms of the * LGPL license (the "GNU LIBRARY GENERAL PUBLIC LICENSE"), in which case the * provisions of LGPL are applicable instead of those above.  If you wish to * allow use of your version of this file only under the terms of the LGPL * License and not to allow others to use your version of this file under * the MPL, indicate your decision by deleting the provisions above and * replace them with the notice and other provisions required by the LGPL. * If you do not delete the provisions above, a recipient may use your version * of this file under either the MPL or the GNU LIBRARY GENERAL PUBLIC LICENSE. * * This library is free software; you can redistribute it and/or modify it * under the terms of the MPL as stated above or under the terms of the GNU * Library General Public License as published by the Free Software Foundation; * either version 2 of the License, or any later version. * * This library is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS * FOR A PARTICULAR PURPOSE. See the GNU Library general Public License for more * details. * * If you didn't download this code from the following link, you should check if * you aren't using an obsolete version: * http://www.lowagie.com/iText/ */package com.lowagie.text.pdf;/** * Shape arabic characters. This code was inspired by an LGPL'ed C library: * Pango ( see http://www.pango.com/ ). Note that the code of this is the * original work of Paulo Soares. Hence it is perfectly justifiable to distribute * it under the MPL. * * @author Paulo Soares (psoares@consiste.pt) */public class ArabicLigaturizer {        static boolean isVowel(char s) {        return ((s >= 0x064B) && (s <= 0x0655)) || (s == 0x0670);    }    static char charshape(char s, int which)    /* which 0=isolated 1=final 2=initial 3=medial */    {        int l, r, m;        if ((s >= 0x0621) && (s <= 0x06D3)) {            l = 0;            r = chartable.length - 1;            while (l <= r) {                m = (l + r) / 2;                if (s == chartable[m][0]) {                    return chartable[m][which + 1];                }                else if (s < chartable[m][0]) {                    r = m - 1;                }                else {                    l = m + 1;                }            }        }        else if (s >= 0xfef5 && s <= 0xfefb)            return (char)(s + which);        return s;    }    static int shapecount(char s) {        int l, r, m;        if ((s >= 0x0621) && (s <= 0x06D3) && !isVowel(s)) {            l = 0;            r = chartable.length - 1;            while (l <= r) {                m = (l + r) / 2;                if (s == chartable[m][0]) {                    return chartable[m].length - 1;                }                else if (s < chartable[m][0]) {                    r = m - 1;                }                else {                    l = m + 1;                }            }        }        else if (s == ZWJ) {            return 4;        }        return 1;    }        static int ligature(char newchar, charstruct oldchar) {    /* 0 == no ligature possible; 1 == vowel; 2 == two chars; 3 == Lam+Alef */        int retval = 0;                if (oldchar.basechar == 0)            return 0;        if (isVowel(newchar)) {            retval = 1;            if ((oldchar.vowel != 0) && (newchar != SHADDA)) {                retval = 2;           /* we eliminate the old vowel .. */            }            switch (newchar) {                case SHADDA:                    if (oldchar.mark1 == 0) {                        oldchar.mark1 = SHADDA;                    }                    else {                        return 0;         /* no ligature possible */                    }                    break;                case HAMZABELOW:                    switch (oldchar.basechar) {                        case ALEF:                            oldchar.basechar = ALEFHAMZABELOW;                            retval = 2;                            break;                        case LAM_ALEF:                            oldchar.basechar = LAM_ALEFHAMZABELOW;                            retval = 2;                            break;                        default:                            oldchar.mark1 = HAMZABELOW;                            break;                    }                    break;                case HAMZAABOVE:                    switch (oldchar.basechar) {                        case ALEF:                            oldchar.basechar = ALEFHAMZA;                            retval = 2;                            break;                        case LAM_ALEF:                            oldchar.basechar = LAM_ALEFHAMZA;                            retval = 2;                            break;                        case WAW:                            oldchar.basechar = WAWHAMZA;                            retval = 2;                            break;                        case YEH:                        case ALEFMAKSURA:                        case FARSIYEH:                            oldchar.basechar = YEHHAMZA;                            retval = 2;                            break;                        default:           /* whatever sense this may make .. */                            oldchar.mark1 = HAMZAABOVE;                            break;                    }                    break;                case MADDA:                    switch (oldchar.basechar) {                        case ALEF:                            oldchar.basechar = ALEFMADDA;                            retval = 2;                            break;                    }                    break;                default:                    oldchar.vowel = newchar;                    break;            }            if (retval == 1) {                oldchar.lignum++;            }            return retval;        }        if (oldchar.vowel != 0) {  /* if we already joined a vowel, we can't join a Hamza */            return 0;        }                switch (oldchar.basechar) {            case LAM:                switch (newchar) {                    case ALEF:                        oldchar.basechar = LAM_ALEF;                        oldchar.numshapes = 2;                        retval = 3;                        break;                    case ALEFHAMZA:                        oldchar.basechar = LAM_ALEFHAMZA;                        oldchar.numshapes = 2;                        retval = 3;                        break;                    case ALEFHAMZABELOW:                        oldchar.basechar = LAM_ALEFHAMZABELOW;                        oldchar.numshapes = 2;                        retval = 3;                        break;                    case ALEFMADDA:                        oldchar.basechar = LAM_ALEFMADDA;                        oldchar.numshapes = 2;                        retval = 3;                        break;                }                break;            case 0:                oldchar.basechar = newchar;                oldchar.numshapes = shapecount(newchar);                retval = 1;                break;        }        return retval;    }        static void copycstostring(StringBuffer string, charstruct s, int level) {    /* s is a shaped charstruct; i is the index into the string */        if (s.basechar == 0)            return;                string.append(s.basechar);        s.lignum--;        if (s.mark1 != 0) {            if ((level & ar_novowel) == 0) {                string.append(s.mark1);                s.lignum--;            }            else {                s.lignum--;            }        }        if (s.vowel != 0) {            if ((level & ar_novowel) == 0) {                string.append(s.vowel);                s.lignum--;            }            else {                       /* vowel elimination */                s.lignum--;            }        }//        while (s.lignum > 0) {                           /* NULL-insertion for Langbox-font *///            string[i] = 0;//            i++;//            (s.lignum)--;//        }//        return i;    }

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?