unicoderange.cpp

来自「linux下开源浏览器WebKit的源码,市面上的很多商用浏览器都是移植自Web」· C++ 代码 · 共 463 行 · 第 1/2 页

CPP

463 行

/* * Copyright (C) 2007 Apple Computer, Inc. * * Portions are Copyright (C) 1998 Netscape Communications Corporation. * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with this library; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA * * Alternatively, the contents of this file may be used under the terms * of either the Mozilla Public License Version 1.1, found at * http://www.mozilla.org/MPL/ (the "MPL") or the GNU General Public * License Version 2.0, found at http://www.fsf.org/copyleft/gpl.html * (the "GPL"), in which case the provisions of the MPL or the GPL are * applicable instead of those above.  If you wish to allow use of your * version of this file only under the terms of one of those two * licenses (the MPL or the GPL) and not to allow others to use your * version of this file under the LGPL, indicate your decision by * deletingthe provisions above and replace them with the notice and * other provisions required by the MPL or the GPL, as the case may be. * If you do not delete the provisions above, a recipient may use your * version of this file under any of the LGPL, the MPL or the GPL. */#include "config.h"#include "UnicodeRange.h"namespace WebCore {// This table depends on unicode range definitions. // Each item's index must correspond to a unicode range value// eg. x-cyrillic = LangGroupTable[cRangeCyrillic]static const char* gUnicodeRangeToLangGroupTable[] = {  "x-cyrillic",  "el",  "tr",  "he",  "ar",  "x-baltic",  "th",  "ko",  "ja",  "zh-CN",  "zh-TW",  "x-devanagari",  "x-tamil",  "x-armn",  "x-beng",  "x-cans",  "x-ethi",  "x-geor",  "x-gujr",  "x-guru",  "x-khmr",  "x-mlym"};/********************************************************************** * Unicode subranges as defined in unicode 3.0 * x-western, x-central-euro, tr, x-baltic  -> latin  *  0000 - 036f  *  1e00 - 1eff *  2000 - 206f  (general punctuation) *  20a0 - 20cf  (currency symbols) *  2100 - 214f  (letterlike symbols) *  2150 - 218f  (Number Forms) * el         -> greek *  0370 - 03ff *  1f00 - 1fff * x-cyrillic -> cyrillic *  0400 - 04ff * he         -> hebrew *  0590 - 05ff * ar         -> arabic *  0600 - 06ff *  fb50 - fdff (arabic presentation forms) *  fe70 - feff (arabic presentation forms b) * th - thai *  0e00 - 0e7f * ko        -> korean *  ac00 - d7af  (hangul Syllables) *  1100 - 11ff    (jamo) *  3130 - 318f (hangul compatibility jamo) * ja *  3040 - 309f (hiragana) *  30a0 - 30ff (katakana) * zh-CN * zh-TW * * CJK *  3100 - 312f (bopomofo) *  31a0 - 31bf (bopomofo extended) *  3000 - 303f (CJK Symbols and Punctuation)  *  2e80 - 2eff (CJK radicals supplement) *  2f00 - 2fdf (Kangxi Radicals) *  2ff0 - 2fff (Ideographic Description Characters) *  3190 - 319f (kanbun) *  3200 - 32ff (Enclosed CJK letters and Months) *  3300 - 33ff (CJK compatibility) *  3400 - 4dbf (CJK Unified Ideographs Extension A) *  4e00 - 9faf (CJK Unified Ideographs) *  f900 - fa5f (CJK Compatibility Ideographs) *  fe30 - fe4f (CJK compatibility Forms) *  ff00 - ffef (halfwidth and fullwidth forms) * * Armenian *  0530 - 058f  * Sriac  *  0700 - 074f * Thaana *  0780 - 07bf * Devanagari *  0900 - 097f * Bengali *  0980 - 09ff * Gurmukhi *  0a00 - 0a7f * Gujarati *  0a80 - 0aff * Oriya *  0b00 - 0b7f * Tamil *  0b80 - 0bff * Telugu *  0c00 - 0c7f * Kannada *  0c80 - 0cff * Malayalam *  0d00 - 0d7f * Sinhala *  0d80 - 0def * Lao *  0e80 - 0eff * Tibetan *  0f00 - 0fbf * Myanmar *  1000 - 109f * Georgian *  10a0 - 10ff * Ethiopic *  1200 - 137f * Cherokee *  13a0 - 13ff * Canadian Aboriginal Syllabics *  1400 - 167f * Ogham *  1680 - 169f * Runic  *  16a0 - 16ff * Khmer *  1780 - 17ff * Mongolian *  1800 - 18af * Misc - superscripts and subscripts *  2070 - 209f * Misc - Combining Diacritical Marks for Symbols *  20d0 - 20ff * Misc - Arrows *  2190 - 21ff * Misc - Mathematical Operators *  2200 - 22ff * Misc - Miscellaneous Technical *  2300 - 23ff * Misc - Control picture *  2400 - 243f * Misc - Optical character recognition *  2440 - 2450 * Misc - Enclose Alphanumerics *  2460 - 24ff * Misc - Box Drawing  *  2500 - 257f * Misc - Block Elements *  2580 - 259f * Misc - Geometric Shapes *  25a0 - 25ff * Misc - Miscellaneous Symbols *  2600 - 267f * Misc - Dingbats *  2700 - 27bf * Misc - Braille Patterns *  2800 - 28ff * Yi Syllables *  a000 - a48f * Yi radicals *  a490 - a4cf * Alphabetic Presentation Forms *  fb00 - fb4f * Misc - Combining half Marks *  fe20 - fe2f * Misc - small form variants *  fe50 - fe6f * Misc - Specials *  fff0 - ffff *********************************************************************/static const unsigned cNumSubTables = 9;static const unsigned cSubTableSize = 16;static const unsigned char gUnicodeSubrangeTable[cNumSubTables][cSubTableSize] = {   { // table for X---    cRangeTableBase+1,  //u0xxx    cRangeTableBase+2,  //u1xxx    cRangeTableBase+3,  //u2xxx    cRangeSetCJK,       //u3xxx    cRangeSetCJK,       //u4xxx    cRangeSetCJK,       //u5xxx    cRangeSetCJK,       //u6xxx    cRangeSetCJK,       //u7xxx    cRangeSetCJK,       //u8xxx    cRangeSetCJK,       //u9xxx    cRangeTableBase+4,  //uaxxx    cRangeKorean,       //ubxxx    cRangeKorean,       //ucxxx    cRangeTableBase+5,  //udxxx    cRangePrivate,      //uexxx    cRangeTableBase+6   //ufxxx  },  { //table for 0X--    cRangeSetLatin,          //u00xx    cRangeSetLatin,          //u01xx

unicoderange.cpp - 源码说明

本页面展示了「linux下开源浏览器WebKit的源码,市面上的很多商用浏览器都是移植自WebKit」中的 unicoderange.cpp 源码文件，采用 C++ 编程语言编写，共 463 行代码。您可以在线阅读完整代码内容，也可以返回资源详情页下载完整源码包进行本地学习和开发。

虫虫下载站收录了大量与WebKit相关的技术资源，包括源代码、技术文档、电路图等，是电子工程师和嵌入式开发者的专业学习平台。

⌨️ 快捷键说明

复制代码Ctrl + C

搜索代码Ctrl + F

全屏模式F11

增大字号Ctrl + =

减小字号Ctrl + -

显示快捷键?