📄 gen_wctype.c
字号:
/* widtht[c/4] |= (wcwidth(c) << ((c & 3) << 1)); */ if (c & 1) { /* Use the high nibble for odd numbered wchars. */ d <<= 4; } wct[c/2] |= d; l = (long)(int) towlower(c) - c; u = (long)(int) towupper(c) - c; ult[c] = 0; if (l || u) { if ((l != (short)l) || (u != (short)u)) { printf("range assumption error! %x %ld %ld\n", c, l, u); return EXIT_FAILURE; } for (i=0 ; i < ul_count ; i++) { if ((l == uldiff[i].l) && (u == uldiff[i].u)) { goto found; } } uldiff[ul_count].l = l; uldiff[ul_count].u = u; ++ul_count; if (ul_count > MAXTO) { printf("too many touppers/tolowers!\n"); return EXIT_FAILURE; } found: ult[c] = i; } } for (i = 0 ; i < 16 ; i++) { printf("typecount[%2d] = %8ld %s\n", i, typecount[i], typename[i]); } printf("optimizing is* table..\n"); n = -1; smallest = SIZE_MAX; cttable.ii = NULL; for (i=0 ; i < 14 ; i++) { t = newopt(wct, (RANGE/2)+1, i, &cttable); if (smallest >= t) { n = i; smallest = t;/* } else { *//* break; */ } } printf("smallest = %zu\n", smallest); if (!(cttable.ii = malloc(smallest))) { printf("couldn't allocate space!\n"); return EXIT_FAILURE; } smallest = SIZE_MAX; newopt(wct, (RANGE/2)+1, n, &cttable); ++cttable.ti_shift; /* correct for nibble mode */ printf("optimizing u/l-to table..\n"); smallest = SIZE_MAX; ultable.ii = NULL; for (i=0 ; i < 14 ; i++) { t = newopt(ult, RANGE+1, i, &ultable); if (smallest >= t) { n = i; smallest = t;/* } else { *//* break; */ } } printf("%zu (smallest) + %zu (u/l diffs) = %zu\n", smallest, 4 * ul_count, smallest + 4 * ul_count); printf("smallest = %zu\n", smallest); if (!(ultable.ii = malloc(smallest))) { printf("couldn't allocate space!\n"); return EXIT_FAILURE; } smallest = SIZE_MAX; newopt(ult, RANGE+1, n, &ultable);#if 0 printf("optimizing comb table..\n"); smallest = SIZE_MAX; combtable.ii = NULL; for (i=0 ; i < 14 ; i++) { t = newopt(combt, sizeof(combt), i, &combtable); if (smallest >= t) { n = i; smallest = t;/* } else { *//* break; */ } } printf("smallest = %zu\n", smallest); if (!(combtable.ii = malloc(smallest))) { printf("couldn't allocate space!\n"); return EXIT_FAILURE; } smallest = SIZE_MAX; newopt(combt, sizeof(combt), n, &combtable); combtable.ti_shift += 4; /* correct for 4 entries per */#endif#if 0 printf("optimizing width table..\n"); smallest = SIZE_MAX; widthtable.ii = NULL; for (i=0 ; i < 14 ; i++) { t = newopt(widtht, sizeof(widtht), i, &widthtable); if (smallest >= t) { n = i; smallest = t;/* } else { *//* break; */ } } printf("smallest = %zu\n", smallest); if (!(widthtable.ii = malloc(smallest))) { printf("couldn't allocate space!\n"); return EXIT_FAILURE; } smallest = SIZE_MAX; newopt(widtht, sizeof(widtht), n, &widthtable); widthtable.ti_shift += 4; /* correct for 4 entries per */#endif#if 0 printf("optimizing comb3 table..\n"); smallest = SIZE_MAX; comb3table.ii = NULL; for (i=0 ; i < 14 ; i++) { t = newopt(comb3t, sizeof(comb3t), i, &comb3table); if (smallest >= t) { n = i; smallest = t;/* } else { *//* break; */ } } printf("smallest = %zu\n", smallest); if (!(comb3table.ii = malloc(smallest))) { printf("couldn't allocate space!\n"); return EXIT_FAILURE; } smallest = SIZE_MAX; newopt(comb3t, sizeof(comb3t), n, &comb3table); comb3table.ti_shift += 8; /* correct for 4 entries per */#endif dump_table_data(&cttable); dump_table_data(&ultable); dump_table_data(&combtable); } printf("verifying for %s...\n", *argv);#if RANGE == 0xffffU for (c=0 ; c <= 0xffffUL ; c++)#else for (c=0 ; c <= 0x10ffffUL ; c++)#endif { unsigned int glibc; unsigned int mine; unsigned int upper, lower;#if 0#if RANGE < 0x10000UL if (c == 0x10000UL) { c = 0x30000UL; /* skip 1st and 2nd sup planes */ }#elif RANGE < 0x20000UL if (c == 0x20000UL) { c = 0x30000UL; /* skip 2nd sup planes */ }#endif#endif glibc = 0; if (iswalnum(c)) ++glibc; glibc <<= 1; if (iswalpha(c)) ++glibc; glibc <<= 1; if (iswblank(c)) ++glibc; glibc <<= 1; if (iswcntrl(c)) ++glibc; glibc <<= 1; if (iswdigit(c)) ++glibc; glibc <<= 1; if (iswgraph(c)) ++glibc; glibc <<= 1; if (iswlower(c)) ++glibc; glibc <<= 1; if (iswprint(c)) ++glibc; glibc <<= 1; if (iswpunct(c)) ++glibc; glibc <<= 1; if (iswspace(c)) ++glibc; glibc <<= 1; if (iswupper(c)) ++glibc; glibc <<= 1; if (iswxdigit(c)) ++glibc; { unsigned int u; int n, sc; int i0, i1; u = c; if (u <= RANGE) { sc = u & ((1 << cttable.ti_shift) - 1); u >>= cttable.ti_shift; n = u & ((1 << cttable.ii_shift) - 1); u >>= cttable.ii_shift; i0 = cttable.ii[u]; i0 <<= cttable.ii_shift; i1 = cttable.ti[i0 + n]; i1 <<= (cttable.ti_shift-1); d = cttable.ut[i1 + (sc >> 1)]; if (sc & 1) { d >>= 4; } d &= 0x0f; } else if ((((unsigned int)(c - 0xe0020UL)) <= 0x5f) || (c == 0xe0001UL)){ d = __CTYPE_punct; } else if (((unsigned int)(c - 0xf0000UL)) < 0x20000UL) { if ((c & 0xffffU) <= 0xfffdU) { d = __CTYPE_punct; } else { d = __CTYPE_unclassified; } } else { d = __CTYPE_unclassified; } mine = 0; if (mywalnum(c)) ++mine; mine <<= 1; if (mywalpha(c)) ++mine; mine <<= 1; if (mywblank(c)) ++mine; mine <<= 1; if (mywcntrl(c)) ++mine; mine <<= 1; if (mywdigit(c)) ++mine; mine <<= 1; if (mywgraph(c)) ++mine; mine <<= 1; if (mywlower(c)) ++mine; mine <<= 1; if (mywprint(c)) ++mine; mine <<= 1; if (mywpunct(c)) ++mine; mine <<= 1; if (mywspace(c)) ++mine; mine <<= 1; if (mywupper(c)) ++mine; mine <<= 1; if (mywxdigit(c)) ++mine; if (glibc != mine) { printf("%#8x : glibc %#4x != %#4x mine %d\n", c, glibc, mine, d); if (c < 0x30000UL) { printf("sc=%#x u=%#x n=%#x i0=%#x i1=%#x\n", sc, u, n, i0, i1); } } upper = lower = u = c; if (u <= RANGE) { sc = u & ((1 << ultable.ti_shift) - 1); u >>= ultable.ti_shift; n = u & ((1 << ultable.ii_shift) - 1); u >>= ultable.ii_shift; i0 = ultable.ii[u]; i0 <<= ultable.ii_shift; i1 = ultable.ti[i0 + n]; i1 <<= (ultable.ti_shift); i1 += sc; i0 = ultable.ut[i1]; upper = c + uldiff[i0].u; lower = c + uldiff[i0].l; } if (towupper(c) != upper) { printf("%#8x : towupper glibc %#4x != %#4x mine\n", c, towupper(c), upper); } if (towlower(c) != lower) { printf("%#8x : towlower glibc %#4x != %#4x mine i0 = %d\n", c, towlower(c), lower, i0); } if (totitle && ((tt = towctrans(c, totitle)) != upper)) { printf("%#8x : totitle glibc %#4lx != %#4x mine i0 = %d\n", c, tt, upper, i0); } } if ((c & 0xfff) == 0xfff) printf("."); } printf("done\n"); } if (1) { FILE *fp; if (!(fp = fopen("wctables.h", "w"))) { printf("couldn't open wctables.h!\n"); return EXIT_FAILURE; } fprintf(fp, "#define __LOCALE_DATA_WC_TABLE_DOMAIN_MAX %#8lx\n\n", (unsigned long) RANGE); output_table(fp, "ctype", &cttable); output_table(fp, "uplow", &ultable); #warning fix the upper bound on the upper/lower tables... save 200 bytes or so fprintf(fp, "#define __LOCALE_DATA_WCuplow_diffs %7u\n", ul_count); fprintf(fp, "\n#ifdef WANT_WCuplow_diff_data\n\n"); fprintf(fp, "\nstatic const short __LOCALE_DATA_WCuplow_diff_data[%zu] = {", 2 * (size_t) ul_count); for (i=0 ; i < ul_count ; i++) { if (i % 4 == 0) { fprintf(fp, "\n"); } fprintf(fp, " %6d, %6d,", uldiff[i].u, uldiff[i].l); } fprintf(fp, "\n};\n\n"); fprintf(fp, "#endif /* WANT_WCuplow_diff_data */\n\n");/* output_table(fp, "comb", &combtable); *//* output_table(fp, "width", &widthtable); */ fclose(fp); } return EXIT_SUCCESS;}size_t newopt(unsigned char *ut, size_t usize, int shift, table_data *tbl){ static int recurse = 0; unsigned char *ti[RANGE+1]; /* table index */ size_t numblocks; size_t blocksize; size_t uniq; size_t i, j; size_t smallest, t; unsigned char *ii_save; int uniqblock[256]; unsigned char uit[RANGE+1]; int shift2; ii_save = NULL; blocksize = 1 << shift; numblocks = usize >> shift; /* init table index */ for (i=j=0 ; i < numblocks ; i++) { ti[i] = ut + j; j += blocksize; } /* sort */ nu_val = blocksize; qsort(ti, numblocks, sizeof(unsigned char *), nu_memcmp); uniq = 1; uit[(ti[0]-ut)/blocksize] = 0; for (i=1 ; i < numblocks ; i++) { if (memcmp(ti[i-1], ti[i], blocksize) < 0) { if (++uniq > 255) { break; } uniqblock[uniq - 1] = i; }#if 1 else if (memcmp(ti[i-1], ti[i], blocksize) > 0) { printf("bad sort %i!\n", i); abort(); }#endif uit[(ti[i]-ut)/blocksize] = uniq - 1; } smallest = SIZE_MAX; shift2 = -1; if (uniq <= 255) { smallest = numblocks + uniq * blocksize; if (!recurse) { ++recurse; for (j=1 ; j < 14 ; j++) { if ((numblocks >> j) < 2) break; if (tbl) { ii_save = tbl->ii; tbl->ii = NULL; } if ((t = newopt(uit, numblocks, j, tbl)) < SIZE_MAX) { t += uniq * blocksize; } if (tbl) { tbl->ii = ii_save; } if (smallest >= t) { shift2 = j; smallest = t; if (!tbl->ii) { printf("ishift %zu tshift %zu size %zu\n", shift2, shift, t); }/* } else { *//* break; */ } } --recurse; } } else { return SIZE_MAX; } if (tbl->ii) { if (recurse) { tbl->ii_shift = shift; tbl->ii_len = numblocks; memcpy(tbl->ii, uit, numblocks); tbl->ti = tbl->ii + tbl->ii_len; tbl->ti_len = uniq * blocksize; for (i=0 ; i < uniq ; i++) { memcpy(tbl->ti + i * blocksize, ti[uniqblock[i]], blocksize); } } else { ++recurse; printf("setting ishift %zu tshift %zu\n", shift2, shift); newopt(uit, numblocks, shift2, tbl); --recurse; tbl->ti_shift = shift; tbl->ut_len = uniq * blocksize; tbl->ut = tbl->ti + tbl->ti_len; for (i=0 ; i < uniq ; i++) { memcpy(tbl->ut + i * blocksize, ti[uniqblock[i]], blocksize); } } } return smallest;}
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -