123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254 |
- // © 2016 and later: Unicode, Inc. and others.
- // License & terms of use: http://www.unicode.org/copyright.html
- /*
- *******************************************************************************
- *
- * Copyright (C) 2004-2014, International Business Machines
- * Corporation and others. All Rights Reserved.
- *
- *******************************************************************************
- * file name: ubidi_props.c
- * encoding: UTF-8
- * tab size: 8 (not used)
- * indentation:4
- *
- * created on: 2004dec30
- * created by: Markus W. Scherer
- *
- * Low-level Unicode bidi/shaping properties access.
- */
- #include "unicode/utypes.h"
- #include "unicode/uset.h"
- #include "unicode/udata.h" /* UDataInfo */
- #include "ucmndata.h" /* DataHeader */
- #include "udatamem.h"
- #include "uassert.h"
- #include "cmemory.h"
- #include "utrie2.h"
- #include "ubidi_props.h"
- #include "ucln_cmn.h"
- struct UBiDiProps {
- UDataMemory *mem;
- const int32_t *indexes;
- const uint32_t *mirrors;
- const uint8_t *jgArray;
- const uint8_t *jgArray2;
- UTrie2 trie;
- uint8_t formatVersion[4];
- };
- /* ubidi_props_data.h is machine-generated by genbidi --csource */
- #define INCLUDED_FROM_UBIDI_PROPS_C
- #include "ubidi_props_data.h"
- /* set of property starts for UnicodeSet ------------------------------------ */
- static UBool U_CALLCONV
- _enumPropertyStartsRange(const void *context, UChar32 start, UChar32 end, uint32_t value) {
- (void)end;
- (void)value;
- /* add the start code point to the USet */
- const USetAdder *sa=(const USetAdder *)context;
- sa->add(sa->set, start);
- return true;
- }
- U_CFUNC void
- ubidi_addPropertyStarts(const USetAdder *sa, UErrorCode *pErrorCode) {
- int32_t i, length;
- UChar32 c, start, limit;
- const uint8_t *jgArray;
- uint8_t prev, jg;
- if(U_FAILURE(*pErrorCode)) {
- return;
- }
- /* add the start code point of each same-value range of the trie */
- utrie2_enum(&ubidi_props_singleton.trie, nullptr, _enumPropertyStartsRange, sa);
- /* add the code points from the bidi mirroring table */
- length=ubidi_props_singleton.indexes[UBIDI_IX_MIRROR_LENGTH];
- for(i=0; i<length; ++i) {
- c=UBIDI_GET_MIRROR_CODE_POINT(ubidi_props_singleton.mirrors[i]);
- sa->addRange(sa->set, c, c+1);
- }
- /* add the code points from the Joining_Group array where the value changes */
- start=ubidi_props_singleton.indexes[UBIDI_IX_JG_START];
- limit=ubidi_props_singleton.indexes[UBIDI_IX_JG_LIMIT];
- jgArray=ubidi_props_singleton.jgArray;
- for(;;) {
- prev=0;
- while(start<limit) {
- jg=*jgArray++;
- if(jg!=prev) {
- sa->add(sa->set, start);
- prev=jg;
- }
- ++start;
- }
- if(prev!=0) {
- /* add the limit code point if the last value was not 0 (it is now start==limit) */
- sa->add(sa->set, limit);
- }
- if(limit==ubidi_props_singleton.indexes[UBIDI_IX_JG_LIMIT]) {
- /* switch to the second Joining_Group range */
- start=ubidi_props_singleton.indexes[UBIDI_IX_JG_START2];
- limit=ubidi_props_singleton.indexes[UBIDI_IX_JG_LIMIT2];
- jgArray=ubidi_props_singleton.jgArray2;
- } else {
- break;
- }
- }
- /* add code points with hardcoded properties, plus the ones following them */
- /* (none right now) */
- }
- /* property access functions ------------------------------------------------ */
- U_CFUNC int32_t
- ubidi_getMaxValue(UProperty which) {
- int32_t max=ubidi_props_singleton.indexes[UBIDI_MAX_VALUES_INDEX];
- switch(which) {
- case UCHAR_BIDI_CLASS:
- return (max&UBIDI_CLASS_MASK);
- case UCHAR_JOINING_GROUP:
- return (max&UBIDI_MAX_JG_MASK)>>UBIDI_MAX_JG_SHIFT;
- case UCHAR_JOINING_TYPE:
- return (max&UBIDI_JT_MASK)>>UBIDI_JT_SHIFT;
- case UCHAR_BIDI_PAIRED_BRACKET_TYPE:
- return (max&UBIDI_BPT_MASK)>>UBIDI_BPT_SHIFT;
- default:
- return -1; /* undefined */
- }
- }
- U_CAPI UCharDirection
- ubidi_getClass(UChar32 c) {
- uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
- return (UCharDirection)UBIDI_GET_CLASS(props);
- }
- U_CFUNC UBool
- ubidi_isMirrored(UChar32 c) {
- uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
- return (UBool)UBIDI_GET_FLAG(props, UBIDI_IS_MIRRORED_SHIFT);
- }
- static UChar32
- getMirror(UChar32 c, uint16_t props) {
- int32_t delta=UBIDI_GET_MIRROR_DELTA(props);
- if(delta!=UBIDI_ESC_MIRROR_DELTA) {
- return c+delta;
- } else {
- /* look for mirror code point in the mirrors[] table */
- const uint32_t *mirrors;
- uint32_t m;
- int32_t i, length;
- UChar32 c2;
- mirrors=ubidi_props_singleton.mirrors;
- length=ubidi_props_singleton.indexes[UBIDI_IX_MIRROR_LENGTH];
- /* linear search */
- for(i=0; i<length; ++i) {
- m=mirrors[i];
- c2=UBIDI_GET_MIRROR_CODE_POINT(m);
- if(c==c2) {
- /* found c, return its mirror code point using the index in m */
- return UBIDI_GET_MIRROR_CODE_POINT(mirrors[UBIDI_GET_MIRROR_INDEX(m)]);
- } else if(c<c2) {
- break;
- }
- }
- /* c not found, return it itself */
- return c;
- }
- }
- U_CFUNC UChar32
- ubidi_getMirror(UChar32 c) {
- uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
- return getMirror(c, props);
- }
- U_CFUNC UBool
- ubidi_isBidiControl(UChar32 c) {
- uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
- return (UBool)UBIDI_GET_FLAG(props, UBIDI_BIDI_CONTROL_SHIFT);
- }
- U_CFUNC UBool
- ubidi_isJoinControl(UChar32 c) {
- uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
- return (UBool)UBIDI_GET_FLAG(props, UBIDI_JOIN_CONTROL_SHIFT);
- }
- U_CFUNC UJoiningType
- ubidi_getJoiningType(UChar32 c) {
- uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
- return (UJoiningType)((props&UBIDI_JT_MASK)>>UBIDI_JT_SHIFT);
- }
- U_CFUNC UJoiningGroup
- ubidi_getJoiningGroup(UChar32 c) {
- UChar32 start, limit;
- start=ubidi_props_singleton.indexes[UBIDI_IX_JG_START];
- limit=ubidi_props_singleton.indexes[UBIDI_IX_JG_LIMIT];
- if(start<=c && c<limit) {
- return (UJoiningGroup)ubidi_props_singleton.jgArray[c-start];
- }
- start=ubidi_props_singleton.indexes[UBIDI_IX_JG_START2];
- limit=ubidi_props_singleton.indexes[UBIDI_IX_JG_LIMIT2];
- if(start<=c && c<limit) {
- return (UJoiningGroup)ubidi_props_singleton.jgArray2[c-start];
- }
- return U_JG_NO_JOINING_GROUP;
- }
- U_CFUNC UBidiPairedBracketType
- ubidi_getPairedBracketType(UChar32 c) {
- uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
- return (UBidiPairedBracketType)((props&UBIDI_BPT_MASK)>>UBIDI_BPT_SHIFT);
- }
- U_CFUNC UChar32
- ubidi_getPairedBracket(UChar32 c) {
- uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
- if((props&UBIDI_BPT_MASK)==0) {
- return c;
- } else {
- return getMirror(c, props);
- }
- }
- /* public API (see uchar.h) ------------------------------------------------- */
- U_CFUNC UCharDirection
- u_charDirection(UChar32 c) {
- return ubidi_getClass(c);
- }
- U_CFUNC UBool
- u_isMirrored(UChar32 c) {
- return ubidi_isMirrored(c);
- }
- U_CFUNC UChar32
- u_charMirror(UChar32 c) {
- return ubidi_getMirror(c);
- }
- U_CAPI UChar32 U_EXPORT2
- u_getBidiPairedBracket(UChar32 c) {
- return ubidi_getPairedBracket(c);
- }
|