blob: 3ba58f7af99cc77a8b6bb2f2ab3389818e900eee [file] [log] [blame]
Jungshik Shin87232d82017-05-13 21:10:13 -07001// © 2016 and later: Unicode, Inc. and others.
Jungshik Shin5feb9ad2016-10-21 12:52:48 -07002// License & terms of use: http://www.unicode.org/copyright.html
jshin@chromium.org6f31ac32014-03-26 22:15:14 +00003/*
4*******************************************************************************
5*
Jungshik Shin (jungshik at google)0f8746a2015-01-08 15:46:45 -08006* Copyright (C) 2004-2014, International Business Machines
jshin@chromium.org6f31ac32014-03-26 22:15:14 +00007* Corporation and others. All Rights Reserved.
8*
9*******************************************************************************
10* file name: ubidi_props.c
Jungshik Shin87232d82017-05-13 21:10:13 -070011* encoding: UTF-8
jshin@chromium.org6f31ac32014-03-26 22:15:14 +000012* tab size: 8 (not used)
13* indentation:4
14*
15* created on: 2004dec30
16* created by: Markus W. Scherer
17*
18* Low-level Unicode bidi/shaping properties access.
19*/
20
21#include "unicode/utypes.h"
22#include "unicode/uset.h"
23#include "unicode/udata.h" /* UDataInfo */
24#include "ucmndata.h" /* DataHeader */
25#include "udatamem.h"
26#include "uassert.h"
27#include "cmemory.h"
28#include "utrie2.h"
29#include "ubidi_props.h"
30#include "ucln_cmn.h"
31
32struct UBiDiProps {
33 UDataMemory *mem;
34 const int32_t *indexes;
35 const uint32_t *mirrors;
36 const uint8_t *jgArray;
Jungshik Shin (jungshik at google)0f8746a2015-01-08 15:46:45 -080037 const uint8_t *jgArray2;
jshin@chromium.org6f31ac32014-03-26 22:15:14 +000038
39 UTrie2 trie;
40 uint8_t formatVersion[4];
41};
42
43/* ubidi_props_data.h is machine-generated by genbidi --csource */
44#define INCLUDED_FROM_UBIDI_PROPS_C
45#include "ubidi_props_data.h"
46
jshin@chromium.org6f31ac32014-03-26 22:15:14 +000047/* set of property starts for UnicodeSet ------------------------------------ */
48
49static UBool U_CALLCONV
50_enumPropertyStartsRange(const void *context, UChar32 start, UChar32 end, uint32_t value) {
Jungshik Shin87232d82017-05-13 21:10:13 -070051 (void)end;
52 (void)value;
jshin@chromium.org6f31ac32014-03-26 22:15:14 +000053 /* add the start code point to the USet */
54 const USetAdder *sa=(const USetAdder *)context;
55 sa->add(sa->set, start);
Frank Tang1f164ee2022-11-08 12:31:27 -080056 return true;
jshin@chromium.org6f31ac32014-03-26 22:15:14 +000057}
58
59U_CFUNC void
Jungshik Shinf61e46d2018-05-04 13:00:45 -070060ubidi_addPropertyStarts(const USetAdder *sa, UErrorCode *pErrorCode) {
jshin@chromium.org6f31ac32014-03-26 22:15:14 +000061 int32_t i, length;
62 UChar32 c, start, limit;
63
64 const uint8_t *jgArray;
65 uint8_t prev, jg;
66
67 if(U_FAILURE(*pErrorCode)) {
68 return;
69 }
70
71 /* add the start code point of each same-value range of the trie */
Jungshik Shinf61e46d2018-05-04 13:00:45 -070072 utrie2_enum(&ubidi_props_singleton.trie, NULL, _enumPropertyStartsRange, sa);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +000073
74 /* add the code points from the bidi mirroring table */
Jungshik Shinf61e46d2018-05-04 13:00:45 -070075 length=ubidi_props_singleton.indexes[UBIDI_IX_MIRROR_LENGTH];
jshin@chromium.org6f31ac32014-03-26 22:15:14 +000076 for(i=0; i<length; ++i) {
Jungshik Shinf61e46d2018-05-04 13:00:45 -070077 c=UBIDI_GET_MIRROR_CODE_POINT(ubidi_props_singleton.mirrors[i]);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +000078 sa->addRange(sa->set, c, c+1);
79 }
80
81 /* add the code points from the Joining_Group array where the value changes */
Jungshik Shinf61e46d2018-05-04 13:00:45 -070082 start=ubidi_props_singleton.indexes[UBIDI_IX_JG_START];
83 limit=ubidi_props_singleton.indexes[UBIDI_IX_JG_LIMIT];
84 jgArray=ubidi_props_singleton.jgArray;
Jungshik Shin (jungshik at google)0f8746a2015-01-08 15:46:45 -080085 for(;;) {
86 prev=0;
87 while(start<limit) {
88 jg=*jgArray++;
89 if(jg!=prev) {
90 sa->add(sa->set, start);
91 prev=jg;
92 }
93 ++start;
jshin@chromium.org6f31ac32014-03-26 22:15:14 +000094 }
Jungshik Shin (jungshik at google)0f8746a2015-01-08 15:46:45 -080095 if(prev!=0) {
96 /* add the limit code point if the last value was not 0 (it is now start==limit) */
97 sa->add(sa->set, limit);
98 }
Jungshik Shinf61e46d2018-05-04 13:00:45 -070099 if(limit==ubidi_props_singleton.indexes[UBIDI_IX_JG_LIMIT]) {
Jungshik Shin (jungshik at google)0f8746a2015-01-08 15:46:45 -0800100 /* switch to the second Joining_Group range */
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700101 start=ubidi_props_singleton.indexes[UBIDI_IX_JG_START2];
102 limit=ubidi_props_singleton.indexes[UBIDI_IX_JG_LIMIT2];
103 jgArray=ubidi_props_singleton.jgArray2;
Jungshik Shin (jungshik at google)0f8746a2015-01-08 15:46:45 -0800104 } else {
105 break;
106 }
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000107 }
108
109 /* add code points with hardcoded properties, plus the ones following them */
110
111 /* (none right now) */
112}
113
114/* property access functions ------------------------------------------------ */
115
116U_CFUNC int32_t
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700117ubidi_getMaxValue(UProperty which) {
118 int32_t max=ubidi_props_singleton.indexes[UBIDI_MAX_VALUES_INDEX];
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000119 switch(which) {
120 case UCHAR_BIDI_CLASS:
121 return (max&UBIDI_CLASS_MASK);
122 case UCHAR_JOINING_GROUP:
123 return (max&UBIDI_MAX_JG_MASK)>>UBIDI_MAX_JG_SHIFT;
124 case UCHAR_JOINING_TYPE:
125 return (max&UBIDI_JT_MASK)>>UBIDI_JT_SHIFT;
126 case UCHAR_BIDI_PAIRED_BRACKET_TYPE:
127 return (max&UBIDI_BPT_MASK)>>UBIDI_BPT_SHIFT;
128 default:
129 return -1; /* undefined */
130 }
131}
132
133U_CAPI UCharDirection
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700134ubidi_getClass(UChar32 c) {
135 uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000136 return (UCharDirection)UBIDI_GET_CLASS(props);
137}
138
139U_CFUNC UBool
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700140ubidi_isMirrored(UChar32 c) {
141 uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000142 return (UBool)UBIDI_GET_FLAG(props, UBIDI_IS_MIRRORED_SHIFT);
143}
144
145static UChar32
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700146getMirror(UChar32 c, uint16_t props) {
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000147 int32_t delta=UBIDI_GET_MIRROR_DELTA(props);
148 if(delta!=UBIDI_ESC_MIRROR_DELTA) {
149 return c+delta;
150 } else {
151 /* look for mirror code point in the mirrors[] table */
152 const uint32_t *mirrors;
153 uint32_t m;
154 int32_t i, length;
155 UChar32 c2;
156
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700157 mirrors=ubidi_props_singleton.mirrors;
158 length=ubidi_props_singleton.indexes[UBIDI_IX_MIRROR_LENGTH];
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000159
160 /* linear search */
161 for(i=0; i<length; ++i) {
162 m=mirrors[i];
163 c2=UBIDI_GET_MIRROR_CODE_POINT(m);
164 if(c==c2) {
165 /* found c, return its mirror code point using the index in m */
166 return UBIDI_GET_MIRROR_CODE_POINT(mirrors[UBIDI_GET_MIRROR_INDEX(m)]);
167 } else if(c<c2) {
168 break;
169 }
170 }
171
172 /* c not found, return it itself */
173 return c;
174 }
175}
176
177U_CFUNC UChar32
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700178ubidi_getMirror(UChar32 c) {
179 uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
180 return getMirror(c, props);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000181}
182
183U_CFUNC UBool
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700184ubidi_isBidiControl(UChar32 c) {
185 uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000186 return (UBool)UBIDI_GET_FLAG(props, UBIDI_BIDI_CONTROL_SHIFT);
187}
188
189U_CFUNC UBool
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700190ubidi_isJoinControl(UChar32 c) {
191 uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000192 return (UBool)UBIDI_GET_FLAG(props, UBIDI_JOIN_CONTROL_SHIFT);
193}
194
195U_CFUNC UJoiningType
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700196ubidi_getJoiningType(UChar32 c) {
197 uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000198 return (UJoiningType)((props&UBIDI_JT_MASK)>>UBIDI_JT_SHIFT);
199}
200
201U_CFUNC UJoiningGroup
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700202ubidi_getJoiningGroup(UChar32 c) {
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000203 UChar32 start, limit;
204
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700205 start=ubidi_props_singleton.indexes[UBIDI_IX_JG_START];
206 limit=ubidi_props_singleton.indexes[UBIDI_IX_JG_LIMIT];
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000207 if(start<=c && c<limit) {
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700208 return (UJoiningGroup)ubidi_props_singleton.jgArray[c-start];
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000209 }
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700210 start=ubidi_props_singleton.indexes[UBIDI_IX_JG_START2];
211 limit=ubidi_props_singleton.indexes[UBIDI_IX_JG_LIMIT2];
Jungshik Shin (jungshik at google)0f8746a2015-01-08 15:46:45 -0800212 if(start<=c && c<limit) {
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700213 return (UJoiningGroup)ubidi_props_singleton.jgArray2[c-start];
Jungshik Shin (jungshik at google)0f8746a2015-01-08 15:46:45 -0800214 }
215 return U_JG_NO_JOINING_GROUP;
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000216}
217
218U_CFUNC UBidiPairedBracketType
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700219ubidi_getPairedBracketType(UChar32 c) {
220 uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000221 return (UBidiPairedBracketType)((props&UBIDI_BPT_MASK)>>UBIDI_BPT_SHIFT);
222}
223
224U_CFUNC UChar32
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700225ubidi_getPairedBracket(UChar32 c) {
226 uint16_t props=UTRIE2_GET16(&ubidi_props_singleton.trie, c);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000227 if((props&UBIDI_BPT_MASK)==0) {
228 return c;
229 } else {
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700230 return getMirror(c, props);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000231 }
232}
233
234/* public API (see uchar.h) ------------------------------------------------- */
235
236U_CFUNC UCharDirection
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700237u_charDirection(UChar32 c) {
238 return ubidi_getClass(c);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000239}
240
241U_CFUNC UBool
242u_isMirrored(UChar32 c) {
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700243 return ubidi_isMirrored(c);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000244}
245
246U_CFUNC UChar32
247u_charMirror(UChar32 c) {
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700248 return ubidi_getMirror(c);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000249}
250
Frank Tangf90543d2020-10-30 19:02:04 -0700251U_CAPI UChar32 U_EXPORT2
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000252u_getBidiPairedBracket(UChar32 c) {
Jungshik Shinf61e46d2018-05-04 13:00:45 -0700253 return ubidi_getPairedBracket(c);
jshin@chromium.org6f31ac32014-03-26 22:15:14 +0000254}