Nigel Tao | a4f2bbb | 2020-07-28 14:15:24 +1000 | [diff] [blame] | 1 | // After editing this file, run "go generate" in the ../data directory. |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 2 | |
| 3 | // Copyright 2020 The Wuffs Authors. |
| 4 | // |
| 5 | // Licensed under the Apache License, Version 2.0 (the "License"); |
| 6 | // you may not use this file except in compliance with the License. |
| 7 | // You may obtain a copy of the License at |
| 8 | // |
| 9 | // https://www.apache.org/licenses/LICENSE-2.0 |
| 10 | // |
| 11 | // Unless required by applicable law or agreed to in writing, software |
| 12 | // distributed under the License is distributed on an "AS IS" BASIS, |
| 13 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 14 | // See the License for the specific language governing permissions and |
| 15 | // limitations under the License. |
| 16 | |
| 17 | // ---------------- Tokens |
| 18 | |
Nigel Tao | 478d1b8 | 2020-04-08 23:03:51 +1000 | [diff] [blame] | 19 | // wuffs_base__token is an element of a byte stream's tokenization. |
| 20 | // |
Nigel Tao | 2f2bbc6 | 2021-01-25 11:30:15 +1100 | [diff] [blame^] | 21 | // See https://github.com/google/wuffs/blob/main/doc/note/tokens.md |
Nigel Tao | 4f1d24c | 2020-09-23 22:02:53 +1000 | [diff] [blame] | 22 | typedef struct wuffs_base__token__struct { |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 23 | uint64_t repr; |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 24 | |
| 25 | #ifdef __cplusplus |
Nigel Tao | 462f866 | 2020-04-01 23:01:51 +1100 | [diff] [blame] | 26 | inline int64_t value() const; |
| 27 | inline int64_t value_extension() const; |
| 28 | inline int64_t value_major() const; |
| 29 | inline int64_t value_base_category() const; |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 30 | inline uint64_t value_minor() const; |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 31 | inline uint64_t value_base_detail() const; |
Nigel Tao | c9d4e34 | 2020-07-21 15:20:34 +1000 | [diff] [blame] | 32 | inline int64_t value_base_detail__sign_extended() const; |
Nigel Tao | 496e88b | 2020-04-09 22:10:08 +1000 | [diff] [blame] | 33 | inline bool continued() const; |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 34 | inline uint64_t length() const; |
| 35 | #endif // __cplusplus |
| 36 | |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 37 | } wuffs_base__token; |
| 38 | |
| 39 | static inline wuffs_base__token // |
| 40 | wuffs_base__make_token(uint64_t repr) { |
| 41 | wuffs_base__token ret; |
| 42 | ret.repr = repr; |
| 43 | return ret; |
| 44 | } |
| 45 | |
Nigel Tao | f45f01f | 2020-06-05 14:06:56 +1000 | [diff] [blame] | 46 | // -------- |
Nigel Tao | 9d4eeb7 | 2020-02-26 11:36:30 +1100 | [diff] [blame] | 47 | |
Nigel Tao | 43f0a87 | 2020-03-02 13:59:46 +1100 | [diff] [blame] | 48 | #define WUFFS_BASE__TOKEN__LENGTH__MAX_INCL 0xFFFF |
| 49 | |
Nigel Tao | 496e88b | 2020-04-09 22:10:08 +1000 | [diff] [blame] | 50 | #define WUFFS_BASE__TOKEN__VALUE__SHIFT 17 |
| 51 | #define WUFFS_BASE__TOKEN__VALUE_EXTENSION__SHIFT 17 |
Nigel Tao | d1c928a | 2020-02-28 12:43:53 +1100 | [diff] [blame] | 52 | #define WUFFS_BASE__TOKEN__VALUE_MAJOR__SHIFT 42 |
Nigel Tao | 496e88b | 2020-04-09 22:10:08 +1000 | [diff] [blame] | 53 | #define WUFFS_BASE__TOKEN__VALUE_MINOR__SHIFT 17 |
| 54 | #define WUFFS_BASE__TOKEN__VALUE_BASE_CATEGORY__SHIFT 38 |
| 55 | #define WUFFS_BASE__TOKEN__VALUE_BASE_DETAIL__SHIFT 17 |
| 56 | #define WUFFS_BASE__TOKEN__CONTINUED__SHIFT 16 |
Nigel Tao | a9d1488 | 2020-02-25 12:12:31 +1100 | [diff] [blame] | 57 | #define WUFFS_BASE__TOKEN__LENGTH__SHIFT 0 |
| 58 | |
Nigel Tao | 850dc18 | 2020-07-21 22:52:04 +1000 | [diff] [blame] | 59 | #define WUFFS_BASE__TOKEN__VALUE_EXTENSION__NUM_BITS 46 |
| 60 | |
Nigel Tao | f45f01f | 2020-06-05 14:06:56 +1000 | [diff] [blame] | 61 | // -------- |
Nigel Tao | 9d4eeb7 | 2020-02-26 11:36:30 +1100 | [diff] [blame] | 62 | |
Nigel Tao | a9d1488 | 2020-02-25 12:12:31 +1100 | [diff] [blame] | 63 | #define WUFFS_BASE__TOKEN__VBC__FILLER 0 |
Nigel Tao | 85fba7f | 2020-02-29 16:28:06 +1100 | [diff] [blame] | 64 | #define WUFFS_BASE__TOKEN__VBC__STRUCTURE 1 |
| 65 | #define WUFFS_BASE__TOKEN__VBC__STRING 2 |
| 66 | #define WUFFS_BASE__TOKEN__VBC__UNICODE_CODE_POINT 3 |
| 67 | #define WUFFS_BASE__TOKEN__VBC__LITERAL 4 |
| 68 | #define WUFFS_BASE__TOKEN__VBC__NUMBER 5 |
Nigel Tao | c9d4e34 | 2020-07-21 15:20:34 +1000 | [diff] [blame] | 69 | #define WUFFS_BASE__TOKEN__VBC__INLINE_INTEGER_SIGNED 6 |
| 70 | #define WUFFS_BASE__TOKEN__VBC__INLINE_INTEGER_UNSIGNED 7 |
Nigel Tao | a9d1488 | 2020-02-25 12:12:31 +1100 | [diff] [blame] | 71 | |
Nigel Tao | f45f01f | 2020-06-05 14:06:56 +1000 | [diff] [blame] | 72 | // -------- |
Nigel Tao | 9d4eeb7 | 2020-02-26 11:36:30 +1100 | [diff] [blame] | 73 | |
Nigel Tao | 4284369 | 2020-08-17 16:48:30 +1000 | [diff] [blame] | 74 | #define WUFFS_BASE__TOKEN__VBD__FILLER__PUNCTUATION 0x00001 |
Nigel Tao | d1c928a | 2020-02-28 12:43:53 +1100 | [diff] [blame] | 75 | #define WUFFS_BASE__TOKEN__VBD__FILLER__COMMENT_BLOCK 0x00002 |
Nigel Tao | 4284369 | 2020-08-17 16:48:30 +1000 | [diff] [blame] | 76 | #define WUFFS_BASE__TOKEN__VBD__FILLER__COMMENT_LINE 0x00004 |
Nigel Tao | a9d1488 | 2020-02-25 12:12:31 +1100 | [diff] [blame] | 77 | |
Nigel Tao | fc30413 | 2020-08-19 09:40:02 +1000 | [diff] [blame] | 78 | // COMMENT_ANY is a bit-wise or of COMMENT_BLOCK AND COMMENT_LINE. |
| 79 | #define WUFFS_BASE__TOKEN__VBD__FILLER__COMMENT_ANY 0x00006 |
| 80 | |
Nigel Tao | f45f01f | 2020-06-05 14:06:56 +1000 | [diff] [blame] | 81 | // -------- |
Nigel Tao | 85fba7f | 2020-02-29 16:28:06 +1100 | [diff] [blame] | 82 | |
| 83 | #define WUFFS_BASE__TOKEN__VBD__STRUCTURE__PUSH 0x00001 |
| 84 | #define WUFFS_BASE__TOKEN__VBD__STRUCTURE__POP 0x00002 |
| 85 | #define WUFFS_BASE__TOKEN__VBD__STRUCTURE__FROM_NONE 0x00010 |
| 86 | #define WUFFS_BASE__TOKEN__VBD__STRUCTURE__FROM_LIST 0x00020 |
| 87 | #define WUFFS_BASE__TOKEN__VBD__STRUCTURE__FROM_DICT 0x00040 |
| 88 | #define WUFFS_BASE__TOKEN__VBD__STRUCTURE__TO_NONE 0x01000 |
| 89 | #define WUFFS_BASE__TOKEN__VBD__STRUCTURE__TO_LIST 0x02000 |
| 90 | #define WUFFS_BASE__TOKEN__VBD__STRUCTURE__TO_DICT 0x04000 |
| 91 | |
Nigel Tao | 9d4eeb7 | 2020-02-26 11:36:30 +1100 | [diff] [blame] | 92 | // -------- |
| 93 | |
Nigel Tao | b9afc26 | 2020-07-03 13:36:13 +1000 | [diff] [blame] | 94 | // DEFINITELY_FOO means that the destination bytes (and also the source bytes, |
| 95 | // for 1_DST_1_SRC_COPY) are in the FOO format. Definitely means that the lack |
| 96 | // of the bit means "maybe FOO". It does not necessarily mean "not FOO". |
| 97 | // |
| 98 | // CHAIN_ETC means that decoding the entire token chain forms a UTF-8 or ASCII |
| 99 | // string, not just this current token. CHAIN_ETC_UTF_8 therefore distinguishes |
| 100 | // Unicode (UTF-8) strings from byte strings. MUST means that the the token |
| 101 | // producer (e.g. parser) must verify this. SHOULD means that the token |
| 102 | // consumer (e.g. renderer) should verify this. |
| 103 | // |
| 104 | // When a CHAIN_ETC_UTF_8 bit is set, the parser must ensure that non-ASCII |
| 105 | // code points (with multi-byte UTF-8 encodings) do not straddle token |
| 106 | // boundaries. Checking UTF-8 validity can inspect each token separately. |
| 107 | // |
| 108 | // The lack of any particular bit is conservative: it is valid for all-ASCII |
| 109 | // strings, in a single- or multi-token chain, to have none of these bits set. |
Nigel Tao | d1c928a | 2020-02-28 12:43:53 +1100 | [diff] [blame] | 110 | #define WUFFS_BASE__TOKEN__VBD__STRING__DEFINITELY_UTF_8 0x00001 |
Nigel Tao | b9afc26 | 2020-07-03 13:36:13 +1000 | [diff] [blame] | 111 | #define WUFFS_BASE__TOKEN__VBD__STRING__CHAIN_MUST_BE_UTF_8 0x00002 |
| 112 | #define WUFFS_BASE__TOKEN__VBD__STRING__CHAIN_SHOULD_BE_UTF_8 0x00004 |
| 113 | #define WUFFS_BASE__TOKEN__VBD__STRING__DEFINITELY_ASCII 0x00010 |
| 114 | #define WUFFS_BASE__TOKEN__VBD__STRING__CHAIN_MUST_BE_ASCII 0x00020 |
| 115 | #define WUFFS_BASE__TOKEN__VBD__STRING__CHAIN_SHOULD_BE_ASCII 0x00040 |
Nigel Tao | a9d1488 | 2020-02-25 12:12:31 +1100 | [diff] [blame] | 116 | |
Nigel Tao | b9afc26 | 2020-07-03 13:36:13 +1000 | [diff] [blame] | 117 | // CONVERT_D_DST_S_SRC means that multiples of S source bytes (possibly padded) |
| 118 | // produces multiples of D destination bytes. For example, |
Nigel Tao | 9d4eeb7 | 2020-02-26 11:36:30 +1100 | [diff] [blame] | 119 | // CONVERT_1_DST_4_SRC_BACKSLASH_X means a source like "\\x23\\x67\\xAB", where |
| 120 | // 12 src bytes encode 3 dst bytes. |
| 121 | // |
Nigel Tao | 478d1b8 | 2020-04-08 23:03:51 +1000 | [diff] [blame] | 122 | // Post-processing may further transform those D destination bytes (e.g. treat |
| 123 | // "\\xFF" as the Unicode code point U+00FF instead of the byte 0xFF), but that |
| 124 | // is out of scope of this VBD's semantics. |
| 125 | // |
Nigel Tao | 9d4eeb7 | 2020-02-26 11:36:30 +1100 | [diff] [blame] | 126 | // When src is the empty string, multiple conversion algorithms are applicable |
| 127 | // (so these bits are not necessarily mutually exclusive), all producing the |
| 128 | // same empty dst string. |
Nigel Tao | b9afc26 | 2020-07-03 13:36:13 +1000 | [diff] [blame] | 129 | #define WUFFS_BASE__TOKEN__VBD__STRING__CONVERT_0_DST_1_SRC_DROP 0x00100 |
| 130 | #define WUFFS_BASE__TOKEN__VBD__STRING__CONVERT_1_DST_1_SRC_COPY 0x00200 |
| 131 | #define WUFFS_BASE__TOKEN__VBD__STRING__CONVERT_1_DST_2_SRC_HEXADECIMAL 0x00400 |
| 132 | #define WUFFS_BASE__TOKEN__VBD__STRING__CONVERT_1_DST_4_SRC_BACKSLASH_X 0x00800 |
| 133 | #define WUFFS_BASE__TOKEN__VBD__STRING__CONVERT_3_DST_4_SRC_BASE_64_STD 0x01000 |
| 134 | #define WUFFS_BASE__TOKEN__VBD__STRING__CONVERT_3_DST_4_SRC_BASE_64_URL 0x02000 |
| 135 | #define WUFFS_BASE__TOKEN__VBD__STRING__CONVERT_4_DST_5_SRC_ASCII_85 0x04000 |
Nigel Tao | 15cc850 | 2020-07-09 21:23:38 +1000 | [diff] [blame] | 136 | #define WUFFS_BASE__TOKEN__VBD__STRING__CONVERT_5_DST_8_SRC_BASE_32_HEX 0x08000 |
| 137 | #define WUFFS_BASE__TOKEN__VBD__STRING__CONVERT_5_DST_8_SRC_BASE_32_STD 0x10000 |
Nigel Tao | 9d4eeb7 | 2020-02-26 11:36:30 +1100 | [diff] [blame] | 138 | |
Nigel Tao | f45f01f | 2020-06-05 14:06:56 +1000 | [diff] [blame] | 139 | // -------- |
Nigel Tao | a9d1488 | 2020-02-25 12:12:31 +1100 | [diff] [blame] | 140 | |
Nigel Tao | 85fba7f | 2020-02-29 16:28:06 +1100 | [diff] [blame] | 141 | #define WUFFS_BASE__TOKEN__VBD__LITERAL__UNDEFINED 0x00001 |
| 142 | #define WUFFS_BASE__TOKEN__VBD__LITERAL__NULL 0x00002 |
| 143 | #define WUFFS_BASE__TOKEN__VBD__LITERAL__FALSE 0x00004 |
| 144 | #define WUFFS_BASE__TOKEN__VBD__LITERAL__TRUE 0x00008 |
| 145 | |
Nigel Tao | f45f01f | 2020-06-05 14:06:56 +1000 | [diff] [blame] | 146 | // -------- |
Nigel Tao | 9d4eeb7 | 2020-02-26 11:36:30 +1100 | [diff] [blame] | 147 | |
Nigel Tao | a9d1488 | 2020-02-25 12:12:31 +1100 | [diff] [blame] | 148 | // For a source string of "123" or "0x9A", it is valid for a tokenizer to |
Nigel Tao | 4e19359 | 2020-07-15 12:48:57 +1000 | [diff] [blame] | 149 | // return any combination of: |
Nigel Tao | c3ca77a | 2020-03-11 12:06:50 +1100 | [diff] [blame] | 150 | // - WUFFS_BASE__TOKEN__VBD__NUMBER__CONTENT_FLOATING_POINT. |
| 151 | // - WUFFS_BASE__TOKEN__VBD__NUMBER__CONTENT_INTEGER_SIGNED. |
| 152 | // - WUFFS_BASE__TOKEN__VBD__NUMBER__CONTENT_INTEGER_UNSIGNED. |
Nigel Tao | a9d1488 | 2020-02-25 12:12:31 +1100 | [diff] [blame] | 153 | // |
| 154 | // For a source string of "+123" or "-0x9A", only the first two are valid. |
| 155 | // |
| 156 | // For a source string of "123.", only the first one is valid. |
Nigel Tao | c3ca77a | 2020-03-11 12:06:50 +1100 | [diff] [blame] | 157 | #define WUFFS_BASE__TOKEN__VBD__NUMBER__CONTENT_FLOATING_POINT 0x00001 |
| 158 | #define WUFFS_BASE__TOKEN__VBD__NUMBER__CONTENT_INTEGER_SIGNED 0x00002 |
| 159 | #define WUFFS_BASE__TOKEN__VBD__NUMBER__CONTENT_INTEGER_UNSIGNED 0x00004 |
| 160 | |
Nigel Tao | d7c7237 | 2020-03-24 13:58:38 +1100 | [diff] [blame] | 161 | #define WUFFS_BASE__TOKEN__VBD__NUMBER__CONTENT_NEG_INF 0x00010 |
| 162 | #define WUFFS_BASE__TOKEN__VBD__NUMBER__CONTENT_POS_INF 0x00020 |
| 163 | #define WUFFS_BASE__TOKEN__VBD__NUMBER__CONTENT_NEG_NAN 0x00040 |
| 164 | #define WUFFS_BASE__TOKEN__VBD__NUMBER__CONTENT_POS_NAN 0x00080 |
| 165 | |
Nigel Tao | c3ca77a | 2020-03-11 12:06:50 +1100 | [diff] [blame] | 166 | // The number 300 might be represented as "\x01\x2C", "\x2C\x01\x00\x00" or |
| 167 | // "300", which are big-endian, little-endian or text. For binary formats, the |
Nigel Tao | 4e19359 | 2020-07-15 12:48:57 +1000 | [diff] [blame] | 168 | // token length (after adjusting for FORMAT_IGNORE_ETC) discriminates |
| 169 | // e.g. u16 little-endian vs u32 little-endian. |
Nigel Tao | c3ca77a | 2020-03-11 12:06:50 +1100 | [diff] [blame] | 170 | #define WUFFS_BASE__TOKEN__VBD__NUMBER__FORMAT_BINARY_BIG_ENDIAN 0x00100 |
| 171 | #define WUFFS_BASE__TOKEN__VBD__NUMBER__FORMAT_BINARY_LITTLE_ENDIAN 0x00200 |
| 172 | #define WUFFS_BASE__TOKEN__VBD__NUMBER__FORMAT_TEXT 0x00400 |
Nigel Tao | 9d4eeb7 | 2020-02-26 11:36:30 +1100 | [diff] [blame] | 173 | |
Nigel Tao | 4e19359 | 2020-07-15 12:48:57 +1000 | [diff] [blame] | 174 | #define WUFFS_BASE__TOKEN__VBD__NUMBER__FORMAT_IGNORE_FIRST_BYTE 0x01000 |
| 175 | |
Nigel Tao | 9d4eeb7 | 2020-02-26 11:36:30 +1100 | [diff] [blame] | 176 | // -------- |
Nigel Tao | a9d1488 | 2020-02-25 12:12:31 +1100 | [diff] [blame] | 177 | |
Nigel Tao | 462f866 | 2020-04-01 23:01:51 +1100 | [diff] [blame] | 178 | // wuffs_base__token__value returns the token's high 46 bits, sign-extended. A |
| 179 | // negative value means an extended token, non-negative means a simple token. |
| 180 | static inline int64_t // |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 181 | wuffs_base__token__value(const wuffs_base__token* t) { |
Nigel Tao | 462f866 | 2020-04-01 23:01:51 +1100 | [diff] [blame] | 182 | return ((int64_t)(t->repr)) >> WUFFS_BASE__TOKEN__VALUE__SHIFT; |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 183 | } |
| 184 | |
Nigel Tao | 462f866 | 2020-04-01 23:01:51 +1100 | [diff] [blame] | 185 | // wuffs_base__token__value_extension returns a negative value if the token was |
| 186 | // not an extended token. |
| 187 | static inline int64_t // |
| 188 | wuffs_base__token__value_extension(const wuffs_base__token* t) { |
| 189 | return (~(int64_t)(t->repr)) >> WUFFS_BASE__TOKEN__VALUE_EXTENSION__SHIFT; |
| 190 | } |
| 191 | |
| 192 | // wuffs_base__token__value_major returns a negative value if the token was not |
| 193 | // a simple token. |
| 194 | static inline int64_t // |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 195 | wuffs_base__token__value_major(const wuffs_base__token* t) { |
Nigel Tao | 462f866 | 2020-04-01 23:01:51 +1100 | [diff] [blame] | 196 | return ((int64_t)(t->repr)) >> WUFFS_BASE__TOKEN__VALUE_MAJOR__SHIFT; |
| 197 | } |
| 198 | |
| 199 | // wuffs_base__token__value_base_category returns a negative value if the token |
| 200 | // was not a simple token. |
| 201 | static inline int64_t // |
| 202 | wuffs_base__token__value_base_category(const wuffs_base__token* t) { |
| 203 | return ((int64_t)(t->repr)) >> WUFFS_BASE__TOKEN__VALUE_BASE_CATEGORY__SHIFT; |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 204 | } |
| 205 | |
| 206 | static inline uint64_t // |
| 207 | wuffs_base__token__value_minor(const wuffs_base__token* t) { |
Nigel Tao | 496e88b | 2020-04-09 22:10:08 +1000 | [diff] [blame] | 208 | return (t->repr >> WUFFS_BASE__TOKEN__VALUE_MINOR__SHIFT) & 0x1FFFFFF; |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 209 | } |
| 210 | |
| 211 | static inline uint64_t // |
| 212 | wuffs_base__token__value_base_detail(const wuffs_base__token* t) { |
Nigel Tao | 462f866 | 2020-04-01 23:01:51 +1100 | [diff] [blame] | 213 | return (t->repr >> WUFFS_BASE__TOKEN__VALUE_BASE_DETAIL__SHIFT) & 0x1FFFFF; |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 214 | } |
| 215 | |
Nigel Tao | c9d4e34 | 2020-07-21 15:20:34 +1000 | [diff] [blame] | 216 | static inline int64_t // |
| 217 | wuffs_base__token__value_base_detail__sign_extended( |
| 218 | const wuffs_base__token* t) { |
| 219 | // The VBD is 21 bits in the middle of t->repr. Left shift the high (64 - 21 |
| 220 | // - ETC__SHIFT) bits off, then right shift (sign-extending) back down. |
| 221 | uint64_t u = t->repr << (43 - WUFFS_BASE__TOKEN__VALUE_BASE_DETAIL__SHIFT); |
| 222 | return ((int64_t)u) >> 43; |
| 223 | } |
| 224 | |
Nigel Tao | d1c928a | 2020-02-28 12:43:53 +1100 | [diff] [blame] | 225 | static inline bool // |
Nigel Tao | 496e88b | 2020-04-09 22:10:08 +1000 | [diff] [blame] | 226 | wuffs_base__token__continued(const wuffs_base__token* t) { |
| 227 | return t->repr & 0x10000; |
Nigel Tao | d1c928a | 2020-02-28 12:43:53 +1100 | [diff] [blame] | 228 | } |
| 229 | |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 230 | static inline uint64_t // |
| 231 | wuffs_base__token__length(const wuffs_base__token* t) { |
Nigel Tao | 462f866 | 2020-04-01 23:01:51 +1100 | [diff] [blame] | 232 | return (t->repr >> WUFFS_BASE__TOKEN__LENGTH__SHIFT) & 0xFFFF; |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 233 | } |
| 234 | |
| 235 | #ifdef __cplusplus |
| 236 | |
Nigel Tao | 462f866 | 2020-04-01 23:01:51 +1100 | [diff] [blame] | 237 | inline int64_t // |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 238 | wuffs_base__token::value() const { |
| 239 | return wuffs_base__token__value(this); |
| 240 | } |
| 241 | |
Nigel Tao | 462f866 | 2020-04-01 23:01:51 +1100 | [diff] [blame] | 242 | inline int64_t // |
| 243 | wuffs_base__token::value_extension() const { |
| 244 | return wuffs_base__token__value_extension(this); |
| 245 | } |
| 246 | |
| 247 | inline int64_t // |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 248 | wuffs_base__token::value_major() const { |
| 249 | return wuffs_base__token__value_major(this); |
| 250 | } |
| 251 | |
Nigel Tao | 462f866 | 2020-04-01 23:01:51 +1100 | [diff] [blame] | 252 | inline int64_t // |
| 253 | wuffs_base__token::value_base_category() const { |
| 254 | return wuffs_base__token__value_base_category(this); |
| 255 | } |
| 256 | |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 257 | inline uint64_t // |
| 258 | wuffs_base__token::value_minor() const { |
| 259 | return wuffs_base__token__value_minor(this); |
| 260 | } |
| 261 | |
| 262 | inline uint64_t // |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 263 | wuffs_base__token::value_base_detail() const { |
| 264 | return wuffs_base__token__value_base_detail(this); |
| 265 | } |
| 266 | |
Nigel Tao | c9d4e34 | 2020-07-21 15:20:34 +1000 | [diff] [blame] | 267 | inline int64_t // |
| 268 | wuffs_base__token::value_base_detail__sign_extended() const { |
| 269 | return wuffs_base__token__value_base_detail__sign_extended(this); |
| 270 | } |
| 271 | |
Nigel Tao | d1c928a | 2020-02-28 12:43:53 +1100 | [diff] [blame] | 272 | inline bool // |
Nigel Tao | 496e88b | 2020-04-09 22:10:08 +1000 | [diff] [blame] | 273 | wuffs_base__token::continued() const { |
| 274 | return wuffs_base__token__continued(this); |
Nigel Tao | d1c928a | 2020-02-28 12:43:53 +1100 | [diff] [blame] | 275 | } |
| 276 | |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 277 | inline uint64_t // |
| 278 | wuffs_base__token::length() const { |
| 279 | return wuffs_base__token__length(this); |
| 280 | } |
| 281 | |
| 282 | #endif // __cplusplus |
| 283 | |
| 284 | // -------- |
| 285 | |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 286 | typedef WUFFS_BASE__SLICE(wuffs_base__token) wuffs_base__slice_token; |
| 287 | |
| 288 | static inline wuffs_base__slice_token // |
| 289 | wuffs_base__make_slice_token(wuffs_base__token* ptr, size_t len) { |
| 290 | wuffs_base__slice_token ret; |
| 291 | ret.ptr = ptr; |
| 292 | ret.len = len; |
| 293 | return ret; |
| 294 | } |
| 295 | |
Nigel Tao | 934136b | 2020-08-06 23:51:13 +1000 | [diff] [blame] | 296 | static inline wuffs_base__slice_token // |
| 297 | wuffs_base__empty_slice_token() { |
| 298 | wuffs_base__slice_token ret; |
| 299 | ret.ptr = NULL; |
| 300 | ret.len = 0; |
| 301 | return ret; |
| 302 | } |
| 303 | |
Nigel Tao | 3685798 | 2020-02-12 11:33:13 +1100 | [diff] [blame] | 304 | // -------- |
| 305 | |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 306 | // wuffs_base__token_buffer_meta is the metadata for a |
| 307 | // wuffs_base__token_buffer's data. |
Nigel Tao | 4f1d24c | 2020-09-23 22:02:53 +1000 | [diff] [blame] | 308 | typedef struct wuffs_base__token_buffer_meta__struct { |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 309 | size_t wi; // Write index. Invariant: wi <= len. |
| 310 | size_t ri; // Read index. Invariant: ri <= wi. |
| 311 | uint64_t pos; // Position of the buffer start relative to the stream start. |
| 312 | bool closed; // No further writes are expected. |
| 313 | } wuffs_base__token_buffer_meta; |
| 314 | |
| 315 | // wuffs_base__token_buffer is a 1-dimensional buffer (a pointer and length) |
| 316 | // plus additional metadata. |
| 317 | // |
| 318 | // A value with all fields zero is a valid, empty buffer. |
Nigel Tao | 4f1d24c | 2020-09-23 22:02:53 +1000 | [diff] [blame] | 319 | typedef struct wuffs_base__token_buffer__struct { |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 320 | wuffs_base__slice_token data; |
| 321 | wuffs_base__token_buffer_meta meta; |
| 322 | |
| 323 | #ifdef __cplusplus |
Nigel Tao | 9fd96e8 | 2020-03-16 21:46:21 +1100 | [diff] [blame] | 324 | inline bool is_valid() const; |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 325 | inline void compact(); |
Nigel Tao | 82a96cb | 2020-08-06 23:41:36 +1000 | [diff] [blame] | 326 | inline uint64_t reader_length() const; |
Nigel Tao | 934136b | 2020-08-06 23:51:13 +1000 | [diff] [blame] | 327 | inline wuffs_base__token* reader_pointer() const; |
| 328 | inline wuffs_base__slice_token reader_slice() const; |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 329 | inline uint64_t reader_token_position() const; |
Nigel Tao | 82a96cb | 2020-08-06 23:41:36 +1000 | [diff] [blame] | 330 | inline uint64_t writer_length() const; |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 331 | inline uint64_t writer_token_position() const; |
Nigel Tao | 934136b | 2020-08-06 23:51:13 +1000 | [diff] [blame] | 332 | inline wuffs_base__token* writer_pointer() const; |
| 333 | inline wuffs_base__slice_token writer_slice() const; |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 334 | #endif // __cplusplus |
| 335 | |
| 336 | } wuffs_base__token_buffer; |
| 337 | |
| 338 | static inline wuffs_base__token_buffer // |
| 339 | wuffs_base__make_token_buffer(wuffs_base__slice_token data, |
| 340 | wuffs_base__token_buffer_meta meta) { |
| 341 | wuffs_base__token_buffer ret; |
| 342 | ret.data = data; |
| 343 | ret.meta = meta; |
| 344 | return ret; |
| 345 | } |
| 346 | |
| 347 | static inline wuffs_base__token_buffer_meta // |
| 348 | wuffs_base__make_token_buffer_meta(size_t wi, |
| 349 | size_t ri, |
| 350 | uint64_t pos, |
| 351 | bool closed) { |
| 352 | wuffs_base__token_buffer_meta ret; |
| 353 | ret.wi = wi; |
| 354 | ret.ri = ri; |
| 355 | ret.pos = pos; |
| 356 | ret.closed = closed; |
| 357 | return ret; |
| 358 | } |
| 359 | |
| 360 | static inline wuffs_base__token_buffer // |
Nigel Tao | 64dbd00 | 2020-04-02 22:11:42 +1100 | [diff] [blame] | 361 | wuffs_base__slice_token__reader(wuffs_base__slice_token s, bool closed) { |
Nigel Tao | 9fd96e8 | 2020-03-16 21:46:21 +1100 | [diff] [blame] | 362 | wuffs_base__token_buffer ret; |
| 363 | ret.data.ptr = s.ptr; |
| 364 | ret.data.len = s.len; |
| 365 | ret.meta.wi = s.len; |
| 366 | ret.meta.ri = 0; |
| 367 | ret.meta.pos = 0; |
| 368 | ret.meta.closed = closed; |
| 369 | return ret; |
| 370 | } |
| 371 | |
| 372 | static inline wuffs_base__token_buffer // |
Nigel Tao | 64dbd00 | 2020-04-02 22:11:42 +1100 | [diff] [blame] | 373 | wuffs_base__slice_token__writer(wuffs_base__slice_token s) { |
Nigel Tao | 9fd96e8 | 2020-03-16 21:46:21 +1100 | [diff] [blame] | 374 | wuffs_base__token_buffer ret; |
| 375 | ret.data.ptr = s.ptr; |
| 376 | ret.data.len = s.len; |
| 377 | ret.meta.wi = 0; |
| 378 | ret.meta.ri = 0; |
| 379 | ret.meta.pos = 0; |
| 380 | ret.meta.closed = false; |
| 381 | return ret; |
| 382 | } |
| 383 | |
| 384 | static inline wuffs_base__token_buffer // |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 385 | wuffs_base__empty_token_buffer() { |
| 386 | wuffs_base__token_buffer ret; |
| 387 | ret.data.ptr = NULL; |
| 388 | ret.data.len = 0; |
| 389 | ret.meta.wi = 0; |
| 390 | ret.meta.ri = 0; |
| 391 | ret.meta.pos = 0; |
| 392 | ret.meta.closed = false; |
| 393 | return ret; |
| 394 | } |
| 395 | |
| 396 | static inline wuffs_base__token_buffer_meta // |
| 397 | wuffs_base__empty_token_buffer_meta() { |
| 398 | wuffs_base__token_buffer_meta ret; |
| 399 | ret.wi = 0; |
| 400 | ret.ri = 0; |
| 401 | ret.pos = 0; |
| 402 | ret.closed = false; |
| 403 | return ret; |
| 404 | } |
| 405 | |
Nigel Tao | 9fd96e8 | 2020-03-16 21:46:21 +1100 | [diff] [blame] | 406 | static inline bool // |
| 407 | wuffs_base__token_buffer__is_valid(const wuffs_base__token_buffer* buf) { |
| 408 | if (buf) { |
| 409 | if (buf->data.ptr) { |
| 410 | return (buf->meta.ri <= buf->meta.wi) && (buf->meta.wi <= buf->data.len); |
| 411 | } else { |
| 412 | return (buf->meta.ri == 0) && (buf->meta.wi == 0) && (buf->data.len == 0); |
| 413 | } |
| 414 | } |
| 415 | return false; |
| 416 | } |
| 417 | |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 418 | // wuffs_base__token_buffer__compact moves any written but unread tokens to the |
| 419 | // start of the buffer. |
| 420 | static inline void // |
| 421 | wuffs_base__token_buffer__compact(wuffs_base__token_buffer* buf) { |
| 422 | if (!buf || (buf->meta.ri == 0)) { |
| 423 | return; |
| 424 | } |
| 425 | buf->meta.pos = wuffs_base__u64__sat_add(buf->meta.pos, buf->meta.ri); |
| 426 | size_t n = buf->meta.wi - buf->meta.ri; |
| 427 | if (n != 0) { |
| 428 | memmove(buf->data.ptr, buf->data.ptr + buf->meta.ri, |
| 429 | n * sizeof(wuffs_base__token)); |
| 430 | } |
| 431 | buf->meta.wi = n; |
| 432 | buf->meta.ri = 0; |
| 433 | } |
| 434 | |
| 435 | static inline uint64_t // |
Nigel Tao | 934136b | 2020-08-06 23:51:13 +1000 | [diff] [blame] | 436 | wuffs_base__token_buffer__reader_length(const wuffs_base__token_buffer* buf) { |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 437 | return buf ? buf->meta.wi - buf->meta.ri : 0; |
| 438 | } |
| 439 | |
Nigel Tao | 934136b | 2020-08-06 23:51:13 +1000 | [diff] [blame] | 440 | static inline wuffs_base__token* // |
| 441 | wuffs_base__token_buffer__reader_pointer(const wuffs_base__token_buffer* buf) { |
| 442 | return buf ? (buf->data.ptr + buf->meta.ri) : NULL; |
| 443 | } |
| 444 | |
| 445 | static inline wuffs_base__slice_token // |
| 446 | wuffs_base__token_buffer__reader_slice(const wuffs_base__token_buffer* buf) { |
| 447 | return buf ? wuffs_base__make_slice_token(buf->data.ptr + buf->meta.ri, |
| 448 | buf->meta.wi - buf->meta.ri) |
| 449 | : wuffs_base__empty_slice_token(); |
| 450 | } |
| 451 | |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 452 | static inline uint64_t // |
| 453 | wuffs_base__token_buffer__reader_token_position( |
| 454 | const wuffs_base__token_buffer* buf) { |
| 455 | return buf ? wuffs_base__u64__sat_add(buf->meta.pos, buf->meta.ri) : 0; |
| 456 | } |
| 457 | |
| 458 | static inline uint64_t // |
Nigel Tao | 934136b | 2020-08-06 23:51:13 +1000 | [diff] [blame] | 459 | wuffs_base__token_buffer__writer_length(const wuffs_base__token_buffer* buf) { |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 460 | return buf ? buf->data.len - buf->meta.wi : 0; |
| 461 | } |
| 462 | |
Nigel Tao | 934136b | 2020-08-06 23:51:13 +1000 | [diff] [blame] | 463 | static inline wuffs_base__token* // |
| 464 | wuffs_base__token_buffer__writer_pointer(const wuffs_base__token_buffer* buf) { |
| 465 | return buf ? (buf->data.ptr + buf->meta.wi) : NULL; |
| 466 | } |
| 467 | |
| 468 | static inline wuffs_base__slice_token // |
| 469 | wuffs_base__token_buffer__writer_slice(const wuffs_base__token_buffer* buf) { |
| 470 | return buf ? wuffs_base__make_slice_token(buf->data.ptr + buf->meta.wi, |
| 471 | buf->data.len - buf->meta.wi) |
| 472 | : wuffs_base__empty_slice_token(); |
| 473 | } |
| 474 | |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 475 | static inline uint64_t // |
| 476 | wuffs_base__token_buffer__writer_token_position( |
| 477 | const wuffs_base__token_buffer* buf) { |
| 478 | return buf ? wuffs_base__u64__sat_add(buf->meta.pos, buf->meta.wi) : 0; |
| 479 | } |
| 480 | |
| 481 | #ifdef __cplusplus |
| 482 | |
Nigel Tao | 9fd96e8 | 2020-03-16 21:46:21 +1100 | [diff] [blame] | 483 | inline bool // |
| 484 | wuffs_base__token_buffer::is_valid() const { |
| 485 | return wuffs_base__token_buffer__is_valid(this); |
| 486 | } |
| 487 | |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 488 | inline void // |
| 489 | wuffs_base__token_buffer::compact() { |
| 490 | wuffs_base__token_buffer__compact(this); |
| 491 | } |
| 492 | |
| 493 | inline uint64_t // |
Nigel Tao | 82a96cb | 2020-08-06 23:41:36 +1000 | [diff] [blame] | 494 | wuffs_base__token_buffer::reader_length() const { |
| 495 | return wuffs_base__token_buffer__reader_length(this); |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 496 | } |
| 497 | |
Nigel Tao | 934136b | 2020-08-06 23:51:13 +1000 | [diff] [blame] | 498 | inline wuffs_base__token* // |
| 499 | wuffs_base__token_buffer::reader_pointer() const { |
| 500 | return wuffs_base__token_buffer__reader_pointer(this); |
| 501 | } |
| 502 | |
| 503 | inline wuffs_base__slice_token // |
| 504 | wuffs_base__token_buffer::reader_slice() const { |
| 505 | return wuffs_base__token_buffer__reader_slice(this); |
| 506 | } |
| 507 | |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 508 | inline uint64_t // |
| 509 | wuffs_base__token_buffer::reader_token_position() const { |
| 510 | return wuffs_base__token_buffer__reader_token_position(this); |
| 511 | } |
| 512 | |
| 513 | inline uint64_t // |
Nigel Tao | 82a96cb | 2020-08-06 23:41:36 +1000 | [diff] [blame] | 514 | wuffs_base__token_buffer::writer_length() const { |
| 515 | return wuffs_base__token_buffer__writer_length(this); |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 516 | } |
| 517 | |
Nigel Tao | 934136b | 2020-08-06 23:51:13 +1000 | [diff] [blame] | 518 | inline wuffs_base__token* // |
| 519 | wuffs_base__token_buffer::writer_pointer() const { |
| 520 | return wuffs_base__token_buffer__writer_pointer(this); |
| 521 | } |
| 522 | |
| 523 | inline wuffs_base__slice_token // |
| 524 | wuffs_base__token_buffer::writer_slice() const { |
| 525 | return wuffs_base__token_buffer__writer_slice(this); |
| 526 | } |
| 527 | |
Nigel Tao | 737e31f | 2020-02-11 11:23:17 +1100 | [diff] [blame] | 528 | inline uint64_t // |
| 529 | wuffs_base__token_buffer::writer_token_position() const { |
| 530 | return wuffs_base__token_buffer__writer_token_position(this); |
| 531 | } |
| 532 | |
| 533 | #endif // __cplusplus |