| 1 | #![allow ( |
| 2 | dead_code, |
| 3 | non_upper_case_globals, |
| 4 | unused_assignments, |
| 5 | unused_parens, |
| 6 | while_true, |
| 7 | clippy::assign_op_pattern, |
| 8 | clippy::collapsible_if, |
| 9 | clippy::comparison_chain, |
| 10 | clippy::double_parens, |
| 11 | clippy::unnecessary_cast, |
| 12 | clippy::single_match, |
| 13 | clippy::never_loop |
| 14 | )] |
| 15 | |
| 16 | use super::buffer::{hb_buffer_t, HB_BUFFER_SCRATCH_FLAG_HAS_BROKEN_SYLLABLE}; |
| 17 | |
| 18 | static _khmer_syllable_machine_actions: [i8; 29] = [ |
| 19 | 0, 1, 0, 1, 1, 1, 2, 1, 5, 1, 6, 1, 7, 1, 8, 1, 9, 1, 10, 1, 11, 2, 2, 3, 2, 2, 4, 0, 0, |
| 20 | ]; |
| 21 | static _khmer_syllable_machine_key_offsets: [i16; 45] = [ |
| 22 | 0, 5, 8, 11, 15, 18, 21, 25, 28, 32, 35, 40, 45, 48, 51, 55, 58, 61, 65, 68, 72, 75, 90, 100, |
| 23 | 103, 113, 122, 123, 129, 134, 141, 149, 158, 168, 171, 181, 190, 191, 197, 202, 209, 217, 226, |
| 24 | 0, 0, |
| 25 | ]; |
| 26 | static _khmer_syllable_machine_trans_keys: [u8; 232] = [ |
| 27 | 20, 25, 26, 5, 6, 26, 5, 6, 15, 1, 2, 20, 26, 5, 6, 26, 5, 6, 26, 5, 6, 20, 26, 5, 6, 26, 5, 6, |
| 28 | 20, 26, 5, 6, 26, 5, 6, 20, 25, 26, 5, 6, 20, 25, 26, 5, 6, 26, 5, 6, 15, 1, 2, 20, 26, 5, 6, |
| 29 | 26, 5, 6, 26, 5, 6, 20, 26, 5, 6, 26, 5, 6, 20, 26, 5, 6, 26, 5, 6, 4, 15, 20, 21, 22, 23, 25, |
| 30 | 26, 27, 1, 2, 5, 6, 10, 11, 4, 20, 21, 22, 23, 25, 26, 27, 5, 6, 15, 1, 2, 4, 20, 21, 22, 23, |
| 31 | 25, 26, 27, 5, 6, 4, 20, 21, 22, 23, 26, 27, 5, 6, 27, 4, 23, 26, 27, 5, 6, 4, 26, 27, 5, 6, 4, |
| 32 | 20, 23, 26, 27, 5, 6, 4, 20, 21, 23, 26, 27, 5, 6, 4, 20, 21, 22, 23, 26, 27, 5, 6, 4, 20, 21, |
| 33 | 22, 23, 25, 26, 27, 5, 6, 15, 1, 2, 4, 20, 21, 22, 23, 25, 26, 27, 5, 6, 4, 20, 21, 22, 23, 26, |
| 34 | 27, 5, 6, 27, 4, 23, 26, 27, 5, 6, 4, 26, 27, 5, 6, 4, 20, 23, 26, 27, 5, 6, 4, 20, 21, 23, 26, |
| 35 | 27, 5, 6, 4, 20, 21, 22, 23, 26, 27, 5, 6, 20, 26, 5, 6, 0, 0, |
| 36 | ]; |
| 37 | static _khmer_syllable_machine_single_lengths: [i8; 45] = [ |
| 38 | 3, 1, 1, 2, 1, 1, 2, 1, 2, 1, 3, 3, 1, 1, 2, 1, 1, 2, 1, 2, 1, 9, 8, 1, 8, 7, 1, 4, 3, 5, 6, 7, |
| 39 | 8, 1, 8, 7, 1, 4, 3, 5, 6, 7, 2, 0, 0, |
| 40 | ]; |
| 41 | static _khmer_syllable_machine_range_lengths: [i8; 45] = [ |
| 42 | 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, |
| 43 | 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, |
| 44 | ]; |
| 45 | static _khmer_syllable_machine_index_offsets: [i16; 45] = [ |
| 46 | 0, 5, 8, 11, 15, 18, 21, 25, 28, 32, 35, 40, 45, 48, 51, 55, 58, 61, 65, 68, 72, 75, 88, 98, |
| 47 | 101, 111, 120, 122, 128, 133, 140, 148, 157, 167, 170, 180, 189, 191, 197, 202, 209, 217, 226, |
| 48 | 0, 0, |
| 49 | ]; |
| 50 | static _khmer_syllable_machine_cond_targs: [i8; 275] = [ |
| 51 | 27, 31, 25, 1, 21, 25, 1, 21, 26, 26, 21, 27, 25, 1, 21, 27, 4, 21, 28, 5, 21, 27, 29, 7, 21, |
| 52 | 29, 7, 21, 27, 30, 9, 21, 30, 9, 21, 27, 32, 25, 1, 21, 37, 41, 35, 12, 21, 35, 12, 21, 36, 36, |
| 53 | 21, 37, 35, 12, 21, 37, 15, 21, 38, 16, 21, 37, 39, 18, 21, 39, 18, 21, 37, 40, 20, 21, 40, 20, |
| 54 | 21, 33, 22, 37, 39, 40, 38, 41, 35, 36, 22, 42, 32, 21, 23, 27, 29, 30, 28, 32, 25, 26, 10, 21, |
| 55 | 24, 24, 21, 23, 27, 29, 30, 28, 31, 25, 26, 0, 21, 2, 27, 29, 30, 28, 25, 26, 3, 21, 26, 21, 2, |
| 56 | 28, 27, 26, 4, 21, 2, 28, 26, 5, 21, 2, 27, 28, 29, 26, 6, 21, 2, 27, 29, 28, 30, 26, 8, 21, |
| 57 | 23, 27, 29, 30, 28, 25, 26, 3, 21, 23, 27, 29, 30, 28, 31, 25, 26, 3, 21, 34, 34, 21, 33, 37, |
| 58 | 39, 40, 38, 41, 35, 36, 11, 21, 13, 37, 39, 40, 38, 35, 36, 14, 21, 36, 21, 13, 38, 37, 36, 15, |
| 59 | 21, 13, 38, 36, 16, 21, 13, 37, 38, 39, 36, 17, 21, 13, 37, 39, 38, 40, 36, 19, 21, 33, 37, 39, |
| 60 | 40, 38, 35, 36, 14, 21, 37, 35, 12, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, |
| 61 | 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, 21, |
| 62 | 21, 21, 21, 21, 21, 0, 0, |
| 63 | ]; |
| 64 | static _khmer_syllable_machine_cond_actions: [i8; 275] = [ |
| 65 | 5, 5, 5, 0, 15, 5, 0, 15, 0, 0, 15, 5, 5, 0, 15, 5, 0, 15, 5, 0, 15, 5, 5, 0, 15, 5, 0, 15, 5, |
| 66 | 5, 0, 15, 5, 0, 15, 5, 5, 5, 0, 15, 5, 21, 21, 0, 17, 21, 0, 19, 0, 0, 17, 5, 21, 0, 17, 5, 0, |
| 67 | 17, 5, 0, 17, 5, 5, 0, 17, 5, 0, 17, 5, 5, 0, 17, 5, 0, 17, 0, 5, 5, 5, 5, 5, 21, 21, 0, 5, 24, |
| 68 | 5, 7, 0, 5, 5, 5, 5, 5, 5, 0, 0, 9, 5, 5, 9, 0, 5, 5, 5, 5, 5, 5, 0, 0, 9, 0, 5, 5, 5, 5, 5, 0, |
| 69 | 0, 9, 0, 9, 0, 5, 5, 0, 0, 9, 0, 5, 0, 0, 9, 0, 5, 5, 5, 0, 0, 9, 0, 5, 5, 5, 5, 0, 0, 9, 0, 5, |
| 70 | 5, 5, 5, 5, 0, 0, 9, 0, 5, 5, 5, 5, 5, 5, 0, 0, 9, 21, 21, 11, 0, 5, 5, 5, 5, 21, 21, 0, 0, 11, |
| 71 | 0, 5, 5, 5, 5, 21, 0, 0, 11, 0, 11, 0, 5, 5, 0, 0, 11, 0, 5, 0, 0, 11, 0, 5, 5, 5, 0, 0, 11, 0, |
| 72 | 5, 5, 5, 5, 0, 0, 11, 0, 5, 5, 5, 5, 21, 0, 0, 11, 5, 21, 0, 13, 15, 15, 15, 15, 15, 15, 15, |
| 73 | 15, 15, 15, 15, 17, 19, 17, 17, 17, 17, 17, 17, 17, 17, 0, 9, 9, 9, 9, 9, 9, 9, 9, 9, 9, 9, 11, |
| 74 | 11, 11, 11, 11, 11, 11, 11, 11, 13, 0, 0, |
| 75 | ]; |
| 76 | static _khmer_syllable_machine_to_state_actions: [i8; 45] = [ |
| 77 | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, |
| 78 | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, |
| 79 | ]; |
| 80 | static _khmer_syllable_machine_from_state_actions: [i8; 45] = [ |
| 81 | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, |
| 82 | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, |
| 83 | ]; |
| 84 | static _khmer_syllable_machine_eof_trans: [i16; 45] = [ |
| 85 | 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, |
| 86 | 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, |
| 87 | 269, 270, 271, 272, 273, 0, 0, |
| 88 | ]; |
| 89 | static khmer_syllable_machine_start: i32 = 21; |
| 90 | static khmer_syllable_machine_first_final: i32 = 21; |
| 91 | static khmer_syllable_machine_error: i32 = -1; |
| 92 | static khmer_syllable_machine_en_main: i32 = 21; |
| 93 | #[derive (Clone, Copy)] |
| 94 | pub enum SyllableType { |
| 95 | ConsonantSyllable = 0, |
| 96 | BrokenCluster, |
| 97 | NonKhmerCluster, |
| 98 | } |
| 99 | |
| 100 | pub fn find_syllables_khmer(buffer: &mut hb_buffer_t) { |
| 101 | let mut cs = 0; |
| 102 | let mut ts = 0; |
| 103 | let mut te = 0; |
| 104 | let mut act = 0; |
| 105 | let mut p = 0; |
| 106 | let pe = buffer.len; |
| 107 | let eof = buffer.len; |
| 108 | let mut syllable_serial = 1u8; |
| 109 | |
| 110 | macro_rules! found_syllable { |
| 111 | ($kind:expr) => {{ |
| 112 | found_syllable(ts, te, &mut syllable_serial, $kind, buffer); |
| 113 | }}; |
| 114 | } |
| 115 | |
| 116 | { |
| 117 | cs = (khmer_syllable_machine_start) as i32; |
| 118 | ts = 0; |
| 119 | te = 0; |
| 120 | act = 0; |
| 121 | } |
| 122 | |
| 123 | { |
| 124 | let mut _klen = 0; |
| 125 | let mut _trans = 0; |
| 126 | let mut _keys: i32 = 0; |
| 127 | let mut _acts: i32 = 0; |
| 128 | let mut _nacts = 0; |
| 129 | let mut __have = 0; |
| 130 | '_resume: while (p != pe || p == eof) { |
| 131 | '_again: while (true) { |
| 132 | _acts = (_khmer_syllable_machine_from_state_actions[(cs) as usize]) as i32; |
| 133 | _nacts = (_khmer_syllable_machine_actions[(_acts) as usize]) as u32; |
| 134 | _acts += 1; |
| 135 | while (_nacts > 0) { |
| 136 | match (_khmer_syllable_machine_actions[(_acts) as usize]) { |
| 137 | 1 => { |
| 138 | ts = p; |
| 139 | } |
| 140 | |
| 141 | _ => {} |
| 142 | } |
| 143 | _nacts -= 1; |
| 144 | _acts += 1; |
| 145 | } |
| 146 | if (p == eof) { |
| 147 | { |
| 148 | if (_khmer_syllable_machine_eof_trans[(cs) as usize] > 0) { |
| 149 | { |
| 150 | _trans = |
| 151 | (_khmer_syllable_machine_eof_trans[(cs) as usize]) as u32 - 1; |
| 152 | } |
| 153 | } |
| 154 | } |
| 155 | } else { |
| 156 | { |
| 157 | _keys = (_khmer_syllable_machine_key_offsets[(cs) as usize]) as i32; |
| 158 | _trans = (_khmer_syllable_machine_index_offsets[(cs) as usize]) as u32; |
| 159 | _klen = (_khmer_syllable_machine_single_lengths[(cs) as usize]) as i32; |
| 160 | __have = 0; |
| 161 | if (_klen > 0) { |
| 162 | { |
| 163 | let mut _lower: i32 = _keys; |
| 164 | let mut _upper: i32 = _keys + _klen - 1; |
| 165 | let mut _mid: i32 = 0; |
| 166 | while (true) { |
| 167 | if (_upper < _lower) { |
| 168 | { |
| 169 | _keys += _klen; |
| 170 | _trans += (_klen) as u32; |
| 171 | break; |
| 172 | } |
| 173 | } |
| 174 | _mid = _lower + ((_upper - _lower) >> 1); |
| 175 | if ((buffer.info[p].khmer_category() as u8) |
| 176 | < _khmer_syllable_machine_trans_keys[(_mid) as usize]) |
| 177 | { |
| 178 | _upper = _mid - 1; |
| 179 | } else if ((buffer.info[p].khmer_category() as u8) |
| 180 | > _khmer_syllable_machine_trans_keys[(_mid) as usize]) |
| 181 | { |
| 182 | _lower = _mid + 1; |
| 183 | } else { |
| 184 | { |
| 185 | __have = 1; |
| 186 | _trans += (_mid - _keys) as u32; |
| 187 | break; |
| 188 | } |
| 189 | } |
| 190 | } |
| 191 | } |
| 192 | } |
| 193 | _klen = (_khmer_syllable_machine_range_lengths[(cs) as usize]) as i32; |
| 194 | if (__have == 0 && _klen > 0) { |
| 195 | { |
| 196 | let mut _lower: i32 = _keys; |
| 197 | let mut _upper: i32 = _keys + (_klen << 1) - 2; |
| 198 | let mut _mid: i32 = 0; |
| 199 | while (true) { |
| 200 | if (_upper < _lower) { |
| 201 | { |
| 202 | _trans += (_klen) as u32; |
| 203 | break; |
| 204 | } |
| 205 | } |
| 206 | _mid = _lower + (((_upper - _lower) >> 1) & !1); |
| 207 | if ((buffer.info[p].khmer_category() as u8) |
| 208 | < _khmer_syllable_machine_trans_keys[(_mid) as usize]) |
| 209 | { |
| 210 | _upper = _mid - 2; |
| 211 | } else if ((buffer.info[p].khmer_category() as u8) |
| 212 | > _khmer_syllable_machine_trans_keys[(_mid + 1) as usize]) |
| 213 | { |
| 214 | _lower = _mid + 2; |
| 215 | } else { |
| 216 | { |
| 217 | _trans += ((_mid - _keys) >> 1) as u32; |
| 218 | break; |
| 219 | } |
| 220 | } |
| 221 | } |
| 222 | } |
| 223 | } |
| 224 | } |
| 225 | } |
| 226 | cs = (_khmer_syllable_machine_cond_targs[(_trans) as usize]) as i32; |
| 227 | if (_khmer_syllable_machine_cond_actions[(_trans) as usize] != 0) { |
| 228 | { |
| 229 | _acts = (_khmer_syllable_machine_cond_actions[(_trans) as usize]) as i32; |
| 230 | _nacts = (_khmer_syllable_machine_actions[(_acts) as usize]) as u32; |
| 231 | _acts += 1; |
| 232 | while (_nacts > 0) { |
| 233 | match (_khmer_syllable_machine_actions[(_acts) as usize]) { |
| 234 | 2 => { |
| 235 | te = p + 1; |
| 236 | } |
| 237 | 3 => { |
| 238 | act = 2; |
| 239 | } |
| 240 | 4 => { |
| 241 | act = 3; |
| 242 | } |
| 243 | 5 => { |
| 244 | te = p + 1; |
| 245 | { |
| 246 | found_syllable!(SyllableType::NonKhmerCluster); |
| 247 | } |
| 248 | } |
| 249 | 6 => { |
| 250 | te = p; |
| 251 | p = p - 1; |
| 252 | { |
| 253 | found_syllable!(SyllableType::ConsonantSyllable); |
| 254 | } |
| 255 | } |
| 256 | 7 => { |
| 257 | te = p; |
| 258 | p = p - 1; |
| 259 | { |
| 260 | found_syllable!(SyllableType::BrokenCluster); |
| 261 | buffer.scratch_flags |= |
| 262 | HB_BUFFER_SCRATCH_FLAG_HAS_BROKEN_SYLLABLE; |
| 263 | } |
| 264 | } |
| 265 | 8 => { |
| 266 | te = p; |
| 267 | p = p - 1; |
| 268 | { |
| 269 | found_syllable!(SyllableType::NonKhmerCluster); |
| 270 | } |
| 271 | } |
| 272 | 9 => { |
| 273 | p = (te) - 1; |
| 274 | { |
| 275 | found_syllable!(SyllableType::ConsonantSyllable); |
| 276 | } |
| 277 | } |
| 278 | 10 => { |
| 279 | p = (te) - 1; |
| 280 | { |
| 281 | found_syllable!(SyllableType::BrokenCluster); |
| 282 | buffer.scratch_flags |= |
| 283 | HB_BUFFER_SCRATCH_FLAG_HAS_BROKEN_SYLLABLE; |
| 284 | } |
| 285 | } |
| 286 | 11 => match (act) { |
| 287 | 2 => { |
| 288 | p = (te) - 1; |
| 289 | { |
| 290 | found_syllable!(SyllableType::BrokenCluster); |
| 291 | buffer.scratch_flags |= |
| 292 | HB_BUFFER_SCRATCH_FLAG_HAS_BROKEN_SYLLABLE; |
| 293 | } |
| 294 | } |
| 295 | 3 => { |
| 296 | p = (te) - 1; |
| 297 | { |
| 298 | found_syllable!(SyllableType::NonKhmerCluster); |
| 299 | } |
| 300 | } |
| 301 | |
| 302 | _ => {} |
| 303 | }, |
| 304 | |
| 305 | _ => {} |
| 306 | } |
| 307 | _nacts -= 1; |
| 308 | _acts += 1; |
| 309 | } |
| 310 | } |
| 311 | } |
| 312 | break '_again; |
| 313 | } |
| 314 | if (p == eof) { |
| 315 | { |
| 316 | if (cs >= 21) { |
| 317 | break '_resume; |
| 318 | } |
| 319 | } |
| 320 | } else { |
| 321 | { |
| 322 | _acts = (_khmer_syllable_machine_to_state_actions[(cs) as usize]) as i32; |
| 323 | _nacts = (_khmer_syllable_machine_actions[(_acts) as usize]) as u32; |
| 324 | _acts += 1; |
| 325 | while (_nacts > 0) { |
| 326 | match (_khmer_syllable_machine_actions[(_acts) as usize]) { |
| 327 | 0 => { |
| 328 | ts = 0; |
| 329 | } |
| 330 | |
| 331 | _ => {} |
| 332 | } |
| 333 | _nacts -= 1; |
| 334 | _acts += 1; |
| 335 | } |
| 336 | p += 1; |
| 337 | continue '_resume; |
| 338 | } |
| 339 | } |
| 340 | break '_resume; |
| 341 | } |
| 342 | } |
| 343 | } |
| 344 | |
| 345 | #[inline ] |
| 346 | fn found_syllable( |
| 347 | start: usize, |
| 348 | end: usize, |
| 349 | syllable_serial: &mut u8, |
| 350 | kind: SyllableType, |
| 351 | buffer: &mut hb_buffer_t, |
| 352 | ) { |
| 353 | for i: usize in start..end { |
| 354 | buffer.info[i].set_syllable((*syllable_serial << 4) | kind as u8); |
| 355 | } |
| 356 | |
| 357 | *syllable_serial += 1; |
| 358 | |
| 359 | if *syllable_serial == 16 { |
| 360 | *syllable_serial = 1; |
| 361 | } |
| 362 | } |
| 363 | |