|
1 | 1 | ///! This file is generated by `./x run src/tools/unicode-table-generator`; do not edit manually!
|
2 | 2 | // Alphabetic : 1723 bytes, 142707 codepoints in 755 ranges (U+0000AA - U+0323B0) using skiplist
|
3 | 3 | // Case_Ignorable : 1043 bytes, 2744 codepoints in 447 ranges (U+0000A8 - U+0E01F0) using skiplist
|
4 |
| -// Cased : 403 bytes, 4526 codepoints in 157 ranges (U+0000AA - U+01F18A) using skiplist |
5 | 4 | // Cc : 7 bytes, 32 codepoints in 1 ranges (U+000080 - U+0000A0) using skiplist
|
6 | 5 | // Grapheme_Extend : 887 bytes, 2193 codepoints in 375 ranges (U+000300 - U+0E01F0) using skiplist
|
7 | 6 | // Lowercase : 933 bytes, 2543 codepoints in 674 ranges (U+0000AA - U+01E944) using bitset
|
| 7 | +// Lt : 33 bytes, 31 codepoints in 10 ranges (U+0001C5 - U+001FFD) using skiplist |
8 | 8 | // N : 455 bytes, 1901 codepoints in 143 ranges (U+0000B2 - U+01FBFA) using skiplist
|
9 | 9 | // Uppercase : 797 bytes, 1952 codepoints in 655 ranges (U+0000C0 - U+01F18A) using bitset
|
10 | 10 | // White_Space : 256 bytes, 19 codepoints in 8 ranges (U+000085 - U+003001) using cascading
|
11 | 11 | // to_lower : 11484 bytes
|
12 | 12 | // to_upper : 13432 bytes
|
13 |
| -// Total : 31420 bytes |
| 13 | +// Total : 31050 bytes |
14 | 14 |
|
15 | 15 | #[inline(always)]
|
16 | 16 | const fn bitset_search<
|
@@ -338,59 +338,6 @@ pub mod case_ignorable {
|
338 | 338 | }
|
339 | 339 | }
|
340 | 340 |
|
341 |
| -#[rustfmt::skip] |
342 |
| -pub mod cased { |
343 |
| - use super::ShortOffsetRunHeader; |
344 |
| - |
345 |
| - static SHORT_OFFSET_RUNS: [ShortOffsetRunHeader; 22] = [ |
346 |
| - ShortOffsetRunHeader::new(0, 4256), ShortOffsetRunHeader::new(51, 5024), |
347 |
| - ShortOffsetRunHeader::new(61, 7296), ShortOffsetRunHeader::new(65, 7958), |
348 |
| - ShortOffsetRunHeader::new(74, 9398), ShortOffsetRunHeader::new(149, 11264), |
349 |
| - ShortOffsetRunHeader::new(151, 42560), ShortOffsetRunHeader::new(163, 43824), |
350 |
| - ShortOffsetRunHeader::new(183, 64256), ShortOffsetRunHeader::new(189, 65313), |
351 |
| - ShortOffsetRunHeader::new(193, 66560), ShortOffsetRunHeader::new(197, 67456), |
352 |
| - ShortOffsetRunHeader::new(219, 68736), ShortOffsetRunHeader::new(227, 71840), |
353 |
| - ShortOffsetRunHeader::new(235, 93760), ShortOffsetRunHeader::new(237, 119808), |
354 |
| - ShortOffsetRunHeader::new(239, 120486), ShortOffsetRunHeader::new(276, 122624), |
355 |
| - ShortOffsetRunHeader::new(299, 122928), ShortOffsetRunHeader::new(305, 125184), |
356 |
| - ShortOffsetRunHeader::new(307, 127280), ShortOffsetRunHeader::new(309, 1241482), |
357 |
| - ]; |
358 |
| - static OFFSETS: [u8; 315] = [ |
359 |
| - 170, 1, 10, 1, 4, 1, 5, 23, 1, 31, 1, 195, 1, 4, 4, 208, 1, 36, 7, 2, 30, 5, 96, 1, 42, 4, |
360 |
| - 2, 2, 2, 4, 1, 1, 6, 1, 1, 3, 1, 1, 1, 20, 1, 83, 1, 139, 8, 166, 1, 38, 9, 41, 0, 38, 1, 1, |
361 |
| - 5, 1, 2, 43, 1, 4, 0, 86, 2, 6, 0, 11, 5, 43, 2, 3, 64, 192, 64, 0, 2, 6, 2, 38, 2, 6, 2, 8, |
362 |
| - 1, 1, 1, 1, 1, 1, 1, 31, 2, 53, 1, 7, 1, 1, 3, 3, 1, 7, 3, 4, 2, 6, 4, 13, 5, 3, 1, 7, 116, |
363 |
| - 1, 13, 1, 16, 13, 101, 1, 4, 1, 2, 10, 1, 1, 3, 5, 6, 1, 1, 1, 1, 1, 1, 4, 1, 6, 4, 1, 2, 4, |
364 |
| - 5, 5, 4, 1, 17, 32, 3, 2, 0, 52, 0, 229, 6, 4, 3, 2, 12, 38, 1, 1, 5, 1, 0, 46, 18, 30, 132, |
365 |
| - 102, 3, 4, 1, 62, 2, 2, 1, 1, 1, 8, 21, 5, 1, 3, 0, 43, 1, 14, 6, 80, 0, 7, 12, 5, 0, 26, 6, |
366 |
| - 26, 0, 80, 96, 36, 4, 36, 116, 11, 1, 15, 1, 7, 1, 2, 1, 11, 1, 15, 1, 7, 1, 2, 0, 1, 2, 3, |
367 |
| - 1, 42, 1, 9, 0, 51, 13, 51, 93, 22, 10, 22, 0, 64, 0, 64, 0, 85, 1, 71, 1, 2, 2, 1, 2, 2, 2, |
368 |
| - 4, 1, 12, 1, 1, 1, 7, 1, 65, 1, 4, 2, 8, 1, 7, 1, 28, 1, 4, 1, 5, 1, 1, 3, 7, 1, 0, 2, 25, |
369 |
| - 1, 25, 1, 31, 1, 25, 1, 31, 1, 25, 1, 31, 1, 25, 1, 31, 1, 25, 1, 8, 0, 10, 1, 20, 6, 6, 0, |
370 |
| - 62, 0, 68, 0, 26, 6, 26, 6, 26, 0, |
371 |
| - ]; |
372 |
| - #[inline] |
373 |
| - pub fn lookup(c: char) -> bool { |
374 |
| - debug_assert!(!c.is_ascii()); |
375 |
| - (c as u32) >= 0xaa && lookup_slow(c) |
376 |
| - } |
377 |
| - |
378 |
| - #[inline(never)] |
379 |
| - fn lookup_slow(c: char) -> bool { |
380 |
| - const { |
381 |
| - assert!(SHORT_OFFSET_RUNS.last().unwrap().0 > char::MAX as u32); |
382 |
| - let mut i = 0; |
383 |
| - while i < SHORT_OFFSET_RUNS.len() { |
384 |
| - assert!(SHORT_OFFSET_RUNS[i].start_index() < OFFSETS.len()); |
385 |
| - i += 1; |
386 |
| - } |
387 |
| - } |
388 |
| - // SAFETY: We just ensured the last element of `SHORT_OFFSET_RUNS` is greater than `std::char::MAX` |
389 |
| - // and the start indices of all elements in `SHORT_OFFSET_RUNS` are smaller than `OFFSETS.len()`. |
390 |
| - unsafe { super::skip_search(c, &SHORT_OFFSET_RUNS, &OFFSETS) } |
391 |
| - } |
392 |
| -} |
393 |
| - |
394 | 341 | #[rustfmt::skip]
|
395 | 342 | pub mod cc {
|
396 | 343 | use super::ShortOffsetRunHeader;
|
@@ -605,6 +552,39 @@ pub mod lowercase {
|
605 | 552 | }
|
606 | 553 | }
|
607 | 554 |
|
| 555 | +#[rustfmt::skip] |
| 556 | +pub mod lt { |
| 557 | + use super::ShortOffsetRunHeader; |
| 558 | + |
| 559 | + static SHORT_OFFSET_RUNS: [ShortOffsetRunHeader; 3] = [ |
| 560 | + ShortOffsetRunHeader::new(0, 453), ShortOffsetRunHeader::new(1, 8072), |
| 561 | + ShortOffsetRunHeader::new(9, 1122301), |
| 562 | + ]; |
| 563 | + static OFFSETS: [u8; 21] = [ |
| 564 | + 0, 1, 2, 1, 2, 1, 38, 1, 0, 8, 8, 8, 8, 8, 12, 1, 15, 1, 47, 1, 0, |
| 565 | + ]; |
| 566 | + #[inline] |
| 567 | + pub fn lookup(c: char) -> bool { |
| 568 | + debug_assert!(!c.is_ascii()); |
| 569 | + (c as u32) >= 0x1c5 && lookup_slow(c) |
| 570 | + } |
| 571 | + |
| 572 | + #[inline(never)] |
| 573 | + fn lookup_slow(c: char) -> bool { |
| 574 | + const { |
| 575 | + assert!(SHORT_OFFSET_RUNS.last().unwrap().0 > char::MAX as u32); |
| 576 | + let mut i = 0; |
| 577 | + while i < SHORT_OFFSET_RUNS.len() { |
| 578 | + assert!(SHORT_OFFSET_RUNS[i].start_index() < OFFSETS.len()); |
| 579 | + i += 1; |
| 580 | + } |
| 581 | + } |
| 582 | + // SAFETY: We just ensured the last element of `SHORT_OFFSET_RUNS` is greater than `std::char::MAX` |
| 583 | + // and the start indices of all elements in `SHORT_OFFSET_RUNS` are smaller than `OFFSETS.len()`. |
| 584 | + unsafe { super::skip_search(c, &SHORT_OFFSET_RUNS, &OFFSETS) } |
| 585 | + } |
| 586 | +} |
| 587 | + |
608 | 588 | #[rustfmt::skip]
|
609 | 589 | pub mod n {
|
610 | 590 | use super::ShortOffsetRunHeader;
|
|
0 commit comments