/src/cpython/Objects/stringlib/find_max_char.h
Line | Count | Source |
1 | | /* Finding the optimal width of unicode characters in a buffer */ |
2 | | |
3 | | /* find_max_char for one-byte will work for bytes objects as well. */ |
4 | | #if !STRINGLIB_IS_UNICODE && STRINGLIB_SIZEOF_CHAR > 1 |
5 | | # error "find_max_char.h is specific to Unicode" |
6 | | #endif |
7 | | |
8 | | /* Mask to quickly check whether a C 'size_t' contains a |
9 | | non-ASCII, UTF8-encoded char. */ |
10 | | #if (SIZEOF_SIZE_T == 8) |
11 | 192M | # define UCS1_ASCII_CHAR_MASK 0x8080808080808080ULL |
12 | | #elif (SIZEOF_SIZE_T == 4) |
13 | | # define UCS1_ASCII_CHAR_MASK 0x80808080U |
14 | | #else |
15 | | # error C 'size_t' size should be either 4 or 8! |
16 | | #endif |
17 | | |
18 | | #if STRINGLIB_SIZEOF_CHAR == 1 |
19 | | |
20 | | Py_LOCAL_INLINE(Py_UCS4) |
21 | | STRINGLIB(find_max_char)(const STRINGLIB_CHAR *begin, const STRINGLIB_CHAR *end) |
22 | 45.9M | { |
23 | 45.9M | const unsigned char *p = (const unsigned char *) begin; |
24 | 45.9M | const unsigned char *_end = (const unsigned char *)end; |
25 | | |
26 | 302M | while (p < _end) { |
27 | 271M | if (_Py_IS_ALIGNED(p, ALIGNOF_SIZE_T)) { |
28 | | /* Help register allocation */ |
29 | 39.2M | const unsigned char *_p = p; |
30 | 226M | while (_p + SIZEOF_SIZE_T <= _end) { |
31 | 192M | size_t value = *(const size_t *) _p; |
32 | 192M | if (value & UCS1_ASCII_CHAR_MASK) |
33 | 5.41M | return 255; |
34 | 187M | _p += SIZEOF_SIZE_T; |
35 | 187M | } |
36 | 33.8M | p = _p; |
37 | 33.8M | if (p == _end) |
38 | 5.30M | break; |
39 | 33.8M | } |
40 | 260M | if (*p++ & 0x80) |
41 | 4.00M | return 255; |
42 | 260M | } |
43 | 36.4M | return 127; |
44 | 45.9M | } Unexecuted instantiation: unicode_writer.c:ucs1lib_find_max_char unicodeobject.c:ucs1lib_find_max_char Line | Count | Source | 22 | 45.9M | { | 23 | 45.9M | const unsigned char *p = (const unsigned char *) begin; | 24 | 45.9M | const unsigned char *_end = (const unsigned char *)end; | 25 | | | 26 | 302M | while (p < _end) { | 27 | 271M | if (_Py_IS_ALIGNED(p, ALIGNOF_SIZE_T)) { | 28 | | /* Help register allocation */ | 29 | 39.2M | const unsigned char *_p = p; | 30 | 226M | while (_p + SIZEOF_SIZE_T <= _end) { | 31 | 192M | size_t value = *(const size_t *) _p; | 32 | 192M | if (value & UCS1_ASCII_CHAR_MASK) | 33 | 5.41M | return 255; | 34 | 187M | _p += SIZEOF_SIZE_T; | 35 | 187M | } | 36 | 33.8M | p = _p; | 37 | 33.8M | if (p == _end) | 38 | 5.30M | break; | 39 | 33.8M | } | 40 | 260M | if (*p++ & 0x80) | 41 | 4.00M | return 255; | 42 | 260M | } | 43 | 36.4M | return 127; | 44 | 45.9M | } |
Unexecuted instantiation: unicodeobject.c:asciilib_find_max_char Unexecuted instantiation: bytes_methods.c:stringlib_find_max_char |
45 | | |
46 | | #undef ASCII_CHAR_MASK |
47 | | |
48 | | #else /* STRINGLIB_SIZEOF_CHAR == 1 */ |
49 | | |
50 | 84.4M | #define MASK_ASCII 0xFFFFFF80 |
51 | 56.2M | #define MASK_UCS1 0xFFFFFF00 |
52 | 28.2M | #define MASK_UCS2 0xFFFF0000 |
53 | | |
54 | 53.8M | #define MAX_CHAR_ASCII 0x7f |
55 | 24.9M | #define MAX_CHAR_UCS1 0xff |
56 | 37.0M | #define MAX_CHAR_UCS2 0xffff |
57 | 22.5M | #define MAX_CHAR_UCS4 0x10ffff |
58 | | |
59 | | Py_LOCAL_INLINE(Py_UCS4) |
60 | | STRINGLIB(find_max_char)(const STRINGLIB_CHAR *begin, const STRINGLIB_CHAR *end) |
61 | 53.8M | { |
62 | | #if STRINGLIB_SIZEOF_CHAR == 2 |
63 | 31.2M | const Py_UCS4 mask_limit = MASK_UCS1; |
64 | 31.2M | const Py_UCS4 max_char_limit = MAX_CHAR_UCS2; |
65 | | #elif STRINGLIB_SIZEOF_CHAR == 4 |
66 | 22.5M | const Py_UCS4 mask_limit = MASK_UCS2; |
67 | 22.5M | const Py_UCS4 max_char_limit = MAX_CHAR_UCS4; |
68 | | #else |
69 | | #error Invalid STRINGLIB_SIZEOF_CHAR (must be 1, 2 or 4) |
70 | | #endif |
71 | 53.8M | Py_UCS4 mask; |
72 | 53.8M | Py_ssize_t n = end - begin; |
73 | 53.8M | const STRINGLIB_CHAR *p = begin; |
74 | 53.8M | const STRINGLIB_CHAR *unrolled_end = begin + _Py_SIZE_ROUND_DOWN(n, 4); |
75 | 53.8M | Py_UCS4 max_char; |
76 | | |
77 | 53.8M | max_char = MAX_CHAR_ASCII; |
78 | 53.8M | mask = MASK_ASCII; |
79 | 1.58G | while (p < unrolled_end) { |
80 | 1.54G | STRINGLIB_CHAR bits = p[0] | p[1] | p[2] | p[3]; |
81 | 1.54G | if (bits & mask) { |
82 | 45.3M | if (mask == mask_limit) { |
83 | | /* Limit reached */ |
84 | 18.1M | return max_char_limit; |
85 | 18.1M | } |
86 | 27.2M | if (mask == MASK_ASCII) { |
87 | 22.5M | max_char = MAX_CHAR_UCS1; |
88 | 22.5M | mask = MASK_UCS1; |
89 | 22.5M | } |
90 | 4.62M | else { |
91 | | /* mask can't be MASK_UCS2 because of mask_limit above */ |
92 | 4.62M | assert(mask == MASK_UCS1); |
93 | 4.62M | max_char = MAX_CHAR_UCS2; |
94 | 4.62M | mask = MASK_UCS2; |
95 | 4.62M | } |
96 | | /* We check the new mask on the same chars in the next iteration */ |
97 | 27.2M | continue; |
98 | 45.3M | } |
99 | 1.50G | p += 4; |
100 | 1.50G | } |
101 | 106M | while (p < end) { |
102 | 72.2M | if (p[0] & mask) { |
103 | 4.62M | if (mask == mask_limit) { |
104 | | /* Limit reached */ |
105 | 1.21M | return max_char_limit; |
106 | 1.21M | } |
107 | 3.41M | if (mask == MASK_ASCII) { |
108 | 2.33M | max_char = MAX_CHAR_UCS1; |
109 | 2.33M | mask = MASK_UCS1; |
110 | 2.33M | } |
111 | 1.07M | else { |
112 | | /* mask can't be MASK_UCS2 because of mask_limit above */ |
113 | 1.07M | assert(mask == MASK_UCS1); |
114 | 1.07M | max_char = MAX_CHAR_UCS2; |
115 | 1.07M | mask = MASK_UCS2; |
116 | 1.07M | } |
117 | | /* We check the new mask on the same chars in the next iteration */ |
118 | 3.41M | continue; |
119 | 4.62M | } |
120 | 67.6M | p++; |
121 | 67.6M | } |
122 | 34.5M | return max_char; |
123 | 35.7M | } unicodeobject.c:ucs4lib_find_max_char Line | Count | Source | 61 | 22.5M | { | 62 | | #if STRINGLIB_SIZEOF_CHAR == 2 | 63 | | const Py_UCS4 mask_limit = MASK_UCS1; | 64 | | const Py_UCS4 max_char_limit = MAX_CHAR_UCS2; | 65 | | #elif STRINGLIB_SIZEOF_CHAR == 4 | 66 | 22.5M | const Py_UCS4 mask_limit = MASK_UCS2; | 67 | 22.5M | const Py_UCS4 max_char_limit = MAX_CHAR_UCS4; | 68 | | #else | 69 | | #error Invalid STRINGLIB_SIZEOF_CHAR (must be 1, 2 or 4) | 70 | | #endif | 71 | 22.5M | Py_UCS4 mask; | 72 | 22.5M | Py_ssize_t n = end - begin; | 73 | 22.5M | const STRINGLIB_CHAR *p = begin; | 74 | 22.5M | const STRINGLIB_CHAR *unrolled_end = begin + _Py_SIZE_ROUND_DOWN(n, 4); | 75 | 22.5M | Py_UCS4 max_char; | 76 | | | 77 | 22.5M | max_char = MAX_CHAR_ASCII; | 78 | 22.5M | mask = MASK_ASCII; | 79 | 535M | while (p < unrolled_end) { | 80 | 514M | STRINGLIB_CHAR bits = p[0] | p[1] | p[2] | p[3]; | 81 | 514M | if (bits & mask) { | 82 | 11.5M | if (mask == mask_limit) { | 83 | | /* Limit reached */ | 84 | 1.28M | return max_char_limit; | 85 | 1.28M | } | 86 | 10.3M | if (mask == MASK_ASCII) { | 87 | 5.68M | max_char = MAX_CHAR_UCS1; | 88 | 5.68M | mask = MASK_UCS1; | 89 | 5.68M | } | 90 | 4.62M | else { | 91 | | /* mask can't be MASK_UCS2 because of mask_limit above */ | 92 | 4.62M | assert(mask == MASK_UCS1); | 93 | 4.62M | max_char = MAX_CHAR_UCS2; | 94 | 4.62M | mask = MASK_UCS2; | 95 | 4.62M | } | 96 | | /* We check the new mask on the same chars in the next iteration */ | 97 | 10.3M | continue; | 98 | 11.5M | } | 99 | 502M | p += 4; | 100 | 502M | } | 101 | 65.5M | while (p < end) { | 102 | 44.3M | if (p[0] & mask) { | 103 | 2.33M | if (mask == mask_limit) { | 104 | | /* Limit reached */ | 105 | 91.4k | return max_char_limit; | 106 | 91.4k | } | 107 | 2.23M | if (mask == MASK_ASCII) { | 108 | 1.16M | max_char = MAX_CHAR_UCS1; | 109 | 1.16M | mask = MASK_UCS1; | 110 | 1.16M | } | 111 | 1.07M | else { | 112 | | /* mask can't be MASK_UCS2 because of mask_limit above */ | 113 | 1.07M | assert(mask == MASK_UCS1); | 114 | 1.07M | max_char = MAX_CHAR_UCS2; | 115 | 1.07M | mask = MASK_UCS2; | 116 | 1.07M | } | 117 | | /* We check the new mask on the same chars in the next iteration */ | 118 | 2.23M | continue; | 119 | 2.33M | } | 120 | 42.0M | p++; | 121 | 42.0M | } | 122 | 21.2M | return max_char; | 123 | 21.3M | } |
unicodeobject.c:ucs2lib_find_max_char Line | Count | Source | 61 | 31.2M | { | 62 | 31.2M | #if STRINGLIB_SIZEOF_CHAR == 2 | 63 | 31.2M | const Py_UCS4 mask_limit = MASK_UCS1; | 64 | 31.2M | const Py_UCS4 max_char_limit = MAX_CHAR_UCS2; | 65 | | #elif STRINGLIB_SIZEOF_CHAR == 4 | 66 | | const Py_UCS4 mask_limit = MASK_UCS2; | 67 | | const Py_UCS4 max_char_limit = MAX_CHAR_UCS4; | 68 | | #else | 69 | | #error Invalid STRINGLIB_SIZEOF_CHAR (must be 1, 2 or 4) | 70 | | #endif | 71 | 31.2M | Py_UCS4 mask; | 72 | 31.2M | Py_ssize_t n = end - begin; | 73 | 31.2M | const STRINGLIB_CHAR *p = begin; | 74 | 31.2M | const STRINGLIB_CHAR *unrolled_end = begin + _Py_SIZE_ROUND_DOWN(n, 4); | 75 | 31.2M | Py_UCS4 max_char; | 76 | | | 77 | 31.2M | max_char = MAX_CHAR_ASCII; | 78 | 31.2M | mask = MASK_ASCII; | 79 | 1.04G | while (p < unrolled_end) { | 80 | 1.03G | STRINGLIB_CHAR bits = p[0] | p[1] | p[2] | p[3]; | 81 | 1.03G | if (bits & mask) { | 82 | 33.7M | if (mask == mask_limit) { | 83 | | /* Limit reached */ | 84 | 16.8M | return max_char_limit; | 85 | 16.8M | } | 86 | 16.8M | if (mask == MASK_ASCII) { | 87 | 16.8M | max_char = MAX_CHAR_UCS1; | 88 | 16.8M | mask = MASK_UCS1; | 89 | 16.8M | } | 90 | 0 | else { | 91 | | /* mask can't be MASK_UCS2 because of mask_limit above */ | 92 | 0 | assert(mask == MASK_UCS1); | 93 | 0 | max_char = MAX_CHAR_UCS2; | 94 | 0 | mask = MASK_UCS2; | 95 | 0 | } | 96 | | /* We check the new mask on the same chars in the next iteration */ | 97 | 16.8M | continue; | 98 | 33.7M | } | 99 | 1.00G | p += 4; | 100 | 1.00G | } | 101 | 41.2M | while (p < end) { | 102 | 27.8M | if (p[0] & mask) { | 103 | 2.29M | if (mask == mask_limit) { | 104 | | /* Limit reached */ | 105 | 1.12M | return max_char_limit; | 106 | 1.12M | } | 107 | 1.17M | if (mask == MASK_ASCII) { | 108 | 1.17M | max_char = MAX_CHAR_UCS1; | 109 | 1.17M | mask = MASK_UCS1; | 110 | 1.17M | } | 111 | 0 | else { | 112 | | /* mask can't be MASK_UCS2 because of mask_limit above */ | 113 | 0 | assert(mask == MASK_UCS1); | 114 | 0 | max_char = MAX_CHAR_UCS2; | 115 | 0 | mask = MASK_UCS2; | 116 | 0 | } | 117 | | /* We check the new mask on the same chars in the next iteration */ | 118 | 1.17M | continue; | 119 | 2.29M | } | 120 | 25.5M | p++; | 121 | 25.5M | } | 122 | 13.3M | return max_char; | 123 | 14.4M | } |
|
124 | | |
125 | | #undef MASK_ASCII |
126 | | #undef MASK_UCS1 |
127 | | #undef MASK_UCS2 |
128 | | #undef MAX_CHAR_ASCII |
129 | | #undef MAX_CHAR_UCS1 |
130 | | #undef MAX_CHAR_UCS2 |
131 | | #undef MAX_CHAR_UCS4 |
132 | | |
133 | | #endif /* STRINGLIB_SIZEOF_CHAR == 1 */ |
134 | | |