/src/php-src/ext/standard/strnatcmp.c
Line | Count | Source |
1 | | /* |
2 | | |
3 | | Modified for PHP by Andrei Zmievski <andrei@ispi.net> |
4 | | |
5 | | strnatcmp.c -- Perform 'natural order' comparisons of strings in C. |
6 | | Copyright (C) 2000 by Martin Pool <mbp@humbug.org.au> |
7 | | |
8 | | This software is provided 'as-is', without any express or implied |
9 | | warranty. In no event will the authors be held liable for any damages |
10 | | arising from the use of this software. |
11 | | |
12 | | Permission is granted to anyone to use this software for any purpose, |
13 | | including commercial applications, and to alter it and redistribute it |
14 | | freely, subject to the following restrictions: |
15 | | |
16 | | 1. The origin of this software must not be misrepresented; you must not |
17 | | claim that you wrote the original software. If you use this software |
18 | | in a product, an acknowledgment in the product documentation would be |
19 | | appreciated but is not required. |
20 | | 2. Altered source versions must be plainly marked as such, and must not be |
21 | | misrepresented as being the original software. |
22 | | 3. This notice may not be removed or altered from any source distribution. |
23 | | */ |
24 | | |
25 | | #include <ctype.h> |
26 | | #include <string.h> |
27 | | #include <stdio.h> |
28 | | |
29 | | #include "php.h" |
30 | | #include "php_string.h" |
31 | | |
32 | | /* {{{ compare_right */ |
33 | | static int |
34 | | compare_right(char const **a, char const *aend, char const **b, char const *bend) |
35 | 2.36k | { |
36 | 2.36k | int bias = 0; |
37 | | |
38 | | /* The longest run of digits wins. That aside, the greatest |
39 | | value wins, but we can't know that it will until we've scanned |
40 | | both numbers to know that they have the same magnitude, so we |
41 | | remember it in BIAS. */ |
42 | 13.2k | for(;; (*a)++, (*b)++) { |
43 | 13.2k | if ((*a == aend || !isdigit((unsigned char)**a)) && |
44 | 1.65k | (*b == bend || !isdigit((unsigned char)**b))) |
45 | 1.37k | return bias; |
46 | 11.8k | else if (*a == aend || !isdigit((unsigned char)**a)) |
47 | 283 | return -1; |
48 | 11.5k | else if (*b == bend || !isdigit((unsigned char)**b)) |
49 | 706 | return +1; |
50 | 10.8k | else if (**a < **b) { |
51 | 1.73k | if (!bias) |
52 | 464 | bias = -1; |
53 | 9.11k | } else if (**a > **b) { |
54 | 1.60k | if (!bias) |
55 | 809 | bias = +1; |
56 | 1.60k | } |
57 | 13.2k | } |
58 | | |
59 | 0 | return 0; |
60 | 2.36k | } |
61 | | /* }}} */ |
62 | | |
63 | | /* {{{ compare_left */ |
64 | | static int |
65 | | compare_left(char const **a, char const *aend, char const **b, char const *bend) |
66 | 1.14k | { |
67 | | /* Compare two left-aligned numbers: the first to have a |
68 | | different value wins. */ |
69 | 3.61k | for(;; (*a)++, (*b)++) { |
70 | 3.61k | if ((*a == aend || !isdigit((unsigned char)**a)) && |
71 | 586 | (*b == bend || !isdigit((unsigned char)**b))) |
72 | 576 | return 0; |
73 | 3.03k | else if (*a == aend || !isdigit((unsigned char)**a)) |
74 | 10 | return -1; |
75 | 3.02k | else if (*b == bend || !isdigit((unsigned char)**b)) |
76 | 32 | return +1; |
77 | 2.99k | else if (**a < **b) |
78 | 168 | return -1; |
79 | 2.82k | else if (**a > **b) |
80 | 354 | return +1; |
81 | 3.61k | } |
82 | | |
83 | 0 | return 0; |
84 | 1.14k | } |
85 | | /* }}} */ |
86 | | |
87 | | /* {{{ strnatcmp_ex */ |
88 | | PHPAPI int strnatcmp_ex(char const *a, size_t a_len, char const *b, size_t b_len, bool is_case_insensitive) |
89 | 24.4k | { |
90 | 24.4k | unsigned char ca, cb; |
91 | 24.4k | char const *ap, *bp; |
92 | 24.4k | char const *aend = a + a_len, |
93 | 24.4k | *bend = b + b_len; |
94 | 24.4k | int fractional, result; |
95 | | |
96 | 24.4k | if (a_len == 0 || b_len == 0) { |
97 | 1.48k | return (a_len == b_len ? 0 : (a_len > b_len ? 1 : -1)); |
98 | 1.48k | } |
99 | | |
100 | 23.0k | ap = a; |
101 | 23.0k | bp = b; |
102 | | |
103 | 23.0k | ca = *ap; cb = *bp; |
104 | | |
105 | | /* skip over leading zeros */ |
106 | 23.5k | while (ca == '0' && (ap+1 < aend) && isdigit((unsigned char)ap[1])) { |
107 | 498 | ca = *++ap; |
108 | 498 | } |
109 | | |
110 | 23.1k | while (cb == '0' && (bp+1 < bend) && isdigit((unsigned char)bp[1])) { |
111 | 120 | cb = *++bp; |
112 | 120 | } |
113 | | |
114 | 244k | while (1) { |
115 | | |
116 | | /* Skip consecutive whitespace */ |
117 | 244k | while (isspace(ca)) { |
118 | 32.0k | ca = *++ap; |
119 | 32.0k | } |
120 | | |
121 | 244k | while (isspace(cb)) { |
122 | 32.1k | cb = *++bp; |
123 | 32.1k | } |
124 | | |
125 | | /* process run of digits */ |
126 | 244k | if (isdigit(ca) && isdigit(cb)) { |
127 | 3.50k | fractional = (ca == '0' || cb == '0'); |
128 | | |
129 | 3.50k | if (fractional) |
130 | 1.14k | result = compare_left(&ap, aend, &bp, bend); |
131 | 2.36k | else |
132 | 2.36k | result = compare_right(&ap, aend, &bp, bend); |
133 | | |
134 | 3.50k | if (result != 0) |
135 | 2.09k | return result; |
136 | 1.40k | else if (ap == aend && bp == bend) |
137 | | /* End of the strings. Let caller sort them out. */ |
138 | 97 | return 0; |
139 | 1.31k | else if (ap == aend) |
140 | 3 | return -1; |
141 | 1.30k | else if (bp == bend) |
142 | 6 | return 1; |
143 | 1.30k | else { |
144 | | /* Keep on comparing from the current point. */ |
145 | 1.30k | ca = *ap; cb = *bp; |
146 | 1.30k | } |
147 | 3.50k | } |
148 | | |
149 | 242k | if (is_case_insensitive) { |
150 | 0 | ca = toupper(ca); |
151 | 0 | cb = toupper(cb); |
152 | 0 | } |
153 | | |
154 | 242k | if (ca < cb) |
155 | 5.20k | return -1; |
156 | 237k | else if (ca > cb) |
157 | 11.5k | return +1; |
158 | | |
159 | 225k | ++ap; ++bp; |
160 | 225k | if (ap >= aend && bp >= bend) |
161 | | /* The strings compare the same. Perhaps the caller |
162 | | will want to call strcmp to break the tie. */ |
163 | 3.15k | return 0; |
164 | 222k | else if (ap >= aend) |
165 | 229 | return -1; |
166 | 222k | else if (bp >= bend) |
167 | 649 | return 1; |
168 | | |
169 | 221k | ca = *ap; cb = *bp; |
170 | 221k | } |
171 | 23.0k | } |
172 | | /* }}} */ |