/src/php-src/ext/standard/strnatcmp.c
Line | Count | Source |
1 | | /* |
2 | | |
3 | | Modified for PHP by Andrei Zmievski <andrei@ispi.net> |
4 | | |
5 | | strnatcmp.c -- Perform 'natural order' comparisons of strings in C. |
6 | | Copyright (C) 2000 by Martin Pool <mbp@humbug.org.au> |
7 | | |
8 | | This software is provided 'as-is', without any express or implied |
9 | | warranty. In no event will the authors be held liable for any damages |
10 | | arising from the use of this software. |
11 | | |
12 | | Permission is granted to anyone to use this software for any purpose, |
13 | | including commercial applications, and to alter it and redistribute it |
14 | | freely, subject to the following restrictions: |
15 | | |
16 | | 1. The origin of this software must not be misrepresented; you must not |
17 | | claim that you wrote the original software. If you use this software |
18 | | in a product, an acknowledgment in the product documentation would be |
19 | | appreciated but is not required. |
20 | | 2. Altered source versions must be plainly marked as such, and must not be |
21 | | misrepresented as being the original software. |
22 | | 3. This notice may not be removed or altered from any source distribution. |
23 | | */ |
24 | | |
25 | | #include <ctype.h> |
26 | | #include <string.h> |
27 | | #include <stdio.h> |
28 | | |
29 | | #include "php.h" |
30 | | #include "php_string.h" |
31 | | |
32 | | /* {{{ compare_right */ |
33 | | static int |
34 | | compare_right(char const **a, char const *aend, char const **b, char const *bend) |
35 | 564 | { |
36 | 564 | int bias = 0; |
37 | | |
38 | | /* The longest run of digits wins. That aside, the greatest |
39 | | value wins, but we can't know that it will until we've scanned |
40 | | both numbers to know that they have the same magnitude, so we |
41 | | remember it in BIAS. */ |
42 | 4.67k | for(;; (*a)++, (*b)++) { |
43 | 4.67k | if ((*a == aend || !isdigit((unsigned char)**a)) && |
44 | 428 | (*b == bend || !isdigit((unsigned char)**b))) |
45 | 344 | return bias; |
46 | 4.32k | else if (*a == aend || !isdigit((unsigned char)**a)) |
47 | 84 | return -1; |
48 | 4.24k | else if (*b == bend || !isdigit((unsigned char)**b)) |
49 | 136 | return +1; |
50 | 4.10k | else if (**a < **b) { |
51 | 240 | if (!bias) |
52 | 68 | bias = -1; |
53 | 3.86k | } else if (**a > **b) { |
54 | 192 | if (!bias) |
55 | 58 | bias = +1; |
56 | 192 | } |
57 | 4.67k | } |
58 | | |
59 | 0 | return 0; |
60 | 564 | } |
61 | | /* }}} */ |
62 | | |
63 | | /* {{{ compare_left */ |
64 | | static int |
65 | | compare_left(char const **a, char const *aend, char const **b, char const *bend) |
66 | 978 | { |
67 | | /* Compare two left-aligned numbers: the first to have a |
68 | | different value wins. */ |
69 | 3.41k | for(;; (*a)++, (*b)++) { |
70 | 3.41k | if ((*a == aend || !isdigit((unsigned char)**a)) && |
71 | 550 | (*b == bend || !isdigit((unsigned char)**b))) |
72 | 540 | return 0; |
73 | 2.87k | else if (*a == aend || !isdigit((unsigned char)**a)) |
74 | 10 | return -1; |
75 | 2.86k | else if (*b == bend || !isdigit((unsigned char)**b)) |
76 | 32 | return +1; |
77 | 2.83k | else if (**a < **b) |
78 | 108 | return -1; |
79 | 2.72k | else if (**a > **b) |
80 | 288 | return +1; |
81 | 3.41k | } |
82 | | |
83 | 0 | return 0; |
84 | 978 | } |
85 | | /* }}} */ |
86 | | |
87 | | /* {{{ strnatcmp_ex */ |
88 | | PHPAPI int strnatcmp_ex(char const *a, size_t a_len, char const *b, size_t b_len, bool is_case_insensitive) |
89 | 9.04k | { |
90 | 9.04k | unsigned char ca, cb; |
91 | 9.04k | char const *ap, *bp; |
92 | 9.04k | char const *aend = a + a_len, |
93 | 9.04k | *bend = b + b_len; |
94 | 9.04k | int fractional, result; |
95 | | |
96 | 9.04k | if (a_len == 0 || b_len == 0) { |
97 | 960 | return (a_len == b_len ? 0 : (a_len > b_len ? 1 : -1)); |
98 | 960 | } |
99 | | |
100 | 8.08k | ap = a; |
101 | 8.08k | bp = b; |
102 | | |
103 | 8.08k | ca = *ap; cb = *bp; |
104 | | |
105 | | /* skip over leading zeros */ |
106 | 8.08k | while (ca == '0' && (ap+1 < aend) && isdigit((unsigned char)ap[1])) { |
107 | 0 | ca = *++ap; |
108 | 0 | } |
109 | | |
110 | 8.08k | while (cb == '0' && (bp+1 < bend) && isdigit((unsigned char)bp[1])) { |
111 | 0 | cb = *++bp; |
112 | 0 | } |
113 | | |
114 | 87.7k | while (1) { |
115 | | |
116 | | /* Skip consecutive whitespace */ |
117 | 87.7k | while (isspace(ca)) { |
118 | 14.0k | ca = *++ap; |
119 | 14.0k | } |
120 | | |
121 | 87.7k | while (isspace(cb)) { |
122 | 13.8k | cb = *++bp; |
123 | 13.8k | } |
124 | | |
125 | | /* process run of digits */ |
126 | 87.7k | if (isdigit(ca) && isdigit(cb)) { |
127 | 1.54k | fractional = (ca == '0' || cb == '0'); |
128 | | |
129 | 1.54k | if (fractional) |
130 | 978 | result = compare_left(&ap, aend, &bp, bend); |
131 | 564 | else |
132 | 564 | result = compare_right(&ap, aend, &bp, bend); |
133 | | |
134 | 1.54k | if (result != 0) |
135 | 690 | return result; |
136 | 852 | else if (ap == aend && bp == bend) |
137 | | /* End of the strings. Let caller sort them out. */ |
138 | 94 | return 0; |
139 | 758 | else if (ap == aend) |
140 | 0 | return -1; |
141 | 758 | else if (bp == bend) |
142 | 0 | return 1; |
143 | 758 | else { |
144 | | /* Keep on comparing from the current point. */ |
145 | 758 | ca = *ap; cb = *bp; |
146 | 758 | } |
147 | 1.54k | } |
148 | | |
149 | 86.9k | if (is_case_insensitive) { |
150 | 0 | ca = toupper(ca); |
151 | 0 | cb = toupper(cb); |
152 | 0 | } |
153 | | |
154 | 86.9k | if (ca < cb) |
155 | 1.77k | return -1; |
156 | 85.1k | else if (ca > cb) |
157 | 3.68k | return +1; |
158 | | |
159 | 81.4k | ++ap; ++bp; |
160 | 81.4k | if (ap >= aend && bp >= bend) |
161 | | /* The strings compare the same. Perhaps the caller |
162 | | will want to call strcmp to break the tie. */ |
163 | 1.56k | return 0; |
164 | 79.8k | else if (ap >= aend) |
165 | 52 | return -1; |
166 | 79.8k | else if (bp >= bend) |
167 | 220 | return 1; |
168 | | |
169 | 79.6k | ca = *ap; cb = *bp; |
170 | 79.6k | } |
171 | 8.08k | } |
172 | | /* }}} */ |