1 /*- 2 * Copyright (c) 2003-2007 Tim Kientzle 3 * All rights reserved. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions 7 * are met: 8 * 1. Redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer. 10 * 2. Redistributions in binary form must reproduce the above copyright 11 * notice, this list of conditions and the following disclaimer in the 12 * documentation and/or other materials provided with the distribution. 13 * 14 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR 15 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 16 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 17 * IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT, 18 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 19 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 20 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 21 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 22 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 23 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 24 */ 25 #include "test.h" 26 27 #define __LIBARCHIVE_TEST 28 #include "archive_pathmatch.h" 29 30 /* 31 * Verify that the pattern matcher implements the wildcard logic specified 32 * in SUSv2 for the cpio command. This is essentially the 33 * shell glob syntax: 34 * * - matches any sequence of chars, including '/' 35 * ? - matches any single char, including '/' 36 * [...] - matches any of a set of chars, '-' specifies a range, 37 * initial '!' is undefined 38 * 39 * The specification in SUSv2 is a bit incomplete, I assume the following: 40 * Trailing '-' in [...] is not special. 41 * 42 * TODO: Figure out if there's a good way to extend this to handle 43 * Windows paths that use '\' as a path separator. <sigh> 44 */ 45 46 DEFINE_TEST(test_archive_pathmatch) 47 { 48 assertEqualInt(1, archive_pathmatch("a/b/c", "a/b/c", 0)); 49 assertEqualInt(0, archive_pathmatch("a/b/", "a/b/c", 0)); 50 assertEqualInt(0, archive_pathmatch("a/b", "a/b/c", 0)); 51 assertEqualInt(0, archive_pathmatch("a/b/c", "a/b/", 0)); 52 assertEqualInt(0, archive_pathmatch("a/b/c", "a/b", 0)); 53 54 /* Null string and non-empty pattern returns false. */ 55 assertEqualInt(0, archive_pathmatch("a/b/c", NULL, 0)); 56 assertEqualInt(0, archive_pathmatch_w(L"a/b/c", NULL, 0)); 57 58 /* Empty pattern only matches empty string. */ 59 assertEqualInt(1, archive_pathmatch("","", 0)); 60 assertEqualInt(0, archive_pathmatch("","a", 0)); 61 assertEqualInt(1, archive_pathmatch("*","", 0)); 62 assertEqualInt(1, archive_pathmatch("*","a", 0)); 63 assertEqualInt(1, archive_pathmatch("*","abcd", 0)); 64 /* SUSv2: * matches / */ 65 assertEqualInt(1, archive_pathmatch("*","abcd/efgh/ijkl", 0)); 66 assertEqualInt(1, archive_pathmatch("abcd*efgh/ijkl","abcd/efgh/ijkl", 0)); 67 assertEqualInt(1, archive_pathmatch("abcd***efgh/ijkl","abcd/efgh/ijkl", 0)); 68 assertEqualInt(1, archive_pathmatch("abcd***/efgh/ijkl","abcd/efgh/ijkl", 0)); 69 assertEqualInt(0, archive_pathmatch("?", "", 0)); 70 assertEqualInt(0, archive_pathmatch("?", "\0", 0)); 71 assertEqualInt(1, archive_pathmatch("?", "a", 0)); 72 assertEqualInt(0, archive_pathmatch("?", "ab", 0)); 73 assertEqualInt(1, archive_pathmatch("?", ".", 0)); 74 assertEqualInt(1, archive_pathmatch("?", "?", 0)); 75 assertEqualInt(1, archive_pathmatch("a", "a", 0)); 76 assertEqualInt(0, archive_pathmatch("a", "ab", 0)); 77 assertEqualInt(0, archive_pathmatch("a", "ab", 0)); 78 assertEqualInt(1, archive_pathmatch("a?c", "abc", 0)); 79 /* SUSv2: ? matches / */ 80 assertEqualInt(1, archive_pathmatch("a?c", "a/c", 0)); 81 assertEqualInt(1, archive_pathmatch("a?*c*", "a/c", 0)); 82 assertEqualInt(1, archive_pathmatch("*a*", "a/c", 0)); 83 assertEqualInt(1, archive_pathmatch("*a*", "/a/c", 0)); 84 assertEqualInt(1, archive_pathmatch("*a*", "defaaaaaaa", 0)); 85 assertEqualInt(0, archive_pathmatch("a*", "defghi", 0)); 86 assertEqualInt(0, archive_pathmatch("*a*", "defghi", 0)); 87 88 /* Character classes */ 89 assertEqualInt(1, archive_pathmatch("abc[def", "abc[def", 0)); 90 assertEqualInt(0, archive_pathmatch("abc[def]", "abc[def", 0)); 91 assertEqualInt(0, archive_pathmatch("abc[def", "abcd", 0)); 92 assertEqualInt(1, archive_pathmatch("abc[def]", "abcd", 0)); 93 assertEqualInt(1, archive_pathmatch("abc[def]", "abce", 0)); 94 assertEqualInt(1, archive_pathmatch("abc[def]", "abcf", 0)); 95 assertEqualInt(0, archive_pathmatch("abc[def]", "abcg", 0)); 96 assertEqualInt(1, archive_pathmatch("abc[d*f]", "abcd", 0)); 97 assertEqualInt(1, archive_pathmatch("abc[d*f]", "abc*", 0)); 98 assertEqualInt(0, archive_pathmatch("abc[d*f]", "abcdefghi", 0)); 99 assertEqualInt(0, archive_pathmatch("abc[d*", "abcdefghi", 0)); 100 assertEqualInt(1, archive_pathmatch("abc[d*", "abc[defghi", 0)); 101 assertEqualInt(1, archive_pathmatch("abc[d-f]", "abcd", 0)); 102 assertEqualInt(1, archive_pathmatch("abc[d-f]", "abce", 0)); 103 assertEqualInt(1, archive_pathmatch("abc[d-f]", "abcf", 0)); 104 assertEqualInt(0, archive_pathmatch("abc[d-f]", "abcg", 0)); 105 assertEqualInt(0, archive_pathmatch("abc[d-fh-k]", "abca", 0)); 106 assertEqualInt(1, archive_pathmatch("abc[d-fh-k]", "abcd", 0)); 107 assertEqualInt(1, archive_pathmatch("abc[d-fh-k]", "abce", 0)); 108 assertEqualInt(1, archive_pathmatch("abc[d-fh-k]", "abcf", 0)); 109 assertEqualInt(0, archive_pathmatch("abc[d-fh-k]", "abcg", 0)); 110 assertEqualInt(1, archive_pathmatch("abc[d-fh-k]", "abch", 0)); 111 assertEqualInt(1, archive_pathmatch("abc[d-fh-k]", "abci", 0)); 112 assertEqualInt(1, archive_pathmatch("abc[d-fh-k]", "abcj", 0)); 113 assertEqualInt(1, archive_pathmatch("abc[d-fh-k]", "abck", 0)); 114 assertEqualInt(0, archive_pathmatch("abc[d-fh-k]", "abcl", 0)); 115 assertEqualInt(0, archive_pathmatch("abc[d-fh-k]", "abc-", 0)); 116 117 /* [] matches nothing, [!] is the same as ? */ 118 assertEqualInt(0, archive_pathmatch("abc[]efg", "abcdefg", 0)); 119 assertEqualInt(0, archive_pathmatch("abc[]efg", "abcqefg", 0)); 120 assertEqualInt(0, archive_pathmatch("abc[]efg", "abcefg", 0)); 121 assertEqualInt(1, archive_pathmatch("abc[!]efg", "abcdefg", 0)); 122 assertEqualInt(1, archive_pathmatch("abc[!]efg", "abcqefg", 0)); 123 assertEqualInt(0, archive_pathmatch("abc[!]efg", "abcefg", 0)); 124 125 /* I assume: Trailing '-' is non-special. */ 126 assertEqualInt(0, archive_pathmatch("abc[d-fh-]", "abcl", 0)); 127 assertEqualInt(1, archive_pathmatch("abc[d-fh-]", "abch", 0)); 128 assertEqualInt(1, archive_pathmatch("abc[d-fh-]", "abc-", 0)); 129 assertEqualInt(1, archive_pathmatch("abc[d-fh-]", "abc-", 0)); 130 131 /* ']' can be backslash-quoted within a character class. */ 132 assertEqualInt(1, archive_pathmatch("abc[\\]]", "abc]", 0)); 133 assertEqualInt(1, archive_pathmatch("abc[\\]d]", "abc]", 0)); 134 assertEqualInt(1, archive_pathmatch("abc[\\]d]", "abcd", 0)); 135 assertEqualInt(1, archive_pathmatch("abc[d\\]]", "abc]", 0)); 136 assertEqualInt(1, archive_pathmatch("abc[d\\]]", "abcd", 0)); 137 assertEqualInt(1, archive_pathmatch("abc[d]e]", "abcde]", 0)); 138 assertEqualInt(1, archive_pathmatch("abc[d\\]e]", "abc]", 0)); 139 assertEqualInt(0, archive_pathmatch("abc[d\\]e]", "abcd]e", 0)); 140 assertEqualInt(0, archive_pathmatch("abc[d]e]", "abc]", 0)); 141 142 /* backslash-quoted chars can appear as either end of a range. */ 143 assertEqualInt(1, archive_pathmatch("abc[\\d-f]gh", "abcegh", 0)); 144 assertEqualInt(0, archive_pathmatch("abc[\\d-f]gh", "abcggh", 0)); 145 assertEqualInt(0, archive_pathmatch("abc[\\d-f]gh", "abc\\gh", 0)); 146 assertEqualInt(1, archive_pathmatch("abc[d-\\f]gh", "abcegh", 0)); 147 assertEqualInt(1, archive_pathmatch("abc[\\d-\\f]gh", "abcegh", 0)); 148 assertEqualInt(1, archive_pathmatch("abc[\\d-\\f]gh", "abcegh", 0)); 149 /* backslash-quoted '-' isn't special. */ 150 assertEqualInt(0, archive_pathmatch("abc[d\\-f]gh", "abcegh", 0)); 151 assertEqualInt(1, archive_pathmatch("abc[d\\-f]gh", "abc-gh", 0)); 152 153 /* Leading '!' negates a character class. */ 154 assertEqualInt(0, archive_pathmatch("abc[!d]", "abcd", 0)); 155 assertEqualInt(1, archive_pathmatch("abc[!d]", "abce", 0)); 156 assertEqualInt(1, archive_pathmatch("abc[!d]", "abcc", 0)); 157 assertEqualInt(0, archive_pathmatch("abc[!d-z]", "abcq", 0)); 158 assertEqualInt(1, archive_pathmatch("abc[!d-gi-z]", "abch", 0)); 159 assertEqualInt(1, archive_pathmatch("abc[!fgijkl]", "abch", 0)); 160 assertEqualInt(0, archive_pathmatch("abc[!fghijkl]", "abch", 0)); 161 162 /* Backslash quotes next character. */ 163 assertEqualInt(0, archive_pathmatch("abc\\[def]", "abc\\d", 0)); 164 assertEqualInt(1, archive_pathmatch("abc\\[def]", "abc[def]", 0)); 165 assertEqualInt(0, archive_pathmatch("abc\\\\[def]", "abc[def]", 0)); 166 assertEqualInt(0, archive_pathmatch("abc\\\\[def]", "abc\\[def]", 0)); 167 assertEqualInt(1, archive_pathmatch("abc\\\\[def]", "abc\\d", 0)); 168 assertEqualInt(1, archive_pathmatch("abcd\\", "abcd\\", 0)); 169 assertEqualInt(0, archive_pathmatch("abcd\\", "abcd\\[", 0)); 170 assertEqualInt(0, archive_pathmatch("abcd\\", "abcde", 0)); 171 assertEqualInt(0, archive_pathmatch("abcd\\[", "abcd\\", 0)); 172 173 /* 174 * Because '.' and '/' have special meanings, we can 175 * identify many equivalent paths even if they're expressed 176 * differently. (But quoting a character with '\\' suppresses 177 * special meanings!) 178 */ 179 assertEqualInt(0, archive_pathmatch("a/b/", "a/bc", 0)); 180 assertEqualInt(1, archive_pathmatch("a/./b", "a/b", 0)); 181 assertEqualInt(0, archive_pathmatch("a\\/./b", "a/b", 0)); 182 assertEqualInt(0, archive_pathmatch("a/\\./b", "a/b", 0)); 183 assertEqualInt(0, archive_pathmatch("a/.\\/b", "a/b", 0)); 184 assertEqualInt(0, archive_pathmatch("a\\/\\.\\/b", "a/b", 0)); 185 assertEqualInt(1, archive_pathmatch("./abc/./def/", "abc/def/", 0)); 186 assertEqualInt(1, archive_pathmatch("abc/def", "./././abc/./def", 0)); 187 assertEqualInt(1, archive_pathmatch("abc/def/././//", "./././abc/./def/", 0)); 188 assertEqualInt(1, archive_pathmatch(".////abc/.//def", "./././abc/./def", 0)); 189 assertEqualInt(1, archive_pathmatch("./abc?def/", "abc/def/", 0)); 190 failure("\"?./\" is not the same as \"/./\""); 191 assertEqualInt(0, archive_pathmatch("./abc?./def/", "abc/def/", 0)); 192 failure("Trailing '/' should match no trailing '/'"); 193 assertEqualInt(1, archive_pathmatch("./abc/./def/", "abc/def", 0)); 194 failure("Trailing '/./' is still the same directory."); 195 assertEqualInt(1, archive_pathmatch("./abc/./def/./", "abc/def", 0)); 196 failure("Trailing '/.' is still the same directory."); 197 assertEqualInt(1, archive_pathmatch("./abc/./def/.", "abc/def", 0)); 198 assertEqualInt(1, archive_pathmatch("./abc/./def", "abc/def/", 0)); 199 failure("Trailing '/./' is still the same directory."); 200 assertEqualInt(1, archive_pathmatch("./abc/./def", "abc/def/./", 0)); 201 failure("Trailing '/.' is still the same directory."); 202 assertEqualInt(1, archive_pathmatch("./abc*/./def", "abc/def/.", 0)); 203 204 /* Matches not anchored at beginning. */ 205 assertEqualInt(0, 206 archive_pathmatch("bcd", "abcd", PATHMATCH_NO_ANCHOR_START)); 207 assertEqualInt(1, 208 archive_pathmatch("abcd", "abcd", PATHMATCH_NO_ANCHOR_START)); 209 assertEqualInt(0, 210 archive_pathmatch("^bcd", "abcd", PATHMATCH_NO_ANCHOR_START)); 211 assertEqualInt(1, 212 archive_pathmatch("b/c/d", "a/b/c/d", PATHMATCH_NO_ANCHOR_START)); 213 assertEqualInt(0, 214 archive_pathmatch("^b/c/d", "a/b/c/d", PATHMATCH_NO_ANCHOR_START)); 215 assertEqualInt(0, 216 archive_pathmatch("/b/c/d", "a/b/c/d", PATHMATCH_NO_ANCHOR_START)); 217 assertEqualInt(0, 218 archive_pathmatch("a/b/c", "a/b/c/d", PATHMATCH_NO_ANCHOR_START)); 219 assertEqualInt(1, 220 archive_pathmatch("a/b/c/d", "a/b/c/d", PATHMATCH_NO_ANCHOR_START)); 221 assertEqualInt(0, 222 archive_pathmatch("b/c", "a/b/c/d", PATHMATCH_NO_ANCHOR_START)); 223 assertEqualInt(0, 224 archive_pathmatch("^b/c", "a/b/c/d", PATHMATCH_NO_ANCHOR_START)); 225 226 227 assertEqualInt(1, 228 archive_pathmatch("b/c/d", "a/b/c/d", PATHMATCH_NO_ANCHOR_START)); 229 assertEqualInt(1, 230 archive_pathmatch("b/c/d", "/a/b/c/d", PATHMATCH_NO_ANCHOR_START)); 231 232 233 /* Matches not anchored at end. */ 234 assertEqualInt(0, 235 archive_pathmatch("bcd", "abcd", PATHMATCH_NO_ANCHOR_END)); 236 assertEqualInt(1, 237 archive_pathmatch("abcd", "abcd", PATHMATCH_NO_ANCHOR_END)); 238 assertEqualInt(1, 239 archive_pathmatch("abcd", "abcd/", PATHMATCH_NO_ANCHOR_END)); 240 assertEqualInt(1, 241 archive_pathmatch("abcd", "abcd/.", PATHMATCH_NO_ANCHOR_END)); 242 assertEqualInt(0, 243 archive_pathmatch("abc", "abcd", PATHMATCH_NO_ANCHOR_END)); 244 assertEqualInt(1, 245 archive_pathmatch("a/b/c", "a/b/c/d", PATHMATCH_NO_ANCHOR_END)); 246 assertEqualInt(0, 247 archive_pathmatch("a/b/c$", "a/b/c/d", PATHMATCH_NO_ANCHOR_END)); 248 assertEqualInt(1, 249 archive_pathmatch("a/b/c$", "a/b/c", PATHMATCH_NO_ANCHOR_END)); 250 assertEqualInt(1, 251 archive_pathmatch("a/b/c$", "a/b/c/", PATHMATCH_NO_ANCHOR_END)); 252 assertEqualInt(1, 253 archive_pathmatch("a/b/c/", "a/b/c/d", PATHMATCH_NO_ANCHOR_END)); 254 assertEqualInt(0, 255 archive_pathmatch("a/b/c/$", "a/b/c/d", PATHMATCH_NO_ANCHOR_END)); 256 assertEqualInt(1, 257 archive_pathmatch("a/b/c/$", "a/b/c/", PATHMATCH_NO_ANCHOR_END)); 258 assertEqualInt(1, 259 archive_pathmatch("a/b/c/$", "a/b/c", PATHMATCH_NO_ANCHOR_END)); 260 assertEqualInt(0, 261 archive_pathmatch("b/c", "a/b/c/d", PATHMATCH_NO_ANCHOR_END)); 262 263 /* Matches not anchored at either end. */ 264 assertEqualInt(1, 265 archive_pathmatch("b/c", "a/b/c/d", PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END)); 266 assertEqualInt(0, 267 archive_pathmatch("/b/c", "a/b/c/d", PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END)); 268 assertEqualInt(0, 269 archive_pathmatch("/a/b/c", "a/b/c/d", PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END)); 270 assertEqualInt(1, 271 archive_pathmatch("/a/b/c", "/a/b/c/d", PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END)); 272 assertEqualInt(0, 273 archive_pathmatch("/a/b/c$", "a/b/c/d", PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END)); 274 assertEqualInt(0, 275 archive_pathmatch("/a/b/c/d$", "a/b/c/d", PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END)); 276 assertEqualInt(0, 277 archive_pathmatch("/a/b/c/d$", "/a/b/c/d/e", PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END)); 278 assertEqualInt(1, 279 archive_pathmatch("/a/b/c/d$", "/a/b/c/d", PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END)); 280 assertEqualInt(1, 281 archive_pathmatch("^a/b/c", "a/b/c/d", PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END)); 282 assertEqualInt(0, 283 archive_pathmatch("^a/b/c$", "a/b/c/d", PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END)); 284 assertEqualInt(0, 285 archive_pathmatch("a/b/c$", "a/b/c/d", PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END)); 286 assertEqualInt(1, 287 archive_pathmatch("b/c/d$", "a/b/c/d", PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END)); 288 } 289