1 /***************************************************************************
2  *                                  _   _ ____  _
3  *  Project                     ___| | | |  _ \| |
4  *                             / __| | | | |_) | |
5  *                            | (__| |_| |  _ <| |___
6  *                             \___|\___/|_| \_\_____|
7  *
8  * Copyright (C) 1998 - 2018, Daniel Stenberg, <daniel@haxx.se>, et al.
9  *
10  * This software is licensed as described in the file COPYING, which
11  * you should have received as part of this distribution. The terms
12  * are also available at https://curl.haxx.se/docs/copyright.html.
13  *
14  * You may opt to use, copy, modify, merge, publish, distribute and/or sell
15  * copies of the Software, and permit persons to whom the Software is
16  * furnished to do so, under the terms of the COPYING file.
17  *
18  * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
19  * KIND, either express or implied.
20  *
21  ***************************************************************************/
22 
23 #include "curl_setup.h"
24 
25 #include <curl/curl.h>
26 
27 #include "curl_fnmatch.h"
28 #include "curl_memory.h"
29 
30 /* The last #include file should be: */
31 #include "memdebug.h"
32 
33 #define CURLFNM_CHARSET_LEN (sizeof(char) * 256)
34 #define CURLFNM_CHSET_SIZE (CURLFNM_CHARSET_LEN + 15)
35 
36 #define CURLFNM_NEGATE  CURLFNM_CHARSET_LEN
37 
38 #define CURLFNM_ALNUM   (CURLFNM_CHARSET_LEN + 1)
39 #define CURLFNM_DIGIT   (CURLFNM_CHARSET_LEN + 2)
40 #define CURLFNM_XDIGIT  (CURLFNM_CHARSET_LEN + 3)
41 #define CURLFNM_ALPHA   (CURLFNM_CHARSET_LEN + 4)
42 #define CURLFNM_PRINT   (CURLFNM_CHARSET_LEN + 5)
43 #define CURLFNM_BLANK   (CURLFNM_CHARSET_LEN + 6)
44 #define CURLFNM_LOWER   (CURLFNM_CHARSET_LEN + 7)
45 #define CURLFNM_GRAPH   (CURLFNM_CHARSET_LEN + 8)
46 #define CURLFNM_SPACE   (CURLFNM_CHARSET_LEN + 9)
47 #define CURLFNM_UPPER   (CURLFNM_CHARSET_LEN + 10)
48 
49 typedef enum {
50   CURLFNM_LOOP_DEFAULT = 0,
51   CURLFNM_LOOP_BACKSLASH
52 } loop_state;
53 
54 typedef enum {
55   CURLFNM_SCHS_DEFAULT = 0,
56   CURLFNM_SCHS_MAYRANGE,
57   CURLFNM_SCHS_MAYRANGE2,
58   CURLFNM_SCHS_RIGHTBR,
59   CURLFNM_SCHS_RIGHTBRLEFTBR
60 } setcharset_state;
61 
62 typedef enum {
63   CURLFNM_PKW_INIT = 0,
64   CURLFNM_PKW_DDOT
65 } parsekey_state;
66 
67 #define SETCHARSET_OK     1
68 #define SETCHARSET_FAIL   0
69 
parsekeyword(unsigned char ** pattern,unsigned char * charset)70 static int parsekeyword(unsigned char **pattern, unsigned char *charset)
71 {
72   parsekey_state state = CURLFNM_PKW_INIT;
73 #define KEYLEN 10
74   char keyword[KEYLEN] = { 0 };
75   int found = FALSE;
76   int i;
77   unsigned char *p = *pattern;
78   for(i = 0; !found; i++) {
79     char c = *p++;
80     if(i >= KEYLEN)
81       return SETCHARSET_FAIL;
82     switch(state) {
83     case CURLFNM_PKW_INIT:
84       if(ISALPHA(c) && ISLOWER(c))
85         keyword[i] = c;
86       else if(c == ':')
87         state = CURLFNM_PKW_DDOT;
88       else
89         return 0;
90       break;
91     case CURLFNM_PKW_DDOT:
92       if(c == ']')
93         found = TRUE;
94       else
95         return SETCHARSET_FAIL;
96     }
97   }
98 #undef KEYLEN
99 
100   *pattern = p; /* move caller's pattern pointer */
101   if(strcmp(keyword, "digit") == 0)
102     charset[CURLFNM_DIGIT] = 1;
103   else if(strcmp(keyword, "alnum") == 0)
104     charset[CURLFNM_ALNUM] = 1;
105   else if(strcmp(keyword, "alpha") == 0)
106     charset[CURLFNM_ALPHA] = 1;
107   else if(strcmp(keyword, "xdigit") == 0)
108     charset[CURLFNM_XDIGIT] = 1;
109   else if(strcmp(keyword, "print") == 0)
110     charset[CURLFNM_PRINT] = 1;
111   else if(strcmp(keyword, "graph") == 0)
112     charset[CURLFNM_GRAPH] = 1;
113   else if(strcmp(keyword, "space") == 0)
114     charset[CURLFNM_SPACE] = 1;
115   else if(strcmp(keyword, "blank") == 0)
116     charset[CURLFNM_BLANK] = 1;
117   else if(strcmp(keyword, "upper") == 0)
118     charset[CURLFNM_UPPER] = 1;
119   else if(strcmp(keyword, "lower") == 0)
120     charset[CURLFNM_LOWER] = 1;
121   else
122     return SETCHARSET_FAIL;
123   return SETCHARSET_OK;
124 }
125 
126 /* returns 1 (true) if pattern is OK, 0 if is bad ("p" is pattern pointer) */
setcharset(unsigned char ** p,unsigned char * charset)127 static int setcharset(unsigned char **p, unsigned char *charset)
128 {
129   setcharset_state state = CURLFNM_SCHS_DEFAULT;
130   unsigned char rangestart = 0;
131   unsigned char lastchar   = 0;
132   bool something_found = FALSE;
133   unsigned char c;
134   for(;;) {
135     c = **p;
136     if(!c)
137       return SETCHARSET_FAIL;
138 
139     switch(state) {
140     case CURLFNM_SCHS_DEFAULT:
141       if(ISALNUM(c)) { /* ASCII value */
142         rangestart = c;
143         charset[c] = 1;
144         (*p)++;
145         state = CURLFNM_SCHS_MAYRANGE;
146         something_found = TRUE;
147       }
148       else if(c == ']') {
149         if(something_found)
150           return SETCHARSET_OK;
151         something_found = TRUE;
152         state = CURLFNM_SCHS_RIGHTBR;
153         charset[c] = 1;
154         (*p)++;
155       }
156       else if(c == '[') {
157         char c2 = *((*p) + 1);
158         if(c2 == ':') { /* there has to be a keyword */
159           (*p) += 2;
160           if(parsekeyword(p, charset)) {
161             state = CURLFNM_SCHS_DEFAULT;
162           }
163           else
164             return SETCHARSET_FAIL;
165         }
166         else {
167           charset[c] = 1;
168           (*p)++;
169         }
170         something_found = TRUE;
171       }
172       else if(c == '?' || c == '*') {
173         something_found = TRUE;
174         charset[c] = 1;
175         (*p)++;
176       }
177       else if(c == '^' || c == '!') {
178         if(!something_found) {
179           if(charset[CURLFNM_NEGATE]) {
180             charset[c] = 1;
181             something_found = TRUE;
182           }
183           else
184             charset[CURLFNM_NEGATE] = 1; /* negate charset */
185         }
186         else
187           charset[c] = 1;
188         (*p)++;
189       }
190       else if(c == '\\') {
191         c = *(++(*p));
192         if(ISPRINT((c))) {
193           something_found = TRUE;
194           state = CURLFNM_SCHS_MAYRANGE;
195           charset[c] = 1;
196           rangestart = c;
197           (*p)++;
198         }
199         else
200           return SETCHARSET_FAIL;
201       }
202       else {
203         charset[c] = 1;
204         (*p)++;
205         something_found = TRUE;
206       }
207       break;
208     case CURLFNM_SCHS_MAYRANGE:
209       if(c == '-') {
210         charset[c] = 1;
211         (*p)++;
212         lastchar = '-';
213         state = CURLFNM_SCHS_MAYRANGE2;
214       }
215       else if(c == '[') {
216         state = CURLFNM_SCHS_DEFAULT;
217       }
218       else if(ISALNUM(c)) {
219         charset[c] = 1;
220         (*p)++;
221       }
222       else if(c == '\\') {
223         c = *(++(*p));
224         if(ISPRINT(c)) {
225           charset[c] = 1;
226           (*p)++;
227         }
228         else
229           return SETCHARSET_FAIL;
230       }
231       else if(c == ']') {
232         return SETCHARSET_OK;
233       }
234       else
235         return SETCHARSET_FAIL;
236       break;
237     case CURLFNM_SCHS_MAYRANGE2:
238       if(c == ']') {
239         return SETCHARSET_OK;
240       }
241       else if(c == '\\') {
242         c = *(++(*p));
243         if(ISPRINT(c)) {
244           charset[c] = 1;
245           state = CURLFNM_SCHS_DEFAULT;
246           (*p)++;
247         }
248         else
249           return SETCHARSET_FAIL;
250       }
251       else if(c >= rangestart) {
252         if((ISLOWER(c) && ISLOWER(rangestart)) ||
253            (ISDIGIT(c) && ISDIGIT(rangestart)) ||
254            (ISUPPER(c) && ISUPPER(rangestart))) {
255           charset[lastchar] = 0;
256           rangestart++;
257           while(rangestart++ <= c)
258             charset[rangestart-1] = 1;
259           (*p)++;
260           state = CURLFNM_SCHS_DEFAULT;
261         }
262         else
263           return SETCHARSET_FAIL;
264       }
265       else
266         return SETCHARSET_FAIL;
267       break;
268     case CURLFNM_SCHS_RIGHTBR:
269       if(c == '[') {
270         state = CURLFNM_SCHS_RIGHTBRLEFTBR;
271         charset[c] = 1;
272         (*p)++;
273       }
274       else if(c == ']') {
275         return SETCHARSET_OK;
276       }
277       else if(ISPRINT(c)) {
278         charset[c] = 1;
279         (*p)++;
280         state = CURLFNM_SCHS_DEFAULT;
281       }
282       else
283         /* used 'goto fail' instead of 'return SETCHARSET_FAIL' to avoid a
284          * nonsense warning 'statement not reached' at end of the fnc when
285          * compiling on Solaris */
286         goto fail;
287       break;
288     case CURLFNM_SCHS_RIGHTBRLEFTBR:
289       if(c == ']') {
290         return SETCHARSET_OK;
291       }
292       else {
293         state  = CURLFNM_SCHS_DEFAULT;
294         charset[c] = 1;
295         (*p)++;
296       }
297       break;
298     }
299   }
300 fail:
301   return SETCHARSET_FAIL;
302 }
303 
loop(const unsigned char * pattern,const unsigned char * string,int maxstars)304 static int loop(const unsigned char *pattern, const unsigned char *string,
305                 int maxstars)
306 {
307   loop_state state = CURLFNM_LOOP_DEFAULT;
308   unsigned char *p = (unsigned char *)pattern;
309   unsigned char *s = (unsigned char *)string;
310   unsigned char charset[CURLFNM_CHSET_SIZE] = { 0 };
311   int rc = 0;
312 
313   for(;;) {
314     switch(state) {
315     case CURLFNM_LOOP_DEFAULT:
316       if(*p == '*') {
317         if(!maxstars)
318           return CURL_FNMATCH_NOMATCH;
319         while(*(p + 1) == '*') /* eliminate multiple stars */
320           p++;
321         if(*s == '\0' && *(p + 1) == '\0')
322           return CURL_FNMATCH_MATCH;
323         rc = loop(p + 1, s, maxstars - 1); /* *.txt matches .txt <=>
324                                               .txt matches .txt */
325         if(rc == CURL_FNMATCH_MATCH)
326           return CURL_FNMATCH_MATCH;
327         if(*s) /* let the star eat up one character */
328           s++;
329         else
330           return CURL_FNMATCH_NOMATCH;
331       }
332       else if(*p == '?') {
333         if(ISPRINT(*s)) {
334           s++;
335           p++;
336         }
337         else if(*s == '\0')
338           return CURL_FNMATCH_NOMATCH;
339         else
340           return CURL_FNMATCH_FAIL; /* cannot deal with other character */
341       }
342       else if(*p == '\0') {
343         if(*s == '\0')
344           return CURL_FNMATCH_MATCH;
345         return CURL_FNMATCH_NOMATCH;
346       }
347       else if(*p == '\\') {
348         state = CURLFNM_LOOP_BACKSLASH;
349         p++;
350       }
351       else if(*p == '[') {
352         unsigned char *pp = p + 1; /* cannot handle with pointer to register */
353         if(setcharset(&pp, charset)) {
354           int found = FALSE;
355           if(charset[(unsigned int)*s])
356             found = TRUE;
357           else if(charset[CURLFNM_ALNUM])
358             found = ISALNUM(*s);
359           else if(charset[CURLFNM_ALPHA])
360             found = ISALPHA(*s);
361           else if(charset[CURLFNM_DIGIT])
362             found = ISDIGIT(*s);
363           else if(charset[CURLFNM_XDIGIT])
364             found = ISXDIGIT(*s);
365           else if(charset[CURLFNM_PRINT])
366             found = ISPRINT(*s);
367           else if(charset[CURLFNM_SPACE])
368             found = ISSPACE(*s);
369           else if(charset[CURLFNM_UPPER])
370             found = ISUPPER(*s);
371           else if(charset[CURLFNM_LOWER])
372             found = ISLOWER(*s);
373           else if(charset[CURLFNM_BLANK])
374             found = ISBLANK(*s);
375           else if(charset[CURLFNM_GRAPH])
376             found = ISGRAPH(*s);
377 
378           if(charset[CURLFNM_NEGATE])
379             found = !found;
380 
381           if(found) {
382             p = pp + 1;
383             if(*s)
384               /* don't advance if we're matching on an empty string */
385               s++;
386             memset(charset, 0, CURLFNM_CHSET_SIZE);
387           }
388           else
389             return CURL_FNMATCH_NOMATCH;
390         }
391         else
392           return CURL_FNMATCH_FAIL;
393       }
394       else {
395         if(*p++ != *s++)
396           return CURL_FNMATCH_NOMATCH;
397       }
398       break;
399     case CURLFNM_LOOP_BACKSLASH:
400       if(ISPRINT(*p)) {
401         if(*p++ == *s++)
402           state = CURLFNM_LOOP_DEFAULT;
403         else
404           return CURL_FNMATCH_NOMATCH;
405       }
406       else
407         return CURL_FNMATCH_FAIL;
408       break;
409     }
410   }
411 }
412 
413 /*
414  * @unittest: 1307
415  */
Curl_fnmatch(void * ptr,const char * pattern,const char * string)416 int Curl_fnmatch(void *ptr, const char *pattern, const char *string)
417 {
418   (void)ptr; /* the argument is specified by the curl_fnmatch_callback
419                 prototype, but not used by Curl_fnmatch() */
420   if(!pattern || !string) {
421     return CURL_FNMATCH_FAIL;
422   }
423   return loop((unsigned char *)pattern, (unsigned char *)string, 5);
424 }
425