1 /* Create and destroy argument vectors (argv's)
2    Copyright (C) 1992, 2001, 2010, 2012 Free Software Foundation, Inc.
3    Written by Fred Fish @ Cygnus Support
4 
5 This file is part of the libiberty library.
6 Libiberty is free software; you can redistribute it and/or
7 modify it under the terms of the GNU Library General Public
8 License as published by the Free Software Foundation; either
9 version 2 of the License, or (at your option) any later version.
10 
11 Libiberty is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14 Library General Public License for more details.
15 
16 You should have received a copy of the GNU Library General Public
17 License along with libiberty; see the file COPYING.LIB.  If
18 not, write to the Free Software Foundation, Inc., 51 Franklin Street - Fifth Floor,
19 Boston, MA 02110-1301, USA.  */
20 
21 
22 /*  Create and destroy argument vectors.  An argument vector is simply an
23     array of string pointers, terminated by a NULL pointer. */
24 
25 #ifdef HAVE_CONFIG_H
26 #include "config.h"
27 #endif
28 #include "ansidecl.h"
29 #include "libiberty.h"
30 #include "safe-ctype.h"
31 
32 /*  Routines imported from standard C runtime libraries. */
33 
34 #include <stddef.h>
35 #include <string.h>
36 #include <stdlib.h>
37 #include <stdio.h>
38 
39 #ifndef NULL
40 #define NULL 0
41 #endif
42 
43 #ifndef EOS
44 #define EOS '\0'
45 #endif
46 
47 #define INITIAL_MAXARGC 8	/* Number of args + NULL in initial argv */
48 
49 
50 /*
51 
52 @deftypefn Extension char** dupargv (char **@var{vector})
53 
54 Duplicate an argument vector.  Simply scans through @var{vector},
55 duplicating each argument until the terminating @code{NULL} is found.
56 Returns a pointer to the argument vector if successful.  Returns
57 @code{NULL} if there is insufficient memory to complete building the
58 argument vector.
59 
60 @end deftypefn
61 
62 */
63 
64 char **
dupargv(char ** argv)65 dupargv (char **argv)
66 {
67   int argc;
68   char **copy;
69 
70   if (argv == NULL)
71     return NULL;
72 
73   /* the vector */
74   for (argc = 0; argv[argc] != NULL; argc++);
75   copy = (char **) xmalloc ((argc + 1) * sizeof (char *));
76 
77   /* the strings */
78   for (argc = 0; argv[argc] != NULL; argc++)
79     {
80       int len = strlen (argv[argc]);
81       copy[argc] = (char *) xmalloc (len + 1);
82       strcpy (copy[argc], argv[argc]);
83     }
84   copy[argc] = NULL;
85   return copy;
86 }
87 
88 /*
89 
90 @deftypefn Extension void freeargv (char **@var{vector})
91 
92 Free an argument vector that was built using @code{buildargv}.  Simply
93 scans through @var{vector}, freeing the memory for each argument until
94 the terminating @code{NULL} is found, and then frees @var{vector}
95 itself.
96 
97 @end deftypefn
98 
99 */
100 
freeargv(char ** vector)101 void freeargv (char **vector)
102 {
103   register char **scan;
104 
105   if (vector != NULL)
106     {
107       for (scan = vector; *scan != NULL; scan++)
108 	{
109 	  free (*scan);
110 	}
111       free (vector);
112     }
113 }
114 
115 static void
consume_whitespace(const char ** input)116 consume_whitespace (const char **input)
117 {
118   while (ISSPACE (**input))
119     {
120       (*input)++;
121     }
122 }
123 
124 static int
only_whitespace(const char * input)125 only_whitespace (const char* input)
126 {
127   while (*input != EOS && ISSPACE (*input))
128     input++;
129 
130   return (*input == EOS);
131 }
132 
133 /*
134 
135 @deftypefn Extension char** buildargv (char *@var{sp})
136 
137 Given a pointer to a string, parse the string extracting fields
138 separated by whitespace and optionally enclosed within either single
139 or double quotes (which are stripped off), and build a vector of
140 pointers to copies of the string for each field.  The input string
141 remains unchanged.  The last element of the vector is followed by a
142 @code{NULL} element.
143 
144 All of the memory for the pointer array and copies of the string
145 is obtained from @code{xmalloc}.  All of the memory can be returned to the
146 system with the single function call @code{freeargv}, which takes the
147 returned result of @code{buildargv}, as it's argument.
148 
149 Returns a pointer to the argument vector if successful.  Returns
150 @code{NULL} if @var{sp} is @code{NULL} or if there is insufficient
151 memory to complete building the argument vector.
152 
153 If the input is a null string (as opposed to a @code{NULL} pointer),
154 then buildarg returns an argument vector that has one arg, a null
155 string.
156 
157 @end deftypefn
158 
159 The memory for the argv array is dynamically expanded as necessary.
160 
161 In order to provide a working buffer for extracting arguments into,
162 with appropriate stripping of quotes and translation of backslash
163 sequences, we allocate a working buffer at least as long as the input
164 string.  This ensures that we always have enough space in which to
165 work, since the extracted arg is never larger than the input string.
166 
167 The argument vector is always kept terminated with a @code{NULL} arg
168 pointer, so it can be passed to @code{freeargv} at any time, or
169 returned, as appropriate.
170 
171 */
172 
buildargv(const char * input)173 char **buildargv (const char *input)
174 {
175   char *arg;
176   char *copybuf;
177   int squote = 0;
178   int dquote = 0;
179   int bsquote = 0;
180   int argc = 0;
181   int maxargc = 0;
182   char **argv = NULL;
183   char **nargv;
184 
185   if (input != NULL)
186     {
187       copybuf = (char *) xmalloc (strlen (input) + 1);
188       /* Is a do{}while to always execute the loop once.  Always return an
189 	 argv, even for null strings.  See NOTES above, test case below. */
190       do
191 	{
192 	  /* Pick off argv[argc] */
193 	  consume_whitespace (&input);
194 
195 	  if ((maxargc == 0) || (argc >= (maxargc - 1)))
196 	    {
197 	      /* argv needs initialization, or expansion */
198 	      if (argv == NULL)
199 		{
200 		  maxargc = INITIAL_MAXARGC;
201 		  nargv = (char **) xmalloc (maxargc * sizeof (char *));
202 		}
203 	      else
204 		{
205 		  maxargc *= 2;
206 		  nargv = (char **) xrealloc (argv, maxargc * sizeof (char *));
207 		}
208 	      argv = nargv;
209 	      argv[argc] = NULL;
210 	    }
211 	  /* Begin scanning arg */
212 	  arg = copybuf;
213 	  while (*input != EOS)
214 	    {
215 	      if (ISSPACE (*input) && !squote && !dquote && !bsquote)
216 		{
217 		  break;
218 		}
219 	      else
220 		{
221 		  if (bsquote)
222 		    {
223 		      bsquote = 0;
224 		      *arg++ = *input;
225 		    }
226 		  else if (*input == '\\')
227 		    {
228 		      bsquote = 1;
229 		    }
230 		  else if (squote)
231 		    {
232 		      if (*input == '\'')
233 			{
234 			  squote = 0;
235 			}
236 		      else
237 			{
238 			  *arg++ = *input;
239 			}
240 		    }
241 		  else if (dquote)
242 		    {
243 		      if (*input == '"')
244 			{
245 			  dquote = 0;
246 			}
247 		      else
248 			{
249 			  *arg++ = *input;
250 			}
251 		    }
252 		  else
253 		    {
254 		      if (*input == '\'')
255 			{
256 			  squote = 1;
257 			}
258 		      else if (*input == '"')
259 			{
260 			  dquote = 1;
261 			}
262 		      else
263 			{
264 			  *arg++ = *input;
265 			}
266 		    }
267 		  input++;
268 		}
269 	    }
270 	  *arg = EOS;
271 	  argv[argc] = xstrdup (copybuf);
272 	  argc++;
273 	  argv[argc] = NULL;
274 
275 	  consume_whitespace (&input);
276 	}
277       while (*input != EOS);
278 
279       free (copybuf);
280     }
281   return (argv);
282 }
283 
284 /*
285 
286 @deftypefn Extension int writeargv (const char **@var{argv}, FILE *@var{file})
287 
288 Write each member of ARGV, handling all necessary quoting, to the file
289 named by FILE, separated by whitespace.  Return 0 on success, non-zero
290 if an error occurred while writing to FILE.
291 
292 @end deftypefn
293 
294 */
295 
296 int
writeargv(char ** argv,FILE * f)297 writeargv (char **argv, FILE *f)
298 {
299   int status = 0;
300 
301   if (f == NULL)
302     return 1;
303 
304   while (*argv != NULL)
305     {
306       const char *arg = *argv;
307 
308       while (*arg != EOS)
309         {
310           char c = *arg;
311 
312           if (ISSPACE(c) || c == '\\' || c == '\'' || c == '"')
313             if (EOF == fputc ('\\', f))
314               {
315                 status = 1;
316                 goto done;
317               }
318 
319           if (EOF == fputc (c, f))
320             {
321               status = 1;
322               goto done;
323             }
324           arg++;
325         }
326 
327       if (EOF == fputc ('\n', f))
328         {
329           status = 1;
330           goto done;
331         }
332       argv++;
333     }
334 
335  done:
336   return status;
337 }
338 
339 /*
340 
341 @deftypefn Extension void expandargv (int *@var{argcp}, char ***@var{argvp})
342 
343 The @var{argcp} and @code{argvp} arguments are pointers to the usual
344 @code{argc} and @code{argv} arguments to @code{main}.  This function
345 looks for arguments that begin with the character @samp{@@}.  Any such
346 arguments are interpreted as ``response files''.  The contents of the
347 response file are interpreted as additional command line options.  In
348 particular, the file is separated into whitespace-separated strings;
349 each such string is taken as a command-line option.  The new options
350 are inserted in place of the option naming the response file, and
351 @code{*argcp} and @code{*argvp} will be updated.  If the value of
352 @code{*argvp} is modified by this function, then the new value has
353 been dynamically allocated and can be deallocated by the caller with
354 @code{freeargv}.  However, most callers will simply call
355 @code{expandargv} near the beginning of @code{main} and allow the
356 operating system to free the memory when the program exits.
357 
358 @end deftypefn
359 
360 */
361 
362 void
expandargv(int * argcp,char *** argvp)363 expandargv (int *argcp, char ***argvp)
364 {
365   /* The argument we are currently processing.  */
366   int i = 0;
367   /* Non-zero if ***argvp has been dynamically allocated.  */
368   int argv_dynamic = 0;
369   /* Limit the number of response files that we parse in order
370      to prevent infinite recursion.  */
371   unsigned int iteration_limit = 2000;
372   /* Loop over the arguments, handling response files.  We always skip
373      ARGVP[0], as that is the name of the program being run.  */
374   while (++i < *argcp)
375     {
376       /* The name of the response file.  */
377       const char *filename;
378       /* The response file.  */
379       FILE *f;
380       /* An upper bound on the number of characters in the response
381 	 file.  */
382       long pos;
383       /* The number of characters in the response file, when actually
384 	 read.  */
385       size_t len;
386       /* A dynamically allocated buffer used to hold options read from a
387 	 response file.  */
388       char *buffer;
389       /* Dynamically allocated storage for the options read from the
390 	 response file.  */
391       char **file_argv;
392       /* The number of options read from the response file, if any.  */
393       size_t file_argc;
394       /* We are only interested in options of the form "@file".  */
395       filename = (*argvp)[i];
396       if (filename[0] != '@')
397 	continue;
398       /* If we have iterated too many times then stop.  */
399       if (-- iteration_limit == 0)
400 	{
401 	  fprintf (stderr, "%s: error: too many @-files encountered\n", (*argvp)[0]);
402 	  xexit (1);
403 	}
404       /* Read the contents of the file.  */
405       f = fopen (++filename, "r");
406       if (!f)
407 	continue;
408       if (fseek (f, 0L, SEEK_END) == -1)
409 	goto error;
410       pos = ftell (f);
411       if (pos == -1)
412 	goto error;
413       if (fseek (f, 0L, SEEK_SET) == -1)
414 	goto error;
415       buffer = (char *) xmalloc (pos * sizeof (char) + 1);
416       len = fread (buffer, sizeof (char), pos, f);
417       if (len != (size_t) pos
418 	  /* On Windows, fread may return a value smaller than POS,
419 	     due to CR/LF->CR translation when reading text files.
420 	     That does not in-and-of itself indicate failure.  */
421 	  && ferror (f))
422 	goto error;
423       /* Add a NUL terminator.  */
424       buffer[len] = '\0';
425       /* If the file is empty or contains only whitespace, buildargv would
426 	 return a single empty argument.  In this context we want no arguments,
427 	 instead.  */
428       if (only_whitespace (buffer))
429 	{
430 	  file_argv = (char **) xmalloc (sizeof (char *));
431 	  file_argv[0] = NULL;
432 	}
433       else
434 	/* Parse the string.  */
435 	file_argv = buildargv (buffer);
436       /* If *ARGVP is not already dynamically allocated, copy it.  */
437       if (!argv_dynamic)
438 	*argvp = dupargv (*argvp);
439       /* Count the number of arguments.  */
440       file_argc = 0;
441       while (file_argv[file_argc])
442 	++file_argc;
443       /* Now, insert FILE_ARGV into ARGV.  The "+1" below handles the
444 	 NULL terminator at the end of ARGV.  */
445       *argvp = ((char **)
446 		xrealloc (*argvp,
447 			  (*argcp + file_argc + 1) * sizeof (char *)));
448       memmove (*argvp + i + file_argc, *argvp + i + 1,
449 	       (*argcp - i) * sizeof (char *));
450       memcpy (*argvp + i, file_argv, file_argc * sizeof (char *));
451       /* The original option has been replaced by all the new
452 	 options.  */
453       *argcp += file_argc - 1;
454       /* Free up memory allocated to process the response file.  We do
455 	 not use freeargv because the individual options in FILE_ARGV
456 	 are now in the main ARGV.  */
457       free (file_argv);
458       free (buffer);
459       /* Rescan all of the arguments just read to support response
460 	 files that include other response files.  */
461       --i;
462     error:
463       /* We're all done with the file now.  */
464       fclose (f);
465     }
466 }
467 
468 /*
469 
470 @deftypefn Extension int countargv (char **@var{argv})
471 
472 Return the number of elements in @var{argv}.
473 Returns zero if @var{argv} is NULL.
474 
475 @end deftypefn
476 
477 */
478 
479 int
countargv(char ** argv)480 countargv (char **argv)
481 {
482   int argc;
483 
484   if (argv == NULL)
485     return 0;
486   for (argc = 0; argv[argc] != NULL; argc++)
487     continue;
488   return argc;
489 }
490 
491 #ifdef MAIN
492 
493 /* Simple little test driver. */
494 
495 static const char *const tests[] =
496 {
497   "a simple command line",
498   "arg 'foo' is single quoted",
499   "arg \"bar\" is double quoted",
500   "arg \"foo bar\" has embedded whitespace",
501   "arg 'Jack said \\'hi\\'' has single quotes",
502   "arg 'Jack said \\\"hi\\\"' has double quotes",
503   "a b c d e f g h i j k l m n o p q r s t u v w x y z 1 2 3 4 5 6 7 8 9",
504 
505   /* This should be expanded into only one argument.  */
506   "trailing-whitespace ",
507 
508   "",
509   NULL
510 };
511 
512 int
main(void)513 main (void)
514 {
515   char **argv;
516   const char *const *test;
517   char **targs;
518 
519   for (test = tests; *test != NULL; test++)
520     {
521       printf ("buildargv(\"%s\")\n", *test);
522       if ((argv = buildargv (*test)) == NULL)
523 	{
524 	  printf ("failed!\n\n");
525 	}
526       else
527 	{
528 	  for (targs = argv; *targs != NULL; targs++)
529 	    {
530 	      printf ("\t\"%s\"\n", *targs);
531 	    }
532 	  printf ("\n");
533 	}
534       freeargv (argv);
535     }
536 
537   return 0;
538 }
539 
540 #endif	/* MAIN */
541