1 /* arrayfunc.c -- High-level array functions used by other parts of the shell. */
3 /* Copyright (C) 2001-2011 Free Software Foundation, Inc.
5 This file is part of GNU Bash, the Bourne Again SHell.
7 Bash is free software: you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation, either version 3 of the License, or
10 (at your option) any later version.
12 Bash is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with Bash. If not, see <http://www.gnu.org/licenses/>.
23 #if defined (ARRAY_VARS)
25 #if defined (HAVE_UNISTD_H)
37 #include "builtins/common.h"
39 extern char *this_command_name
;
40 extern int last_command_exit_value
;
41 extern int array_needs_making
;
43 static SHELL_VAR
*bind_array_var_internal
__P((SHELL_VAR
*, arrayind_t
, char *, char *, int));
44 static SHELL_VAR
*assign_array_element_internal
__P((SHELL_VAR
*, char *, char *, char *, int, char *, int));
46 static char *quote_assign
__P((const char *));
47 static void quote_array_assignment_chars
__P((WORD_LIST
*));
48 static char *array_value_internal
__P((char *, int, int, int *, arrayind_t
*));
50 /* Standard error message to use when encountering an invalid array subscript */
51 const char * const bash_badsub_errmsg
= N_("bad array subscript");
53 /* **************************************************************** */
55 /* Functions to manipulate array variables and perform assignments */
57 /* **************************************************************** */
59 /* Convert a shell variable to an array variable. The original value is
62 convert_var_to_array (var
)
68 oldval
= value_cell (var
);
69 array
= array_create ();
71 array_insert (array
, 0, oldval
);
73 FREE (value_cell (var
));
74 var_setarray (var
, array
);
76 /* these aren't valid anymore */
77 var
->dynamic_value
= (sh_var_value_func_t
*)NULL
;
78 var
->assign_func
= (sh_var_assign_func_t
*)NULL
;
80 INVALIDATE_EXPORTSTR (var
);
84 VSETATTR (var
, att_array
);
85 VUNSETATTR (var
, att_invisible
);
90 /* Convert a shell variable to an array variable. The original value is
93 convert_var_to_assoc (var
)
99 oldval
= value_cell (var
);
100 hash
= assoc_create (0);
102 assoc_insert (hash
, savestring ("0"), oldval
);
104 FREE (value_cell (var
));
105 var_setassoc (var
, hash
);
107 /* these aren't valid anymore */
108 var
->dynamic_value
= (sh_var_value_func_t
*)NULL
;
109 var
->assign_func
= (sh_var_assign_func_t
*)NULL
;
111 INVALIDATE_EXPORTSTR (var
);
112 if (exported_p (var
))
113 array_needs_making
++;
115 VSETATTR (var
, att_assoc
);
116 VUNSETATTR (var
, att_invisible
);
122 make_array_variable_value (entry
, ind
, key
, value
, flags
)
132 /* If we're appending, we need the old value of the array reference, so
133 fake out make_variable_value with a dummy SHELL_VAR */
134 if (flags
& ASS_APPEND
)
136 dentry
= (SHELL_VAR
*)xmalloc (sizeof (SHELL_VAR
));
137 dentry
->name
= savestring (entry
->name
);
139 newval
= assoc_reference (assoc_cell (entry
), key
);
141 newval
= array_reference (array_cell (entry
), ind
);
143 dentry
->value
= savestring (newval
);
146 dentry
->value
= (char *)xmalloc (1);
147 dentry
->value
[0] = '\0';
149 dentry
->exportstr
= 0;
150 dentry
->attributes
= entry
->attributes
& ~(att_array
|att_assoc
|att_exported
);
151 /* Leave the rest of the members uninitialized; the code doesn't look
153 newval
= make_variable_value (dentry
, value
, flags
);
154 dispose_variable (dentry
);
157 newval
= make_variable_value (entry
, value
, flags
);
163 bind_array_var_internal (entry
, ind
, key
, value
, flags
)
172 newval
= make_array_variable_value (entry
, ind
, key
, value
, flags
);
174 if (entry
->assign_func
)
175 (*entry
->assign_func
) (entry
, newval
, ind
, key
);
176 else if (assoc_p (entry
))
177 assoc_insert (assoc_cell (entry
), key
, newval
);
179 array_insert (array_cell (entry
), ind
, newval
);
185 /* Perform an array assignment name[ind]=value. If NAME already exists and
186 is not an array, and IND is 0, perform name=value instead. If NAME exists
187 and is not an array, and IND is not 0, convert it into an array with the
188 existing value as name[0].
190 If NAME does not exist, just create an array variable, no matter what
191 IND's value may be. */
193 bind_array_variable (name
, ind
, value
, flags
)
201 entry
= find_shell_variable (name
);
203 if (entry
== (SHELL_VAR
*) 0)
204 entry
= make_new_array_variable (name
);
205 else if (readonly_p (entry
) || noassign_p (entry
))
207 if (readonly_p (entry
))
211 else if (array_p (entry
) == 0)
212 entry
= convert_var_to_array (entry
);
214 /* ENTRY is an array variable, and ARRAY points to the value. */
215 return (bind_array_var_internal (entry
, ind
, 0, value
, flags
));
219 bind_array_element (entry
, ind
, value
, flags
)
225 return (bind_array_var_internal (entry
, ind
, 0, value
, flags
));
229 bind_assoc_variable (entry
, name
, key
, value
, flags
)
239 if (readonly_p (entry
) || noassign_p (entry
))
241 if (readonly_p (entry
))
246 return (bind_array_var_internal (entry
, 0, key
, value
, flags
));
249 /* Parse NAME, a lhs of an assignment statement of the form v[s], and
250 assign VALUE to that array element by calling bind_array_variable(). */
252 assign_array_element (name
, value
, flags
)
260 vname
= array_variable_name (name
, &sub
, &sublen
);
263 return ((SHELL_VAR
*)NULL
);
265 if ((ALL_ELEMENT_SUB (sub
[0]) && sub
[1] == ']') || (sublen
<= 1))
268 err_badarraysub (name
);
269 return ((SHELL_VAR
*)NULL
);
272 entry
= find_variable (vname
);
273 entry
= assign_array_element_internal (entry
, name
, vname
, sub
, sublen
, value
, flags
);
280 assign_array_element_internal (entry
, name
, vname
, sub
, sublen
, value
, flags
)
282 char *name
; /* only used for error messages */
292 if (entry
&& assoc_p (entry
))
294 sub
[sublen
-1] = '\0';
295 akey
= expand_assignment_string_to_string (sub
, 0); /* [ */
297 if (akey
== 0 || *akey
== 0)
299 err_badarraysub (name
);
301 return ((SHELL_VAR
*)NULL
);
303 entry
= bind_assoc_variable (entry
, vname
, akey
, value
, flags
);
307 ind
= array_expand_index (entry
, sub
, sublen
);
310 err_badarraysub (name
);
311 return ((SHELL_VAR
*)NULL
);
313 entry
= bind_array_variable (vname
, ind
, value
, flags
);
319 /* Find the array variable corresponding to NAME. If there is no variable,
320 create a new array variable. If the variable exists but is not an array,
321 convert it to an indexed array. If FLAGS&1 is non-zero, an existing
322 variable is checked for the readonly or noassign attribute in preparation
323 for assignment (e.g., by the `read' builtin). If FLAGS&2 is non-zero, we
324 create an associative array. */
326 find_or_make_array_variable (name
, flags
)
332 var
= find_variable (name
);
335 /* See if we have a nameref pointing to a variable that hasn't been
337 var
= find_variable_last_nameref (name
);
338 if (var
&& nameref_p (var
))
339 var
= (flags
& 2) ? make_new_assoc_variable (nameref_cell (var
)) : make_new_array_variable (nameref_cell (var
));
343 var
= (flags
& 2) ? make_new_assoc_variable (name
) : make_new_array_variable (name
);
344 else if ((flags
& 1) && (readonly_p (var
) || noassign_p (var
)))
346 if (readonly_p (var
))
348 return ((SHELL_VAR
*)NULL
);
350 else if ((flags
& 2) && array_p (var
))
352 last_command_exit_value
= 1;
353 report_error (_("%s: cannot convert indexed to associative array"), name
);
354 return ((SHELL_VAR
*)NULL
);
356 else if (array_p (var
) == 0 && assoc_p (var
) == 0)
357 var
= convert_var_to_array (var
);
362 /* Perform a compound assignment statement for array NAME, where VALUE is
363 the text between the parens: NAME=( VALUE ) */
365 assign_array_from_string (name
, value
, flags
)
373 if (flags
& ASS_MKASSOC
)
376 var
= find_or_make_array_variable (name
, vflags
);
378 return ((SHELL_VAR
*)NULL
);
380 return (assign_array_var_from_string (var
, value
, flags
));
383 /* Sequentially assign the indices of indexed array variable VAR from the
386 assign_array_var_from_word_list (var
, list
, flags
)
391 register arrayind_t i
;
392 register WORD_LIST
*l
;
395 a
= array_cell (var
);
396 i
= (flags
& ASS_APPEND
) ? array_max_index (a
) + 1 : 0;
398 for (l
= list
; l
; l
= l
->next
, i
++)
399 if (var
->assign_func
)
400 (*var
->assign_func
) (var
, l
->word
->word
, i
, 0);
402 array_insert (a
, i
, l
->word
->word
);
407 expand_compound_array_assignment (var
, value
, flags
)
412 WORD_LIST
*list
, *nlist
;
413 WORD_LIST
*hd
, *tl
, *t
, *n
;
417 /* This condition is true when invoked from the declare builtin with a
419 declare -a d='([1]="" [2]="bdef" [5]="hello world" "test")' */
420 if (*value
== '(') /*)*/
423 val
= extract_array_assignment_list (value
, &ni
);
425 return (WORD_LIST
*)NULL
;
430 /* Expand the value string into a list of words, performing all the
431 shell expansions including pathname generation and word splitting. */
432 /* First we split the string on whitespace, using the shell parser
433 (ksh93 seems to do this). */
434 list
= parse_string_to_word_list (val
, 1, "array assign");
436 if (var
&& assoc_p (var
))
443 /* If we're using [subscript]=value, we need to quote each [ and ] to
444 prevent unwanted filename expansion. This doesn't need to be done
445 for associative array expansion, since that uses a different expansion
446 function (see assign_compound_array_list below). */
448 quote_array_assignment_chars (list
);
450 /* Now that we've split it, perform the shell expansions on each
452 nlist
= list
? expand_words_no_vars (list
) : (WORD_LIST
*)NULL
;
454 dispose_words (list
);
462 /* Callers ensure that VAR is not NULL */
464 assign_compound_array_list (var
, nlist
, flags
)
472 char *w
, *val
, *nval
;
473 int len
, iflags
, free_val
;
474 arrayind_t ind
, last_ind
;
477 a
= (var
&& array_p (var
)) ? array_cell (var
) : (ARRAY
*)0;
478 h
= (var
&& assoc_p (var
)) ? assoc_cell (var
) : (HASH_TABLE
*)0;
483 /* Now that we are ready to assign values to the array, kill the existing
485 if ((flags
& ASS_APPEND
) == 0)
487 if (a
&& array_p (var
))
489 else if (h
&& assoc_p (var
))
493 last_ind
= (a
&& (flags
& ASS_APPEND
)) ? array_max_index (a
) + 1 : 0;
495 for (list
= nlist
; list
; list
= list
->next
)
498 w
= list
->word
->word
;
500 /* We have a word of the form [ind]=value */
501 if ((list
->word
->flags
& W_ASSIGNMENT
) && w
[0] == '[')
503 /* Don't have to handle embedded quotes specially any more, since
504 associative array subscripts have not been expanded yet (see
506 len
= skipsubscript (w
, 0, 0);
508 /* XXX - changes for `+=' */
509 if (w
[len
] != ']' || (w
[len
+1] != '=' && (w
[len
+1] != '+' || w
[len
+2] != '=')))
516 nval
= make_variable_value (var
, w
, flags
);
517 if (var
->assign_func
)
518 (*var
->assign_func
) (var
, nval
, last_ind
, 0);
520 array_insert (a
, last_ind
, nval
);
532 if (ALL_ELEMENT_SUB (w
[1]) && len
== 2)
534 last_command_exit_value
= 1;
536 report_error (_("%s: invalid associative array key"), w
);
538 report_error (_("%s: cannot assign to non-numeric index"), w
);
544 ind
= array_expand_index (var
, w
+ 1, len
);
553 else if (assoc_p (var
))
555 /* This is not performed above, see expand_compound_array_assignment */
557 akey
= expand_assignment_string_to_string (w
+1, 0);
559 /* And we need to expand the value also, see below */
560 if (akey
== 0 || *akey
== 0)
568 /* XXX - changes for `+=' -- just accept the syntax. ksh93 doesn't do this */
569 if (w
[len
+ 1] == '+' && w
[len
+ 2] == '=')
571 iflags
|= ASS_APPEND
;
577 else if (assoc_p (var
))
579 last_command_exit_value
= 1;
580 report_error (_("%s: %s: must use subscript when assigning associative array"), var
->name
, w
);
583 else /* No [ind]=value, just a stray `=' */
590 /* See above; we need to expand the value here */
593 val
= expand_assignment_string_to_string (val
, 0);
598 this_command_name
= (char *)NULL
; /* no command name for errors */
599 bind_array_var_internal (var
, ind
, akey
, val
, iflags
);
607 /* Perform a compound array assignment: VAR->name=( VALUE ). The
608 VALUE has already had the parentheses stripped. */
610 assign_array_var_from_string (var
, value
, flags
)
620 nlist
= expand_compound_array_assignment (var
, value
, flags
);
621 assign_compound_array_list (var
, nlist
, flags
);
624 dispose_words (nlist
);
628 /* Quote globbing chars and characters in $IFS before the `=' in an assignment
629 statement (usually a compound array assignment) to protect them from
630 unwanted filename expansion or word splitting. */
632 quote_assign (string
)
637 char *temp
, *t
, *subs
;
638 const char *s
, *send
;
642 slen
= strlen (string
);
643 send
= string
+ slen
;
645 t
= temp
= (char *)xmalloc (slen
* 2 + 1);
647 for (s
= string
; *s
; )
651 if (saw_eq
== 0 && *s
== '[') /* looks like a subscript */
654 se
= skipsubscript (string
, ss
, 0);
655 subs
= substring (s
, ss
, se
);
665 if (saw_eq
== 0 && (glob_char_p (s
) || isifs (*s
)))
668 COPY_CHAR_P (t
, s
, send
);
674 /* For each word in a compound array assignment, if the word looks like
675 [ind]=value, quote globbing chars and characters in $IFS before the `='. */
677 quote_array_assignment_chars (list
)
683 for (l
= list
; l
; l
= l
->next
)
685 if (l
->word
== 0 || l
->word
->word
== 0 || l
->word
->word
[0] == '\0')
686 continue; /* should not happen, but just in case... */
687 /* Don't bother if it doesn't look like [ind]=value */
688 if (l
->word
->word
[0] != '[' || mbschr (l
->word
->word
, '=') == 0) /* ] */
690 nword
= quote_assign (l
->word
->word
);
691 free (l
->word
->word
);
692 l
->word
->word
= nword
;
696 /* skipsubscript moved to subst.c to use private functions. 2009/02/24. */
698 /* This function is called with SUB pointing to just after the beginning
699 `[' of an array subscript and removes the array element to which SUB
700 expands from array VAR. A subscript of `*' or `@' unsets the array. */
702 unbind_array_element (var
, sub
)
711 len
= skipsubscript (sub
, 0, 0);
712 if (sub
[len
] != ']' || len
== 0)
714 builtin_error ("%s[%s: %s", var
->name
, sub
, _(bash_badsub_errmsg
));
719 if (ALL_ELEMENT_SUB (sub
[0]) && sub
[1] == 0)
721 unbind_variable (var
->name
);
727 akey
= expand_assignment_string_to_string (sub
, 0); /* [ */
728 if (akey
== 0 || *akey
== 0)
730 builtin_error ("[%s]: %s", sub
, _(bash_badsub_errmsg
));
734 assoc_remove (assoc_cell (var
), akey
);
739 ind
= array_expand_index (var
, sub
, len
+1);
742 builtin_error ("[%s]: %s", sub
, _(bash_badsub_errmsg
));
745 ae
= array_remove (array_cell (var
), ind
);
747 array_dispose_element (ae
);
753 /* Format and output an array assignment in compound form VAR=(VALUES),
754 suitable for re-use as input. */
756 print_array_assignment (var
, quoted
)
762 vstr
= array_to_assign (array_cell (var
), quoted
);
765 printf ("%s=%s\n", var
->name
, quoted
? "'()'" : "()");
768 printf ("%s=%s\n", var
->name
, vstr
);
773 /* Format and output an associative array assignment in compound form
774 VAR=(VALUES), suitable for re-use as input. */
776 print_assoc_assignment (var
, quoted
)
782 vstr
= assoc_to_assign (assoc_cell (var
), quoted
);
785 printf ("%s=%s\n", var
->name
, quoted
? "'()'" : "()");
788 printf ("%s=%s\n", var
->name
, vstr
);
793 /***********************************************************************/
795 /* Utility functions to manage arrays and their contents for expansion */
797 /***********************************************************************/
799 /* Return 1 if NAME is a properly-formed array reference v[sub]. */
801 valid_array_reference (name
)
807 t
= mbschr (name
, '['); /* ] */
811 r
= legal_identifier (name
);
815 /* Check for a properly-terminated non-blank subscript. */
816 len
= skipsubscript (t
, 0, 0);
817 if (t
[len
] != ']' || len
== 1)
819 for (r
= 1; r
< len
; r
++)
820 if (whitespace (t
[r
]) == 0)
827 /* Expand the array index beginning at S and extending LEN characters. */
829 array_expand_index (var
, s
, len
)
838 exp
= (char *)xmalloc (len
);
839 strncpy (exp
, s
, len
- 1);
841 t
= expand_arith_string (exp
, 0);
842 this_command_name
= (char *)NULL
;
843 val
= evalexp (t
, &expok
);
848 last_command_exit_value
= EXECUTION_FAILURE
;
850 top_level_cleanup ();
851 jump_to_top_level (DISCARD
);
856 /* Return the name of the variable specified by S without any subscript.
857 If SUBP is non-null, return a pointer to the start of the subscript
858 in *SUBP. If LENP is non-null, the length of the subscript is returned
859 in *LENP. This returns newly-allocated memory. */
861 array_variable_name (s
, subp
, lenp
)
875 return ((char *)NULL
);
878 ni
= skipsubscript (s
, ind
, 0);
879 if (ni
<= ind
+ 1 || s
[ni
] != ']')
886 return ((char *)NULL
);
890 ret
= savestring (s
);
901 /* Return the variable specified by S without any subscript. If SUBP is
902 non-null, return a pointer to the start of the subscript in *SUBP.
903 If LENP is non-null, the length of the subscript is returned in *LENP. */
905 array_variable_part (s
, subp
, lenp
)
912 t
= array_variable_name (s
, subp
, lenp
);
914 return ((SHELL_VAR
*)NULL
);
915 var
= find_variable (t
);
918 return (var
== 0 || invisible_p (var
)) ? (SHELL_VAR
*)0 : var
;
921 #define INDEX_ERROR() \
925 err_badarraysub (var->name); \
929 err_badarraysub (s); \
930 t[-1] = '['; /* ] */\
932 return ((char *)NULL); \
936 /* Return a string containing the elements in the array and subscript
937 described by S. If the subscript is * or @, obeys quoting rules akin
938 to the expansion of $* and $@ including double quoting. If RTYPE
939 is non-null it gets 1 if the array reference is name[*], 2 if the
940 reference is name[@], and 0 otherwise. */
942 array_value_internal (s
, quoted
, flags
, rtype
, indp
)
944 int quoted
, flags
, *rtype
;
950 char *retval
, *t
, *temp
;
954 var
= array_variable_part (s
, &t
, &len
);
956 /* Expand the index, even if the variable doesn't exist, in case side
957 effects are needed, like ${w[i++]} where w is unset. */
964 return ((char *)NULL
); /* error message already printed */
968 if (ALL_ELEMENT_SUB (t
[0]) && t
[1] == ']')
971 *rtype
= (t
[0] == '*') ? 1 : 2;
972 if ((flags
& AV_ALLOWALL
) == 0)
975 return ((char *)NULL
);
977 else if (var
== 0 || value_cell (var
) == 0) /* XXX - check for invisible_p(var) ? */
978 return ((char *)NULL
);
979 else if (array_p (var
) == 0 && assoc_p (var
) == 0)
980 l
= add_string_to_list (value_cell (var
), (WORD_LIST
*)NULL
);
981 else if (assoc_p (var
))
983 l
= assoc_to_word_list (assoc_cell (var
));
984 if (l
== (WORD_LIST
*)NULL
)
985 return ((char *)NULL
);
989 l
= array_to_word_list (array_cell (var
));
990 if (l
== (WORD_LIST
*)NULL
)
991 return ((char *) NULL
);
994 if (t
[0] == '*' && (quoted
& (Q_HERE_DOCUMENT
|Q_DOUBLE_QUOTES
)))
996 temp
= string_list_dollar_star (l
);
997 retval
= quote_string (temp
); /* XXX - leak here */
1000 else /* ${name[@]} or unquoted ${name[*]} */
1001 retval
= string_list_dollar_at (l
, quoted
); /* XXX - leak here */
1009 if (var
== 0 || array_p (var
) || assoc_p (var
) == 0)
1011 if ((flags
& AV_USEIND
) == 0 || indp
== 0)
1013 ind
= array_expand_index (var
, t
, len
);
1016 /* negative subscripts to indexed arrays count back from end */
1017 if (var
&& array_p (var
))
1018 ind
= array_max_index (array_cell (var
)) + 1 + ind
;
1028 else if (assoc_p (var
))
1031 akey
= expand_assignment_string_to_string (t
, 0); /* [ */
1033 if (akey
== 0 || *akey
== 0)
1040 if (var
== 0 || value_cell (var
) == 0) /* XXX - check invisible_p(var) ? */
1043 return ((char *)NULL
);
1045 if (array_p (var
) == 0 && assoc_p (var
) == 0)
1046 return (ind
== 0 ? value_cell (var
) : (char *)NULL
);
1047 else if (assoc_p (var
))
1049 retval
= assoc_reference (assoc_cell (var
), akey
);
1053 retval
= array_reference (array_cell (var
), ind
);
1059 /* Return a string containing the elements described by the array and
1060 subscript contained in S, obeying quoting for subscripts * and @. */
1062 array_value (s
, quoted
, flags
, rtype
, indp
)
1064 int quoted
, flags
, *rtype
;
1067 return (array_value_internal (s
, quoted
, flags
|AV_ALLOWALL
, rtype
, indp
));
1070 /* Return the value of the array indexing expression S as a single string.
1071 If (FLAGS & AV_ALLOWALL) is 0, do not allow `@' and `*' subscripts. This
1072 is used by other parts of the shell such as the arithmetic expression
1073 evaluator in expr.c. */
1075 get_array_value (s
, flags
, rtype
, indp
)
1080 return (array_value_internal (s
, 0, flags
, rtype
, indp
));
1084 array_keys (s
, quoted
)
1089 char *retval
, *t
, *temp
;
1093 var
= array_variable_part (s
, &t
, &len
);
1096 if (var
== 0 || ALL_ELEMENT_SUB (t
[0]) == 0 || t
[1] != ']')
1097 return (char *)NULL
;
1099 if (var_isset (var
) == 0 || invisible_p (var
))
1100 return (char *)NULL
;
1102 if (array_p (var
) == 0 && assoc_p (var
) == 0)
1103 l
= add_string_to_list ("0", (WORD_LIST
*)NULL
);
1104 else if (assoc_p (var
))
1105 l
= assoc_keys_to_word_list (assoc_cell (var
));
1107 l
= array_keys_to_word_list (array_cell (var
));
1108 if (l
== (WORD_LIST
*)NULL
)
1109 return ((char *) NULL
);
1111 if (t
[0] == '*' && (quoted
& (Q_HERE_DOCUMENT
|Q_DOUBLE_QUOTES
)))
1113 temp
= string_list_dollar_star (l
);
1114 retval
= quote_string (temp
);
1117 else /* ${!name[@]} or unquoted ${!name[*]} */
1118 retval
= string_list_dollar_at (l
, quoted
);
1123 #endif /* ARRAY_VARS */