| /* subst.c -- The part of the shell that does parameter, command, arithmetic, |
| and globbing substitutions. */ |
| |
| /* ``Have a little faith, there's magic in the night. You ain't a |
| beauty, but, hey, you're alright.'' */ |
| |
| /* Copyright (C) 1987-2020 Free Software Foundation, Inc. |
| |
| This file is part of GNU Bash, the Bourne Again SHell. |
| |
| Bash is free software: you can redistribute it and/or modify |
| it under the terms of the GNU General Public License as published by |
| the Free Software Foundation, either version 3 of the License, or |
| (at your option) any later version. |
| |
| Bash is distributed in the hope that it will be useful, |
| but WITHOUT ANY WARRANTY; without even the implied warranty of |
| MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| GNU General Public License for more details. |
| |
| You should have received a copy of the GNU General Public License |
| along with Bash. If not, see <http://www.gnu.org/licenses/>. |
| */ |
| |
| #include "config.h" |
| |
| #include "bashtypes.h" |
| #include <stdio.h> |
| #include "chartypes.h" |
| #if defined (HAVE_PWD_H) |
| # include <pwd.h> |
| #endif |
| #include <signal.h> |
| #include <errno.h> |
| |
| #if defined (HAVE_UNISTD_H) |
| # include <unistd.h> |
| #endif |
| |
| #define NEED_FPURGE_DECL |
| |
| #include "bashansi.h" |
| #include "posixstat.h" |
| #include "bashintl.h" |
| |
| #include "shell.h" |
| #include "parser.h" |
| #include "flags.h" |
| #include "jobs.h" |
| #include "execute_cmd.h" |
| #include "filecntl.h" |
| #include "trap.h" |
| #include "pathexp.h" |
| #include "mailcheck.h" |
| |
| #include "shmbutil.h" |
| #if defined (HAVE_MBSTR_H) && defined (HAVE_MBSCHR) |
| # include <mbstr.h> /* mbschr */ |
| #endif |
| #include "typemax.h" |
| |
| #include "builtins/getopt.h" |
| #include "builtins/common.h" |
| |
| #include "builtins/builtext.h" |
| |
| #include <tilde/tilde.h> |
| #include <glob/strmatch.h> |
| |
| #if !defined (errno) |
| extern int errno; |
| #endif /* !errno */ |
| |
| /* The size that strings change by. */ |
| #define DEFAULT_INITIAL_ARRAY_SIZE 112 |
| #define DEFAULT_ARRAY_SIZE 128 |
| |
| /* Variable types. */ |
| #define VT_VARIABLE 0 |
| #define VT_POSPARMS 1 |
| #define VT_ARRAYVAR 2 |
| #define VT_ARRAYMEMBER 3 |
| #define VT_ASSOCVAR 4 |
| |
| #define VT_STARSUB 128 /* $* or ${array[*]} -- used to split */ |
| |
| /* Flags for quoted_strchr */ |
| #define ST_BACKSL 0x01 |
| #define ST_CTLESC 0x02 |
| #define ST_SQUOTE 0x04 /* unused yet */ |
| #define ST_DQUOTE 0x08 /* unused yet */ |
| |
| /* These defs make it easier to use the editor. */ |
| #define LBRACE '{' |
| #define RBRACE '}' |
| #define LPAREN '(' |
| #define RPAREN ')' |
| #define LBRACK '[' |
| #define RBRACK ']' |
| |
| #if defined (HANDLE_MULTIBYTE) |
| #define WLPAREN L'(' |
| #define WRPAREN L')' |
| #endif |
| |
| #define DOLLAR_AT_STAR(c) ((c) == '@' || (c) == '*') |
| #define STR_DOLLAR_AT_STAR(s) (DOLLAR_AT_STAR ((s)[0]) && (s)[1] == '\0') |
| |
| /* Evaluates to 1 if C is one of the shell's special parameters whose length |
| can be taken, but is also one of the special expansion characters. */ |
| #define VALID_SPECIAL_LENGTH_PARAM(c) \ |
| ((c) == '-' || (c) == '?' || (c) == '#' || (c) == '@') |
| |
| /* Evaluates to 1 if C is one of the shell's special parameters for which an |
| indirect variable reference may be made. */ |
| #define VALID_INDIR_PARAM(c) \ |
| ((posixly_correct == 0 && (c) == '#') || (posixly_correct == 0 && (c) == '?') || (c) == '@' || (c) == '*') |
| |
| /* Evaluates to 1 if C is one of the OP characters that follows the parameter |
| in ${parameter[:]OPword}. */ |
| #define VALID_PARAM_EXPAND_CHAR(c) (sh_syntaxtab[(unsigned char)c] & CSUBSTOP) |
| |
| /* Evaluates to 1 if this is one of the shell's special variables. */ |
| #define SPECIAL_VAR(name, wi) \ |
| (*name && ((DIGIT (*name) && all_digits (name)) || \ |
| (name[1] == '\0' && (sh_syntaxtab[(unsigned char)*name] & CSPECVAR)) || \ |
| (wi && name[2] == '\0' && VALID_INDIR_PARAM (name[1])))) |
| |
| /* This can be used by all of the *_extract_* functions that have a similar |
| structure. It can't just be wrapped in a do...while(0) loop because of |
| the embedded `break'. The dangling else accommodates a trailing semicolon; |
| we could also put in a do ; while (0) */ |
| |
| #define CHECK_STRING_OVERRUN(oind, ind, len, ch) \ |
| if (ind >= len) \ |
| { \ |
| oind = len; \ |
| ch = 0; \ |
| break; \ |
| } \ |
| else \ |
| |
| /* An expansion function that takes a string and a quoted flag and returns |
| a WORD_LIST *. Used as the type of the third argument to |
| expand_string_if_necessary(). */ |
| typedef WORD_LIST *EXPFUNC PARAMS((char *, int)); |
| |
| /* Process ID of the last command executed within command substitution. */ |
| pid_t last_command_subst_pid = NO_PID; |
| pid_t current_command_subst_pid = NO_PID; |
| |
| /* Variables used to keep track of the characters in IFS. */ |
| SHELL_VAR *ifs_var; |
| char *ifs_value; |
| unsigned char ifs_cmap[UCHAR_MAX + 1]; |
| int ifs_is_set, ifs_is_null; |
| |
| #if defined (HANDLE_MULTIBYTE) |
| unsigned char ifs_firstc[MB_LEN_MAX]; |
| size_t ifs_firstc_len; |
| #else |
| unsigned char ifs_firstc; |
| #endif |
| |
| /* If non-zero, command substitution inherits the value of errexit option */ |
| int inherit_errexit = 0; |
| |
| /* Sentinel to tell when we are performing variable assignments preceding a |
| command name and putting them into the environment. Used to make sure |
| we use the temporary environment when looking up variable values. */ |
| int assigning_in_environment; |
| |
| /* Used to hold a list of variable assignments preceding a command. Global |
| so the SIGCHLD handler in jobs.c can unwind-protect it when it runs a |
| SIGCHLD trap and so it can be saved and restored by the trap handlers. */ |
| WORD_LIST *subst_assign_varlist = (WORD_LIST *)NULL; |
| |
| /* Tell the expansion functions to not longjmp back to top_level on fatal |
| errors. Enabled when doing completion and prompt string expansion. */ |
| int no_longjmp_on_fatal_error = 0; |
| |
| /* Non-zero means to allow unmatched globbed filenames to expand to |
| a null file. */ |
| int allow_null_glob_expansion; |
| |
| /* Non-zero means to throw an error when globbing fails to match anything. */ |
| int fail_glob_expansion; |
| |
| /* Extern functions and variables from different files. */ |
| extern struct fd_bitmap *current_fds_to_close; |
| extern int wordexp_only; |
| |
| #if defined (JOB_CONTROL) && defined (PROCESS_SUBSTITUTION) |
| extern PROCESS *last_procsub_child; |
| #endif |
| |
| #if !defined (HAVE_WCSDUP) && defined (HANDLE_MULTIBYTE) |
| extern wchar_t *wcsdup PARAMS((const wchar_t *)); |
| #endif |
| |
| #if 0 |
| /* Variables to keep track of which words in an expanded word list (the |
| output of expand_word_list_internal) are the result of globbing |
| expansions. GLOB_ARGV_FLAGS is used by execute_cmd.c. |
| (CURRENTLY UNUSED). */ |
| char *glob_argv_flags; |
| static int glob_argv_flags_size; |
| #endif |
| |
| static WORD_LIST *cached_quoted_dollar_at = 0; |
| |
| /* Distinguished error values to return from expansion functions */ |
| static WORD_LIST expand_word_error, expand_word_fatal; |
| static WORD_DESC expand_wdesc_error, expand_wdesc_fatal; |
| static char expand_param_error, expand_param_fatal, expand_param_unset; |
| static char extract_string_error, extract_string_fatal; |
| |
| /* Set by expand_word_unsplit and several of the expand_string_XXX functions; |
| used to inhibit splitting and re-joining $* on $IFS, primarily when doing |
| assignment statements. The idea is that if we're in a context where this |
| is set, we're not going to be performing word splitting, so we use the same |
| rules to expand $* as we would if it appeared within double quotes. */ |
| static int expand_no_split_dollar_star = 0; |
| |
| /* A WORD_LIST of words to be expanded by expand_word_list_internal, |
| without any leading variable assignments. */ |
| static WORD_LIST *garglist = (WORD_LIST *)NULL; |
| |
| static char *quoted_substring PARAMS((char *, int, int)); |
| static int quoted_strlen PARAMS((char *)); |
| static char *quoted_strchr PARAMS((char *, int, int)); |
| |
| static char *expand_string_if_necessary PARAMS((char *, int, EXPFUNC *)); |
| static inline char *expand_string_to_string_internal PARAMS((char *, int, EXPFUNC *)); |
| static WORD_LIST *call_expand_word_internal PARAMS((WORD_DESC *, int, int, int *, int *)); |
| static WORD_LIST *expand_string_internal PARAMS((char *, int)); |
| static WORD_LIST *expand_string_leave_quoted PARAMS((char *, int)); |
| static WORD_LIST *expand_string_for_rhs PARAMS((char *, int, int, int, int *, int *)); |
| static WORD_LIST *expand_string_for_pat PARAMS((char *, int, int *, int *)); |
| |
| static char *quote_escapes_internal PARAMS((const char *, int)); |
| |
| static WORD_LIST *list_quote_escapes PARAMS((WORD_LIST *)); |
| static WORD_LIST *list_dequote_escapes PARAMS((WORD_LIST *)); |
| |
| static char *make_quoted_char PARAMS((int)); |
| static WORD_LIST *quote_list PARAMS((WORD_LIST *)); |
| |
| static int unquoted_substring PARAMS((char *, char *)); |
| static int unquoted_member PARAMS((int, char *)); |
| |
| #if defined (ARRAY_VARS) |
| static SHELL_VAR *do_compound_assignment PARAMS((char *, char *, int)); |
| #endif |
| static int do_assignment_internal PARAMS((const WORD_DESC *, int)); |
| |
| static char *string_extract_verbatim PARAMS((char *, size_t, int *, char *, int)); |
| static char *string_extract PARAMS((char *, int *, char *, int)); |
| static char *string_extract_double_quoted PARAMS((char *, int *, int)); |
| static inline char *string_extract_single_quoted PARAMS((char *, int *)); |
| static inline int skip_single_quoted PARAMS((const char *, size_t, int, int)); |
| static int skip_double_quoted PARAMS((char *, size_t, int, int)); |
| static char *extract_delimited_string PARAMS((char *, int *, char *, char *, char *, int)); |
| static char *extract_dollar_brace_string PARAMS((char *, int *, int, int)); |
| static int skip_matched_pair PARAMS((const char *, int, int, int, int)); |
| |
| static char *pos_params PARAMS((char *, int, int, int, int)); |
| |
| static unsigned char *mb_getcharlens PARAMS((char *, int)); |
| |
| static char *remove_upattern PARAMS((char *, char *, int)); |
| #if defined (HANDLE_MULTIBYTE) |
| static wchar_t *remove_wpattern PARAMS((wchar_t *, size_t, wchar_t *, int)); |
| #endif |
| static char *remove_pattern PARAMS((char *, char *, int)); |
| |
| static int match_upattern PARAMS((char *, char *, int, char **, char **)); |
| #if defined (HANDLE_MULTIBYTE) |
| static int match_wpattern PARAMS((wchar_t *, char **, size_t, wchar_t *, int, char **, char **)); |
| #endif |
| static int match_pattern PARAMS((char *, char *, int, char **, char **)); |
| static int getpatspec PARAMS((int, char *)); |
| static char *getpattern PARAMS((char *, int, int)); |
| static char *variable_remove_pattern PARAMS((char *, char *, int, int)); |
| static char *list_remove_pattern PARAMS((WORD_LIST *, char *, int, int, int)); |
| static char *parameter_list_remove_pattern PARAMS((int, char *, int, int)); |
| #ifdef ARRAY_VARS |
| static char *array_remove_pattern PARAMS((SHELL_VAR *, char *, int, int, int)); |
| #endif |
| static char *parameter_brace_remove_pattern PARAMS((char *, char *, int, char *, int, int, int)); |
| |
| static char *string_var_assignment PARAMS((SHELL_VAR *, char *)); |
| #if defined (ARRAY_VARS) |
| static char *array_var_assignment PARAMS((SHELL_VAR *, int, int, int)); |
| #endif |
| static char *pos_params_assignment PARAMS((WORD_LIST *, int, int)); |
| static char *string_transform PARAMS((int, SHELL_VAR *, char *)); |
| static char *list_transform PARAMS((int, SHELL_VAR *, WORD_LIST *, int, int)); |
| static char *parameter_list_transform PARAMS((int, int, int)); |
| #if defined ARRAY_VARS |
| static char *array_transform PARAMS((int, SHELL_VAR *, int, int)); |
| #endif |
| static char *parameter_brace_transform PARAMS((char *, char *, int, char *, int, int, int, int)); |
| static int valid_parameter_transform PARAMS((char *)); |
| |
| static char *process_substitute PARAMS((char *, int)); |
| |
| static char *read_comsub PARAMS((int, int, int, int *)); |
| |
| #ifdef ARRAY_VARS |
| static arrayind_t array_length_reference PARAMS((char *)); |
| #endif |
| |
| static int valid_brace_expansion_word PARAMS((char *, int)); |
| static int chk_atstar PARAMS((char *, int, int, int *, int *)); |
| static int chk_arithsub PARAMS((const char *, int)); |
| |
| static WORD_DESC *parameter_brace_expand_word PARAMS((char *, int, int, int, arrayind_t *)); |
| static char *parameter_brace_find_indir PARAMS((char *, int, int, int)); |
| static WORD_DESC *parameter_brace_expand_indir PARAMS((char *, int, int, int, int *, int *)); |
| static WORD_DESC *parameter_brace_expand_rhs PARAMS((char *, char *, int, int, int, int *, int *)); |
| static void parameter_brace_expand_error PARAMS((char *, char *, int)); |
| |
| static int valid_length_expression PARAMS((char *)); |
| static intmax_t parameter_brace_expand_length PARAMS((char *)); |
| |
| static char *skiparith PARAMS((char *, int)); |
| static int verify_substring_values PARAMS((SHELL_VAR *, char *, char *, int, intmax_t *, intmax_t *)); |
| static int get_var_and_type PARAMS((char *, char *, arrayind_t, int, int, SHELL_VAR **, char **)); |
| static char *mb_substring PARAMS((char *, int, int)); |
| static char *parameter_brace_substring PARAMS((char *, char *, int, char *, int, int, int)); |
| |
| static int shouldexp_replacement PARAMS((char *)); |
| |
| static char *pos_params_pat_subst PARAMS((char *, char *, char *, int)); |
| |
| static char *parameter_brace_patsub PARAMS((char *, char *, int, char *, int, int, int)); |
| |
| static char *pos_params_casemod PARAMS((char *, char *, int, int)); |
| static char *parameter_brace_casemod PARAMS((char *, char *, int, int, char *, int, int, int)); |
| |
| static WORD_DESC *parameter_brace_expand PARAMS((char *, int *, int, int, int *, int *)); |
| static WORD_DESC *param_expand PARAMS((char *, int *, int, int *, int *, int *, int *, int)); |
| |
| static WORD_LIST *expand_word_internal PARAMS((WORD_DESC *, int, int, int *, int *)); |
| |
| static WORD_LIST *word_list_split PARAMS((WORD_LIST *)); |
| |
| static void exp_jump_to_top_level PARAMS((int)); |
| |
| static WORD_LIST *separate_out_assignments PARAMS((WORD_LIST *)); |
| static WORD_LIST *glob_expand_word_list PARAMS((WORD_LIST *, int)); |
| #ifdef BRACE_EXPANSION |
| static WORD_LIST *brace_expand_word_list PARAMS((WORD_LIST *, int)); |
| #endif |
| #if defined (ARRAY_VARS) |
| static int make_internal_declare PARAMS((char *, char *, char *)); |
| static void expand_compound_assignment_word PARAMS((WORD_LIST *, int)); |
| static WORD_LIST *expand_declaration_argument PARAMS((WORD_LIST *, WORD_LIST *)); |
| #endif |
| static WORD_LIST *shell_expand_word_list PARAMS((WORD_LIST *, int)); |
| static WORD_LIST *expand_word_list_internal PARAMS((WORD_LIST *, int)); |
| |
| /* **************************************************************** */ |
| /* */ |
| /* Utility Functions */ |
| /* */ |
| /* **************************************************************** */ |
| |
| #if defined (DEBUG) |
| void |
| dump_word_flags (flags) |
| int flags; |
| { |
| int f; |
| |
| f = flags; |
| fprintf (stderr, "%d -> ", f); |
| if (f & W_ARRAYIND) |
| { |
| f &= ~W_ARRAYIND; |
| fprintf (stderr, "W_ARRAYIND%s", f ? "|" : ""); |
| } |
| if (f & W_ASSIGNASSOC) |
| { |
| f &= ~W_ASSIGNASSOC; |
| fprintf (stderr, "W_ASSIGNASSOC%s", f ? "|" : ""); |
| } |
| if (f & W_ASSIGNARRAY) |
| { |
| f &= ~W_ASSIGNARRAY; |
| fprintf (stderr, "W_ASSIGNARRAY%s", f ? "|" : ""); |
| } |
| if (f & W_SAWQUOTEDNULL) |
| { |
| f &= ~W_SAWQUOTEDNULL; |
| fprintf (stderr, "W_SAWQUOTEDNULL%s", f ? "|" : ""); |
| } |
| if (f & W_NOPROCSUB) |
| { |
| f &= ~W_NOPROCSUB; |
| fprintf (stderr, "W_NOPROCSUB%s", f ? "|" : ""); |
| } |
| if (f & W_DQUOTE) |
| { |
| f &= ~W_DQUOTE; |
| fprintf (stderr, "W_DQUOTE%s", f ? "|" : ""); |
| } |
| if (f & W_HASQUOTEDNULL) |
| { |
| f &= ~W_HASQUOTEDNULL; |
| fprintf (stderr, "W_HASQUOTEDNULL%s", f ? "|" : ""); |
| } |
| if (f & W_ASSIGNARG) |
| { |
| f &= ~W_ASSIGNARG; |
| fprintf (stderr, "W_ASSIGNARG%s", f ? "|" : ""); |
| } |
| if (f & W_ASSNBLTIN) |
| { |
| f &= ~W_ASSNBLTIN; |
| fprintf (stderr, "W_ASSNBLTIN%s", f ? "|" : ""); |
| } |
| if (f & W_ASSNGLOBAL) |
| { |
| f &= ~W_ASSNGLOBAL; |
| fprintf (stderr, "W_ASSNGLOBAL%s", f ? "|" : ""); |
| } |
| if (f & W_COMPASSIGN) |
| { |
| f &= ~W_COMPASSIGN; |
| fprintf (stderr, "W_COMPASSIGN%s", f ? "|" : ""); |
| } |
| if (f & W_EXPANDRHS) |
| { |
| f &= ~W_EXPANDRHS; |
| fprintf (stderr, "W_EXPANDRHS%s", f ? "|" : ""); |
| } |
| if (f & W_ITILDE) |
| { |
| f &= ~W_ITILDE; |
| fprintf (stderr, "W_ITILDE%s", f ? "|" : ""); |
| } |
| if (f & W_NOTILDE) |
| { |
| f &= ~W_NOTILDE; |
| fprintf (stderr, "W_NOTILDE%s", f ? "|" : ""); |
| } |
| if (f & W_ASSIGNRHS) |
| { |
| f &= ~W_ASSIGNRHS; |
| fprintf (stderr, "W_ASSIGNRHS%s", f ? "|" : ""); |
| } |
| if (f & W_NOASSNTILDE) |
| { |
| f &= ~W_NOASSNTILDE; |
| fprintf (stderr, "W_NOASSNTILDE%s", f ? "|" : ""); |
| } |
| if (f & W_NOCOMSUB) |
| { |
| f &= ~W_NOCOMSUB; |
| fprintf (stderr, "W_NOCOMSUB%s", f ? "|" : ""); |
| } |
| if (f & W_DOLLARSTAR) |
| { |
| f &= ~W_DOLLARSTAR; |
| fprintf (stderr, "W_DOLLARSTAR%s", f ? "|" : ""); |
| } |
| if (f & W_DOLLARAT) |
| { |
| f &= ~W_DOLLARAT; |
| fprintf (stderr, "W_DOLLARAT%s", f ? "|" : ""); |
| } |
| if (f & W_TILDEEXP) |
| { |
| f &= ~W_TILDEEXP; |
| fprintf (stderr, "W_TILDEEXP%s", f ? "|" : ""); |
| } |
| if (f & W_NOSPLIT2) |
| { |
| f &= ~W_NOSPLIT2; |
| fprintf (stderr, "W_NOSPLIT2%s", f ? "|" : ""); |
| } |
| if (f & W_NOSPLIT) |
| { |
| f &= ~W_NOSPLIT; |
| fprintf (stderr, "W_NOSPLIT%s", f ? "|" : ""); |
| } |
| if (f & W_NOBRACE) |
| { |
| f &= ~W_NOBRACE; |
| fprintf (stderr, "W_NOBRACE%s", f ? "|" : ""); |
| } |
| if (f & W_NOGLOB) |
| { |
| f &= ~W_NOGLOB; |
| fprintf (stderr, "W_NOGLOB%s", f ? "|" : ""); |
| } |
| if (f & W_SPLITSPACE) |
| { |
| f &= ~W_SPLITSPACE; |
| fprintf (stderr, "W_SPLITSPACE%s", f ? "|" : ""); |
| } |
| if (f & W_ASSIGNMENT) |
| { |
| f &= ~W_ASSIGNMENT; |
| fprintf (stderr, "W_ASSIGNMENT%s", f ? "|" : ""); |
| } |
| if (f & W_QUOTED) |
| { |
| f &= ~W_QUOTED; |
| fprintf (stderr, "W_QUOTED%s", f ? "|" : ""); |
| } |
| if (f & W_HASDOLLAR) |
| { |
| f &= ~W_HASDOLLAR; |
| fprintf (stderr, "W_HASDOLLAR%s", f ? "|" : ""); |
| } |
| if (f & W_COMPLETE) |
| { |
| f &= ~W_COMPLETE; |
| fprintf (stderr, "W_COMPLETE%s", f ? "|" : ""); |
| } |
| if (f & W_CHKLOCAL) |
| { |
| f &= ~W_CHKLOCAL; |
| fprintf (stderr, "W_CHKLOCAL%s", f ? "|" : ""); |
| } |
| if (f & W_FORCELOCAL) |
| { |
| f &= ~W_FORCELOCAL; |
| fprintf (stderr, "W_FORCELOCAL%s", f ? "|" : ""); |
| } |
| |
| fprintf (stderr, "\n"); |
| fflush (stderr); |
| } |
| #endif |
| |
| #ifdef INCLUDE_UNUSED |
| static char * |
| quoted_substring (string, start, end) |
| char *string; |
| int start, end; |
| { |
| register int len, l; |
| register char *result, *s, *r; |
| |
| len = end - start; |
| |
| /* Move to string[start], skipping quoted characters. */ |
| for (s = string, l = 0; *s && l < start; ) |
| { |
| if (*s == CTLESC) |
| { |
| s++; |
| continue; |
| } |
| l++; |
| if (*s == 0) |
| break; |
| } |
| |
| r = result = (char *)xmalloc (2*len + 1); /* save room for quotes */ |
| |
| /* Copy LEN characters, including quote characters. */ |
| s = string + l; |
| for (l = 0; l < len; s++) |
| { |
| if (*s == CTLESC) |
| *r++ = *s++; |
| *r++ = *s; |
| l++; |
| if (*s == 0) |
| break; |
| } |
| *r = '\0'; |
| return result; |
| } |
| #endif |
| |
| #ifdef INCLUDE_UNUSED |
| /* Return the length of S, skipping over quoted characters */ |
| static int |
| quoted_strlen (s) |
| char *s; |
| { |
| register char *p; |
| int i; |
| |
| i = 0; |
| for (p = s; *p; p++) |
| { |
| if (*p == CTLESC) |
| { |
| p++; |
| if (*p == 0) |
| return (i + 1); |
| } |
| i++; |
| } |
| |
| return i; |
| } |
| #endif |
| |
| #ifdef INCLUDE_UNUSED |
| /* Find the first occurrence of character C in string S, obeying shell |
| quoting rules. If (FLAGS & ST_BACKSL) is non-zero, backslash-escaped |
| characters are skipped. If (FLAGS & ST_CTLESC) is non-zero, characters |
| escaped with CTLESC are skipped. */ |
| static char * |
| quoted_strchr (s, c, flags) |
| char *s; |
| int c, flags; |
| { |
| register char *p; |
| |
| for (p = s; *p; p++) |
| { |
| if (((flags & ST_BACKSL) && *p == '\\') |
| || ((flags & ST_CTLESC) && *p == CTLESC)) |
| { |
| p++; |
| if (*p == '\0') |
| return ((char *)NULL); |
| continue; |
| } |
| else if (*p == c) |
| return p; |
| } |
| return ((char *)NULL); |
| } |
| |
| /* Return 1 if CHARACTER appears in an unquoted portion of |
| STRING. Return 0 otherwise. CHARACTER must be a single-byte character. */ |
| static int |
| unquoted_member (character, string) |
| int character; |
| char *string; |
| { |
| size_t slen; |
| int sindex, c; |
| DECLARE_MBSTATE; |
| |
| slen = strlen (string); |
| sindex = 0; |
| while (c = string[sindex]) |
| { |
| if (c == character) |
| return (1); |
| |
| switch (c) |
| { |
| default: |
| ADVANCE_CHAR (string, slen, sindex); |
| break; |
| |
| case '\\': |
| sindex++; |
| if (string[sindex]) |
| ADVANCE_CHAR (string, slen, sindex); |
| break; |
| |
| case '\'': |
| sindex = skip_single_quoted (string, slen, ++sindex, 0); |
| break; |
| |
| case '"': |
| sindex = skip_double_quoted (string, slen, ++sindex, 0); |
| break; |
| } |
| } |
| return (0); |
| } |
| |
| /* Return 1 if SUBSTR appears in an unquoted portion of STRING. */ |
| static int |
| unquoted_substring (substr, string) |
| char *substr, *string; |
| { |
| size_t slen; |
| int sindex, c, sublen; |
| DECLARE_MBSTATE; |
| |
| if (substr == 0 || *substr == '\0') |
| return (0); |
| |
| slen = strlen (string); |
| sublen = strlen (substr); |
| for (sindex = 0; c = string[sindex]; ) |
| { |
| if (STREQN (string + sindex, substr, sublen)) |
| return (1); |
| |
| switch (c) |
| { |
| case '\\': |
| sindex++; |
| if (string[sindex]) |
| ADVANCE_CHAR (string, slen, sindex); |
| break; |
| |
| case '\'': |
| sindex = skip_single_quoted (string, slen, ++sindex, 0); |
| break; |
| |
| case '"': |
| sindex = skip_double_quoted (string, slen, ++sindex, 0); |
| break; |
| |
| default: |
| ADVANCE_CHAR (string, slen, sindex); |
| break; |
| } |
| } |
| return (0); |
| } |
| #endif |
| |
| /* Most of the substitutions must be done in parallel. In order |
| to avoid using tons of unclear goto's, I have some functions |
| for manipulating malloc'ed strings. They all take INDX, a |
| pointer to an integer which is the offset into the string |
| where manipulation is taking place. They also take SIZE, a |
| pointer to an integer which is the current length of the |
| character array for this string. */ |
| |
| /* Append SOURCE to TARGET at INDEX. SIZE is the current amount |
| of space allocated to TARGET. SOURCE can be NULL, in which |
| case nothing happens. Gets rid of SOURCE by freeing it. |
| Returns TARGET in case the location has changed. */ |
| INLINE char * |
| sub_append_string (source, target, indx, size) |
| char *source, *target; |
| int *indx; |
| size_t *size; |
| { |
| if (source) |
| { |
| int n; |
| size_t srclen; |
| |
| srclen = STRLEN (source); |
| if (srclen >= (int)(*size - *indx)) |
| { |
| n = srclen + *indx; |
| n = (n + DEFAULT_ARRAY_SIZE) - (n % DEFAULT_ARRAY_SIZE); |
| target = (char *)xrealloc (target, (*size = n)); |
| } |
| |
| FASTCOPY (source, target + *indx, srclen); |
| *indx += srclen; |
| target[*indx] = '\0'; |
| |
| free (source); |
| } |
| return (target); |
| } |
| |
| #if 0 |
| /* UNUSED */ |
| /* Append the textual representation of NUMBER to TARGET. |
| INDX and SIZE are as in SUB_APPEND_STRING. */ |
| char * |
| sub_append_number (number, target, indx, size) |
| intmax_t number; |
| char *target; |
| int *indx; |
| size_t *size; |
| { |
| char *temp; |
| |
| temp = itos (number); |
| return (sub_append_string (temp, target, indx, size)); |
| } |
| #endif |
| |
| /* Extract a substring from STRING, starting at SINDEX and ending with |
| one of the characters in CHARLIST. Don't make the ending character |
| part of the string. Leave SINDEX pointing at the ending character. |
| Understand about backslashes in the string. If (flags & SX_VARNAME) |
| is non-zero, and array variables have been compiled into the shell, |
| everything between a `[' and a corresponding `]' is skipped over. |
| If (flags & SX_NOALLOC) is non-zero, don't return the substring, just |
| update SINDEX. If (flags & SX_REQMATCH) is non-zero, the string must |
| contain a closing character from CHARLIST. */ |
| static char * |
| string_extract (string, sindex, charlist, flags) |
| char *string; |
| int *sindex; |
| char *charlist; |
| int flags; |
| { |
| register int c, i; |
| int found; |
| size_t slen; |
| char *temp; |
| DECLARE_MBSTATE; |
| |
| slen = (MB_CUR_MAX > 1) ? strlen (string + *sindex) + *sindex : 0; |
| i = *sindex; |
| found = 0; |
| while (c = string[i]) |
| { |
| if (c == '\\') |
| { |
| if (string[i + 1]) |
| i++; |
| else |
| break; |
| } |
| #if defined (ARRAY_VARS) |
| else if ((flags & SX_VARNAME) && c == LBRACK) |
| { |
| int ni; |
| /* If this is an array subscript, skip over it and continue. */ |
| ni = skipsubscript (string, i, 0); |
| if (string[ni] == RBRACK) |
| i = ni; |
| } |
| #endif |
| else if (MEMBER (c, charlist)) |
| { |
| found = 1; |
| break; |
| } |
| |
| ADVANCE_CHAR (string, slen, i); |
| } |
| |
| /* If we had to have a matching delimiter and didn't find one, return an |
| error and let the caller deal with it. */ |
| if ((flags & SX_REQMATCH) && found == 0) |
| { |
| *sindex = i; |
| return (&extract_string_error); |
| } |
| |
| temp = (flags & SX_NOALLOC) ? (char *)NULL : substring (string, *sindex, i); |
| *sindex = i; |
| |
| return (temp); |
| } |
| |
| /* Extract the contents of STRING as if it is enclosed in double quotes. |
| SINDEX, when passed in, is the offset of the character immediately |
| following the opening double quote; on exit, SINDEX is left pointing after |
| the closing double quote. If STRIPDQ is non-zero, unquoted double |
| quotes are stripped and the string is terminated by a null byte. |
| Backslashes between the embedded double quotes are processed. If STRIPDQ |
| is zero, an unquoted `"' terminates the string. */ |
| static char * |
| string_extract_double_quoted (string, sindex, flags) |
| char *string; |
| int *sindex, flags; |
| { |
| size_t slen; |
| char *send; |
| int j, i, t; |
| unsigned char c; |
| char *temp, *ret; /* The new string we return. */ |
| int pass_next, backquote, si; /* State variables for the machine. */ |
| int dquote; |
| int stripdq; |
| DECLARE_MBSTATE; |
| |
| slen = strlen (string + *sindex) + *sindex; |
| send = string + slen; |
| |
| stripdq = (flags & SX_STRIPDQ); |
| |
| pass_next = backquote = dquote = 0; |
| temp = (char *)xmalloc (1 + slen - *sindex); |
| |
| j = 0; |
| i = *sindex; |
| while (c = string[i]) |
| { |
| /* Process a character that was quoted by a backslash. */ |
| if (pass_next) |
| { |
| /* XXX - take another look at this in light of Interp 221 */ |
| /* Posix.2 sez: |
| |
| ``The backslash shall retain its special meaning as an escape |
| character only when followed by one of the characters: |
| $ ` " \ <newline>''. |
| |
| If STRIPDQ is zero, we handle the double quotes here and let |
| expand_word_internal handle the rest. If STRIPDQ is non-zero, |
| we have already been through one round of backslash stripping, |
| and want to strip these backslashes only if DQUOTE is non-zero, |
| indicating that we are inside an embedded double-quoted string. */ |
| |
| /* If we are in an embedded quoted string, then don't strip |
| backslashes before characters for which the backslash |
| retains its special meaning, but remove backslashes in |
| front of other characters. If we are not in an |
| embedded quoted string, don't strip backslashes at all. |
| This mess is necessary because the string was already |
| surrounded by double quotes (and sh has some really weird |
| quoting rules). |
| The returned string will be run through expansion as if |
| it were double-quoted. */ |
| if ((stripdq == 0 && c != '"') || |
| (stripdq && ((dquote && (sh_syntaxtab[c] & CBSDQUOTE)) || dquote == 0))) |
| temp[j++] = '\\'; |
| pass_next = 0; |
| |
| add_one_character: |
| COPY_CHAR_I (temp, j, string, send, i); |
| continue; |
| } |
| |
| /* A backslash protects the next character. The code just above |
| handles preserving the backslash in front of any character but |
| a double quote. */ |
| if (c == '\\') |
| { |
| pass_next++; |
| i++; |
| continue; |
| } |
| |
| /* Inside backquotes, ``the portion of the quoted string from the |
| initial backquote and the characters up to the next backquote |
| that is not preceded by a backslash, having escape characters |
| removed, defines that command''. */ |
| if (backquote) |
| { |
| if (c == '`') |
| backquote = 0; |
| temp[j++] = c; /* COPY_CHAR_I? */ |
| i++; |
| continue; |
| } |
| |
| if (c == '`') |
| { |
| temp[j++] = c; |
| backquote++; |
| i++; |
| continue; |
| } |
| |
| /* Pass everything between `$(' and the matching `)' or a quoted |
| ${ ... } pair through according to the Posix.2 specification. */ |
| if (c == '$' && ((string[i + 1] == LPAREN) || (string[i + 1] == LBRACE))) |
| { |
| int free_ret = 1; |
| |
| si = i + 2; |
| if (string[i + 1] == LPAREN) |
| ret = extract_command_subst (string, &si, (flags & SX_COMPLETE)); |
| else |
| ret = extract_dollar_brace_string (string, &si, Q_DOUBLE_QUOTES, 0); |
| |
| temp[j++] = '$'; |
| temp[j++] = string[i + 1]; |
| |
| /* Just paranoia; ret will not be 0 unless no_longjmp_on_fatal_error |
| is set. */ |
| if (ret == 0 && no_longjmp_on_fatal_error) |
| { |
| free_ret = 0; |
| ret = string + i + 2; |
| } |
| |
| /* XXX - CHECK_STRING_OVERRUN here? */ |
| for (t = 0; ret[t]; t++, j++) |
| temp[j] = ret[t]; |
| temp[j] = string[si]; |
| |
| if (si < i + 2) /* we went back? */ |
| i += 2; |
| else if (string[si]) |
| { |
| j++; |
| i = si + 1; |
| } |
| else |
| i = si; |
| |
| if (free_ret) |
| free (ret); |
| continue; |
| } |
| |
| /* Add any character but a double quote to the quoted string we're |
| accumulating. */ |
| if (c != '"') |
| goto add_one_character; |
| |
| /* c == '"' */ |
| if (stripdq) |
| { |
| dquote ^= 1; |
| i++; |
| continue; |
| } |
| |
| break; |
| } |
| temp[j] = '\0'; |
| |
| /* Point to after the closing quote. */ |
| if (c) |
| i++; |
| *sindex = i; |
| |
| return (temp); |
| } |
| |
| /* This should really be another option to string_extract_double_quoted. */ |
| static int |
| skip_double_quoted (string, slen, sind, flags) |
| char *string; |
| size_t slen; |
| int sind; |
| int flags; |
| { |
| int c, i; |
| char *ret; |
| int pass_next, backquote, si; |
| DECLARE_MBSTATE; |
| |
| pass_next = backquote = 0; |
| i = sind; |
| while (c = string[i]) |
| { |
| if (pass_next) |
| { |
| pass_next = 0; |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| else if (c == '\\') |
| { |
| pass_next++; |
| i++; |
| continue; |
| } |
| else if (backquote) |
| { |
| if (c == '`') |
| backquote = 0; |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| else if (c == '`') |
| { |
| backquote++; |
| i++; |
| continue; |
| } |
| else if (c == '$' && ((string[i + 1] == LPAREN) || (string[i + 1] == LBRACE))) |
| { |
| si = i + 2; |
| if (string[i + 1] == LPAREN) |
| ret = extract_command_subst (string, &si, SX_NOALLOC|(flags&SX_COMPLETE)); |
| else |
| ret = extract_dollar_brace_string (string, &si, Q_DOUBLE_QUOTES, SX_NOALLOC); |
| |
| /* These can consume the entire string if they are unterminated */ |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| |
| i = si + 1; |
| continue; |
| } |
| else if (c != '"') |
| { |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| else |
| break; |
| } |
| |
| if (c) |
| i++; |
| |
| return (i); |
| } |
| |
| /* Extract the contents of STRING as if it is enclosed in single quotes. |
| SINDEX, when passed in, is the offset of the character immediately |
| following the opening single quote; on exit, SINDEX is left pointing after |
| the closing single quote. */ |
| static inline char * |
| string_extract_single_quoted (string, sindex) |
| char *string; |
| int *sindex; |
| { |
| register int i; |
| size_t slen; |
| char *t; |
| DECLARE_MBSTATE; |
| |
| /* Don't need slen for ADVANCE_CHAR unless multibyte chars possible. */ |
| slen = (MB_CUR_MAX > 1) ? strlen (string + *sindex) + *sindex : 0; |
| i = *sindex; |
| while (string[i] && string[i] != '\'') |
| ADVANCE_CHAR (string, slen, i); |
| |
| t = substring (string, *sindex, i); |
| |
| if (string[i]) |
| i++; |
| *sindex = i; |
| |
| return (t); |
| } |
| |
| /* Skip over a single-quoted string. We overload the SX_COMPLETE flag to mean |
| that we are splitting out words for completion and have encountered a $'...' |
| string, which allows backslash-escaped single quotes. */ |
| static inline int |
| skip_single_quoted (string, slen, sind, flags) |
| const char *string; |
| size_t slen; |
| int sind; |
| int flags; |
| { |
| register int c; |
| DECLARE_MBSTATE; |
| |
| c = sind; |
| while (string[c] && string[c] != '\'') |
| { |
| if ((flags & SX_COMPLETE) && string[c] == '\\' && string[c+1] == '\'' && string[c+2]) |
| ADVANCE_CHAR (string, slen, c); |
| ADVANCE_CHAR (string, slen, c); |
| } |
| |
| if (string[c]) |
| c++; |
| return c; |
| } |
| |
| /* Just like string_extract, but doesn't hack backslashes or any of |
| that other stuff. Obeys CTLESC quoting. Used to do splitting on $IFS. */ |
| static char * |
| string_extract_verbatim (string, slen, sindex, charlist, flags) |
| char *string; |
| size_t slen; |
| int *sindex; |
| char *charlist; |
| int flags; |
| { |
| register int i; |
| #if defined (HANDLE_MULTIBYTE) |
| wchar_t *wcharlist; |
| #endif |
| int c; |
| char *temp; |
| DECLARE_MBSTATE; |
| |
| if ((flags & SX_NOCTLESC) && charlist[0] == '\'' && charlist[1] == '\0') |
| { |
| temp = string_extract_single_quoted (string, sindex); |
| --*sindex; /* leave *sindex at separator character */ |
| return temp; |
| } |
| |
| /* This can never be called with charlist == NULL. If *charlist == NULL, |
| we can skip the loop and just return a copy of the string, updating |
| *sindex */ |
| if (*charlist == 0) |
| { |
| temp = string + *sindex; |
| c = (*sindex == 0) ? slen : STRLEN (temp); |
| temp = savestring (temp); |
| *sindex += c; |
| return temp; |
| } |
| |
| i = *sindex; |
| #if defined (HANDLE_MULTIBYTE) |
| wcharlist = 0; |
| #endif |
| while (c = string[i]) |
| { |
| #if defined (HANDLE_MULTIBYTE) |
| size_t mblength; |
| #endif |
| if ((flags & SX_NOCTLESC) == 0 && c == CTLESC) |
| { |
| i += 2; |
| CHECK_STRING_OVERRUN (i, i, slen, c); |
| continue; |
| } |
| /* Even if flags contains SX_NOCTLESC, we let CTLESC quoting CTLNUL |
| through, to protect the CTLNULs from later calls to |
| remove_quoted_nulls. */ |
| else if ((flags & SX_NOESCCTLNUL) == 0 && c == CTLESC && string[i+1] == CTLNUL) |
| { |
| i += 2; |
| CHECK_STRING_OVERRUN (i, i, slen, c); |
| continue; |
| } |
| |
| #if defined (HANDLE_MULTIBYTE) |
| if (locale_utf8locale && slen > i && UTF8_SINGLEBYTE (string[i])) |
| mblength = (string[i] != 0) ? 1 : 0; |
| else |
| mblength = MBLEN (string + i, slen - i); |
| if (mblength > 1) |
| { |
| wchar_t wc; |
| mblength = mbtowc (&wc, string + i, slen - i); |
| if (MB_INVALIDCH (mblength)) |
| { |
| if (MEMBER (c, charlist)) |
| break; |
| } |
| else |
| { |
| if (wcharlist == 0) |
| { |
| size_t len; |
| len = mbstowcs (wcharlist, charlist, 0); |
| if (len == -1) |
| len = 0; |
| wcharlist = (wchar_t *)xmalloc (sizeof (wchar_t) * (len + 1)); |
| mbstowcs (wcharlist, charlist, len + 1); |
| } |
| |
| if (wcschr (wcharlist, wc)) |
| break; |
| } |
| } |
| else |
| #endif |
| if (MEMBER (c, charlist)) |
| break; |
| |
| ADVANCE_CHAR (string, slen, i); |
| } |
| |
| #if defined (HANDLE_MULTIBYTE) |
| FREE (wcharlist); |
| #endif |
| |
| temp = substring (string, *sindex, i); |
| *sindex = i; |
| |
| return (temp); |
| } |
| |
| /* Extract the $( construct in STRING, and return a new string. |
| Start extracting at (SINDEX) as if we had just seen "$(". |
| Make (SINDEX) get the position of the matching ")". ) |
| XFLAGS is additional flags to pass to other extraction functions. */ |
| char * |
| extract_command_subst (string, sindex, xflags) |
| char *string; |
| int *sindex; |
| int xflags; |
| { |
| char *ret; |
| |
| if (string[*sindex] == LPAREN || (xflags & SX_COMPLETE)) |
| return (extract_delimited_string (string, sindex, "$(", "(", ")", xflags|SX_COMMAND)); /*)*/ |
| else |
| { |
| xflags |= (no_longjmp_on_fatal_error ? SX_NOLONGJMP : 0); |
| ret = xparse_dolparen (string, string+*sindex, sindex, xflags); |
| return ret; |
| } |
| } |
| |
| /* Extract the $[ construct in STRING, and return a new string. (]) |
| Start extracting at (SINDEX) as if we had just seen "$[". |
| Make (SINDEX) get the position of the matching "]". */ |
| char * |
| extract_arithmetic_subst (string, sindex) |
| char *string; |
| int *sindex; |
| { |
| return (extract_delimited_string (string, sindex, "$[", "[", "]", 0)); /*]*/ |
| } |
| |
| #if defined (PROCESS_SUBSTITUTION) |
| /* Extract the <( or >( construct in STRING, and return a new string. |
| Start extracting at (SINDEX) as if we had just seen "<(". |
| Make (SINDEX) get the position of the matching ")". */ /*))*/ |
| char * |
| extract_process_subst (string, starter, sindex, xflags) |
| char *string; |
| char *starter; |
| int *sindex; |
| int xflags; |
| { |
| #if 0 |
| /* XXX - check xflags&SX_COMPLETE here? */ |
| return (extract_delimited_string (string, sindex, starter, "(", ")", SX_COMMAND)); |
| #else |
| xflags |= (no_longjmp_on_fatal_error ? SX_NOLONGJMP : 0); |
| return (xparse_dolparen (string, string+*sindex, sindex, xflags)); |
| #endif |
| } |
| #endif /* PROCESS_SUBSTITUTION */ |
| |
| #if defined (ARRAY_VARS) |
| /* This can be fooled by unquoted right parens in the passed string. If |
| each caller verifies that the last character in STRING is a right paren, |
| we don't even need to call extract_delimited_string. */ |
| char * |
| extract_array_assignment_list (string, sindex) |
| char *string; |
| int *sindex; |
| { |
| int slen; |
| char *ret; |
| |
| slen = strlen (string); |
| if (string[slen - 1] == RPAREN) |
| { |
| ret = substring (string, *sindex, slen - 1); |
| *sindex = slen - 1; |
| return ret; |
| } |
| return 0; |
| } |
| #endif |
| |
| /* Extract and create a new string from the contents of STRING, a |
| character string delimited with OPENER and CLOSER. SINDEX is |
| the address of an int describing the current offset in STRING; |
| it should point to just after the first OPENER found. On exit, |
| SINDEX gets the position of the last character of the matching CLOSER. |
| If OPENER is more than a single character, ALT_OPENER, if non-null, |
| contains a character string that can also match CLOSER and thus |
| needs to be skipped. */ |
| static char * |
| extract_delimited_string (string, sindex, opener, alt_opener, closer, flags) |
| char *string; |
| int *sindex; |
| char *opener, *alt_opener, *closer; |
| int flags; |
| { |
| int i, c, si; |
| size_t slen; |
| char *t, *result; |
| int pass_character, nesting_level, in_comment; |
| int len_closer, len_opener, len_alt_opener; |
| DECLARE_MBSTATE; |
| |
| slen = strlen (string + *sindex) + *sindex; |
| len_opener = STRLEN (opener); |
| len_alt_opener = STRLEN (alt_opener); |
| len_closer = STRLEN (closer); |
| |
| pass_character = in_comment = 0; |
| |
| nesting_level = 1; |
| i = *sindex; |
| |
| while (nesting_level) |
| { |
| c = string[i]; |
| |
| /* If a recursive call or a call to ADVANCE_CHAR leaves the index beyond |
| the end of the string, catch it and cut the loop. */ |
| if (i > slen) |
| { |
| i = slen; |
| c = string[i = slen]; |
| break; |
| } |
| |
| if (c == 0) |
| break; |
| |
| if (in_comment) |
| { |
| if (c == '\n') |
| in_comment = 0; |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| |
| if (pass_character) /* previous char was backslash */ |
| { |
| pass_character = 0; |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| |
| /* Not exactly right yet; should handle shell metacharacters and |
| multibyte characters, too. See COMMENT_BEGIN define in parse.y */ |
| if ((flags & SX_COMMAND) && c == '#' && (i == 0 || string[i - 1] == '\n' || shellblank (string[i - 1]))) |
| { |
| in_comment = 1; |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| |
| if (c == CTLESC || c == '\\') |
| { |
| pass_character++; |
| i++; |
| continue; |
| } |
| |
| /* Process a nested command substitution, but only if we're parsing an |
| arithmetic substitution. */ |
| if ((flags & SX_COMMAND) && string[i] == '$' && string[i+1] == LPAREN) |
| { |
| si = i + 2; |
| t = extract_command_subst (string, &si, flags|SX_NOALLOC); |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| i = si + 1; |
| continue; |
| } |
| |
| /* Process a nested OPENER. */ |
| if (STREQN (string + i, opener, len_opener)) |
| { |
| si = i + len_opener; |
| t = extract_delimited_string (string, &si, opener, alt_opener, closer, flags|SX_NOALLOC); |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| i = si + 1; |
| continue; |
| } |
| |
| /* Process a nested ALT_OPENER */ |
| if (len_alt_opener && STREQN (string + i, alt_opener, len_alt_opener)) |
| { |
| si = i + len_alt_opener; |
| t = extract_delimited_string (string, &si, alt_opener, alt_opener, closer, flags|SX_NOALLOC); |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| i = si + 1; |
| continue; |
| } |
| |
| /* If the current substring terminates the delimited string, decrement |
| the nesting level. */ |
| if (STREQN (string + i, closer, len_closer)) |
| { |
| i += len_closer - 1; /* move to last byte of the closer */ |
| nesting_level--; |
| if (nesting_level == 0) |
| break; |
| } |
| |
| /* Pass old-style command substitution through verbatim. */ |
| if (c == '`') |
| { |
| si = i + 1; |
| t = string_extract (string, &si, "`", flags|SX_NOALLOC); |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| i = si + 1; |
| continue; |
| } |
| |
| /* Pass single-quoted and double-quoted strings through verbatim. */ |
| if (c == '\'' || c == '"') |
| { |
| si = i + 1; |
| i = (c == '\'') ? skip_single_quoted (string, slen, si, 0) |
| : skip_double_quoted (string, slen, si, 0); |
| continue; |
| } |
| |
| /* move past this character, which was not special. */ |
| ADVANCE_CHAR (string, slen, i); |
| } |
| |
| if (c == 0 && nesting_level) |
| { |
| if (no_longjmp_on_fatal_error == 0) |
| { |
| last_command_exit_value = EXECUTION_FAILURE; |
| report_error (_("bad substitution: no closing `%s' in %s"), closer, string); |
| exp_jump_to_top_level (DISCARD); |
| } |
| else |
| { |
| *sindex = i; |
| return (char *)NULL; |
| } |
| } |
| |
| si = i - *sindex - len_closer + 1; |
| if (flags & SX_NOALLOC) |
| result = (char *)NULL; |
| else |
| { |
| result = (char *)xmalloc (1 + si); |
| strncpy (result, string + *sindex, si); |
| result[si] = '\0'; |
| } |
| *sindex = i; |
| |
| return (result); |
| } |
| |
| /* Extract a parameter expansion expression within ${ and } from STRING. |
| Obey the Posix.2 rules for finding the ending `}': count braces while |
| skipping over enclosed quoted strings and command substitutions. |
| SINDEX is the address of an int describing the current offset in STRING; |
| it should point to just after the first `{' found. On exit, SINDEX |
| gets the position of the matching `}'. QUOTED is non-zero if this |
| occurs inside double quotes. */ |
| /* XXX -- this is very similar to extract_delimited_string -- XXX */ |
| static char * |
| extract_dollar_brace_string (string, sindex, quoted, flags) |
| char *string; |
| int *sindex, quoted, flags; |
| { |
| register int i, c; |
| size_t slen; |
| int pass_character, nesting_level, si, dolbrace_state; |
| char *result, *t; |
| DECLARE_MBSTATE; |
| |
| pass_character = 0; |
| nesting_level = 1; |
| slen = strlen (string + *sindex) + *sindex; |
| |
| /* The handling of dolbrace_state needs to agree with the code in parse.y: |
| parse_matched_pair(). The different initial value is to handle the |
| case where this function is called to parse the word in |
| ${param op word} (SX_WORD). */ |
| dolbrace_state = (flags & SX_WORD) ? DOLBRACE_WORD : DOLBRACE_PARAM; |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && (flags & SX_POSIXEXP)) |
| dolbrace_state = DOLBRACE_QUOTE; |
| |
| i = *sindex; |
| while (c = string[i]) |
| { |
| if (pass_character) |
| { |
| pass_character = 0; |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| |
| /* CTLESCs and backslashes quote the next character. */ |
| if (c == CTLESC || c == '\\') |
| { |
| pass_character++; |
| i++; |
| continue; |
| } |
| |
| if (string[i] == '$' && string[i+1] == LBRACE) |
| { |
| nesting_level++; |
| i += 2; |
| continue; |
| } |
| |
| if (c == RBRACE) |
| { |
| nesting_level--; |
| if (nesting_level == 0) |
| break; |
| i++; |
| continue; |
| } |
| |
| /* Pass the contents of old-style command substitutions through |
| verbatim. */ |
| if (c == '`') |
| { |
| si = i + 1; |
| t = string_extract (string, &si, "`", flags|SX_NOALLOC); |
| |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| |
| i = si + 1; |
| continue; |
| } |
| |
| /* Pass the contents of new-style command substitutions and |
| arithmetic substitutions through verbatim. */ |
| if (string[i] == '$' && string[i+1] == LPAREN) |
| { |
| si = i + 2; |
| t = extract_command_subst (string, &si, flags|SX_NOALLOC); |
| |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| |
| i = si + 1; |
| continue; |
| } |
| |
| #if defined (PROCESS_SUBSTITUTION) |
| /* Technically this should only work at the start of a word */ |
| if ((string[i] == '<' || string[i] == '>') && string[i+1] == LPAREN) |
| { |
| si = i + 2; |
| t = extract_process_subst (string, (string[i] == '<' ? "<(" : ">)"), &si, flags|SX_NOALLOC); |
| |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| |
| i = si + 1; |
| continue; |
| } |
| #endif |
| |
| /* Pass the contents of double-quoted strings through verbatim. */ |
| if (c == '"') |
| { |
| si = i + 1; |
| i = skip_double_quoted (string, slen, si, 0); |
| /* skip_XXX_quoted leaves index one past close quote */ |
| continue; |
| } |
| |
| if (c == '\'') |
| { |
| /*itrace("extract_dollar_brace_string: c == single quote flags = %d quoted = %d dolbrace_state = %d", flags, quoted, dolbrace_state);*/ |
| if (posixly_correct && shell_compatibility_level > 42 && dolbrace_state != DOLBRACE_QUOTE && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES))) |
| ADVANCE_CHAR (string, slen, i); |
| else |
| { |
| si = i + 1; |
| i = skip_single_quoted (string, slen, si, 0); |
| } |
| |
| continue; |
| } |
| |
| #if defined (ARRAY_VARS) |
| if (c == LBRACK && dolbrace_state == DOLBRACE_PARAM) |
| { |
| si = skipsubscript (string, i, 0); |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| if (string[si] == RBRACK) |
| c = string[i = si]; |
| } |
| #endif |
| |
| /* move past this character, which was not special. */ |
| ADVANCE_CHAR (string, slen, i); |
| |
| /* This logic must agree with parse.y:parse_matched_pair, since they |
| share the same defines. */ |
| if (dolbrace_state == DOLBRACE_PARAM && c == '%' && (i - *sindex) > 1) |
| dolbrace_state = DOLBRACE_QUOTE; |
| else if (dolbrace_state == DOLBRACE_PARAM && c == '#' && (i - *sindex) > 1) |
| dolbrace_state = DOLBRACE_QUOTE; |
| else if (dolbrace_state == DOLBRACE_PARAM && c == '/' && (i - *sindex) > 1) |
| dolbrace_state = DOLBRACE_QUOTE2; /* XXX */ |
| else if (dolbrace_state == DOLBRACE_PARAM && c == '^' && (i - *sindex) > 1) |
| dolbrace_state = DOLBRACE_QUOTE; |
| else if (dolbrace_state == DOLBRACE_PARAM && c == ',' && (i - *sindex) > 1) |
| dolbrace_state = DOLBRACE_QUOTE; |
| /* This is intended to handle all of the [:]op expansions and the substring/ |
| length/pattern removal/pattern substitution expansions. */ |
| else if (dolbrace_state == DOLBRACE_PARAM && strchr ("#%^,~:-=?+/", c) != 0) |
| dolbrace_state = DOLBRACE_OP; |
| else if (dolbrace_state == DOLBRACE_OP && strchr ("#%^,~:-=?+/", c) == 0) |
| dolbrace_state = DOLBRACE_WORD; |
| } |
| |
| if (c == 0 && nesting_level) |
| { |
| if (no_longjmp_on_fatal_error == 0) |
| { /* { */ |
| last_command_exit_value = EXECUTION_FAILURE; |
| report_error (_("bad substitution: no closing `%s' in %s"), "}", string); |
| exp_jump_to_top_level (DISCARD); |
| } |
| else |
| { |
| *sindex = i; |
| return ((char *)NULL); |
| } |
| } |
| |
| result = (flags & SX_NOALLOC) ? (char *)NULL : substring (string, *sindex, i); |
| *sindex = i; |
| |
| return (result); |
| } |
| |
| /* Remove backslashes which are quoting backquotes from STRING. Modifies |
| STRING, and returns a pointer to it. */ |
| char * |
| de_backslash (string) |
| char *string; |
| { |
| register size_t slen; |
| register int i, j, prev_i; |
| DECLARE_MBSTATE; |
| |
| slen = strlen (string); |
| i = j = 0; |
| |
| /* Loop copying string[i] to string[j], i >= j. */ |
| while (i < slen) |
| { |
| if (string[i] == '\\' && (string[i + 1] == '`' || string[i + 1] == '\\' || |
| string[i + 1] == '$')) |
| i++; |
| prev_i = i; |
| ADVANCE_CHAR (string, slen, i); |
| if (j < prev_i) |
| do string[j++] = string[prev_i++]; while (prev_i < i); |
| else |
| j = i; |
| } |
| string[j] = '\0'; |
| |
| return (string); |
| } |
| |
| #if 0 |
| /*UNUSED*/ |
| /* Replace instances of \! in a string with !. */ |
| void |
| unquote_bang (string) |
| char *string; |
| { |
| register int i, j; |
| register char *temp; |
| |
| temp = (char *)xmalloc (1 + strlen (string)); |
| |
| for (i = 0, j = 0; (temp[j] = string[i]); i++, j++) |
| { |
| if (string[i] == '\\' && string[i + 1] == '!') |
| { |
| temp[j] = '!'; |
| i++; |
| } |
| } |
| strcpy (string, temp); |
| free (temp); |
| } |
| #endif |
| |
| #define CQ_RETURN(x) do { no_longjmp_on_fatal_error = oldjmp; return (x); } while (0) |
| |
| /* This function assumes s[i] == open; returns with s[ret] == close; used to |
| parse array subscripts. FLAGS & 1 means to not attempt to skip over |
| matched pairs of quotes or backquotes, or skip word expansions; it is |
| intended to be used after expansion has been performed and during final |
| assignment parsing (see arrayfunc.c:assign_compound_array_list()) or |
| during execution by a builtin which has already undergone word expansion. */ |
| static int |
| skip_matched_pair (string, start, open, close, flags) |
| const char *string; |
| int start, open, close, flags; |
| { |
| int i, pass_next, backq, si, c, count, oldjmp; |
| size_t slen; |
| char *temp, *ss; |
| DECLARE_MBSTATE; |
| |
| slen = strlen (string + start) + start; |
| oldjmp = no_longjmp_on_fatal_error; |
| no_longjmp_on_fatal_error = 1; |
| |
| i = start + 1; /* skip over leading bracket */ |
| count = 1; |
| pass_next = backq = 0; |
| ss = (char *)string; |
| while (c = string[i]) |
| { |
| if (pass_next) |
| { |
| pass_next = 0; |
| if (c == 0) |
| CQ_RETURN(i); |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| else if ((flags & 1) == 0 && c == '\\') |
| { |
| pass_next = 1; |
| i++; |
| continue; |
| } |
| else if (backq) |
| { |
| if (c == '`') |
| backq = 0; |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| else if ((flags & 1) == 0 && c == '`') |
| { |
| backq = 1; |
| i++; |
| continue; |
| } |
| else if ((flags & 1) == 0 && c == open) |
| { |
| count++; |
| i++; |
| continue; |
| } |
| else if (c == close) |
| { |
| count--; |
| if (count == 0) |
| break; |
| i++; |
| continue; |
| } |
| else if ((flags & 1) == 0 && (c == '\'' || c == '"')) |
| { |
| i = (c == '\'') ? skip_single_quoted (ss, slen, ++i, 0) |
| : skip_double_quoted (ss, slen, ++i, 0); |
| /* no increment, the skip functions increment past the closing quote. */ |
| } |
| else if ((flags&1) == 0 && c == '$' && (string[i+1] == LPAREN || string[i+1] == LBRACE)) |
| { |
| si = i + 2; |
| if (string[si] == '\0') |
| CQ_RETURN(si); |
| |
| /* XXX - extract_command_subst here? */ |
| if (string[i+1] == LPAREN) |
| temp = extract_delimited_string (ss, &si, "$(", "(", ")", SX_NOALLOC|SX_COMMAND); /* ) */ |
| else |
| temp = extract_dollar_brace_string (ss, &si, 0, SX_NOALLOC); |
| |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| |
| i = si; |
| if (string[i] == '\0') /* don't increment i past EOS in loop */ |
| break; |
| i++; |
| continue; |
| } |
| else |
| ADVANCE_CHAR (string, slen, i); |
| } |
| |
| CQ_RETURN(i); |
| } |
| |
| #if defined (ARRAY_VARS) |
| /* Flags has 1 as a reserved value, since skip_matched_pair uses it for |
| skipping over quoted strings and taking the first instance of the |
| closing character. */ |
| int |
| skipsubscript (string, start, flags) |
| const char *string; |
| int start, flags; |
| { |
| return (skip_matched_pair (string, start, '[', ']', flags)); |
| } |
| #endif |
| |
| /* Skip characters in STRING until we find a character in DELIMS, and return |
| the index of that character. START is the index into string at which we |
| begin. This is similar in spirit to strpbrk, but it returns an index into |
| STRING and takes a starting index. This little piece of code knows quite |
| a lot of shell syntax. It's very similar to skip_double_quoted and other |
| functions of that ilk. */ |
| int |
| skip_to_delim (string, start, delims, flags) |
| char *string; |
| int start; |
| char *delims; |
| int flags; |
| { |
| int i, pass_next, backq, dquote, si, c, oldjmp; |
| int invert, skipquote, skipcmd, noprocsub, completeflag; |
| int arithexp, skipcol; |
| size_t slen; |
| char *temp, open[3]; |
| DECLARE_MBSTATE; |
| |
| slen = strlen (string + start) + start; |
| oldjmp = no_longjmp_on_fatal_error; |
| if (flags & SD_NOJMP) |
| no_longjmp_on_fatal_error = 1; |
| invert = (flags & SD_INVERT); |
| skipcmd = (flags & SD_NOSKIPCMD) == 0; |
| noprocsub = (flags & SD_NOPROCSUB); |
| completeflag = (flags & SD_COMPLETE) ? SX_COMPLETE : 0; |
| |
| arithexp = (flags & SD_ARITHEXP); |
| skipcol = 0; |
| |
| i = start; |
| pass_next = backq = dquote = 0; |
| while (c = string[i]) |
| { |
| /* If this is non-zero, we should not let quote characters be delimiters |
| and the current character is a single or double quote. We should not |
| test whether or not it's a delimiter until after we skip single- or |
| double-quoted strings. */ |
| skipquote = ((flags & SD_NOQUOTEDELIM) && (c == '\'' || c =='"')); |
| if (pass_next) |
| { |
| pass_next = 0; |
| if (c == 0) |
| CQ_RETURN(i); |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| else if (c == '\\') |
| { |
| pass_next = 1; |
| i++; |
| continue; |
| } |
| else if (backq) |
| { |
| if (c == '`') |
| backq = 0; |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| else if (c == '`') |
| { |
| backq = 1; |
| i++; |
| continue; |
| } |
| else if (arithexp && skipcol && c == ':') |
| { |
| skipcol--; |
| i++; |
| continue; |
| } |
| else if (arithexp && c == '?') |
| { |
| skipcol++; |
| i++; |
| continue; |
| } |
| else if (skipquote == 0 && invert == 0 && member (c, delims)) |
| break; |
| /* the usual case is to use skip_xxx_quoted, but we don't skip over double |
| quoted strings when looking for the history expansion character as a |
| delimiter. */ |
| /* special case for programmable completion which takes place before |
| parser converts backslash-escaped single quotes between $'...' to |
| `regular' single-quoted strings. */ |
| else if (completeflag && i > 0 && string[i-1] == '$' && c == '\'') |
| i = skip_single_quoted (string, slen, ++i, SX_COMPLETE); |
| else if (c == '\'') |
| i = skip_single_quoted (string, slen, ++i, 0); |
| else if (c == '"') |
| i = skip_double_quoted (string, slen, ++i, completeflag); |
| else if (c == LPAREN && arithexp) |
| { |
| si = i + 1; |
| if (string[si] == '\0') |
| CQ_RETURN(si); |
| |
| temp = extract_delimited_string (string, &si, "(", "(", ")", SX_NOALLOC); /* ) */ |
| i = si; |
| if (string[i] == '\0') /* don't increment i past EOS in loop */ |
| break; |
| i++; |
| continue; |
| } |
| else if (c == '$' && ((skipcmd && string[i+1] == LPAREN) || string[i+1] == LBRACE)) |
| { |
| si = i + 2; |
| if (string[si] == '\0') |
| CQ_RETURN(si); |
| |
| if (string[i+1] == LPAREN) |
| temp = extract_delimited_string (string, &si, "$(", "(", ")", SX_NOALLOC|SX_COMMAND); /* ) */ |
| else |
| temp = extract_dollar_brace_string (string, &si, 0, SX_NOALLOC); |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| i = si; |
| if (string[i] == '\0') /* don't increment i past EOS in loop */ |
| break; |
| i++; |
| continue; |
| } |
| #if defined (PROCESS_SUBSTITUTION) |
| else if (skipcmd && noprocsub == 0 && (c == '<' || c == '>') && string[i+1] == LPAREN) |
| { |
| si = i + 2; |
| if (string[si] == '\0') |
| CQ_RETURN(si); |
| |
| temp = extract_delimited_string (string, &si, (c == '<') ? "<(" : ">(", "(", ")", SX_COMMAND|SX_NOALLOC); /* )) */ |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| i = si; |
| if (string[i] == '\0') |
| break; |
| i++; |
| continue; |
| } |
| #endif /* PROCESS_SUBSTITUTION */ |
| #if defined (EXTENDED_GLOB) |
| else if ((flags & SD_EXTGLOB) && extended_glob && string[i+1] == LPAREN && member (c, "?*+!@")) |
| { |
| si = i + 2; |
| if (string[si] == '\0') |
| CQ_RETURN(si); |
| |
| open[0] = c; |
| open[1] = LPAREN; |
| open[2] = '\0'; |
| temp = extract_delimited_string (string, &si, open, "(", ")", SX_NOALLOC); /* ) */ |
| |
| CHECK_STRING_OVERRUN (i, si, slen, c); |
| i = si; |
| if (string[i] == '\0') /* don't increment i past EOS in loop */ |
| break; |
| i++; |
| continue; |
| } |
| #endif |
| else if ((flags & SD_GLOB) && c == LBRACK) |
| { |
| si = i + 1; |
| if (string[si] == '\0') |
| CQ_RETURN(si); |
| |
| temp = extract_delimited_string (string, &si, "[", "[", "]", SX_NOALLOC); /* ] */ |
| |
| i = si; |
| if (string[i] == '\0') /* don't increment i past EOS in loop */ |
| break; |
| i++; |
| continue; |
| } |
| else if ((skipquote || invert) && (member (c, delims) == 0)) |
| break; |
| else |
| ADVANCE_CHAR (string, slen, i); |
| } |
| |
| CQ_RETURN(i); |
| } |
| |
| #if defined (BANG_HISTORY) |
| /* Skip to the history expansion character (delims[0]), paying attention to |
| quoted strings and command and process substitution. This is a stripped- |
| down version of skip_to_delims. The essential difference is that this |
| resets the quoting state when starting a command substitution */ |
| int |
| skip_to_histexp (string, start, delims, flags) |
| char *string; |
| int start; |
| char *delims; |
| int flags; |
| { |
| int i, pass_next, backq, dquote, c, oldjmp; |
| int histexp_comsub, histexp_backq, old_dquote; |
| size_t slen; |
| DECLARE_MBSTATE; |
| |
| slen = strlen (string + start) + start; |
| oldjmp = no_longjmp_on_fatal_error; |
| if (flags & SD_NOJMP) |
| no_longjmp_on_fatal_error = 1; |
| |
| histexp_comsub = histexp_backq = old_dquote = 0; |
| |
| i = start; |
| pass_next = backq = dquote = 0; |
| while (c = string[i]) |
| { |
| if (pass_next) |
| { |
| pass_next = 0; |
| if (c == 0) |
| CQ_RETURN(i); |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| else if (c == '\\') |
| { |
| pass_next = 1; |
| i++; |
| continue; |
| } |
| else if (backq && c == '`') |
| { |
| backq = 0; |
| histexp_backq--; |
| dquote = old_dquote; |
| i++; |
| continue; |
| } |
| else if (c == '`') |
| { |
| backq = 1; |
| histexp_backq++; |
| old_dquote = dquote; /* simple - one level for now */ |
| dquote = 0; |
| i++; |
| continue; |
| } |
| /* When in double quotes, act as if the double quote is a member of |
| history_no_expand_chars, like the history library does */ |
| else if (dquote && c == delims[0] && string[i+1] == '"') |
| { |
| i++; |
| continue; |
| } |
| else if (c == delims[0]) |
| break; |
| /* the usual case is to use skip_xxx_quoted, but we don't skip over double |
| quoted strings when looking for the history expansion character as a |
| delimiter. */ |
| else if (dquote && c == '\'') |
| { |
| i++; |
| continue; |
| } |
| else if (c == '\'') |
| i = skip_single_quoted (string, slen, ++i, 0); |
| /* The posixly_correct test makes posix-mode shells allow double quotes |
| to quote the history expansion character */ |
| else if (posixly_correct == 0 && c == '"') |
| { |
| dquote = 1 - dquote; |
| i++; |
| continue; |
| } |
| else if (c == '"') |
| i = skip_double_quoted (string, slen, ++i, 0); |
| #if defined (PROCESS_SUBSTITUTION) |
| else if ((c == '$' || c == '<' || c == '>') && string[i+1] == LPAREN && string[i+2] != LPAREN) |
| #else |
| else if (c == '$' && string[i+1] == LPAREN && string[i+2] != LPAREN) |
| #endif |
| { |
| if (string[i+2] == '\0') |
| CQ_RETURN(i+2); |
| i += 2; |
| histexp_comsub++; |
| old_dquote = dquote; |
| dquote = 0; |
| } |
| else if (histexp_comsub && c == RPAREN) |
| { |
| histexp_comsub--; |
| dquote = old_dquote; |
| i++; |
| continue; |
| } |
| else if (backq) /* placeholder */ |
| { |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| else |
| ADVANCE_CHAR (string, slen, i); |
| } |
| |
| CQ_RETURN(i); |
| } |
| #endif /* BANG_HISTORY */ |
| |
| #if defined (READLINE) |
| /* Return 1 if the portion of STRING ending at EINDEX is quoted (there is |
| an unclosed quoted string), or if the character at EINDEX is quoted |
| by a backslash. NO_LONGJMP_ON_FATAL_ERROR is used to flag that the various |
| single and double-quoted string parsing functions should not return an |
| error if there are unclosed quotes or braces. The characters that this |
| recognizes need to be the same as the contents of |
| rl_completer_quote_characters. */ |
| |
| int |
| char_is_quoted (string, eindex) |
| char *string; |
| int eindex; |
| { |
| int i, pass_next, c, oldjmp; |
| size_t slen; |
| DECLARE_MBSTATE; |
| |
| slen = strlen (string); |
| oldjmp = no_longjmp_on_fatal_error; |
| no_longjmp_on_fatal_error = 1; |
| i = pass_next = 0; |
| while (i <= eindex) |
| { |
| c = string[i]; |
| |
| if (pass_next) |
| { |
| pass_next = 0; |
| if (i >= eindex) /* XXX was if (i >= eindex - 1) */ |
| CQ_RETURN(1); |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| else if (c == '\\') |
| { |
| pass_next = 1; |
| i++; |
| continue; |
| } |
| else if (c == '$' && string[i+1] == '\'' && string[i+2]) |
| { |
| i += 2; |
| i = skip_single_quoted (string, slen, i, SX_COMPLETE); |
| if (i > eindex) |
| CQ_RETURN (i); |
| } |
| else if (c == '\'' || c == '"') |
| { |
| i = (c == '\'') ? skip_single_quoted (string, slen, ++i, 0) |
| : skip_double_quoted (string, slen, ++i, SX_COMPLETE); |
| if (i > eindex) |
| CQ_RETURN(1); |
| /* no increment, the skip_xxx functions go one past end */ |
| } |
| else |
| ADVANCE_CHAR (string, slen, i); |
| } |
| |
| CQ_RETURN(0); |
| } |
| |
| int |
| unclosed_pair (string, eindex, openstr) |
| char *string; |
| int eindex; |
| char *openstr; |
| { |
| int i, pass_next, openc, olen; |
| size_t slen; |
| DECLARE_MBSTATE; |
| |
| slen = strlen (string); |
| olen = strlen (openstr); |
| i = pass_next = openc = 0; |
| while (i <= eindex) |
| { |
| if (pass_next) |
| { |
| pass_next = 0; |
| if (i >= eindex) /* XXX was if (i >= eindex - 1) */ |
| return 0; |
| ADVANCE_CHAR (string, slen, i); |
| continue; |
| } |
| else if (string[i] == '\\') |
| { |
| pass_next = 1; |
| i++; |
| continue; |
| } |
| else if (STREQN (string + i, openstr, olen)) |
| { |
| openc = 1 - openc; |
| i += olen; |
| } |
| /* XXX - may want to handle $'...' specially here */ |
| else if (string[i] == '\'' || string[i] == '"') |
| { |
| i = (string[i] == '\'') ? skip_single_quoted (string, slen, i, 0) |
| : skip_double_quoted (string, slen, i, SX_COMPLETE); |
| if (i > eindex) |
| return 0; |
| } |
| else |
| ADVANCE_CHAR (string, slen, i); |
| } |
| return (openc); |
| } |
| |
| /* Split STRING (length SLEN) at DELIMS, and return a WORD_LIST with the |
| individual words. If DELIMS is NULL, the current value of $IFS is used |
| to split the string, and the function follows the shell field splitting |
| rules. SENTINEL is an index to look for. NWP, if non-NULL, |
| gets the number of words in the returned list. CWP, if non-NULL, gets |
| the index of the word containing SENTINEL. Non-whitespace chars in |
| DELIMS delimit separate fields. This is used by programmable completion. */ |
| WORD_LIST * |
| split_at_delims (string, slen, delims, sentinel, flags, nwp, cwp) |
| char *string; |
| int slen; |
| char *delims; |
| int sentinel, flags; |
| int *nwp, *cwp; |
| { |
| int ts, te, i, nw, cw, ifs_split, dflags; |
| char *token, *d, *d2; |
| WORD_LIST *ret, *tl; |
| |
| if (string == 0 || *string == '\0') |
| { |
| if (nwp) |
| *nwp = 0; |
| if (cwp) |
| *cwp = 0; |
| return ((WORD_LIST *)NULL); |
| } |
| |
| d = (delims == 0) ? ifs_value : delims; |
| ifs_split = delims == 0; |
| |
| /* Make d2 the non-whitespace characters in delims */ |
| d2 = 0; |
| if (delims) |
| { |
| size_t slength; |
| #if defined (HANDLE_MULTIBYTE) |
| size_t mblength = 1; |
| #endif |
| DECLARE_MBSTATE; |
| |
| slength = strlen (delims); |
| d2 = (char *)xmalloc (slength + 1); |
| i = ts = 0; |
| while (delims[i]) |
| { |
| #if defined (HANDLE_MULTIBYTE) |
| mbstate_t state_bak; |
| state_bak = state; |
| mblength = MBRLEN (delims + i, slength, &state); |
| if (MB_INVALIDCH (mblength)) |
| state = state_bak; |
| else if (mblength > 1) |
| { |
| memcpy (d2 + ts, delims + i, mblength); |
| ts += mblength; |
| i += mblength; |
| slength -= mblength; |
| continue; |
| } |
| #endif |
| if (whitespace (delims[i]) == 0) |
| d2[ts++] = delims[i]; |
| |
| i++; |
| slength--; |
| } |
| d2[ts] = '\0'; |
| } |
| |
| ret = (WORD_LIST *)NULL; |
| |
| /* Remove sequences of whitespace characters at the start of the string, as |
| long as those characters are delimiters. */ |
| for (i = 0; member (string[i], d) && spctabnl (string[i]); i++) |
| ; |
| if (string[i] == '\0') |
| { |
| FREE (d2); |
| return (ret); |
| } |
| |
| ts = i; |
| nw = 0; |
| cw = -1; |
| dflags = flags|SD_NOJMP; |
| while (1) |
| { |
| te = skip_to_delim (string, ts, d, dflags); |
| |
| /* If we have a non-whitespace delimiter character, use it to make a |
| separate field. This is just about what $IFS splitting does and |
| is closer to the behavior of the shell parser. */ |
| if (ts == te && d2 && member (string[ts], d2)) |
| { |
| te = ts + 1; |
| /* If we're using IFS splitting, the non-whitespace delimiter char |
| and any additional IFS whitespace delimits a field. */ |
| if (ifs_split) |
| while (member (string[te], d) && spctabnl (string[te]) && ((flags&SD_NOQUOTEDELIM) == 0 || (string[te] != '\'' && string[te] != '"'))) |
| te++; |
| else |
| while (member (string[te], d2) && ((flags&SD_NOQUOTEDELIM) == 0 || (string[te] != '\'' && string[te] != '"'))) |
| te++; |
| } |
| |
| token = substring (string, ts, te); |
| |
| ret = add_string_to_list (token, ret); /* XXX */ |
| free (token); |
| nw++; |
| |
| if (sentinel >= ts && sentinel <= te) |
| cw = nw; |
| |
| /* If the cursor is at whitespace just before word start, set the |
| sentinel word to the current word. */ |
| if (cwp && cw == -1 && sentinel == ts-1) |
| cw = nw; |
| |
| /* If the cursor is at whitespace between two words, make a new, empty |
| word, add it before (well, after, since the list is in reverse order) |
| the word we just added, and set the current word to that one. */ |
| if (cwp && cw == -1 && sentinel < ts) |
| { |
| tl = make_word_list (make_word (""), ret->next); |
| ret->next = tl; |
| cw = nw; |
| nw++; |
| } |
| |
| if (string[te] == 0) |
| break; |
| |
| i = te; |
| /* XXX - honor SD_NOQUOTEDELIM here */ |
| while (member (string[i], d) && (ifs_split || spctabnl(string[i])) && ((flags&SD_NOQUOTEDELIM) == 0 || (string[te] != '\'' && string[te] != '"'))) |
| i++; |
| |
| if (string[i]) |
| ts = i; |
| else |
| break; |
| } |
| |
| /* Special case for SENTINEL at the end of STRING. If we haven't found |
| the word containing SENTINEL yet, and the index we're looking for is at |
| the end of STRING (or past the end of the previously-found token, |
| possible if the end of the line is composed solely of IFS whitespace) |
| add an additional null argument and set the current word pointer to that. */ |
| if (cwp && cw == -1 && (sentinel >= slen || sentinel >= te)) |
| { |
| if (whitespace (string[sentinel - 1])) |
| { |
| token = ""; |
| ret = add_string_to_list (token, ret); |
| nw++; |
| } |
| cw = nw; |
| } |
| |
| if (nwp) |
| *nwp = nw; |
| if (cwp) |
| *cwp = cw; |
| |
| FREE (d2); |
| |
| return (REVERSE_LIST (ret, WORD_LIST *)); |
| } |
| #endif /* READLINE */ |
| |
| #if 0 |
| /* UNUSED */ |
| /* Extract the name of the variable to bind to from the assignment string. */ |
| char * |
| assignment_name (string) |
| char *string; |
| { |
| int offset; |
| char *temp; |
| |
| offset = assignment (string, 0); |
| if (offset == 0) |
| return (char *)NULL; |
| temp = substring (string, 0, offset); |
| return (temp); |
| } |
| #endif |
| |
| /* **************************************************************** */ |
| /* */ |
| /* Functions to convert strings to WORD_LISTs and vice versa */ |
| /* */ |
| /* **************************************************************** */ |
| |
| /* Return a single string of all the words in LIST. SEP is the separator |
| to put between individual elements of LIST in the output string. */ |
| char * |
| string_list_internal (list, sep) |
| WORD_LIST *list; |
| char *sep; |
| { |
| register WORD_LIST *t; |
| char *result, *r; |
| size_t word_len, sep_len, result_size; |
| |
| if (list == 0) |
| return ((char *)NULL); |
| |
| /* Short-circuit quickly if we don't need to separate anything. */ |
| if (list->next == 0) |
| return (savestring (list->word->word)); |
| |
| /* This is nearly always called with either sep[0] == 0 or sep[1] == 0. */ |
| sep_len = STRLEN (sep); |
| result_size = 0; |
| |
| for (t = list; t; t = t->next) |
| { |
| if (t != list) |
| result_size += sep_len; |
| result_size += strlen (t->word->word); |
| } |
| |
| r = result = (char *)xmalloc (result_size + 1); |
| |
| for (t = list; t; t = t->next) |
| { |
| if (t != list && sep_len) |
| { |
| if (sep_len > 1) |
| { |
| FASTCOPY (sep, r, sep_len); |
| r += sep_len; |
| } |
| else |
| *r++ = sep[0]; |
| } |
| |
| word_len = strlen (t->word->word); |
| FASTCOPY (t->word->word, r, word_len); |
| r += word_len; |
| } |
| |
| *r = '\0'; |
| return (result); |
| } |
| |
| /* Return a single string of all the words present in LIST, separating |
| each word with a space. */ |
| char * |
| string_list (list) |
| WORD_LIST *list; |
| { |
| return (string_list_internal (list, " ")); |
| } |
| |
| /* An external interface that can be used by the rest of the shell to |
| obtain a string containing the first character in $IFS. Handles all |
| the multibyte complications. If LENP is non-null, it is set to the |
| length of the returned string. */ |
| char * |
| ifs_firstchar (lenp) |
| int *lenp; |
| { |
| char *ret; |
| int len; |
| |
| ret = xmalloc (MB_LEN_MAX + 1); |
| #if defined (HANDLE_MULTIBYTE) |
| if (ifs_firstc_len == 1) |
| { |
| ret[0] = ifs_firstc[0]; |
| ret[1] = '\0'; |
| len = ret[0] ? 1 : 0; |
| } |
| else |
| { |
| memcpy (ret, ifs_firstc, ifs_firstc_len); |
| ret[len = ifs_firstc_len] = '\0'; |
| } |
| #else |
| ret[0] = ifs_firstc; |
| ret[1] = '\0'; |
| len = ret[0] ? 0 : 1; |
| #endif |
| |
| if (lenp) |
| *lenp = len; |
| |
| return ret; |
| } |
| |
| /* Return a single string of all the words present in LIST, obeying the |
| quoting rules for "$*", to wit: (P1003.2, draft 11, 3.5.2) "If the |
| expansion [of $*] appears within a double quoted string, it expands |
| to a single field with the value of each parameter separated by the |
| first character of the IFS variable, or by a <space> if IFS is unset." */ |
| /* Posix interpretation 888 changes this when IFS is null by specifying |
| that when unquoted, this expands to separate arguments */ |
| char * |
| string_list_dollar_star (list, quoted, flags) |
| WORD_LIST *list; |
| int quoted, flags; |
| { |
| char *ret; |
| #if defined (HANDLE_MULTIBYTE) |
| # if defined (__GNUC__) |
| char sep[MB_CUR_MAX + 1]; |
| # else |
| char *sep = 0; |
| # endif |
| #else |
| char sep[2]; |
| #endif |
| |
| #if defined (HANDLE_MULTIBYTE) |
| # if !defined (__GNUC__) |
| sep = (char *)xmalloc (MB_CUR_MAX + 1); |
| # endif /* !__GNUC__ */ |
| if (ifs_firstc_len == 1) |
| { |
| sep[0] = ifs_firstc[0]; |
| sep[1] = '\0'; |
| } |
| else |
| { |
| memcpy (sep, ifs_firstc, ifs_firstc_len); |
| sep[ifs_firstc_len] = '\0'; |
| } |
| #else |
| sep[0] = ifs_firstc; |
| sep[1] = '\0'; |
| #endif |
| |
| ret = string_list_internal (list, sep); |
| #if defined (HANDLE_MULTIBYTE) && !defined (__GNUC__) |
| free (sep); |
| #endif |
| return ret; |
| } |
| |
| /* Turn $@ into a string. If (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) |
| is non-zero, the $@ appears within double quotes, and we should quote |
| the list before converting it into a string. If IFS is unset, and the |
| word is not quoted, we just need to quote CTLESC and CTLNUL characters |
| in the words in the list, because the default value of $IFS is |
| <space><tab><newline>, IFS characters in the words in the list should |
| also be split. If IFS is null, and the word is not quoted, we need |
| to quote the words in the list to preserve the positional parameters |
| exactly. |
| Valid values for the FLAGS argument are the PF_ flags in command.h, |
| the only one we care about is PF_ASSIGNRHS. $@ is supposed to expand |
| to the positional parameters separated by spaces no matter what IFS is |
| set to if in a context where word splitting is not performed. The only |
| one that we didn't handle before is assignment statement arguments to |
| declaration builtins like `declare'. */ |
| char * |
| string_list_dollar_at (list, quoted, flags) |
| WORD_LIST *list; |
| int quoted; |
| int flags; |
| { |
| char *ifs, *ret; |
| #if defined (HANDLE_MULTIBYTE) |
| # if defined (__GNUC__) |
| char sep[MB_CUR_MAX + 1]; |
| # else |
| char *sep = 0; |
| # endif /* !__GNUC__ */ |
| #else |
| char sep[2]; |
| #endif |
| WORD_LIST *tlist; |
| |
| /* XXX this could just be ifs = ifs_value; */ |
| ifs = ifs_var ? value_cell (ifs_var) : (char *)0; |
| |
| #if defined (HANDLE_MULTIBYTE) |
| # if !defined (__GNUC__) |
| sep = (char *)xmalloc (MB_CUR_MAX + 1); |
| # endif /* !__GNUC__ */ |
| /* XXX - testing PF_ASSIGNRHS to make sure positional parameters are |
| separated with a space even when word splitting will not occur. */ |
| if (flags & PF_ASSIGNRHS) |
| { |
| sep[0] = ' '; |
| sep[1] = '\0'; |
| } |
| else if (ifs && *ifs) |
| { |
| if (ifs_firstc_len == 1) |
| { |
| sep[0] = ifs_firstc[0]; |
| sep[1] = '\0'; |
| } |
| else |
| { |
| memcpy (sep, ifs_firstc, ifs_firstc_len); |
| sep[ifs_firstc_len] = '\0'; |
| } |
| } |
| else |
| { |
| sep[0] = ' '; |
| sep[1] = '\0'; |
| } |
| #else /* !HANDLE_MULTIBYTE */ |
| /* XXX - PF_ASSIGNRHS means no word splitting, so we want positional |
| parameters separated by a space. */ |
| sep[0] = ((flags & PF_ASSIGNRHS) || ifs == 0 || *ifs == 0) ? ' ' : *ifs; |
| sep[1] = '\0'; |
| #endif /* !HANDLE_MULTIBYTE */ |
| |
| /* XXX -- why call quote_list if ifs == 0? we can get away without doing |
| it now that quote_escapes quotes spaces */ |
| tlist = (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES|Q_PATQUOTE)) |
| ? quote_list (list) |
| : list_quote_escapes (list); |
| |
| ret = string_list_internal (tlist, sep); |
| #if defined (HANDLE_MULTIBYTE) && !defined (__GNUC__) |
| free (sep); |
| #endif |
| return ret; |
| } |
| |
| /* Turn the positional parameters into a string, understanding quoting and |
| the various subtleties of using the first character of $IFS as the |
| separator. Calls string_list_dollar_at, string_list_dollar_star, and |
| string_list as appropriate. */ |
| /* This needs to fully understand the additional contexts where word |
| splitting does not occur (W_ASSIGNRHS, etc.) */ |
| char * |
| string_list_pos_params (pchar, list, quoted, pflags) |
| int pchar; |
| WORD_LIST *list; |
| int quoted, pflags; |
| { |
| char *ret; |
| WORD_LIST *tlist; |
| |
| if (pchar == '*' && (quoted & Q_DOUBLE_QUOTES)) |
| { |
| tlist = quote_list (list); |
| word_list_remove_quoted_nulls (tlist); |
| ret = string_list_dollar_star (tlist, 0, 0); |
| } |
| else if (pchar == '*' && (quoted & Q_HERE_DOCUMENT)) |
| { |
| tlist = quote_list (list); |
| word_list_remove_quoted_nulls (tlist); |
| ret = string_list (tlist); |
| } |
| else if (pchar == '*' && quoted == 0 && ifs_is_null) /* XXX */ |
| ret = expand_no_split_dollar_star ? string_list_dollar_star (list, quoted, 0) : string_list_dollar_at (list, quoted, 0); /* Posix interp 888 */ |
| else if (pchar == '*' && quoted == 0 && (pflags & PF_ASSIGNRHS)) /* XXX */ |
| ret = expand_no_split_dollar_star ? string_list_dollar_star (list, quoted, 0) : string_list_dollar_at (list, quoted, 0); /* Posix interp 888 */ |
| else if (pchar == '*') |
| { |
| /* Even when unquoted, string_list_dollar_star does the right thing |
| making sure that the first character of $IFS is used as the |
| separator. */ |
| ret = string_list_dollar_star (list, quoted, 0); |
| } |
| else if (pchar == '@' && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES))) |
| /* We use string_list_dollar_at, but only if the string is quoted, since |
| that quotes the escapes if it's not, which we don't want. We could |
| use string_list (the old code did), but that doesn't do the right |
| thing if the first character of $IFS is not a space. We use |
| string_list_dollar_star if the string is unquoted so we make sure that |
| the elements of $@ are separated by the first character of $IFS for |
| later splitting. */ |
| ret = string_list_dollar_at (list, quoted, 0); |
| else if (pchar == '@' && quoted == 0 && ifs_is_null) /* XXX */ |
| ret = string_list_dollar_at (list, quoted, 0); /* Posix interp 888 */ |
| else if (pchar == '@' && quoted == 0 && (pflags & PF_ASSIGNRHS)) |
| ret = string_list_dollar_at (list, quoted, pflags); /* Posix interp 888 */ |
| else if (pchar == '@') |
| ret = string_list_dollar_star (list, quoted, 0); |
| else |
| ret = string_list ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) ? quote_list (list) : list); |
| |
| return ret; |
| } |
| |
| /* Return the list of words present in STRING. Separate the string into |
| words at any of the characters found in SEPARATORS. If QUOTED is |
| non-zero then word in the list will have its quoted flag set, otherwise |
| the quoted flag is left as make_word () deemed fit. |
| |
| This obeys the P1003.2 word splitting semantics. If `separators' is |
| exactly <space><tab><newline>, then the splitting algorithm is that of |
| the Bourne shell, which treats any sequence of characters from `separators' |
| as a delimiter. If IFS is unset, which results in `separators' being set |
| to "", no splitting occurs. If separators has some other value, the |
| following rules are applied (`IFS white space' means zero or more |
| occurrences of <space>, <tab>, or <newline>, as long as those characters |
| are in `separators'): |
| |
| 1) IFS white space is ignored at the start and the end of the |
| string. |
| 2) Each occurrence of a character in `separators' that is not |
| IFS white space, along with any adjacent occurrences of |
| IFS white space delimits a field. |
| 3) Any nonzero-length sequence of IFS white space delimits a field. |
| */ |
| |
| /* BEWARE! list_string strips null arguments. Don't call it twice and |
| expect to have "" preserved! */ |
| |
| /* This performs word splitting and quoted null character removal on |
| STRING. */ |
| #define issep(c) \ |
| (((separators)[0]) ? ((separators)[1] ? isifs(c) \ |
| : (c) == (separators)[0]) \ |
| : 0) |
| |
| /* member of the space character class in the current locale */ |
| #define ifs_whitespace(c) ISSPACE(c) |
| |
| /* "adjacent IFS white space" */ |
| #define ifs_whitesep(c) ((sh_style_split || separators == 0) ? spctabnl (c) \ |
| : ifs_whitespace (c)) |
| |
| WORD_LIST * |
| list_string (string, separators, quoted) |
| register char *string, *separators; |
| int quoted; |
| { |
| WORD_LIST *result; |
| WORD_DESC *t; |
| char *current_word, *s; |
| int sindex, sh_style_split, whitesep, xflags, free_word; |
| size_t slen; |
| |
| if (!string || !*string) |
| return ((WORD_LIST *)NULL); |
| |
| sh_style_split = separators && separators[0] == ' ' && |
| separators[1] == '\t' && |
| separators[2] == '\n' && |
| separators[3] == '\0'; |
| for (xflags = 0, s = ifs_value; s && *s; s++) |
| { |
| if (*s == CTLESC) xflags |= SX_NOCTLESC; |
| else if (*s == CTLNUL) xflags |= SX_NOESCCTLNUL; |
| } |
| |
| slen = 0; |
| /* Remove sequences of whitespace at the beginning of STRING, as |
| long as those characters appear in IFS. Do not do this if |
| STRING is quoted or if there are no separator characters. We use the |
| Posix definition of whitespace as a member of the space character |
| class in the current locale. */ |
| #if 0 |
| if (!quoted || !separators || !*separators) |
| #else |
| /* issep() requires that separators be non-null, and always returns 0 if |
| separator is the empty string, so don't bother if we get an empty string |
| for separators. We already returned NULL above if STRING is empty. */ |
| if (!quoted && separators && *separators) |
| #endif |
| { |
| for (s = string; *s && issep (*s) && ifs_whitespace (*s); s++); |
| |
| if (!*s) |
| return ((WORD_LIST *)NULL); |
| |
| string = s; |
| } |
| |
| /* OK, now STRING points to a word that does not begin with white space. |
| The splitting algorithm is: |
| extract a word, stopping at a separator |
| skip sequences of whitespace characters as long as they are separators |
| This obeys the field splitting rules in Posix.2. */ |
| slen = STRLEN (string); |
| for (result = (WORD_LIST *)NULL, sindex = 0; string[sindex]; ) |
| { |
| /* Don't need string length in ADVANCE_CHAR unless multibyte chars are |
| possible, but need it in string_extract_verbatim for bounds checking */ |
| current_word = string_extract_verbatim (string, slen, &sindex, separators, xflags); |
| if (current_word == 0) |
| break; |
| |
| free_word = 1; /* If non-zero, we free current_word */ |
| |
| /* If we have a quoted empty string, add a quoted null argument. We |
| want to preserve the quoted null character iff this is a quoted |
| empty string; otherwise the quoted null characters are removed |
| below. */ |
| if (QUOTED_NULL (current_word)) |
| { |
| t = alloc_word_desc (); |
| t->word = make_quoted_char ('\0'); |
| t->flags |= W_QUOTED|W_HASQUOTEDNULL; |
| result = make_word_list (t, result); |
| } |
| else if (current_word[0] != '\0') |
| { |
| /* If we have something, then add it regardless. However, |
| perform quoted null character removal on the current word. */ |
| remove_quoted_nulls (current_word); |
| |
| /* We don't want to set the word flags based on the string contents |
| here -- that's mostly for the parser -- so we just allocate a |
| WORD_DESC *, assign current_word (noting that we don't want to |
| free it), and skip all of make_word. */ |
| t = alloc_word_desc (); |
| t->word = current_word; |
| result = make_word_list (t, result); |
| free_word = 0; |
| result->word->flags &= ~W_HASQUOTEDNULL; /* just to be sure */ |
| if (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) |
| result->word->flags |= W_QUOTED; |
| /* If removing quoted null characters leaves an empty word, note |
| that we saw this for the caller to act on. */ |
| if (current_word == 0 || current_word[0] == '\0') |
| result->word->flags |= W_SAWQUOTEDNULL; |
| } |
| |
| /* If we're not doing sequences of separators in the traditional |
| Bourne shell style, then add a quoted null argument. */ |
| else if (!sh_style_split && !ifs_whitespace (string[sindex])) |
| { |
| t = alloc_word_desc (); |
| t->word = make_quoted_char ('\0'); |
| t->flags |= W_QUOTED|W_HASQUOTEDNULL; |
| result = make_word_list (t, result); |
| } |
| |
| if (free_word) |
| free (current_word); |
| |
| /* Note whether or not the separator is IFS whitespace, used later. */ |
| whitesep = string[sindex] && ifs_whitesep (string[sindex]); |
| |
| /* Move past the current separator character. */ |
| if (string[sindex]) |
| { |
| DECLARE_MBSTATE; |
| ADVANCE_CHAR (string, slen, sindex); |
| } |
| |
| /* Now skip sequences of whitespace characters if they are |
| in the list of separators. */ |
| while (string[sindex] && ifs_whitesep (string[sindex]) && issep (string[sindex])) |
| sindex++; |
| |
| /* If the first separator was IFS whitespace and the current character |
| is a non-whitespace IFS character, it should be part of the current |
| field delimiter, not a separate delimiter that would result in an |
| empty field. Look at POSIX.2, 3.6.5, (3)(b). */ |
| if (string[sindex] && whitesep && issep (string[sindex]) && !ifs_whitesep (string[sindex])) |
| { |
| sindex++; |
| /* An IFS character that is not IFS white space, along with any |
| adjacent IFS white space, shall delimit a field. (SUSv3) */ |
| while (string[sindex] && ifs_whitesep (string[sindex]) && isifs (string[sindex])) |
| sindex++; |
| } |
| } |
| return (REVERSE_LIST (result, WORD_LIST *)); |
| } |
| |
| /* Parse a single word from STRING, using SEPARATORS to separate fields. |
| ENDPTR is set to the first character after the word. This is used by |
| the `read' builtin. |
| |
| This is never called with SEPARATORS != $IFS, and takes advantage of that. |
| |
| XXX - this function is very similar to list_string; they should be |
| combined - XXX */ |
| |
| /* character is in $IFS */ |
| #define islocalsep(c) (local_cmap[(unsigned char)(c)] != 0) |
| |
| char * |
| get_word_from_string (stringp, separators, endptr) |
| char **stringp, *separators, **endptr; |
| { |
| register char *s; |
| char *current_word; |
| int sindex, sh_style_split, whitesep, xflags; |
| unsigned char local_cmap[UCHAR_MAX+1]; /* really only need single-byte chars here */ |
| size_t slen; |
| |
| if (!stringp || !*stringp || !**stringp) |
| return ((char *)NULL); |
| |
| sh_style_split = separators && separators[0] == ' ' && |
| separators[1] == '\t' && |
| separators[2] == '\n' && |
| separators[3] == '\0'; |
| memset (local_cmap, '\0', sizeof (local_cmap)); |
| for (xflags = 0, s = separators; s && *s; s++) |
| { |
| if (*s == CTLESC) xflags |= SX_NOCTLESC; |
| if (*s == CTLNUL) xflags |= SX_NOESCCTLNUL; |
| local_cmap[(unsigned char)*s] = 1; /* local charmap of separators */ |
| } |
| |
| s = *stringp; |
| slen = 0; |
| |
| /* Remove sequences of whitespace at the beginning of STRING, as |
| long as those characters appear in SEPARATORS. This happens if |
| SEPARATORS == $' \t\n' or if IFS is unset. */ |
| if (sh_style_split || separators == 0) |
| for (; *s && spctabnl (*s) && islocalsep (*s); s++); |
| else |
| for (; *s && ifs_whitespace (*s) && islocalsep (*s); s++); |
| |
| /* If the string is nothing but whitespace, update it and return. */ |
| if (!*s) |
| { |
| *stringp = s; |
| if (endptr) |
| *endptr = s; |
| return ((char *)NULL); |
| } |
| |
| /* OK, S points to a word that does not begin with white space. |
| Now extract a word, stopping at a separator, save a pointer to |
| the first character after the word, then skip sequences of spc, |
| tab, or nl as long as they are separators. |
| |
| This obeys the field splitting rules in Posix.2. */ |
| sindex = 0; |
| /* Don't need string length in ADVANCE_CHAR unless multibyte chars are |
| possible, but need it in string_extract_verbatim for bounds checking */ |
| slen = STRLEN (s); |
| current_word = string_extract_verbatim (s, slen, &sindex, separators, xflags); |
| |
| /* Set ENDPTR to the first character after the end of the word. */ |
| if (endptr) |
| *endptr = s + sindex; |
| |
| /* Note whether or not the separator is IFS whitespace, used later. */ |
| whitesep = s[sindex] && ifs_whitesep (s[sindex]); |
| |
| /* Move past the current separator character. */ |
| if (s[sindex]) |
| { |
| DECLARE_MBSTATE; |
| ADVANCE_CHAR (s, slen, sindex); |
| } |
| |
| /* Now skip sequences of space, tab, or newline characters if they are |
| in the list of separators. */ |
| while (s[sindex] && spctabnl (s[sindex]) && islocalsep (s[sindex])) |
| sindex++; |
| |
| /* If the first separator was IFS whitespace and the current character is |
| a non-whitespace IFS character, it should be part of the current field |
| delimiter, not a separate delimiter that would result in an empty field. |
| Look at POSIX.2, 3.6.5, (3)(b). */ |
| if (s[sindex] && whitesep && islocalsep (s[sindex]) && !ifs_whitesep (s[sindex])) |
| { |
| sindex++; |
| /* An IFS character that is not IFS white space, along with any adjacent |
| IFS white space, shall delimit a field. */ |
| while (s[sindex] && ifs_whitesep (s[sindex]) && islocalsep(s[sindex])) |
| sindex++; |
| } |
| |
| /* Update STRING to point to the next field. */ |
| *stringp = s + sindex; |
| return (current_word); |
| } |
| |
| /* Remove IFS white space at the end of STRING. Start at the end |
| of the string and walk backwards until the beginning of the string |
| or we find a character that's not IFS white space and not CTLESC. |
| Only let CTLESC escape a white space character if SAW_ESCAPE is |
| non-zero. */ |
| char * |
| strip_trailing_ifs_whitespace (string, separators, saw_escape) |
| char *string, *separators; |
| int saw_escape; |
| { |
| char *s; |
| |
| s = string + STRLEN (string) - 1; |
| while (s > string && ((spctabnl (*s) && isifs (*s)) || |
| (saw_escape && *s == CTLESC && spctabnl (s[1])))) |
| s--; |
| *++s = '\0'; |
| return string; |
| } |
| |
| #if 0 |
| /* UNUSED */ |
| /* Split STRING into words at whitespace. Obeys shell-style quoting with |
| backslashes, single and double quotes. */ |
| WORD_LIST * |
| list_string_with_quotes (string) |
| char *string; |
| { |
| WORD_LIST *list; |
| char *token, *s; |
| size_t s_len; |
| int c, i, tokstart, len; |
| |
| for (s = string; s && *s && spctabnl (*s); s++) |
| ; |
| if (s == 0 || *s == 0) |
| return ((WORD_LIST *)NULL); |
| |
| s_len = strlen (s); |
| tokstart = i = 0; |
| list = (WORD_LIST *)NULL; |
| while (1) |
| { |
| c = s[i]; |
| if (c == '\\') |
| { |
| i++; |
| if (s[i]) |
| i++; |
| } |
| else if (c == '\'') |
| i = skip_single_quoted (s, s_len, ++i, 0); |
| else if (c == '"') |
| i = skip_double_quoted (s, s_len, ++i, 0); |
| else if (c == 0 || spctabnl (c)) |
| { |
| /* We have found the end of a token. Make a word out of it and |
| add it to the word list. */ |
| token = substring (s, tokstart, i); |
| list = add_string_to_list (token, list); |
| free (token); |
| while (spctabnl (s[i])) |
| i++; |
| if (s[i]) |
| tokstart = i; |
| else |
| break; |
| } |
| else |
| i++; /* normal character */ |
| } |
| return (REVERSE_LIST (list, WORD_LIST *)); |
| } |
| #endif |
| |
| /********************************************************/ |
| /* */ |
| /* Functions to perform assignment statements */ |
| /* */ |
| /********************************************************/ |
| |
| #if defined (ARRAY_VARS) |
| static SHELL_VAR * |
| do_compound_assignment (name, value, flags) |
| char *name, *value; |
| int flags; |
| { |
| SHELL_VAR *v; |
| int mklocal, mkassoc, mkglobal, chklocal; |
| WORD_LIST *list; |
| char *newname; /* used for local nameref references */ |
| |
| mklocal = flags & ASS_MKLOCAL; |
| mkassoc = flags & ASS_MKASSOC; |
| mkglobal = flags & ASS_MKGLOBAL; |
| chklocal = flags & ASS_CHKLOCAL; |
| |
| if (mklocal && variable_context) |
| { |
| v = find_variable (name); /* follows namerefs */ |
| newname = (v == 0) ? nameref_transform_name (name, flags) : v->name; |
| if (v && ((readonly_p (v) && (flags & ASS_FORCE) == 0) || noassign_p (v))) |
| { |
| if (readonly_p (v)) |
| err_readonly (name); |
| return (v); /* XXX */ |
| } |
| list = expand_compound_array_assignment (v, value, flags); |
| if (mkassoc) |
| v = make_local_assoc_variable (newname, 0); |
| else if (v == 0 || (array_p (v) == 0 && assoc_p (v) == 0) || v->context != variable_context) |
| v = make_local_array_variable (newname, 0); |
| if (v) |
| assign_compound_array_list (v, list, flags); |
| if (list) |
| dispose_words (list); |
| } |
| /* In a function but forcing assignment in global context. CHKLOCAL means to |
| check for an existing local variable first. */ |
| else if (mkglobal && variable_context) |
| { |
| v = chklocal ? find_variable (name) : 0; |
| if (v && (local_p (v) == 0 || v->context != variable_context)) |
| v = 0; |
| if (v == 0) |
| v = find_global_variable (name); |
| if (v && ((readonly_p (v) && (flags & ASS_FORCE) == 0) || noassign_p (v))) |
| { |
| if (readonly_p (v)) |
| err_readonly (name); |
| return (v); /* XXX */ |
| } |
| /* sanity check */ |
| newname = (v == 0) ? nameref_transform_name (name, flags) : name; |
| list = expand_compound_array_assignment (v, value, flags); |
| if (v == 0 && mkassoc) |
| v = make_new_assoc_variable (newname); |
| else if (v && mkassoc && assoc_p (v) == 0) |
| v = convert_var_to_assoc (v); |
| else if (v == 0) |
| v = make_new_array_variable (newname); |
| else if (v && mkassoc == 0 && array_p (v) == 0) |
| v = convert_var_to_array (v); |
| if (v) |
| assign_compound_array_list (v, list, flags); |
| if (list) |
| dispose_words (list); |
| } |
| else |
| { |
| v = assign_array_from_string (name, value, flags); |
| if (v && ((readonly_p (v) && (flags & ASS_FORCE) == 0) || noassign_p (v))) |
| { |
| if (readonly_p (v)) |
| err_readonly (name); |
| return (v); /* XXX */ |
| } |
| } |
| |
| return (v); |
| } |
| #endif |
| |
| /* Given STRING, an assignment string, get the value of the right side |
| of the `=', and bind it to the left side. If EXPAND is true, then |
| perform parameter expansion, command substitution, and arithmetic |
| expansion on the right-hand side. Perform tilde expansion in any |
| case. Do not perform word splitting on the result of expansion. */ |
| static int |
| do_assignment_internal (word, expand) |
| const WORD_DESC *word; |
| int expand; |
| { |
| int offset, appendop, assign_list, aflags, retval; |
| char *name, *value, *temp; |
| SHELL_VAR *entry; |
| #if defined (ARRAY_VARS) |
| char *t; |
| int ni; |
| #endif |
| const char *string; |
| |
| if (word == 0 || word->word == 0) |
| return 0; |
| |
| appendop = assign_list = aflags = 0; |
| string = word->word; |
| offset = assignment (string, 0); |
| name = savestring (string); |
| value = (char *)NULL; |
| |
| if (name[offset] == '=') |
| { |
| if (name[offset - 1] == '+') |
| { |
| appendop = 1; |
| name[offset - 1] = '\0'; |
| } |
| |
| name[offset] = 0; /* might need this set later */ |
| temp = name + offset + 1; |
| |
| #if defined (ARRAY_VARS) |
| if (expand && (word->flags & W_COMPASSIGN)) |
| { |
| assign_list = ni = 1; |
| value = extract_array_assignment_list (temp, &ni); |
| } |
| else |
| #endif |
| if (expand && temp[0]) |
| value = expand_string_if_necessary (temp, 0, expand_string_assignment); |
| else |
| value = savestring (temp); |
| } |
| |
| if (value == 0) |
| { |
| value = (char *)xmalloc (1); |
| value[0] = '\0'; |
| } |
| |
| if (echo_command_at_execute) |
| { |
| if (appendop) |
| name[offset - 1] = '+'; |
| xtrace_print_assignment (name, value, assign_list, 1); |
| if (appendop) |
| name[offset - 1] = '\0'; |
| } |
| |
| #define ASSIGN_RETURN(r) do { FREE (value); free (name); return (r); } while (0) |
| |
| if (appendop) |
| aflags |= ASS_APPEND; |
| |
| #if defined (ARRAY_VARS) |
| if (t = mbschr (name, LBRACK)) |
| { |
| if (assign_list) |
| { |
| report_error (_("%s: cannot assign list to array member"), name); |
| ASSIGN_RETURN (0); |
| } |
| entry = assign_array_element (name, value, aflags); |
| if (entry == 0) |
| ASSIGN_RETURN (0); |
| } |
| else if (assign_list) |
| { |
| if ((word->flags & W_ASSIGNARG) && (word->flags & W_CHKLOCAL)) |
| aflags |= ASS_CHKLOCAL; |
| if ((word->flags & W_ASSIGNARG) && (word->flags & W_ASSNGLOBAL) == 0) |
| aflags |= ASS_MKLOCAL; |
| if ((word->flags & W_ASSIGNARG) && (word->flags & W_ASSNGLOBAL)) |
| aflags |= ASS_MKGLOBAL; |
| if (word->flags & W_ASSIGNASSOC) |
| aflags |= ASS_MKASSOC; |
| entry = do_compound_assignment (name, value, aflags); |
| } |
| else |
| #endif /* ARRAY_VARS */ |
| entry = bind_variable (name, value, aflags); |
| |
| if (entry) |
| stupidly_hack_special_variables (entry->name); /* might be a nameref */ |
| else |
| stupidly_hack_special_variables (name); |
| |
| /* Return 1 if the assignment seems to have been performed correctly. */ |
| if (entry == 0 || readonly_p (entry)) |
| retval = 0; /* assignment failure */ |
| else if (noassign_p (entry)) |
| { |
| set_exit_status (EXECUTION_FAILURE); |
| retval = 1; /* error status, but not assignment failure */ |
| } |
| else |
| retval = 1; |
| |
| if (entry && retval != 0 && noassign_p (entry) == 0) |
| VUNSETATTR (entry, att_invisible); |
| |
| ASSIGN_RETURN (retval); |
| } |
| |
| /* Perform the assignment statement in STRING, and expand the |
| right side by doing tilde, command and parameter expansion. */ |
| int |
| do_assignment (string) |
| char *string; |
| { |
| WORD_DESC td; |
| |
| td.flags = W_ASSIGNMENT; |
| td.word = string; |
| |
| return do_assignment_internal (&td, 1); |
| } |
| |
| int |
| do_word_assignment (word, flags) |
| WORD_DESC *word; |
| int flags; |
| { |
| return do_assignment_internal (word, 1); |
| } |
| |
| /* Given STRING, an assignment string, get the value of the right side |
| of the `=', and bind it to the left side. Do not perform any word |
| expansions on the right hand side. */ |
| int |
| do_assignment_no_expand (string) |
| char *string; |
| { |
| WORD_DESC td; |
| |
| td.flags = W_ASSIGNMENT; |
| td.word = string; |
| |
| return (do_assignment_internal (&td, 0)); |
| } |
| |
| /*************************************************** |
| * * |
| * Functions to manage the positional parameters * |
| * * |
| ***************************************************/ |
| |
| /* Return the word list that corresponds to `$*'. */ |
| WORD_LIST * |
| list_rest_of_args () |
| { |
| register WORD_LIST *list, *args; |
| int i; |
| |
| /* Break out of the loop as soon as one of the dollar variables is null. */ |
| for (i = 1, list = (WORD_LIST *)NULL; i < 10 && dollar_vars[i]; i++) |
| list = make_word_list (make_bare_word (dollar_vars[i]), list); |
| |
| for (args = rest_of_args; args; args = args->next) |
| list = make_word_list (make_bare_word (args->word->word), list); |
| |
| return (REVERSE_LIST (list, WORD_LIST *)); |
| } |
| |
| /* Return the value of a positional parameter. This handles values > 10. */ |
| char * |
| get_dollar_var_value (ind) |
| intmax_t ind; |
| { |
| char *temp; |
| WORD_LIST *p; |
| |
| if (ind < 10) |
| temp = dollar_vars[ind] ? savestring (dollar_vars[ind]) : (char *)NULL; |
| else /* We want something like ${11} */ |
| { |
| ind -= 10; |
| for (p = rest_of_args; p && ind--; p = p->next) |
| ; |
| temp = p ? savestring (p->word->word) : (char *)NULL; |
| } |
| return (temp); |
| } |
| |
| /* Make a single large string out of the dollar digit variables, |
| and the rest_of_args. If DOLLAR_STAR is 1, then obey the special |
| case of "$*" with respect to IFS. */ |
| char * |
| string_rest_of_args (dollar_star) |
| int dollar_star; |
| { |
| register WORD_LIST *list; |
| char *string; |
| |
| list = list_rest_of_args (); |
| string = dollar_star ? string_list_dollar_star (list, 0, 0) : string_list (list); |
| dispose_words (list); |
| return (string); |
| } |
| |
| /* Return a string containing the positional parameters from START to |
| END, inclusive. If STRING[0] == '*', we obey the rules for $*, |
| which only makes a difference if QUOTED is non-zero. If QUOTED includes |
| Q_HERE_DOCUMENT or Q_DOUBLE_QUOTES, this returns a quoted list, otherwise |
| no quoting chars are added. */ |
| static char * |
| pos_params (string, start, end, quoted, pflags) |
| char *string; |
| int start, end, quoted, pflags; |
| { |
| WORD_LIST *save, *params, *h, *t; |
| char *ret; |
| int i; |
| |
| /* see if we can short-circuit. if start == end, we want 0 parameters. */ |
| if (start == end) |
| return ((char *)NULL); |
| |
| save = params = list_rest_of_args (); |
| if (save == 0 && start > 0) |
| return ((char *)NULL); |
| |
| if (start == 0) /* handle ${@:0[:x]} specially */ |
| { |
| t = make_word_list (make_word (dollar_vars[0]), params); |
| save = params = t; |
| } |
| |
| for (i = start ? 1 : 0; params && i < start; i++) |
| params = params->next; |
| if (params == 0) |
| { |
| dispose_words (save); |
| return ((char *)NULL); |
| } |
| for (h = t = params; params && i < end; i++) |
| { |
| t = params; |
| params = params->next; |
| } |
| t->next = (WORD_LIST *)NULL; |
| |
| ret = string_list_pos_params (string[0], h, quoted, pflags); |
| |
| if (t != params) |
| t->next = params; |
| |
| dispose_words (save); |
| return (ret); |
| } |
| |
| /******************************************************************/ |
| /* */ |
| /* Functions to expand strings to strings or WORD_LISTs */ |
| /* */ |
| /******************************************************************/ |
| |
| #if defined (PROCESS_SUBSTITUTION) |
| #define EXP_CHAR(s) (s == '$' || s == '`' || s == '<' || s == '>' || s == CTLESC || s == '~') |
| #else |
| #define EXP_CHAR(s) (s == '$' || s == '`' || s == CTLESC || s == '~') |
| #endif |
| |
| /* If there are any characters in STRING that require full expansion, |
| then call FUNC to expand STRING; otherwise just perform quote |
| removal if necessary. This returns a new string. */ |
| static char * |
| expand_string_if_necessary (string, quoted, func) |
| char *string; |
| int quoted; |
| EXPFUNC *func; |
| { |
| WORD_LIST *list; |
| size_t slen; |
| int i, saw_quote; |
| char *ret; |
| DECLARE_MBSTATE; |
| |
| /* Don't need string length for ADVANCE_CHAR unless multibyte chars possible. */ |
| slen = (MB_CUR_MAX > 1) ? strlen (string) : 0; |
| i = saw_quote = 0; |
| while (string[i]) |
| { |
| if (EXP_CHAR (string[i])) |
| break; |
| else if (string[i] == '\'' || string[i] == '\\' || string[i] == '"') |
| saw_quote = 1; |
| ADVANCE_CHAR (string, slen, i); |
| } |
| |
| if (string[i]) |
| { |
| list = (*func) (string, quoted); |
| if (list) |
| { |
| ret = string_list (list); |
| dispose_words (list); |
| } |
| else |
| ret = (char *)NULL; |
| } |
| else if (saw_quote && ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) == 0)) |
| ret = string_quote_removal (string, quoted); |
| else |
| ret = savestring (string); |
| |
| return ret; |
| } |
| |
| static inline char * |
| expand_string_to_string_internal (string, quoted, func) |
| char *string; |
| int quoted; |
| EXPFUNC *func; |
| { |
| WORD_LIST *list; |
| char *ret; |
| |
| if (string == 0 || *string == '\0') |
| return ((char *)NULL); |
| |
| list = (*func) (string, quoted); |
| if (list) |
| { |
| ret = string_list (list); |
| dispose_words (list); |
| } |
| else |
| ret = (char *)NULL; |
| |
| return (ret); |
| } |
| |
| char * |
| expand_string_to_string (string, quoted) |
| char *string; |
| int quoted; |
| { |
| return (expand_string_to_string_internal (string, quoted, expand_string)); |
| } |
| |
| char * |
| expand_string_unsplit_to_string (string, quoted) |
| char *string; |
| int quoted; |
| { |
| return (expand_string_to_string_internal (string, quoted, expand_string_unsplit)); |
| } |
| |
| char * |
| expand_assignment_string_to_string (string, quoted) |
| char *string; |
| int quoted; |
| { |
| return (expand_string_to_string_internal (string, quoted, expand_string_assignment)); |
| } |
| |
| char * |
| expand_arith_string (string, quoted) |
| char *string; |
| int quoted; |
| { |
| WORD_DESC td; |
| WORD_LIST *list, *tlist; |
| size_t slen; |
| int i, saw_quote; |
| char *ret; |
| DECLARE_MBSTATE; |
| |
| /* Don't need string length for ADVANCE_CHAR unless multibyte chars possible. */ |
| slen = (MB_CUR_MAX > 1) ? strlen (string) : 0; |
| i = saw_quote = 0; |
| while (string[i]) |
| { |
| if (EXP_CHAR (string[i])) |
| break; |
| else if (string[i] == '\'' || string[i] == '\\' || string[i] == '"') |
| saw_quote = 1; |
| ADVANCE_CHAR (string, slen, i); |
| } |
| |
| if (string[i]) |
| { |
| /* This is expanded version of expand_string_internal as it's called by |
| expand_string_leave_quoted */ |
| td.flags = W_NOPROCSUB|W_NOTILDE; /* don't want process substitution or tilde expansion */ |
| #if 0 /* TAG: bash-5.2 */ |
| if (quoted & Q_ARRAYSUB) |
| td.flags |= W_NOCOMSUB; |
| #endif |
| td.word = savestring (string); |
| list = call_expand_word_internal (&td, quoted, 0, (int *)NULL, (int *)NULL); |
| /* This takes care of the calls from expand_string_leave_quoted and |
| expand_string */ |
| if (list) |
| { |
| tlist = word_list_split (list); |
| dispose_words (list); |
| list = tlist; |
| if (list) |
| dequote_list (list); |
| } |
| /* This comes from expand_string_if_necessary */ |
| if (list) |
| { |
| ret = string_list (list); |
| dispose_words (list); |
| } |
| else |
| ret = (char *)NULL; |
| FREE (td.word); |
| } |
| else if (saw_quote && (quoted & Q_ARITH)) |
| ret = string_quote_removal (string, quoted); |
| else if (saw_quote && ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) == 0)) |
| ret = string_quote_removal (string, quoted); |
| else |
| ret = savestring (string); |
| |
| return ret; |
| } |
| |
| #if defined (COND_COMMAND) |
| /* Just remove backslashes in STRING. Returns a new string. */ |
| char * |
| remove_backslashes (string) |
| char *string; |
| { |
| char *r, *ret, *s; |
| |
| r = ret = (char *)xmalloc (strlen (string) + 1); |
| for (s = string; s && *s; ) |
| { |
| if (*s == '\\') |
| s++; |
| if (*s == 0) |
| break; |
| *r++ = *s++; |
| } |
| *r = '\0'; |
| return ret; |
| } |
| |
| /* This needs better error handling. */ |
| /* Expand W for use as an argument to a unary or binary operator in a |
| [[...]] expression. If SPECIAL is 1, this is the rhs argument |
| to the != or == operator, and should be treated as a pattern. In |
| this case, we quote the string specially for the globbing code. If |
| SPECIAL is 2, this is an rhs argument for the =~ operator, and should |
| be quoted appropriately for regcomp/regexec. The caller is responsible |
| for removing the backslashes if the unquoted word is needed later. In |
| any case, since we don't perform word splitting, we need to do quoted |
| null character removal. */ |
| char * |
| cond_expand_word (w, special) |
| WORD_DESC *w; |
| int special; |
| { |
| char *r, *p; |
| WORD_LIST *l; |
| int qflags; |
| |
| if (w->word == 0 || w->word[0] == '\0') |
| return ((char *)NULL); |
| |
| expand_no_split_dollar_star = 1; |
| w->flags |= W_NOSPLIT2; |
| l = call_expand_word_internal (w, 0, 0, (int *)0, (int *)0); |
| expand_no_split_dollar_star = 0; |
| if (l) |
| { |
| if (special == 0) /* LHS */ |
| { |
| if (l->word) |
| word_list_remove_quoted_nulls (l); |
| dequote_list (l); |
| r = string_list (l); |
| } |
| else |
| { |
| /* Need to figure out whether or not we should call dequote_escapes |
| or a new dequote_ctlnul function here, and under what |
| circumstances. */ |
| qflags = QGLOB_CVTNULL|QGLOB_CTLESC; |
| if (special == 2) |
| qflags |= QGLOB_REGEXP; |
| word_list_remove_quoted_nulls (l); |
| p = string_list (l); |
| r = quote_string_for_globbing (p, qflags); |
| free (p); |
| } |
| dispose_words (l); |
| } |
| else |
| r = (char *)NULL; |
| |
| return r; |
| } |
| #endif |
| |
| /* Call expand_word_internal to expand W and handle error returns. |
| A convenience function for functions that don't want to handle |
| any errors or free any memory before aborting. */ |
| static WORD_LIST * |
| call_expand_word_internal (w, q, i, c, e) |
| WORD_DESC *w; |
| int q, i, *c, *e; |
| { |
| WORD_LIST *result; |
| |
| result = expand_word_internal (w, q, i, c, e); |
| if (result == &expand_word_error || result == &expand_word_fatal) |
| { |
| /* By convention, each time this error is returned, w->word has |
| already been freed (it sometimes may not be in the fatal case, |
| but that doesn't result in a memory leak because we're going |
| to exit in most cases). */ |
| w->word = (char *)NULL; |
| last_command_exit_value = EXECUTION_FAILURE; |
| exp_jump_to_top_level ((result == &expand_word_error) ? DISCARD : FORCE_EOF); |
| /* NOTREACHED */ |
| return (NULL); |
| } |
| else |
| return (result); |
| } |
| |
| /* Perform parameter expansion, command substitution, and arithmetic |
| expansion on STRING, as if it were a word. Leave the result quoted. |
| Since this does not perform word splitting, it leaves quoted nulls |
| in the result. */ |
| static WORD_LIST * |
| expand_string_internal (string, quoted) |
| char *string; |
| int quoted; |
| { |
| WORD_DESC td; |
| WORD_LIST *tresult; |
| |
| if (string == 0 || *string == 0) |
| return ((WORD_LIST *)NULL); |
| |
| td.flags = 0; |
| td.word = savestring (string); |
| |
| tresult = call_expand_word_internal (&td, quoted, 0, (int *)NULL, (int *)NULL); |
| |
| FREE (td.word); |
| return (tresult); |
| } |
| |
| /* Expand STRING by performing parameter expansion, command substitution, |
| and arithmetic expansion. Dequote the resulting WORD_LIST before |
| returning it, but do not perform word splitting. The call to |
| remove_quoted_nulls () is in here because word splitting normally |
| takes care of quote removal. */ |
| WORD_LIST * |
| expand_string_unsplit (string, quoted) |
| char *string; |
| int quoted; |
| { |
| WORD_LIST *value; |
| |
| if (string == 0 || *string == '\0') |
| return ((WORD_LIST *)NULL); |
| |
| expand_no_split_dollar_star = 1; |
| value = expand_string_internal (string, quoted); |
| expand_no_split_dollar_star = 0; |
| |
| if (value) |
| { |
| if (value->word) |
| { |
| remove_quoted_nulls (value->word->word); /* XXX */ |
| value->word->flags &= ~W_HASQUOTEDNULL; |
| } |
| dequote_list (value); |
| } |
| return (value); |
| } |
| |
| /* Expand the rhs of an assignment statement */ |
| WORD_LIST * |
| expand_string_assignment (string, quoted) |
| char *string; |
| int quoted; |
| { |
| WORD_DESC td; |
| WORD_LIST *value; |
| |
| if (string == 0 || *string == '\0') |
| return ((WORD_LIST *)NULL); |
| |
| expand_no_split_dollar_star = 1; |
| |
| #if 0 |
| /* Other shells (ksh93) do it this way, which affects how $@ is expanded |
| in constructs like bar=${@#0} (preserves the spaces resulting from the |
| expansion of $@ in a context where you don't do word splitting); Posix |
| interp 888 makes the expansion of $@ in contexts where word splitting |
| is not performed unspecified. */ |
| td.flags = W_ASSIGNRHS|W_NOSPLIT2; /* Posix interp 888 */ |
| #else |
| td.flags = W_ASSIGNRHS; |
| #endif |
| td.word = savestring (string); |
| value = call_expand_word_internal (&td, quoted, 0, (int *)NULL, (int *)NULL); |
| FREE (td.word); |
| |
| expand_no_split_dollar_star = 0; |
| |
| if (value) |
| { |
| if (value->word) |
| { |
| remove_quoted_nulls (value->word->word); /* XXX */ |
| value->word->flags &= ~W_HASQUOTEDNULL; |
| } |
| dequote_list (value); |
| } |
| return (value); |
| } |
| |
| |
| /* Expand one of the PS? prompt strings. This is a sort of combination of |
| expand_string_unsplit and expand_string_internal, but returns the |
| passed string when an error occurs. Might want to trap other calls |
| to jump_to_top_level here so we don't endlessly loop. */ |
| WORD_LIST * |
| expand_prompt_string (string, quoted, wflags) |
| char *string; |
| int quoted; |
| int wflags; |
| { |
| WORD_LIST *value; |
| WORD_DESC td; |
| |
| if (string == 0 || *string == 0) |
| return ((WORD_LIST *)NULL); |
| |
| td.flags = wflags; |
| td.word = savestring (string); |
| |
| no_longjmp_on_fatal_error = 1; |
| value = expand_word_internal (&td, quoted, 0, (int *)NULL, (int *)NULL); |
| no_longjmp_on_fatal_error = 0; |
| |
| if (value == &expand_word_error || value == &expand_word_fatal) |
| { |
| value = make_word_list (make_bare_word (string), (WORD_LIST *)NULL); |
| return value; |
| } |
| FREE (td.word); |
| if (value) |
| { |
| if (value->word) |
| { |
| remove_quoted_nulls (value->word->word); /* XXX */ |
| value->word->flags &= ~W_HASQUOTEDNULL; |
| } |
| dequote_list (value); |
| } |
| return (value); |
| } |
| |
| /* Expand STRING just as if you were expanding a word, but do not dequote |
| the resultant WORD_LIST. This is called only from within this file, |
| and is used to correctly preserve quoted characters when expanding |
| things like ${1+"$@"}. This does parameter expansion, command |
| substitution, arithmetic expansion, and word splitting. */ |
| static WORD_LIST * |
| expand_string_leave_quoted (string, quoted) |
| char *string; |
| int quoted; |
| { |
| WORD_LIST *tlist; |
| WORD_LIST *tresult; |
| |
| if (string == 0 || *string == '\0') |
| return ((WORD_LIST *)NULL); |
| |
| tlist = expand_string_internal (string, quoted); |
| |
| if (tlist) |
| { |
| tresult = word_list_split (tlist); |
| dispose_words (tlist); |
| return (tresult); |
| } |
| return ((WORD_LIST *)NULL); |
| } |
| |
| /* This does not perform word splitting or dequote the WORD_LIST |
| it returns. */ |
| static WORD_LIST * |
| expand_string_for_rhs (string, quoted, op, pflags, dollar_at_p, expanded_p) |
| char *string; |
| int quoted, op, pflags; |
| int *dollar_at_p, *expanded_p; |
| { |
| WORD_DESC td; |
| WORD_LIST *tresult; |
| int old_nosplit; |
| |
| if (string == 0 || *string == '\0') |
| return (WORD_LIST *)NULL; |
| |
| /* We want field splitting to be determined by what is going to be done with |
| the entire ${parameterOPword} expansion, so we don't want to split the RHS |
| we expand here. However, the expansion of $* is determined by whether we |
| are going to eventually perform word splitting, so we want to set this |
| depending on whether or not are are going to be splitting: if the expansion |
| is quoted, if the OP is `=', or if IFS is set to the empty string, we |
| are not going to be splitting, so we set expand_no_split_dollar_star to |
| note this to callees. |
| We pass through PF_ASSIGNRHS as W_ASSIGNRHS if this is on the RHS of an |
| assignment statement. */ |
| /* The updated treatment of $* is the result of Posix interp 888 */ |
| /* This was further clarified on the austin-group list in March, 2017 and |
| in Posix bug 1129 */ |
| old_nosplit = expand_no_split_dollar_star; |
| expand_no_split_dollar_star = (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) || op == '=' || ifs_is_null == 0; /* XXX - was 1 */ |
| td.flags = W_EXPANDRHS; /* expanding RHS of ${paramOPword} */ |
| td.flags |= W_NOSPLIT2; /* no splitting, remove "" and '' */ |
| if (pflags & PF_ASSIGNRHS) /* pass through */ |
| td.flags |= W_ASSIGNRHS; |
| if (op == '=') |
| #if 0 |
| td.flags |= W_ASSIGNRHS; /* expand b in ${a=b} like assignment */ |
| #else |
| td.flags |= W_ASSIGNRHS|W_NOASSNTILDE; /* expand b in ${a=b} like assignment */ |
| #endif |
| td.word = string; |
| tresult = call_expand_word_internal (&td, quoted, 1, dollar_at_p, expanded_p); |
| expand_no_split_dollar_star = old_nosplit; |
| |
| return (tresult); |
| } |
| |
| /* This does not perform word splitting or dequote the WORD_LIST |
| it returns and it treats $* as if it were quoted. */ |
| static WORD_LIST * |
| expand_string_for_pat (string, quoted, dollar_at_p, expanded_p) |
| char *string; |
| int quoted, *dollar_at_p, *expanded_p; |
| { |
| WORD_DESC td; |
| WORD_LIST *tresult; |
| int oexp; |
| |
| if (string == 0 || *string == '\0') |
| return (WORD_LIST *)NULL; |
| |
| oexp = expand_no_split_dollar_star; |
| expand_no_split_dollar_star = 1; |
| td.flags = W_NOSPLIT2; /* no splitting, remove "" and '' */ |
| td.word = string; |
| tresult = call_expand_word_internal (&td, quoted, 1, dollar_at_p, expanded_p); |
| expand_no_split_dollar_star = oexp; |
| |
| return (tresult); |
| } |
| |
| /* Expand STRING just as if you were expanding a word. This also returns |
| a list of words. Note that filename globbing is *NOT* done for word |
| or string expansion, just when the shell is expanding a command. This |
| does parameter expansion, command substitution, arithmetic expansion, |
| and word splitting. Dequote the resultant WORD_LIST before returning. */ |
| WORD_LIST * |
| expand_string (string, quoted) |
| char *string; |
| int quoted; |
| { |
| WORD_LIST *result; |
| |
| if (string == 0 || *string == '\0') |
| return ((WORD_LIST *)NULL); |
| |
| result = expand_string_leave_quoted (string, quoted); |
| return (result ? dequote_list (result) : result); |
| } |
| |
| /******************************************* |
| * * |
| * Functions to expand WORD_DESCs * |
| * * |
| *******************************************/ |
| |
| /* Expand WORD, performing word splitting on the result. This does |
| parameter expansion, command substitution, arithmetic expansion, |
| word splitting, and quote removal. */ |
| |
| WORD_LIST * |
| expand_word (word, quoted) |
| WORD_DESC *word; |
| int quoted; |
| { |
| WORD_LIST *result, *tresult; |
| |
| tresult = call_expand_word_internal (word, quoted, 0, (int *)NULL, (int *)NULL); |
| result = word_list_split (tresult); |
| dispose_words (tresult); |
| return (result ? dequote_list (result) : result); |
| } |
| |
| /* Expand WORD, but do not perform word splitting on the result. This |
| does parameter expansion, command substitution, arithmetic expansion, |
| and quote removal. */ |
| WORD_LIST * |
| expand_word_unsplit (word, quoted) |
| WORD_DESC *word; |
| int quoted; |
| { |
| WORD_LIST *result; |
| |
| result = expand_word_leave_quoted (word, quoted); |
| return (result ? dequote_list (result) : result); |
| } |
| |
| /* Perform shell expansions on WORD, but do not perform word splitting or |
| quote removal on the result. Virtually identical to expand_word_unsplit; |
| could be combined if implementations don't diverge. */ |
| WORD_LIST * |
| expand_word_leave_quoted (word, quoted) |
| WORD_DESC *word; |
| int quoted; |
| { |
| WORD_LIST *result; |
| |
| expand_no_split_dollar_star = 1; |
| if (ifs_is_null) |
| word->flags |= W_NOSPLIT; |
| word->flags |= W_NOSPLIT2; |
| result = call_expand_word_internal (word, quoted, 0, (int *)NULL, (int *)NULL); |
| expand_no_split_dollar_star = 0; |
| |
| return result; |
| } |
| |
| /*************************************************** |
| * * |
| * Functions to handle quoting chars * |
| * * |
| ***************************************************/ |
| |
| /* Conventions: |
| |
| A string with s[0] == CTLNUL && s[1] == 0 is a quoted null string. |
| The parser passes CTLNUL as CTLESC CTLNUL. */ |
| |
| /* Quote escape characters in string s, but no other characters. This is |
| used to protect CTLESC and CTLNUL in variable values from the rest of |
| the word expansion process after the variable is expanded (word splitting |
| and filename generation). If IFS is null, we quote spaces as well, just |
| in case we split on spaces later (in the case of unquoted $@, we will |
| eventually attempt to split the entire word on spaces). Corresponding |
| code exists in dequote_escapes. Even if we don't end up splitting on |
| spaces, quoting spaces is not a problem. This should never be called on |
| a string that is quoted with single or double quotes or part of a here |
| document (effectively double-quoted). |
| FLAGS says whether or not we are going to split the result. If we are not, |
| and there is a CTLESC or CTLNUL in IFS, we need to quote CTLESC and CTLNUL, |
| respectively, to prevent them from being removed as part of dequoting. */ |
| static char * |
| quote_escapes_internal (string, flags) |
| const char *string; |
| int flags; |
| { |
| const char *s, *send; |
| char *t, *result; |
| size_t slen; |
| int quote_spaces, skip_ctlesc, skip_ctlnul, nosplit; |
| DECLARE_MBSTATE; |
| |
| slen = strlen (string); |
| send = string + slen; |
| |
| quote_spaces = (ifs_value && *ifs_value == 0); |
| nosplit = (flags & PF_NOSPLIT2); |
| |
| for (skip_ctlesc = skip_ctlnul = 0, s = ifs_value; s && *s; s++) |
| { |
| skip_ctlesc |= (nosplit == 0 && *s == CTLESC); |
| skip_ctlnul |= (nosplit == 0 && *s == CTLNUL); |
| } |
| |
| t = result = (char *)xmalloc ((slen * 2) + 1); |
| s = string; |
| |
| while (*s) |
| { |
| if ((skip_ctlesc == 0 && *s == CTLESC) || (skip_ctlnul == 0 && *s == CTLNUL) || (quote_spaces && *s == ' ')) |
| *t++ = CTLESC; |
| COPY_CHAR_P (t, s, send); |
| } |
| *t = '\0'; |
| |
| return (result); |
| } |
| |
| char * |
| quote_escapes (string) |
| const char *string; |
| { |
| return (quote_escapes_internal (string, 0)); |
| } |
| |
| char * |
| quote_rhs (string) |
| const char *string; |
| { |
| return (quote_escapes_internal (string, PF_NOSPLIT2)); |
| } |
| |
| static WORD_LIST * |
| list_quote_escapes (list) |
| WORD_LIST *list; |
| { |
| register WORD_LIST *w; |
| char *t; |
| |
| for (w = list; w; w = w->next) |
| { |
| t = w->word->word; |
| w->word->word = quote_escapes (t); |
| free (t); |
| } |
| return list; |
| } |
| |
| /* Inverse of quote_escapes; remove CTLESC protecting CTLESC or CTLNUL. |
| |
| The parser passes us CTLESC as CTLESC CTLESC and CTLNUL as CTLESC CTLNUL. |
| This is necessary to make unquoted CTLESC and CTLNUL characters in the |
| data stream pass through properly. |
| |
| We need to remove doubled CTLESC characters inside quoted strings before |
| quoting the entire string, so we do not double the number of CTLESC |
| characters. |
| |
| Also used by parts of the pattern substitution code. */ |
| char * |
| dequote_escapes (string) |
| const char *string; |
| { |
| const char *s, *send; |
| char *t, *result; |
| size_t slen; |
| int quote_spaces; |
| DECLARE_MBSTATE; |
| |
| if (string == 0) |
| return (char *)0; |
| |
| slen = strlen (string); |
| send = string + slen; |
| |
| t = result = (char *)xmalloc (slen + 1); |
| |
| if (strchr (string, CTLESC) == 0) |
| return (strcpy (result, string)); |
| |
| quote_spaces = (ifs_value && *ifs_value == 0); |
| |
| s = string; |
| while (*s) |
| { |
| if (*s == CTLESC && (s[1] == CTLESC || s[1] == CTLNUL || (quote_spaces && s[1] == ' '))) |
| { |
| s++; |
| if (*s == '\0') |
| break; |
| } |
| COPY_CHAR_P (t, s, send); |
| } |
| *t = '\0'; |
| |
| return result; |
| } |
| |
| #if defined (INCLUDE_UNUSED) |
| static WORD_LIST * |
| list_dequote_escapes (list) |
| WORD_LIST *list; |
| { |
| register WORD_LIST *w; |
| char *t; |
| |
| for (w = list; w; w = w->next) |
| { |
| t = w->word->word; |
| w->word->word = dequote_escapes (t); |
| free (t); |
| } |
| return list; |
| } |
| #endif |
| |
| /* Return a new string with the quoted representation of character C. |
| This turns "" into QUOTED_NULL, so the W_HASQUOTEDNULL flag needs to be |
| set in any resultant WORD_DESC where this value is the word. */ |
| static char * |
| make_quoted_char (c) |
| int c; |
| { |
| char *temp; |
| |
| temp = (char *)xmalloc (3); |
| if (c == 0) |
| { |
| temp[0] = CTLNUL; |
| temp[1] = '\0'; |
| } |
| else |
| { |
| temp[0] = CTLESC; |
| temp[1] = c; |
| temp[2] = '\0'; |
| } |
| return (temp); |
| } |
| |
| /* Quote STRING, returning a new string. This turns "" into QUOTED_NULL, so |
| the W_HASQUOTEDNULL flag needs to be set in any resultant WORD_DESC where |
| this value is the word. */ |
| char * |
| quote_string (string) |
| char *string; |
| { |
| register char *t; |
| size_t slen; |
| char *result, *send; |
| |
| if (*string == 0) |
| { |
| result = (char *)xmalloc (2); |
| result[0] = CTLNUL; |
| result[1] = '\0'; |
| } |
| else |
| { |
| DECLARE_MBSTATE; |
| |
| slen = strlen (string); |
| send = string + slen; |
| |
| result = (char *)xmalloc ((slen * 2) + 1); |
| |
| for (t = result; string < send; ) |
| { |
| *t++ = CTLESC; |
| COPY_CHAR_P (t, string, send); |
| } |
| *t = '\0'; |
| } |
| return (result); |
| } |
| |
| /* De-quote quoted characters in STRING. */ |
| char * |
| dequote_string (string) |
| char *string; |
| { |
| register char *s, *t; |
| size_t slen; |
| char *result, *send; |
| DECLARE_MBSTATE; |
| |
| #if defined (DEBUG) |
| if (string[0] == CTLESC && string[1] == 0) |
| internal_inform ("dequote_string: string with bare CTLESC"); |
| #endif |
| |
| slen = STRLEN (string); |
| |
| t = result = (char *)xmalloc (slen + 1); |
| |
| if (QUOTED_NULL (string)) |
| { |
| result[0] = '\0'; |
| return (result); |
| } |
| |
| /* A string consisting of only a single CTLESC should pass through unchanged */ |
| if (string[0] == CTLESC && string[1] == 0) |
| { |
| result[0] = CTLESC; |
| result[1] = '\0'; |
| return (result); |
| } |
| |
| /* If no character in the string can be quoted, don't bother examining |
| each character. Just return a copy of the string passed to us. */ |
| if (strchr (string, CTLESC) == NULL) |
| return (strcpy (result, string)); |
| |
| send = string + slen; |
| s = string; |
| while (*s) |
| { |
| if (*s == CTLESC) |
| { |
| s++; |
| if (*s == '\0') |
| break; |
| } |
| COPY_CHAR_P (t, s, send); |
| } |
| |
| *t = '\0'; |
| return (result); |
| } |
| |
| /* Quote the entire WORD_LIST list. */ |
| static WORD_LIST * |
| quote_list (list) |
| WORD_LIST *list; |
| { |
| register WORD_LIST *w; |
| char *t; |
| |
| for (w = list; w; w = w->next) |
| { |
| t = w->word->word; |
| w->word->word = quote_string (t); |
| if (*t == 0) |
| w->word->flags |= W_HASQUOTEDNULL; /* XXX - turn on W_HASQUOTEDNULL here? */ |
| w->word->flags |= W_QUOTED; |
| free (t); |
| } |
| return list; |
| } |
| |
| WORD_DESC * |
| dequote_word (word) |
| WORD_DESC *word; |
| { |
| register char *s; |
| |
| s = dequote_string (word->word); |
| if (QUOTED_NULL (word->word)) |
| word->flags &= ~W_HASQUOTEDNULL; |
| free (word->word); |
| word->word = s; |
| |
| return word; |
| } |
| |
| /* De-quote quoted characters in each word in LIST. */ |
| WORD_LIST * |
| dequote_list (list) |
| WORD_LIST *list; |
| { |
| register char *s; |
| register WORD_LIST *tlist; |
| |
| for (tlist = list; tlist; tlist = tlist->next) |
| { |
| s = dequote_string (tlist->word->word); |
| if (QUOTED_NULL (tlist->word->word)) |
| tlist->word->flags &= ~W_HASQUOTEDNULL; |
| free (tlist->word->word); |
| tlist->word->word = s; |
| } |
| return list; |
| } |
| |
| /* Remove CTLESC protecting a CTLESC or CTLNUL in place. Return the passed |
| string. */ |
| char * |
| remove_quoted_escapes (string) |
| char *string; |
| { |
| char *t; |
| |
| if (string) |
| { |
| t = dequote_escapes (string); |
| strcpy (string, t); |
| free (t); |
| } |
| |
| return (string); |
| } |
| |
| /* Remove quoted $IFS characters from STRING. Quoted IFS characters are |
| added to protect them from word splitting, but we need to remove them |
| if no word splitting takes place. This returns newly-allocated memory, |
| so callers can use it to replace savestring(). */ |
| char * |
| remove_quoted_ifs (string) |
| char *string; |
| { |
| register size_t slen; |
| register int i, j; |
| char *ret, *send; |
| DECLARE_MBSTATE; |
| |
| slen = strlen (string); |
| send = string + slen; |
| |
| i = j = 0; |
| ret = (char *)xmalloc (slen + 1); |
| |
| while (i < slen) |
| { |
| if (string[i] == CTLESC) |
| { |
| i++; |
| if (string[i] == 0 || isifs (string[i]) == 0) |
| ret[j++] = CTLESC; |
| if (i == slen) |
| break; |
| } |
| |
| COPY_CHAR_I (ret, j, string, send, i); |
| } |
| ret[j] = '\0'; |
| |
| return (ret); |
| } |
| |
| char * |
| remove_quoted_nulls (string) |
| char *string; |
| { |
| register size_t slen; |
| register int i, j, prev_i; |
| DECLARE_MBSTATE; |
| |
| if (strchr (string, CTLNUL) == 0) /* XXX */ |
| return string; /* XXX */ |
| |
| slen = strlen (string); |
| i = j = 0; |
| |
| while (i < slen) |
| { |
| if (string[i] == CTLESC) |
| { |
| /* Old code had j++, but we cannot assume that i == j at this |
| point -- what if a CTLNUL has already been removed from the |
| string? We don't want to drop the CTLESC or recopy characters |
| that we've already copied down. */ |
| i++; |
| string[j++] = CTLESC; |
| if (i == slen) |
| break; |
| } |
| else if (string[i] == CTLNUL) |
| { |
| i++; |
| continue; |
| } |
| |
| prev_i = i; |
| ADVANCE_CHAR (string, slen, i); /* COPY_CHAR_I? */ |
| if (j < prev_i) |
| { |
| do string[j++] = string[prev_i++]; while (prev_i < i); |
| } |
| else |
| j = i; |
| } |
| string[j] = '\0'; |
| |
| return (string); |
| } |
| |
| /* Perform quoted null character removal on each element of LIST. |
| This modifies LIST. */ |
| void |
| word_list_remove_quoted_nulls (list) |
| WORD_LIST *list; |
| { |
| register WORD_LIST *t; |
| |
| for (t = list; t; t = t->next) |
| { |
| remove_quoted_nulls (t->word->word); |
| t->word->flags &= ~W_HASQUOTEDNULL; |
| } |
| } |
| |
| /* **************************************************************** */ |
| /* */ |
| /* Functions for Matching and Removing Patterns */ |
| /* */ |
| /* **************************************************************** */ |
| |
| #if defined (HANDLE_MULTIBYTE) |
| # ifdef INCLUDE_UNUSED |
| static unsigned char * |
| mb_getcharlens (string, len) |
| char *string; |
| int len; |
| { |
| int i, offset, last; |
| unsigned char *ret; |
| char *p; |
| DECLARE_MBSTATE; |
| |
| i = offset = 0; |
| last = 0; |
| ret = (unsigned char *)xmalloc (len); |
| memset (ret, 0, len); |
| while (string[last]) |
| { |
| ADVANCE_CHAR (string, len, offset); |
| ret[last] = offset - last; |
| last = offset; |
| } |
| return ret; |
| } |
| # endif |
| #endif |
| |
| /* Remove the portion of PARAM matched by PATTERN according to OP, where OP |
| can have one of 4 values: |
| RP_LONG_LEFT remove longest matching portion at start of PARAM |
| RP_SHORT_LEFT remove shortest matching portion at start of PARAM |
| RP_LONG_RIGHT remove longest matching portion at end of PARAM |
| RP_SHORT_RIGHT remove shortest matching portion at end of PARAM |
| */ |
| |
| #define RP_LONG_LEFT 1 |
| #define RP_SHORT_LEFT 2 |
| #define RP_LONG_RIGHT 3 |
| #define RP_SHORT_RIGHT 4 |
| |
| /* Returns its first argument if nothing matched; new memory otherwise */ |
| static char * |
| remove_upattern (param, pattern, op) |
| char *param, *pattern; |
| int op; |
| { |
| register size_t len; |
| register char *end; |
| register char *p, *ret, c; |
| |
| len = STRLEN (param); |
| end = param + len; |
| |
| switch (op) |
| { |
| case RP_LONG_LEFT: /* remove longest match at start */ |
| for (p = end; p >= param; p--) |
| { |
| c = *p; *p = '\0'; |
| if (strmatch (pattern, param, FNMATCH_EXTFLAG) != FNM_NOMATCH) |
| { |
| *p = c; |
| return (savestring (p)); |
| } |
| *p = c; |
| |
| } |
| break; |
| |
| case RP_SHORT_LEFT: /* remove shortest match at start */ |
| for (p = param; p <= end; p++) |
| { |
| c = *p; *p = '\0'; |
| if (strmatch (pattern, param, FNMATCH_EXTFLAG) != FNM_NOMATCH) |
| { |
| *p = c; |
| return (savestring (p)); |
| } |
| *p = c; |
| } |
| break; |
| |
| case RP_LONG_RIGHT: /* remove longest match at end */ |
| for (p = param; p <= end; p++) |
| { |
| if (strmatch (pattern, p, FNMATCH_EXTFLAG) != FNM_NOMATCH) |
| { |
| c = *p; *p = '\0'; |
| ret = savestring (param); |
| *p = c; |
| return (ret); |
| } |
| } |
| break; |
| |
| case RP_SHORT_RIGHT: /* remove shortest match at end */ |
| for (p = end; p >= param; p--) |
| { |
| if (strmatch (pattern, p, FNMATCH_EXTFLAG) != FNM_NOMATCH) |
| { |
| c = *p; *p = '\0'; |
| ret = savestring (param); |
| *p = c; |
| return (ret); |
| } |
| } |
| break; |
| } |
| |
| return (param); /* no match, return original string */ |
| } |
| |
| #if defined (HANDLE_MULTIBYTE) |
| /* Returns its first argument if nothing matched; new memory otherwise */ |
| static wchar_t * |
| remove_wpattern (wparam, wstrlen, wpattern, op) |
| wchar_t *wparam; |
| size_t wstrlen; |
| wchar_t *wpattern; |
| int op; |
| { |
| wchar_t wc, *ret; |
| int n; |
| |
| switch (op) |
| { |
| case RP_LONG_LEFT: /* remove longest match at start */ |
| for (n = wstrlen; n >= 0; n--) |
| { |
| wc = wparam[n]; wparam[n] = L'\0'; |
| if (wcsmatch (wpattern, wparam, FNMATCH_EXTFLAG) != FNM_NOMATCH) |
| { |
| wparam[n] = wc; |
| return (wcsdup (wparam + n)); |
| } |
| wparam[n] = wc; |
| } |
| break; |
| |
| case RP_SHORT_LEFT: /* remove shortest match at start */ |
| for (n = 0; n <= wstrlen; n++) |
| { |
| wc = wparam[n]; wparam[n] = L'\0'; |
| if (wcsmatch (wpattern, wparam, FNMATCH_EXTFLAG) != FNM_NOMATCH) |
| { |
| wparam[n] = wc; |
| return (wcsdup (wparam + n)); |
| } |
| wparam[n] = wc; |
| } |
| break; |
| |
| case RP_LONG_RIGHT: /* remove longest match at end */ |
| for (n = 0; n <= wstrlen; n++) |
| { |
| if (wcsmatch (wpattern, wparam + n, FNMATCH_EXTFLAG) != FNM_NOMATCH) |
| { |
| wc = wparam[n]; wparam[n] = L'\0'; |
| ret = wcsdup (wparam); |
| wparam[n] = wc; |
| return (ret); |
| } |
| } |
| break; |
| |
| case RP_SHORT_RIGHT: /* remove shortest match at end */ |
| for (n = wstrlen; n >= 0; n--) |
| { |
| if (wcsmatch (wpattern, wparam + n, FNMATCH_EXTFLAG) != FNM_NOMATCH) |
| { |
| wc = wparam[n]; wparam[n] = L'\0'; |
| ret = wcsdup (wparam); |
| wparam[n] = wc; |
| return (ret); |
| } |
| } |
| break; |
| } |
| |
| return (wparam); /* no match, return original string */ |
| } |
| #endif /* HANDLE_MULTIBYTE */ |
| |
| static char * |
| remove_pattern (param, pattern, op) |
| char *param, *pattern; |
| int op; |
| { |
| char *xret; |
| |
| if (param == NULL) |
| return (param); |
| if (*param == '\0' || pattern == NULL || *pattern == '\0') /* minor optimization */ |
| return (savestring (param)); |
| |
| #if defined (HANDLE_MULTIBYTE) |
| if (MB_CUR_MAX > 1) |
| { |
| wchar_t *ret, *oret; |
| size_t n; |
| wchar_t *wparam, *wpattern; |
| mbstate_t ps; |
| |
| /* XXX - could optimize here by checking param and pattern for multibyte |
| chars with mbsmbchar and calling remove_upattern. */ |
| |
| n = xdupmbstowcs (&wpattern, NULL, pattern); |
| if (n == (size_t)-1) |
| { |
| xret = remove_upattern (param, pattern, op); |
| return ((xret == param) ? savestring (param) : xret); |
| } |
| n = xdupmbstowcs (&wparam, NULL, param); |
| |
| if (n == (size_t)-1) |
| { |
| free (wpattern); |
| xret = remove_upattern (param, pattern, op); |
| return ((xret == param) ? savestring (param) : xret); |
| } |
| oret = ret = remove_wpattern (wparam, n, wpattern, op); |
| /* Don't bother to convert wparam back to multibyte string if nothing |
| matched; just return copy of original string */ |
| if (ret == wparam) |
| { |
| free (wparam); |
| free (wpattern); |
| return (savestring (param)); |
| } |
| |
| free (wparam); |
| free (wpattern); |
| |
| n = strlen (param); |
| xret = (char *)xmalloc (n + 1); |
| memset (&ps, '\0', sizeof (mbstate_t)); |
| n = wcsrtombs (xret, (const wchar_t **)&ret, n, &ps); |
| xret[n] = '\0'; /* just to make sure */ |
| free (oret); |
| return xret; |
| } |
| else |
| #endif |
| { |
| xret = remove_upattern (param, pattern, op); |
| return ((xret == param) ? savestring (param) : xret); |
| } |
| } |
| |
| /* Match PAT anywhere in STRING and return the match boundaries. |
| This returns 1 in case of a successful match, 0 otherwise. SP |
| and EP are pointers into the string where the match begins and |
| ends, respectively. MTYPE controls what kind of match is attempted. |
| MATCH_BEG and MATCH_END anchor the match at the beginning and end |
| of the string, respectively. The longest match is returned. */ |
| static int |
| match_upattern (string, pat, mtype, sp, ep) |
| char *string, *pat; |
| int mtype; |
| char **sp, **ep; |
| { |
| int c, mlen; |
| size_t len; |
| register char *p, *p1, *npat; |
| char *end; |
| |
| /* If the pattern doesn't match anywhere in the string, go ahead and |
| short-circuit right away. A minor optimization, saves a bunch of |
| unnecessary calls to strmatch (up to N calls for a string of N |
| characters) if the match is unsuccessful. To preserve the semantics |
| of the substring matches below, we make sure that the pattern has |
| `*' as first and last character, making a new pattern if necessary. */ |
| /* XXX - check this later if I ever implement `**' with special meaning, |
| since this will potentially result in `**' at the beginning or end */ |
| len = STRLEN (pat); |
| if (pat[0] != '*' || (pat[0] == '*' && pat[1] == LPAREN && extended_glob) || pat[len - 1] != '*') |
| { |
| int unescaped_backslash; |
| char *pp; |
| |
| p = npat = (char *)xmalloc (len + 3); |
| p1 = pat; |
| if ((mtype != MATCH_BEG) && (*p1 != '*' || (*p1 == '*' && p1[1] == LPAREN && extended_glob))) |
| *p++ = '*'; |
| while (*p1) |
| *p++ = *p1++; |
| #if 1 |
| /* Need to also handle a pattern that ends with an unescaped backslash. |
| For right now, we ignore it because the pattern matching code will |
| fail the match anyway */ |
| /* If the pattern ends with a `*' we leave it alone if it's preceded by |
| an even number of backslashes, but if it's escaped by a backslash |
| we need to add another `*'. */ |
| if ((mtype != MATCH_END) && (p1[-1] == '*' && (unescaped_backslash = p1[-2] == '\\'))) |
| { |
| pp = p1 - 3; |
| while (pp >= pat && *pp-- == '\\') |
| unescaped_backslash = 1 - unescaped_backslash; |
| if (unescaped_backslash) |
| *p++ = '*'; |
| } |
| else if (mtype != MATCH_END && p1[-1] != '*') |
| *p++ = '*'; |
| #else |
| if (p1[-1] != '*' || p1[-2] == '\\') |
| *p++ = '*'; |
| #endif |
| *p = '\0'; |
| } |
| else |
| npat = pat; |
| c = strmatch (npat, string, FNMATCH_EXTFLAG | FNMATCH_IGNCASE); |
| if (npat != pat) |
| free (npat); |
| if (c == FNM_NOMATCH) |
| return (0); |
| |
| len = STRLEN (string); |
| end = string + len; |
| |
| mlen = umatchlen (pat, len); |
| if (mlen > (int)len) |
| return (0); |
| |
| switch (mtype) |
| { |
| case MATCH_ANY: |
| for (p = string; p <= end; p++) |
| { |
| if (match_pattern_char (pat, p, FNMATCH_IGNCASE)) |
| { |
| p1 = (mlen == -1) ? end : p + mlen; |
| /* p1 - p = length of portion of string to be considered |
| p = current position in string |
| mlen = number of characters consumed by match (-1 for entire string) |
| end = end of string |
| we want to break immediately if the potential match len |
| is greater than the number of characters remaining in the |
| string |
| */ |
| if (p1 > end) |
| break; |
| for ( ; p1 >= p; p1--) |
| { |
| c = *p1; *p1 = '\0'; |
| if (strmatch (pat, p, FNMATCH_EXTFLAG | FNMATCH_IGNCASE) == 0) |
| { |
| *p1 = c; |
| *sp = p; |
| *ep = p1; |
| return 1; |
| } |
| *p1 = c; |
| #if 1 |
| /* If MLEN != -1, we have a fixed length pattern. */ |
| if (mlen != -1) |
| break; |
| #endif |
| } |
| } |
| } |
| |
| return (0); |
| |
| case MATCH_BEG: |
| if (match_pattern_char (pat, string, FNMATCH_IGNCASE) == 0) |
| return (0); |
| |
| for (p = (mlen == -1) ? end : string + mlen; p >= string; p--) |
| { |
| c = *p; *p = '\0'; |
| if (strmatch (pat, string, FNMATCH_EXTFLAG | FNMATCH_IGNCASE) == 0) |
| { |
| *p = c; |
| *sp = string; |
| *ep = p; |
| return 1; |
| } |
| *p = c; |
| /* If MLEN != -1, we have a fixed length pattern. */ |
| if (mlen != -1) |
| break; |
| } |
| |
| return (0); |
| |
| case MATCH_END: |
| for (p = end - ((mlen == -1) ? len : mlen); p <= end; p++) |
| { |
| if (strmatch (pat, p, FNMATCH_EXTFLAG | FNMATCH_IGNCASE) == 0) |
| { |
| *sp = p; |
| *ep = end; |
| return 1; |
| } |
| /* If MLEN != -1, we have a fixed length pattern. */ |
| if (mlen != -1) |
| break; |
| } |
| |
| return (0); |
| } |
| |
| return (0); |
| } |
| |
| #if defined (HANDLE_MULTIBYTE) |
| |
| #define WFOLD(c) (match_ignore_case && iswupper (c) ? towlower (c) : (c)) |
| |
| /* Match WPAT anywhere in WSTRING and return the match boundaries. |
| This returns 1 in case of a successful match, 0 otherwise. Wide |
| character version. */ |
| static int |
| match_wpattern (wstring, indices, wstrlen, wpat, mtype, sp, ep) |
| wchar_t *wstring; |
| char **indices; |
| size_t wstrlen; |
| wchar_t *wpat; |
| int mtype; |
| char **sp, **ep; |
| { |
| wchar_t wc, *wp, *nwpat, *wp1; |
| size_t len; |
| int mlen; |
| int n, n1, n2, simple; |
| |
| simple = (wpat[0] != L'\\' && wpat[0] != L'*' && wpat[0] != L'?' && wpat[0] != L'['); |
| #if defined (EXTENDED_GLOB) |
| if (extended_glob) |
| simple &= (wpat[1] != L'(' || (wpat[0] != L'*' && wpat[0] != L'?' && wpat[0] != L'+' && wpat[0] != L'!' && wpat[0] != L'@')); /*)*/ |
| #endif |
| |
| /* If the pattern doesn't match anywhere in the string, go ahead and |
| short-circuit right away. A minor optimization, saves a bunch of |
| unnecessary calls to strmatch (up to N calls for a string of N |
| characters) if the match is unsuccessful. To preserve the semantics |
| of the substring matches below, we make sure that the pattern has |
| `*' as first and last character, making a new pattern if necessary. */ |
| len = wcslen (wpat); |
| if (wpat[0] != L'*' || (wpat[0] == L'*' && wpat[1] == WLPAREN && extended_glob) || wpat[len - 1] != L'*') |
| { |
| int unescaped_backslash; |
| wchar_t *wpp; |
| |
| wp = nwpat = (wchar_t *)xmalloc ((len + 3) * sizeof (wchar_t)); |
| wp1 = wpat; |
| if (*wp1 != L'*' || (*wp1 == '*' && wp1[1] == WLPAREN && extended_glob)) |
| *wp++ = L'*'; |
| while (*wp1 != L'\0') |
| *wp++ = *wp1++; |
| #if 1 |
| /* See comments above in match_upattern. */ |
| if (wp1[-1] == L'*' && (unescaped_backslash = wp1[-2] == L'\\')) |
| { |
| wpp = wp1 - 3; |
| while (wpp >= wpat && *wpp-- == L'\\') |
| unescaped_backslash = 1 - unescaped_backslash; |
| if (unescaped_backslash) |
| *wp++ = L'*'; |
| } |
| else if (wp1[-1] != L'*') |
| *wp++ = L'*'; |
| #else |
| if (wp1[-1] != L'*' || wp1[-2] == L'\\') |
| *wp++ = L'*'; |
| #endif |
| *wp = '\0'; |
| } |
| else |
| nwpat = wpat; |
| len = wcsmatch (nwpat, wstring, FNMATCH_EXTFLAG | FNMATCH_IGNCASE); |
| if (nwpat != wpat) |
| free (nwpat); |
| if (len == FNM_NOMATCH) |
| return (0); |
| |
| mlen = wmatchlen (wpat, wstrlen); |
| if (mlen > (int)wstrlen) |
| return (0); |
| |
| /* itrace("wmatchlen (%ls) -> %d", wpat, mlen); */ |
| switch (mtype) |
| { |
| case MATCH_ANY: |
| for (n = 0; n <= wstrlen; n++) |
| { |
| n2 = simple ? (WFOLD(*wpat) == WFOLD(wstring[n])) : match_pattern_wchar (wpat, wstring + n, FNMATCH_IGNCASE); |
| if (n2) |
| { |
| n1 = (mlen == -1) ? wstrlen : n + mlen; |
| if (n1 > wstrlen) |
| break; |
| |
| for ( ; n1 >= n; n1--) |
| { |
| wc = wstring[n1]; wstring[n1] = L'\0'; |
| if (wcsmatch (wpat, wstring + n, FNMATCH_EXTFLAG | FNMATCH_IGNCASE) == 0) |
| { |
| wstring[n1] = wc; |
| *sp = indices[n]; |
| *ep = indices[n1]; |
| return 1; |
| } |
| wstring[n1] = wc; |
| /* If MLEN != -1, we have a fixed length pattern. */ |
| if (mlen != -1) |
| break; |
| } |
| } |
| } |
| |
| return (0); |
| |
| case MATCH_BEG: |
| if (match_pattern_wchar (wpat, wstring, FNMATCH_IGNCASE) == 0) |
| return (0); |
| |
| for (n = (mlen == -1) ? wstrlen : mlen; n >= 0; n--) |
| { |
| wc = wstring[n]; wstring[n] = L'\0'; |
| if (wcsmatch (wpat, wstring, FNMATCH_EXTFLAG | FNMATCH_IGNCASE) == 0) |
| { |
| wstring[n] = wc; |
| *sp = indices[0]; |
| *ep = indices[n]; |
| return 1; |
| } |
| wstring[n] = wc; |
| /* If MLEN != -1, we have a fixed length pattern. */ |
| if (mlen != -1) |
| break; |
| } |
| |
| return (0); |
| |
| case MATCH_END: |
| for (n = wstrlen - ((mlen == -1) ? wstrlen : mlen); n <= wstrlen; n++) |
| { |
| if (wcsmatch (wpat, wstring + n, FNMATCH_EXTFLAG | FNMATCH_IGNCASE) == 0) |
| { |
| *sp = indices[n]; |
| *ep = indices[wstrlen]; |
| return 1; |
| } |
| /* If MLEN != -1, we have a fixed length pattern. */ |
| if (mlen != -1) |
| break; |
| } |
| |
| return (0); |
| } |
| |
| return (0); |
| } |
| #undef WFOLD |
| #endif /* HANDLE_MULTIBYTE */ |
| |
| static int |
| match_pattern (string, pat, mtype, sp, ep) |
| char *string, *pat; |
| int mtype; |
| char **sp, **ep; |
| { |
| #if defined (HANDLE_MULTIBYTE) |
| int ret; |
| size_t n; |
| wchar_t *wstring, *wpat; |
| char **indices; |
| #endif |
| |
| if (string == 0 || pat == 0 || *pat == 0) |
| return (0); |
| |
| #if defined (HANDLE_MULTIBYTE) |
| if (MB_CUR_MAX > 1) |
| { |
| if (mbsmbchar (string) == 0 && mbsmbchar (pat) == 0) |
| return (match_upattern (string, pat, mtype, sp, ep)); |
| |
| n = xdupmbstowcs (&wpat, NULL, pat); |
| if (n == (size_t)-1) |
| return (match_upattern (string, pat, mtype, sp, ep)); |
| n = xdupmbstowcs (&wstring, &indices, string); |
| if (n == (size_t)-1) |
| { |
| free (wpat); |
| return (match_upattern (string, pat, mtype, sp, ep)); |
| } |
| ret = match_wpattern (wstring, indices, n, wpat, mtype, sp, ep); |
| |
| free (wpat); |
| free (wstring); |
| free (indices); |
| |
| return (ret); |
| } |
| else |
| #endif |
| return (match_upattern (string, pat, mtype, sp, ep)); |
| } |
| |
| static int |
| getpatspec (c, value) |
| int c; |
| char *value; |
| { |
| if (c == '#') |
| return ((*value == '#') ? RP_LONG_LEFT : RP_SHORT_LEFT); |
| else /* c == '%' */ |
| return ((*value == '%') ? RP_LONG_RIGHT : RP_SHORT_RIGHT); |
| } |
| |
| /* Posix.2 says that the WORD should be run through tilde expansion, |
| parameter expansion, command substitution and arithmetic expansion. |
| This leaves the result quoted, so quote_string_for_globbing () has |
| to be called to fix it up for strmatch (). If QUOTED is non-zero, |
| it means that the entire expression was enclosed in double quotes. |
| This means that quoting characters in the pattern do not make any |
| special pattern characters quoted. For example, the `*' in the |
| following retains its special meaning: "${foo#'*'}". */ |
| static char * |
| getpattern (value, quoted, expandpat) |
| char *value; |
| int quoted, expandpat; |
| { |
| char *pat, *tword; |
| WORD_LIST *l; |
| #if 0 |
| int i; |
| #endif |
| /* There is a problem here: how to handle single or double quotes in the |
| pattern string when the whole expression is between double quotes? |
| POSIX.2 says that enclosing double quotes do not cause the pattern to |
| be quoted, but does that leave us a problem with @ and array[@] and their |
| expansions inside a pattern? */ |
| #if 0 |
| if (expandpat && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && *tword) |
| { |
| i = 0; |
| pat = string_extract_double_quoted (tword, &i, SX_STRIPDQ); |
| free (tword); |
| tword = pat; |
| } |
| #endif |
| |
| /* expand_string_for_pat () leaves WORD quoted and does not perform |
| word splitting. */ |
| l = *value ? expand_string_for_pat (value, |
| (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) ? Q_PATQUOTE : quoted, |
| (int *)NULL, (int *)NULL) |
| : (WORD_LIST *)0; |
| if (l) |
| word_list_remove_quoted_nulls (l); |
| pat = string_list (l); |
| dispose_words (l); |
| if (pat) |
| { |
| tword = quote_string_for_globbing (pat, QGLOB_CVTNULL); |
| free (pat); |
| pat = tword; |
| } |
| return (pat); |
| } |
| |
| #if 0 |
| /* Handle removing a pattern from a string as a result of ${name%[%]value} |
| or ${name#[#]value}. */ |
| static char * |
| variable_remove_pattern (value, pattern, patspec, quoted) |
| char *value, *pattern; |
| int patspec, quoted; |
| { |
| char *tword; |
| |
| tword = remove_pattern (value, pattern, patspec); |
| |
| return (tword); |
| } |
| #endif |
| |
| static char * |
| list_remove_pattern (list, pattern, patspec, itype, quoted) |
| WORD_LIST *list; |
| char *pattern; |
| int patspec, itype, quoted; |
| { |
| WORD_LIST *new, *l; |
| WORD_DESC *w; |
| char *tword; |
| |
| for (new = (WORD_LIST *)NULL, l = list; l; l = l->next) |
| { |
| tword = remove_pattern (l->word->word, pattern, patspec); |
| w = alloc_word_desc (); |
| w->word = tword ? tword : savestring (""); |
| new = make_word_list (w, new); |
| } |
| |
| l = REVERSE_LIST (new, WORD_LIST *); |
| tword = string_list_pos_params (itype, l, quoted, 0); |
| dispose_words (l); |
| |
| return (tword); |
| } |
| |
| static char * |
| parameter_list_remove_pattern (itype, pattern, patspec, quoted) |
| int itype; |
| char *pattern; |
| int patspec, quoted; |
| { |
| char *ret; |
| WORD_LIST *list; |
| |
| list = list_rest_of_args (); |
| if (list == 0) |
| return ((char *)NULL); |
| ret = list_remove_pattern (list, pattern, patspec, itype, quoted); |
| dispose_words (list); |
| return (ret); |
| } |
| |
| #if defined (ARRAY_VARS) |
| static char * |
| array_remove_pattern (var, pattern, patspec, starsub, quoted) |
| SHELL_VAR *var; |
| char *pattern; |
| int patspec; |
| int starsub; /* so we can figure out how it's indexed */ |
| int quoted; |
| { |
| ARRAY *a; |
| HASH_TABLE *h; |
| int itype; |
| char *ret; |
| WORD_LIST *list; |
| SHELL_VAR *v; |
| |
| v = var; /* XXX - for now */ |
| |
| itype = starsub ? '*' : '@'; |
| |
| a = (v && array_p (v)) ? array_cell (v) : 0; |
| h = (v && assoc_p (v)) ? assoc_cell (v) : 0; |
| |
| list = a ? array_to_word_list (a) : (h ? assoc_to_word_list (h) : 0); |
| if (list == 0) |
| return ((char *)NULL); |
| ret = list_remove_pattern (list, pattern, patspec, itype, quoted); |
| dispose_words (list); |
| |
| return ret; |
| } |
| #endif /* ARRAY_VARS */ |
| |
| static char * |
| parameter_brace_remove_pattern (varname, value, ind, patstr, rtype, quoted, flags) |
| char *varname, *value; |
| int ind; |
| char *patstr; |
| int rtype, quoted, flags; |
| { |
| int vtype, patspec, starsub; |
| char *temp1, *val, *pattern, *oname; |
| SHELL_VAR *v; |
| |
| if (value == 0) |
| return ((char *)NULL); |
| |
| oname = this_command_name; |
| this_command_name = varname; |
| |
| vtype = get_var_and_type (varname, value, ind, quoted, flags, &v, &val); |
| if (vtype == -1) |
| { |
| this_command_name = oname; |
| return ((char *)NULL); |
| } |
| |
| starsub = vtype & VT_STARSUB; |
| vtype &= ~VT_STARSUB; |
| |
| patspec = getpatspec (rtype, patstr); |
| if (patspec == RP_LONG_LEFT || patspec == RP_LONG_RIGHT) |
| patstr++; |
| |
| /* Need to pass getpattern newly-allocated memory in case of expansion -- |
| the expansion code will free the passed string on an error. */ |
| temp1 = savestring (patstr); |
| pattern = getpattern (temp1, quoted, 1); |
| free (temp1); |
| |
| temp1 = (char *)NULL; /* shut up gcc */ |
| switch (vtype) |
| { |
| case VT_VARIABLE: |
| case VT_ARRAYMEMBER: |
| temp1 = remove_pattern (val, pattern, patspec); |
| if (vtype == VT_VARIABLE) |
| FREE (val); |
| if (temp1) |
| { |
| val = (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) |
| ? quote_string (temp1) |
| : quote_escapes (temp1); |
| free (temp1); |
| temp1 = val; |
| } |
| break; |
| #if defined (ARRAY_VARS) |
| case VT_ARRAYVAR: |
| temp1 = array_remove_pattern (v, pattern, patspec, starsub, quoted); |
| if (temp1 && ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) == 0)) |
| { |
| val = quote_escapes (temp1); |
| free (temp1); |
| temp1 = val; |
| } |
| break; |
| #endif |
| case VT_POSPARMS: |
| temp1 = parameter_list_remove_pattern (varname[0], pattern, patspec, quoted); |
| if (temp1 && quoted == 0 && ifs_is_null) |
| { |
| /* Posix interp 888 */ |
| } |
| else if (temp1 && ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) == 0)) |
| { |
| val = quote_escapes (temp1); |
| free (temp1); |
| temp1 = val; |
| } |
| break; |
| } |
| |
| this_command_name = oname; |
| |
| FREE (pattern); |
| return temp1; |
| } |
| |
| #if defined (PROCESS_SUBSTITUTION) |
| |
| static void reap_some_procsubs PARAMS((int)); |
| |
| /*****************************************************************/ |
| /* */ |
| /* Hacking Process Substitution */ |
| /* */ |
| /*****************************************************************/ |
| |
| #if !defined (HAVE_DEV_FD) |
| /* Named pipes must be removed explicitly with `unlink'. This keeps a list |
| of FIFOs the shell has open. unlink_fifo_list will walk the list and |
| unlink the ones that don't have a living process on the other end. |
| unlink_all_fifos will walk the list and unconditionally unlink them, trying |
| to open and close the FIFO first to release any child processes sleeping on |
| the FIFO. add_fifo_list adds the name of an open FIFO to the list. |
| NFIFO is a count of the number of FIFOs in the list. */ |
| #define FIFO_INCR 20 |
| |
| /* PROC value of -1 means the process has been reaped and the FIFO needs to |
| be removed. PROC value of 0 means the slot is unused. */ |
| struct temp_fifo { |
| char *file; |
| pid_t proc; |
| }; |
| |
| static struct temp_fifo *fifo_list = (struct temp_fifo *)NULL; |
| static int nfifo; |
| static int fifo_list_size; |
| |
| void |
| clear_fifo_list () |
| { |
| int i; |
| |
| for (i = 0; i < fifo_list_size; i++) |
| { |
| if (fifo_list[i].file) |
| free (fifo_list[i].file); |
| fifo_list[i].file = NULL; |
| fifo_list[i].proc = 0; |
| } |
| nfifo = 0; |
| } |
| |
| void * |
| copy_fifo_list (sizep) |
| int *sizep; |
| { |
| if (sizep) |
| *sizep = 0; |
| return (void *)NULL; |
| } |
| |
| static void |
| add_fifo_list (pathname) |
| char *pathname; |
| { |
| int osize, i; |
| |
| if (nfifo >= fifo_list_size - 1) |
| { |
| osize = fifo_list_size; |
| fifo_list_size += FIFO_INCR; |
| fifo_list = (struct temp_fifo *)xrealloc (fifo_list, |
| fifo_list_size * sizeof (struct temp_fifo)); |
| for (i = osize; i < fifo_list_size; i++) |
| { |
| fifo_list[i].file = (char *)NULL; |
| fifo_list[i].proc = 0; /* unused */ |
| } |
| } |
| |
| fifo_list[nfifo].file = savestring (pathname); |
| nfifo++; |
| } |
| |
| void |
| unlink_fifo (i) |
| int i; |
| { |
| if ((fifo_list[i].proc == (pid_t)-1) || (fifo_list[i].proc > 0 && (kill(fifo_list[i].proc, 0) == -1))) |
| { |
| unlink (fifo_list[i].file); |
| free (fifo_list[i].file); |
| fifo_list[i].file = (char *)NULL; |
| fifo_list[i].proc = 0; |
| } |
| } |
| |
| void |
| unlink_fifo_list () |
| { |
| int saved, i, j; |
| |
| if (nfifo == 0) |
| return; |
| |
| for (i = saved = 0; i < nfifo; i++) |
| { |
| if ((fifo_list[i].proc == (pid_t)-1) || (fifo_list[i].proc > 0 && (kill(fifo_list[i].proc, 0) == -1))) |
| { |
| unlink (fifo_list[i].file); |
| free (fifo_list[i].file); |
| fifo_list[i].file = (char *)NULL; |
| fifo_list[i].proc = 0; |
| } |
| else |
| saved++; |
| } |
| |
| /* If we didn't remove some of the FIFOs, compact the list. */ |
| if (saved) |
| { |
| for (i = j = 0; i < nfifo; i++) |
| if (fifo_list[i].file) |
| { |
| if (i != j) |
| { |
| fifo_list[j].file = fifo_list[i].file; |
| fifo_list[j].proc = fifo_list[i].proc; |
| fifo_list[i].file = (char *)NULL; |
| fifo_list[i].proc = 0; |
| } |
| j++; |
| } |
| nfifo = j; |
| } |
| else |
| nfifo = 0; |
| } |
| |
| void |
| unlink_all_fifos () |
| { |
| int i, fd; |
| |
| if (nfifo == 0) |
| return; |
| |
| for (i = 0; i < nfifo; i++) |
| { |
| fifo_list[i].proc = (pid_t)-1; |
| fd = open (fifo_list[i].file, O_RDWR|O_NONBLOCK); |
| unlink_fifo (i); |
| if (fd >= 0) |
| close (fd); |
| } |
| |
| nfifo = 0; |
| } |
| |
| /* Take LIST, which is a bitmap denoting active FIFOs in fifo_list |
| from some point in the past, and close all open FIFOs in fifo_list |
| that are not marked as active in LIST. If LIST is NULL, close |
| everything in fifo_list. LSIZE is the number of elements in LIST, in |
| case it's larger than fifo_list_size (size of fifo_list). */ |
| void |
| close_new_fifos (list, lsize) |
| void *list; |
| int lsize; |
| { |
| int i; |
| char *plist; |
| |
| if (list == 0) |
| { |
| unlink_fifo_list (); |
| return; |
| } |
| |
| for (plist = (char *)list, i = 0; i < lsize; i++) |
| if (plist[i] == 0 && i < fifo_list_size && fifo_list[i].proc != -1) |
| unlink_fifo (i); |
| |
| for (i = lsize; i < fifo_list_size; i++) |
| unlink_fifo (i); |
| } |
| |
| int |
| find_procsub_child (pid) |
| pid_t pid; |
| { |
| int i; |
| |
| for (i = 0; i < nfifo; i++) |
| if (fifo_list[i].proc == pid) |
| return i; |
| return -1; |
| } |
| |
| void |
| set_procsub_status (ind, pid, status) |
| int ind; |
| pid_t pid; |
| int status; |
| { |
| if (ind >= 0 && ind < nfifo) |
| fifo_list[ind].proc = (pid_t)-1; /* sentinel */ |
| } |
| |
| /* If we've marked the process for this procsub as dead, close the |
| associated file descriptor and delete the FIFO. */ |
| static void |
| reap_some_procsubs (max) |
| int max; |
| { |
| int i; |
| |
| for (i = 0; i < max; i++) |
| if (fifo_list[i].proc == (pid_t)-1) /* reaped */ |
| unlink_fifo (i); |
| } |
| |
| void |
| reap_procsubs () |
| { |
| reap_some_procsubs (nfifo); |
| } |
| |
| #if 0 |
| /* UNUSED */ |
| void |
| wait_procsubs () |
| { |
| int i, r; |
| |
| for (i = 0; i < nfifo; i++) |
| { |
| if (fifo_list[i].proc != (pid_t)-1 && fifo_list[i].proc > 0) |
| { |
| r = wait_for (fifo_list[i].proc, 0); |
| save_proc_status (fifo_list[i].proc, r); |
| fifo_list[i].proc = (pid_t)-1; |
| } |
| } |
| } |
| #endif |
| |
| int |
| fifos_pending () |
| { |
| return nfifo; |
| } |
| |
| int |
| num_fifos () |
| { |
| return nfifo; |
| } |
| |
| static char * |
| make_named_pipe () |
| { |
| char *tname; |
| |
| tname = sh_mktmpname ("sh-np", MT_USERANDOM|MT_USETMPDIR); |
| if (mkfifo (tname, 0600) < 0) |
| { |
| free (tname); |
| return ((char *)NULL); |
| } |
| |
| add_fifo_list (tname); |
| return (tname); |
| } |
| |
| #else /* HAVE_DEV_FD */ |
| |
| /* DEV_FD_LIST is a bitmap of file descriptors attached to pipes the shell |
| has open to children. NFDS is a count of the number of bits currently |
| set in DEV_FD_LIST. TOTFDS is a count of the highest possible number |
| of open files. */ |
| /* dev_fd_list[I] value of -1 means the process has been reaped and file |
| descriptor I needs to be closed. Value of 0 means the slot is unused. */ |
| |
| static pid_t *dev_fd_list = (pid_t *)NULL; |
| static int nfds; |
| static int totfds; /* The highest possible number of open files. */ |
| |
| void |
| clear_fifo (i) |
| int i; |
| { |
| if (dev_fd_list[i]) |
| { |
| dev_fd_list[i] = 0; |
| nfds--; |
| } |
| } |
| |
| void |
| clear_fifo_list () |
| { |
| register int i; |
| |
| if (nfds == 0) |
| return; |
| |
| for (i = 0; nfds && i < totfds; i++) |
| clear_fifo (i); |
| |
| nfds = 0; |
| } |
| |
| void * |
| copy_fifo_list (sizep) |
| int *sizep; |
| { |
| void *ret; |
| |
| if (nfds == 0 || totfds == 0) |
| { |
| if (sizep) |
| *sizep = 0; |
| return (void *)NULL; |
| } |
| |
| if (sizep) |
| *sizep = totfds; |
| ret = xmalloc (totfds * sizeof (pid_t)); |
| return (memcpy (ret, dev_fd_list, totfds * sizeof (pid_t))); |
| } |
| |
| static void |
| add_fifo_list (fd) |
| int fd; |
| { |
| if (dev_fd_list == 0 || fd >= totfds) |
| { |
| int ofds; |
| |
| ofds = totfds; |
| totfds = getdtablesize (); |
| if (totfds < 0 || totfds > 256) |
| totfds = 256; |
| if (fd >= totfds) |
| totfds = fd + 2; |
| |
| dev_fd_list = (pid_t *)xrealloc (dev_fd_list, totfds * sizeof (dev_fd_list[0])); |
| /* XXX - might need a loop for this */ |
| memset (dev_fd_list + ofds, '\0', (totfds - ofds) * sizeof (pid_t)); |
| } |
| |
| dev_fd_list[fd] = 1; /* marker; updated later */ |
| nfds++; |
| } |
| |
| int |
| fifos_pending () |
| { |
| return 0; /* used for cleanup; not needed with /dev/fd */ |
| } |
| |
| int |
| num_fifos () |
| { |
| return nfds; |
| } |
| |
| void |
| unlink_fifo (fd) |
| int fd; |
| { |
| if (dev_fd_list[fd]) |
| { |
| close (fd); |
| dev_fd_list[fd] = 0; |
| nfds--; |
| } |
| } |
| |
| void |
| unlink_fifo_list () |
| { |
| register int i; |
| |
| if (nfds == 0) |
| return; |
| |
| for (i = totfds-1; nfds && i >= 0; i--) |
| unlink_fifo (i); |
| |
| nfds = 0; |
| } |
| |
| void |
| unlink_all_fifos () |
| { |
| unlink_fifo_list (); |
| } |
| |
| /* Take LIST, which is a snapshot copy of dev_fd_list from some point in |
| the past, and close all open fds in dev_fd_list that are not marked |
| as open in LIST. If LIST is NULL, close everything in dev_fd_list. |
| LSIZE is the number of elements in LIST, in case it's larger than |
| totfds (size of dev_fd_list). */ |
| void |
| close_new_fifos (list, lsize) |
| void *list; |
| int lsize; |
| { |
| int i; |
| pid_t *plist; |
| |
| if (list == 0) |
| { |
| unlink_fifo_list (); |
| return; |
| } |
| |
| for (plist = (pid_t *)list, i = 0; i < lsize; i++) |
| if (plist[i] == 0 && i < totfds && dev_fd_list[i]) |
| unlink_fifo (i); |
| |
| for (i = lsize; i < totfds; i++) |
| unlink_fifo (i); |
| } |
| |
| int |
| find_procsub_child (pid) |
| pid_t pid; |
| { |
| int i; |
| |
| if (nfds == 0) |
| return -1; |
| |
| for (i = 0; i < totfds; i++) |
| if (dev_fd_list[i] == pid) |
| return i; |
| |
| return -1; |
| } |
| |
| void |
| set_procsub_status (ind, pid, status) |
| int ind; |
| pid_t pid; |
| int status; |
| { |
| if (ind >= 0 && ind < totfds) |
| dev_fd_list[ind] = (pid_t)-1; /* sentinel */ |
| } |
| |
| /* If we've marked the process for this procsub as dead, close the |
| associated file descriptor. */ |
| static void |
| reap_some_procsubs (max) |
| int max; |
| { |
| int i; |
| |
| for (i = 0; nfds > 0 && i < max; i++) |
| if (dev_fd_list[i] == (pid_t)-1) |
| unlink_fifo (i); |
| } |
| |
| void |
| reap_procsubs () |
| { |
| reap_some_procsubs (totfds); |
| } |
| |
| #if 0 |
| /* UNUSED */ |
| void |
| wait_procsubs () |
| { |
| int i, r; |
| |
| for (i = 0; nfds > 0 && i < totfds; i++) |
| { |
| if (dev_fd_list[i] != (pid_t)-1 && dev_fd_list[i] > 0) |
| { |
| r = wait_for (dev_fd_list[i], 0); |
| save_proc_status (dev_fd_list[i], r); |
| dev_fd_list[i] = (pid_t)-1; |
| } |
| } |
| } |
| #endif |
| |
| #if defined (NOTDEF) |
| print_dev_fd_list () |
| { |
| register int i; |
| |
| fprintf (stderr, "pid %ld: dev_fd_list:", (long)getpid ()); |
| fflush (stderr); |
| |
| for (i = 0; i < totfds; i++) |
| { |
| if (dev_fd_list[i]) |
| fprintf (stderr, " %d", i); |
| } |
| fprintf (stderr, "\n"); |
| } |
| #endif /* NOTDEF */ |
| |
| static char * |
| make_dev_fd_filename (fd) |
| int fd; |
| { |
| char *ret, intbuf[INT_STRLEN_BOUND (int) + 1], *p; |
| |
| ret = (char *)xmalloc (sizeof (DEV_FD_PREFIX) + 8); |
| |
| strcpy (ret, DEV_FD_PREFIX); |
| p = inttostr (fd, intbuf, sizeof (intbuf)); |
| strcpy (ret + sizeof (DEV_FD_PREFIX) - 1, p); |
| |
| add_fifo_list (fd); |
| return (ret); |
| } |
| |
| #endif /* HAVE_DEV_FD */ |
| |
| /* Return a filename that will open a connection to the process defined by |
| executing STRING. HAVE_DEV_FD, if defined, means open a pipe and return |
| a filename in /dev/fd corresponding to a descriptor that is one of the |
| ends of the pipe. If not defined, we use named pipes on systems that have |
| them. Systems without /dev/fd and named pipes are out of luck. |
| |
| OPEN_FOR_READ_IN_CHILD, if 1, means open the named pipe for reading or |
| use the read end of the pipe and dup that file descriptor to fd 0 in |
| the child. If OPEN_FOR_READ_IN_CHILD is 0, we open the named pipe for |
| writing or use the write end of the pipe in the child, and dup that |
| file descriptor to fd 1 in the child. The parent does the opposite. */ |
| |
| static char * |
| process_substitute (string, open_for_read_in_child) |
| char *string; |
| int open_for_read_in_child; |
| { |
| char *pathname; |
| int fd, result, rc, function_value; |
| pid_t old_pid, pid; |
| #if defined (HAVE_DEV_FD) |
| int parent_pipe_fd, child_pipe_fd; |
| int fildes[2]; |
| #endif /* HAVE_DEV_FD */ |
| #if defined (JOB_CONTROL) |
| pid_t old_pipeline_pgrp; |
| #endif |
| |
| if (!string || !*string || wordexp_only) |
| return ((char *)NULL); |
| |
| #if !defined (HAVE_DEV_FD) |
| pathname = make_named_pipe (); |
| #else /* HAVE_DEV_FD */ |
| if (pipe (fildes) < 0) |
| { |
| sys_error ("%s", _("cannot make pipe for process substitution")); |
| return ((char *)NULL); |
| } |
| /* If OPEN_FOR_READ_IN_CHILD == 1, we want to use the write end of |
| the pipe in the parent, otherwise the read end. */ |
| parent_pipe_fd = fildes[open_for_read_in_child]; |
| child_pipe_fd = fildes[1 - open_for_read_in_child]; |
| /* Move the parent end of the pipe to some high file descriptor, to |
| avoid clashes with FDs used by the script. */ |
| parent_pipe_fd = move_to_high_fd (parent_pipe_fd, 1, 64); |
| |
| pathname = make_dev_fd_filename (parent_pipe_fd); |
| #endif /* HAVE_DEV_FD */ |
| |
| if (pathname == 0) |
| { |
| sys_error ("%s", _("cannot make pipe for process substitution")); |
| return ((char *)NULL); |
| } |
| |
| old_pid = last_made_pid; |
| |
| #if defined (JOB_CONTROL) |
| old_pipeline_pgrp = pipeline_pgrp; |
| if (pipeline_pgrp == 0 || (subshell_environment & (SUBSHELL_PIPE|SUBSHELL_FORK|SUBSHELL_ASYNC)) == 0) |
| pipeline_pgrp = shell_pgrp; |
| save_pipeline (1); |
| #endif /* JOB_CONTROL */ |
| |
| pid = make_child ((char *)NULL, FORK_ASYNC); |
| if (pid == 0) |
| { |
| #if 0 |
| int old_interactive; |
| |
| old_interactive = interactive; |
| #endif |
| /* The currently-executing shell is not interactive */ |
| interactive = 0; |
| |
| reset_terminating_signals (); /* XXX */ |
| free_pushed_string_input (); |
| /* Cancel traps, in trap.c. */ |
| restore_original_signals (); /* XXX - what about special builtins? bash-4.2 */ |
| QUIT; /* catch any interrupts we got post-fork */ |
| setup_async_signals (); |
| #if 0 |
| if (open_for_read_in_child == 0 && old_interactive && (bash_input.type == st_stdin || bash_input.type == st_stream)) |
| async_redirect_stdin (); |
| #endif |
| |
| subshell_environment |= SUBSHELL_COMSUB|SUBSHELL_PROCSUB|SUBSHELL_ASYNC; |
| |
| /* We don't inherit the verbose option for command substitutions now, so |
| let's try it for process substitutions. */ |
| change_flag ('v', FLAG_OFF); |
| |
| /* if we're expanding a redirection, we shouldn't have access to the |
| temporary environment, but commands in the subshell should have |
| access to their own temporary environment. */ |
| if (expanding_redir) |
| flush_temporary_env (); |
| } |
| |
| #if defined (JOB_CONTROL) |
| set_sigchld_handler (); |
| stop_making_children (); |
| /* XXX - should we only do this in the parent? (as in command subst) */ |
| pipeline_pgrp = old_pipeline_pgrp; |
| #else |
| stop_making_children (); |
| #endif /* JOB_CONTROL */ |
| |
| if (pid < 0) |
| { |
| sys_error ("%s", _("cannot make child for process substitution")); |
| free (pathname); |
| #if defined (HAVE_DEV_FD) |
| close (parent_pipe_fd); |
| close (child_pipe_fd); |
| #endif /* HAVE_DEV_FD */ |
| #if defined (JOB_CONTROL) |
| restore_pipeline (1); |
| #endif |
| return ((char *)NULL); |
| } |
| |
| if (pid > 0) |
| { |
| #if defined (JOB_CONTROL) |
| last_procsub_child = restore_pipeline (0); |
| /* We assume that last_procsub_child->next == last_procsub_child because |
| of how jobs.c:add_process() works. */ |
| last_procsub_child->next = 0; |
| procsub_add (last_procsub_child); |
| #endif |
| |
| #if defined (HAVE_DEV_FD) |
| dev_fd_list[parent_pipe_fd] = pid; |
| #else |
| fifo_list[nfifo-1].proc = pid; |
| #endif |
| |
| last_made_pid = old_pid; |
| |
| #if defined (JOB_CONTROL) && defined (PGRP_PIPE) |
| close_pgrp_pipe (); |
| #endif /* JOB_CONTROL && PGRP_PIPE */ |
| |
| #if defined (HAVE_DEV_FD) |
| close (child_pipe_fd); |
| #endif /* HAVE_DEV_FD */ |
| |
| return (pathname); |
| } |
| |
| set_sigint_handler (); |
| |
| #if defined (JOB_CONTROL) |
| /* make sure we don't have any job control */ |
| set_job_control (0); |
| |
| /* Clear out any existing list of process substitutions */ |
| procsub_clear (); |
| |
| /* The idea is that we want all the jobs we start from an async process |
| substitution to be in the same process group, but not the same pgrp |
| as our parent shell, since we don't want to affect our parent shell's |
| jobs if we get a SIGHUP and end up calling hangup_all_jobs, for example. |
| If pipeline_pgrp != shell_pgrp, we assume that there is a job control |
| shell somewhere in our parent process chain (since make_child initializes |
| pipeline_pgrp to shell_pgrp if job_control == 0). What we do in this |
| case is to set pipeline_pgrp to our PID, so all jobs started by this |
| process have that same pgrp and we are basically the process group leader. |
| This should not have negative effects on child processes surviving |
| after we exit, since we wait for the children we create, but that is |
| something to watch for. */ |
| |
| if (pipeline_pgrp != shell_pgrp) |
| pipeline_pgrp = getpid (); |
| #endif /* JOB_CONTROL */ |
| |
| #if !defined (HAVE_DEV_FD) |
| /* Open the named pipe in the child. */ |
| fd = open (pathname, open_for_read_in_child ? O_RDONLY : O_WRONLY); |
| if (fd < 0) |
| { |
| /* Two separate strings for ease of translation. */ |
| if (open_for_read_in_child) |
| sys_error (_("cannot open named pipe %s for reading"), pathname); |
| else |
| sys_error (_("cannot open named pipe %s for writing"), pathname); |
| |
| exit (127); |
| } |
| if (open_for_read_in_child) |
| { |
| if (sh_unset_nodelay_mode (fd) < 0) |
| { |
| sys_error (_("cannot reset nodelay mode for fd %d"), fd); |
| exit (127); |
| } |
| } |
| #else /* HAVE_DEV_FD */ |
| fd = child_pipe_fd; |
| #endif /* HAVE_DEV_FD */ |
| |
| /* Discard buffered stdio output before replacing the underlying file |
| descriptor. */ |
| if (open_for_read_in_child == 0) |
| fpurge (stdout); |
| |
| if (dup2 (fd, open_for_read_in_child ? 0 : 1) < 0) |
| { |
| sys_error (_("cannot duplicate named pipe %s as fd %d"), pathname, |
| open_for_read_in_child ? 0 : 1); |
| exit (127); |
| } |
| |
| if (fd != (open_for_read_in_child ? 0 : 1)) |
| close (fd); |
| |
| /* Need to close any files that this process has open to pipes inherited |
| from its parent. */ |
| if (current_fds_to_close) |
| { |
| close_fd_bitmap (current_fds_to_close); |
| current_fds_to_close = (struct fd_bitmap *)NULL; |
| } |
| |
| #if defined (HAVE_DEV_FD) |
| /* Make sure we close the parent's end of the pipe and clear the slot |
| in the fd list so it is not closed later, if reallocated by, for |
| instance, pipe(2). */ |
| close (parent_pipe_fd); |
| dev_fd_list[parent_pipe_fd] = 0; |
| #endif /* HAVE_DEV_FD */ |
| |
| /* subshells shouldn't have this flag, which controls using the temporary |
| environment for variable lookups. We have already flushed the temporary |
| environment above in the case we're expanding a redirection, so processes |
| executed by this command need to be able to set it independently of their |
| parent. */ |
| expanding_redir = 0; |
| |
| remove_quoted_escapes (string); |
| |
| #if 0 /* TAG: bash-5.2 */ |
| startup_state = 2; /* see if we can avoid a fork */ |
| parse_and_execute_level = 0; |
| #endif |
| |
| /* Give process substitution a place to jump back to on failure, |
| so we don't go back up to main (). */ |
| result = setjmp_nosigs (top_level); |
| |
| /* If we're running a process substitution inside a shell function, |
| trap `return' so we don't return from the function in the subshell |
| and go off to never-never land. */ |
| if (result == 0 && return_catch_flag) |
| function_value = setjmp_nosigs (return_catch); |
| else |
| function_value = 0; |
| |
| if (result == ERREXIT) |
| rc = last_command_exit_value; |
| else if (result == EXITPROG) |
| rc = last_command_exit_value; |
| else if (result) |
| rc = EXECUTION_FAILURE; |
| else if (function_value) |
| rc = return_catch_value; |
| else |
| { |
| subshell_level++; |
| rc = parse_and_execute (string, "process substitution", (SEVAL_NONINT|SEVAL_NOHIST)); |
| /* leave subshell level intact for any exit trap */ |
| } |
| |
| #if !defined (HAVE_DEV_FD) |
| /* Make sure we close the named pipe in the child before we exit. */ |
| close (open_for_read_in_child ? 0 : 1); |
| #endif /* !HAVE_DEV_FD */ |
| |
| last_command_exit_value = rc; |
| rc = run_exit_trap (); |
| exit (rc); |
| /*NOTREACHED*/ |
| } |
| #endif /* PROCESS_SUBSTITUTION */ |
| |
| /***********************************/ |
| /* */ |
| /* Command Substitution */ |
| /* */ |
| /***********************************/ |
| |
| static char * |
| read_comsub (fd, quoted, flags, rflag) |
| int fd, quoted, flags; |
| int *rflag; |
| { |
| char *istring, buf[512], *bufp; |
| int istring_index, c, tflag, skip_ctlesc, skip_ctlnul; |
| int mb_cur_max; |
| size_t istring_size; |
| ssize_t bufn; |
| int nullbyte; |
| #if defined (HANDLE_MULTIBYTE) |
| mbstate_t ps; |
| wchar_t wc; |
| size_t mblen; |
| int i; |
| #endif |
| |
| istring = (char *)NULL; |
| istring_index = istring_size = bufn = tflag = 0; |
| |
| skip_ctlesc = ifs_cmap[CTLESC]; |
| skip_ctlnul = ifs_cmap[CTLNUL]; |
| |
| mb_cur_max = MB_CUR_MAX; |
| nullbyte = 0; |
| |
| /* Read the output of the command through the pipe. */ |
| while (1) |
| { |
| if (fd < 0) |
| break; |
| if (--bufn <= 0) |
| { |
| bufn = zread (fd, buf, sizeof (buf)); |
| if (bufn <= 0) |
| break; |
| bufp = buf; |
| } |
| c = *bufp++; |
| |
| if (c == 0) |
| { |
| #if 1 |
| if (nullbyte == 0) |
| { |
| internal_warning ("%s", _("command substitution: ignored null byte in input")); |
| nullbyte = 1; |
| } |
| #endif |
| continue; |
| } |
| |
| /* Add the character to ISTRING, possibly after resizing it. */ |
| RESIZE_MALLOCED_BUFFER (istring, istring_index, mb_cur_max+1, istring_size, 512); |
| |
| /* This is essentially quote_string inline */ |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) /* || c == CTLESC || c == CTLNUL */) |
| istring[istring_index++] = CTLESC; |
| else if ((flags & PF_ASSIGNRHS) && skip_ctlesc && c == CTLESC) |
| istring[istring_index++] = CTLESC; |
| /* Escape CTLESC and CTLNUL in the output to protect those characters |
| from the rest of the word expansions (word splitting and globbing.) |
| This is essentially quote_escapes inline. */ |
| else if (skip_ctlesc == 0 && c == CTLESC) |
| istring[istring_index++] = CTLESC; |
| else if ((skip_ctlnul == 0 && c == CTLNUL) || (c == ' ' && (ifs_value && *ifs_value == 0))) |
| istring[istring_index++] = CTLESC; |
| |
| #if defined (HANDLE_MULTIBYTE) |
| if ((locale_utf8locale && (c & 0x80)) || |
| (locale_utf8locale == 0 && mb_cur_max > 1 && (unsigned char)c > 127)) |
| { |
| /* read a multibyte character from buf */ |
| /* punt on the hard case for now */ |
| memset (&ps, '\0', sizeof (mbstate_t)); |
| mblen = mbrtowc (&wc, bufp-1, bufn+1, &ps); |
| if (MB_INVALIDCH (mblen) || mblen == 0 || mblen == 1) |
| istring[istring_index++] = c; |
| else |
| { |
| istring[istring_index++] = c; |
| for (i = 0; i < mblen-1; i++) |
| istring[istring_index++] = *bufp++; |
| bufn -= mblen - 1; |
| } |
| continue; |
| } |
| #endif |
| |
| istring[istring_index++] = c; |
| } |
| |
| if (istring) |
| istring[istring_index] = '\0'; |
| |
| /* If we read no output, just return now and save ourselves some |
| trouble. */ |
| if (istring_index == 0) |
| { |
| FREE (istring); |
| if (rflag) |
| *rflag = tflag; |
| return (char *)NULL; |
| } |
| |
| /* Strip trailing newlines from the output of the command. */ |
| if (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) |
| { |
| while (istring_index > 0) |
| { |
| if (istring[istring_index - 1] == '\n') |
| { |
| --istring_index; |
| |
| /* If the newline was quoted, remove the quoting char. */ |
| if (istring[istring_index - 1] == CTLESC) |
| --istring_index; |
| } |
| else |
| break; |
| } |
| istring[istring_index] = '\0'; |
| } |
| else |
| strip_trailing (istring, istring_index - 1, 1); |
| |
| if (rflag) |
| *rflag = tflag; |
| return istring; |
| } |
| |
| /* Perform command substitution on STRING. This returns a WORD_DESC * with the |
| contained string possibly quoted. */ |
| WORD_DESC * |
| command_substitute (string, quoted, flags) |
| char *string; |
| int quoted; |
| int flags; |
| { |
| pid_t pid, old_pid, old_pipeline_pgrp, old_async_pid; |
| char *istring, *s; |
| int result, fildes[2], function_value, pflags, rc, tflag, fork_flags; |
| WORD_DESC *ret; |
| sigset_t set, oset; |
| |
| istring = (char *)NULL; |
| |
| /* Don't fork () if there is no need to. In the case of no command to |
| run, just return NULL. */ |
| #if 1 |
| for (s = string; s && *s && (shellblank (*s) || *s == '\n'); s++) |
| ; |
| if (s == 0 || *s == 0) |
| return ((WORD_DESC *)NULL); |
| #else |
| if (!string || !*string || (string[0] == '\n' && !string[1])) |
| return ((WORD_DESC *)NULL); |
| #endif |
| |
| if (wordexp_only && read_but_dont_execute) |
| { |
| last_command_exit_value = EX_WEXPCOMSUB; |
| jump_to_top_level (EXITPROG); |
| } |
| |
| /* We're making the assumption here that the command substitution will |
| eventually run a command from the file system. Since we'll run |
| maybe_make_export_env in this subshell before executing that command, |
| the parent shell and any other shells it starts will have to remake |
| the environment. If we make it before we fork, other shells won't |
| have to. Don't bother if we have any temporary variable assignments, |
| though, because the export environment will be remade after this |
| command completes anyway, but do it if all the words to be expanded |
| are variable assignments. */ |
| if (subst_assign_varlist == 0 || garglist == 0) |
| maybe_make_export_env (); /* XXX */ |
| |
| /* Flags to pass to parse_and_execute() */ |
| pflags = (interactive && sourcelevel == 0) ? SEVAL_RESETLINE : 0; |
| |
| old_pid = last_made_pid; |
| |
| /* Pipe the output of executing STRING into the current shell. */ |
| if (pipe (fildes) < 0) |
| { |
| sys_error ("%s", _("cannot make pipe for command substitution")); |
| goto error_exit; |
| } |
| |
| #if defined (JOB_CONTROL) |
| old_pipeline_pgrp = pipeline_pgrp; |
| /* Don't reset the pipeline pgrp if we're already a subshell in a pipeline. */ |
| if ((subshell_environment & SUBSHELL_PIPE) == 0) |
| pipeline_pgrp = shell_pgrp; |
| cleanup_the_pipeline (); |
| #endif /* JOB_CONTROL */ |
| |
| old_async_pid = last_asynchronous_pid; |
| fork_flags = (subshell_environment&SUBSHELL_ASYNC) ? FORK_ASYNC : 0; |
| pid = make_child ((char *)NULL, fork_flags|FORK_NOTERM); |
| last_asynchronous_pid = old_async_pid; |
| |
| if (pid == 0) |
| { |
| /* Reset the signal handlers in the child, but don't free the |
| trap strings. Set a flag noting that we have to free the |
| trap strings if we run trap to change a signal disposition. */ |
| reset_signal_handlers (); |
| if (ISINTERRUPT) |
| { |
| kill (getpid (), SIGINT); |
| CLRINTERRUPT; /* if we're ignoring SIGINT somehow */ |
| } |
| QUIT; /* catch any interrupts we got post-fork */ |
| subshell_environment |= SUBSHELL_RESETTRAP; |
| } |
| |
| #if defined (JOB_CONTROL) |
| /* XXX DO THIS ONLY IN PARENT ? XXX */ |
| set_sigchld_handler (); |
| stop_making_children (); |
| if (pid != 0) |
| pipeline_pgrp = old_pipeline_pgrp; |
| #else |
| stop_making_children (); |
| #endif /* JOB_CONTROL */ |
| |
| if (pid < 0) |
| { |
| sys_error (_("cannot make child for command substitution")); |
| error_exit: |
| |
| last_made_pid = old_pid; |
| |
| FREE (istring); |
| close (fildes[0]); |
| close (fildes[1]); |
| return ((WORD_DESC *)NULL); |
| } |
| |
| if (pid == 0) |
| { |
| /* The currently executing shell is not interactive. */ |
| interactive = 0; |
| |
| set_sigint_handler (); /* XXX */ |
| |
| free_pushed_string_input (); |
| |
| /* Discard buffered stdio output before replacing the underlying file |
| descriptor. */ |
| fpurge (stdout); |
| |
| if (dup2 (fildes[1], 1) < 0) |
| { |
| sys_error ("%s", _("command_substitute: cannot duplicate pipe as fd 1")); |
| exit (EXECUTION_FAILURE); |
| } |
| |
| /* If standard output is closed in the parent shell |
| (such as after `exec >&-'), file descriptor 1 will be |
| the lowest available file descriptor, and end up in |
| fildes[0]. This can happen for stdin and stderr as well, |
| but stdout is more important -- it will cause no output |
| to be generated from this command. */ |
| if ((fildes[1] != fileno (stdin)) && |
| (fildes[1] != fileno (stdout)) && |
| (fildes[1] != fileno (stderr))) |
| close (fildes[1]); |
| |
| if ((fildes[0] != fileno (stdin)) && |
| (fildes[0] != fileno (stdout)) && |
| (fildes[0] != fileno (stderr))) |
| close (fildes[0]); |
| |
| #ifdef __CYGWIN__ |
| /* Let stdio know the fd may have changed from text to binary mode, and |
| make sure to preserve stdout line buffering. */ |
| freopen (NULL, "w", stdout); |
| sh_setlinebuf (stdout); |
| #endif /* __CYGWIN__ */ |
| |
| /* This is a subshell environment. */ |
| subshell_environment |= SUBSHELL_COMSUB; |
| |
| /* Many shells do not appear to inherit the -v option for command |
| substitutions. */ |
| change_flag ('v', FLAG_OFF); |
| |
| /* When inherit_errexit option is not enabled, command substitution does |
| not inherit the -e flag. It is enabled when Posix mode is enabled */ |
| if (inherit_errexit == 0) |
| { |
| builtin_ignoring_errexit = 0; |
| change_flag ('e', FLAG_OFF); |
| } |
| set_shellopts (); |
| |
| /* If we are expanding a redirection, we can dispose of any temporary |
| environment we received, since redirections are not supposed to have |
| access to the temporary environment. We will have to see whether this |
| affects temporary environments supplied to `eval', but the temporary |
| environment gets copied to builtin_env at some point. */ |
| if (expanding_redir) |
| { |
| flush_temporary_env (); |
| expanding_redir = 0; |
| } |
| |
| remove_quoted_escapes (string); |
| |
| startup_state = 2; /* see if we can avoid a fork */ |
| parse_and_execute_level = 0; |
| |
| /* Give command substitution a place to jump back to on failure, |
| so we don't go back up to main (). */ |
| result = setjmp_nosigs (top_level); |
| |
| /* If we're running a command substitution inside a shell function, |
| trap `return' so we don't return from the function in the subshell |
| and go off to never-never land. */ |
| if (result == 0 && return_catch_flag) |
| function_value = setjmp_nosigs (return_catch); |
| else |
| function_value = 0; |
| |
| if (result == ERREXIT) |
| rc = last_command_exit_value; |
| else if (result == EXITPROG) |
| rc = last_command_exit_value; |
| else if (result) |
| rc = EXECUTION_FAILURE; |
| else if (function_value) |
| rc = return_catch_value; |
| else |
| { |
| subshell_level++; |
| rc = parse_and_execute (string, "command substitution", pflags|SEVAL_NOHIST); |
| /* leave subshell level intact for any exit trap */ |
| } |
| |
| last_command_exit_value = rc; |
| rc = run_exit_trap (); |
| #if defined (PROCESS_SUBSTITUTION) |
| unlink_fifo_list (); |
| #endif |
| exit (rc); |
| } |
| else |
| { |
| int dummyfd; |
| |
| #if defined (JOB_CONTROL) && defined (PGRP_PIPE) |
| close_pgrp_pipe (); |
| #endif /* JOB_CONTROL && PGRP_PIPE */ |
| |
| close (fildes[1]); |
| |
| begin_unwind_frame ("read-comsub"); |
| dummyfd = fildes[0]; |
| add_unwind_protect (close, dummyfd); |
| |
| /* Block SIGINT while we're reading from the pipe. If the child |
| process gets a SIGINT, it will either handle it or die, and the |
| read will return. */ |
| BLOCK_SIGNAL (SIGINT, set, oset); |
| tflag = 0; |
| istring = read_comsub (fildes[0], quoted, flags, &tflag); |
| |
| close (fildes[0]); |
| discard_unwind_frame ("read-comsub"); |
| UNBLOCK_SIGNAL (oset); |
| |
| current_command_subst_pid = pid; |
| last_command_exit_value = wait_for (pid, JWAIT_NOTERM); |
| last_command_subst_pid = pid; |
| last_made_pid = old_pid; |
| |
| #if defined (JOB_CONTROL) |
| /* If last_command_exit_value > 128, then the substituted command |
| was terminated by a signal. If that signal was SIGINT, then send |
| SIGINT to ourselves. This will break out of loops, for instance. */ |
| if (last_command_exit_value == (128 + SIGINT) && last_command_exit_signal == SIGINT) |
| kill (getpid (), SIGINT); |
| #endif /* JOB_CONTROL */ |
| |
| ret = alloc_word_desc (); |
| ret->word = istring; |
| ret->flags = tflag; |
| |
| return ret; |
| } |
| } |
| |
| /******************************************************** |
| * * |
| * Utility functions for parameter expansion * |
| * * |
| ********************************************************/ |
| |
| #if defined (ARRAY_VARS) |
| |
| static arrayind_t |
| array_length_reference (s) |
| char *s; |
| { |
| int len; |
| arrayind_t ind; |
| char *akey; |
| char *t, c; |
| ARRAY *array; |
| HASH_TABLE *h; |
| SHELL_VAR *var; |
| |
| var = array_variable_part (s, 0, &t, &len); |
| |
| /* If unbound variables should generate an error, report one and return |
| failure. */ |
| if ((var == 0 || invisible_p (var) || (assoc_p (var) == 0 && array_p (var) == 0)) && unbound_vars_is_error) |
| { |
| c = *--t; |
| *t = '\0'; |
| set_exit_status (EXECUTION_FAILURE); |
| err_unboundvar (s); |
| *t = c; |
| return (-1); |
| } |
| else if (var == 0 || invisible_p (var)) |
| return 0; |
| |
| /* We support a couple of expansions for variables that are not arrays. |
| We'll return the length of the value for v[0], and 1 for v[@] or |
| v[*]. Return 0 for everything else. */ |
| |
| array = array_p (var) ? array_cell (var) : (ARRAY *)NULL; |
| h = assoc_p (var) ? assoc_cell (var) : (HASH_TABLE *)NULL; |
| |
| if (ALL_ELEMENT_SUB (t[0]) && t[1] == RBRACK) |
| { |
| if (assoc_p (var)) |
| return (h ? assoc_num_elements (h) : 0); |
| else if (array_p (var)) |
| return (array ? array_num_elements (array) : 0); |
| else |
| return (var_isset (var) ? 1 : 0); |
| } |
| |
| if (assoc_p (var)) |
| { |
| t[len - 1] = '\0'; |
| akey = expand_assignment_string_to_string (t, 0); /* [ */ |
| t[len - 1] = RBRACK; |
| if (akey == 0 || *akey == 0) |
| { |
| err_badarraysub (t); |
| FREE (akey); |
| return (-1); |
| } |
| t = assoc_reference (assoc_cell (var), akey); |
| free (akey); |
| } |
| else |
| { |
| ind = array_expand_index (var, t, len, 0); |
| /* negative subscripts to indexed arrays count back from end */ |
| if (var && array_p (var) && ind < 0) |
| ind = array_max_index (array_cell (var)) + 1 + ind; |
| if (ind < 0) |
| { |
| err_badarraysub (t); |
| return (-1); |
| } |
| if (array_p (var)) |
| t = array_reference (array, ind); |
| else |
| t = (ind == 0) ? value_cell (var) : (char *)NULL; |
| } |
| |
| len = MB_STRLEN (t); |
| return (len); |
| } |
| #endif /* ARRAY_VARS */ |
| |
| static int |
| valid_brace_expansion_word (name, var_is_special) |
| char *name; |
| int var_is_special; |
| { |
| if (DIGIT (*name) && all_digits (name)) |
| return 1; |
| else if (var_is_special) |
| return 1; |
| #if defined (ARRAY_VARS) |
| else if (valid_array_reference (name, 0)) |
| return 1; |
| #endif /* ARRAY_VARS */ |
| else if (legal_identifier (name)) |
| return 1; |
| else |
| return 0; |
| } |
| |
| static int |
| chk_atstar (name, quoted, pflags, quoted_dollar_atp, contains_dollar_at) |
| char *name; |
| int quoted, pflags; |
| int *quoted_dollar_atp, *contains_dollar_at; |
| { |
| char *temp1; |
| |
| if (name == 0) |
| { |
| if (quoted_dollar_atp) |
| *quoted_dollar_atp = 0; |
| if (contains_dollar_at) |
| *contains_dollar_at = 0; |
| return 0; |
| } |
| |
| /* check for $@ and $* */ |
| if (name[0] == '@' && name[1] == 0) |
| { |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && quoted_dollar_atp) |
| *quoted_dollar_atp = 1; |
| if (contains_dollar_at) |
| *contains_dollar_at = 1; |
| return 1; |
| } |
| else if (name[0] == '*' && name[1] == '\0' && quoted == 0) |
| { |
| /* Need more checks here that parallel what string_list_pos_params and |
| param_expand do. Check expand_no_split_dollar_star and ??? */ |
| if (contains_dollar_at && expand_no_split_dollar_star == 0) |
| *contains_dollar_at = 1; |
| return 1; |
| } |
| |
| /* Now check for ${array[@]} and ${array[*]} */ |
| #if defined (ARRAY_VARS) |
| else if (valid_array_reference (name, 0)) |
| { |
| temp1 = mbschr (name, LBRACK); |
| if (temp1 && temp1[1] == '@' && temp1[2] == RBRACK) |
| { |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && quoted_dollar_atp) |
| *quoted_dollar_atp = 1; |
| if (contains_dollar_at) |
| *contains_dollar_at = 1; |
| return 1; |
| } |
| /* ${array[*]}, when unquoted, should be treated like ${array[@]}, |
| which should result in separate words even when IFS is unset. */ |
| if (temp1 && temp1[1] == '*' && temp1[2] == RBRACK && quoted == 0) |
| { |
| if (contains_dollar_at) |
| *contains_dollar_at = 1; |
| return 1; |
| } |
| } |
| #endif |
| return 0; |
| } |
| |
| /* Parameter expand NAME, and return a new string which is the expansion, |
| or NULL if there was no expansion. NAME is as given in ${NAMEcWORD}. |
| VAR_IS_SPECIAL is non-zero if NAME is one of the special variables in |
| the shell, e.g., "@", "$", "*", etc. QUOTED, if non-zero, means that |
| NAME was found inside of a double-quoted expression. */ |
| static WORD_DESC * |
| parameter_brace_expand_word (name, var_is_special, quoted, pflags, indp) |
| char *name; |
| int var_is_special, quoted, pflags; |
| arrayind_t *indp; |
| { |
| WORD_DESC *ret; |
| char *temp, *tt; |
| intmax_t arg_index; |
| SHELL_VAR *var; |
| int atype, rflags; |
| arrayind_t ind; |
| |
| ret = 0; |
| temp = 0; |
| rflags = 0; |
| |
| if (indp) |
| *indp = INTMAX_MIN; |
| |
| /* Handle multiple digit arguments, as in ${11}. */ |
| if (legal_number (name, &arg_index)) |
| { |
| tt = get_dollar_var_value (arg_index); |
| if (tt) |
| temp = (*tt && (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT))) |
| ? quote_string (tt) |
| : quote_escapes (tt); |
| else |
| temp = (char *)NULL; |
| FREE (tt); |
| } |
| else if (var_is_special) /* ${@} */ |
| { |
| int sindex; |
| tt = (char *)xmalloc (2 + strlen (name)); |
| tt[sindex = 0] = '$'; |
| strcpy (tt + 1, name); |
| |
| ret = param_expand (tt, &sindex, quoted, (int *)NULL, (int *)NULL, |
| (int *)NULL, (int *)NULL, pflags); |
| free (tt); |
| } |
| #if defined (ARRAY_VARS) |
| else if (valid_array_reference (name, 0)) |
| { |
| expand_arrayref: |
| var = array_variable_part (name, 0, &tt, (int *)0); |
| /* These are the cases where word splitting will not be performed */ |
| if (pflags & PF_ASSIGNRHS) |
| { |
| if (ALL_ELEMENT_SUB (tt[0]) && tt[1] == RBRACK) |
| { |
| /* Only treat as double quoted if array variable */ |
| if (var && (array_p (var) || assoc_p (var))) |
| temp = array_value (name, quoted|Q_DOUBLE_QUOTES, AV_ASSIGNRHS, &atype, &ind); |
| else |
| temp = array_value (name, quoted, 0, &atype, &ind); |
| } |
| else |
| temp = array_value (name, quoted, 0, &atype, &ind); |
| } |
| /* Posix interp 888 */ |
| else if (pflags & PF_NOSPLIT2) |
| { |
| /* Special cases, then general case, for each of A[@], A[*], A[n] */ |
| #if defined (HANDLE_MULTIBYTE) |
| if (tt[0] == '@' && tt[1] == RBRACK && var && quoted == 0 && ifs_is_set && ifs_is_null == 0 && ifs_firstc[0] != ' ') |
| #else |
| if (tt[0] == '@' && tt[1] == RBRACK && var && quoted == 0 && ifs_is_set && ifs_is_null == 0 && ifs_firstc != ' ') |
| #endif |
| temp = array_value (name, Q_DOUBLE_QUOTES, AV_ASSIGNRHS, &atype, &ind); |
| else if (tt[0] == '@' && tt[1] == RBRACK) |
| temp = array_value (name, quoted, 0, &atype, &ind); |
| else if (tt[0] == '*' && tt[1] == RBRACK && expand_no_split_dollar_star && ifs_is_null) |
| temp = array_value (name, Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT, 0, &atype, &ind); |
| else if (tt[0] == '*' && tt[1] == RBRACK) |
| temp = array_value (name, quoted, 0, &atype, &ind); |
| else |
| temp = array_value (name, quoted, 0, &atype, &ind); |
| } |
| else if (tt[0] == '*' && tt[1] == RBRACK && expand_no_split_dollar_star && ifs_is_null) |
| temp = array_value (name, Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT, 0, &atype, &ind); |
| else |
| temp = array_value (name, quoted, 0, &atype, &ind); |
| if (atype == 0 && temp) |
| { |
| temp = (*temp && (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT))) |
| ? quote_string (temp) |
| : quote_escapes (temp); |
| rflags |= W_ARRAYIND; |
| if (indp) |
| *indp = ind; |
| } |
| else if (atype == 1 && temp && QUOTED_NULL (temp) && (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT))) |
| rflags |= W_HASQUOTEDNULL; |
| } |
| #endif |
| else if (var = find_variable (name)) |
| { |
| if (var_isset (var) && invisible_p (var) == 0) |
| { |
| #if defined (ARRAY_VARS) |
| /* We avoid a memory leak by saving TT as the memory allocated by |
| assoc_to_string or array_to_string and leaving it 0 otherwise, |
| then freeing TT after quoting temp. */ |
| tt = (char *)NULL; |
| if ((pflags & PF_ALLINDS) && assoc_p (var)) |
| tt = temp = assoc_empty (assoc_cell (var)) ? (char *)NULL : assoc_to_string (assoc_cell (var), " ", quoted); |
| else if ((pflags & PF_ALLINDS) && array_p (var)) |
| tt = temp = array_empty (array_cell (var)) ? (char *)NULL : array_to_string (array_cell (var), " ", quoted); |
| else if (assoc_p (var)) |
| temp = assoc_reference (assoc_cell (var), "0"); |
| else if (array_p (var)) |
| temp = array_reference (array_cell (var), 0); |
| else |
| temp = value_cell (var); |
| #else |
| temp = value_cell (var); |
| #endif |
| |
| if (temp) |
| temp = (*temp && (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT))) |
| ? quote_string (temp) |
| : ((pflags & PF_ASSIGNRHS) ? quote_rhs (temp) |
| : quote_escapes (temp)); |
| FREE (tt); |
| } |
| else |
| temp = (char *)NULL; |
| } |
| else if (var = find_variable_last_nameref (name, 0)) |
| { |
| temp = nameref_cell (var); |
| #if defined (ARRAY_VARS) |
| /* Handle expanding nameref whose value is x[n] */ |
| if (temp && *temp && valid_array_reference (temp, 0)) |
| { |
| name = temp; |
| goto expand_arrayref; |
| } |
| else |
| #endif |
| /* y=2 ; typeset -n x=y; echo ${x} is not the same as echo ${2} in ksh */ |
| if (temp && *temp && legal_identifier (temp) == 0) |
| { |
| set_exit_status (EXECUTION_FAILURE); |
| report_error (_("%s: invalid variable name for name reference"), temp); |
| temp = &expand_param_error; |
| } |
| else |
| temp = (char *)NULL; |
| } |
| else |
| temp = (char *)NULL; |
| |
| if (ret == 0) |
| { |
| ret = alloc_word_desc (); |
| ret->word = temp; |
| ret->flags |= rflags; |
| } |
| return ret; |
| } |
| |
| static char * |
| parameter_brace_find_indir (name, var_is_special, quoted, find_nameref) |
| char *name; |
| int var_is_special, quoted, find_nameref; |
| { |
| char *temp, *t; |
| WORD_DESC *w; |
| SHELL_VAR *v; |
| int pflags, oldex; |
| |
| if (find_nameref && var_is_special == 0 && (v = find_variable_last_nameref (name, 0)) && |
| nameref_p (v) && (t = nameref_cell (v)) && *t) |
| return (savestring (t)); |
| |
| /* If var_is_special == 0, and name is not an array reference, this does |
| more expansion than necessary. It should really look up the variable's |
| value and not try to expand it. */ |
| pflags = PF_IGNUNBOUND; |
| /* Note that we're not going to be doing word splitting here */ |
| if (var_is_special) |
| { |
| pflags |= PF_ASSIGNRHS; /* suppresses word splitting */ |
| oldex = expand_no_split_dollar_star; |
| expand_no_split_dollar_star = 1; |
| } |
| w = parameter_brace_expand_word (name, var_is_special, quoted, pflags, 0); |
| if (var_is_special) |
| expand_no_split_dollar_star = oldex; |
| |
| t = w->word; |
| /* Have to dequote here if necessary */ |
| if (t) |
| { |
| temp = ((quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) || var_is_special) |
| ? dequote_string (t) |
| : dequote_escapes (t); |
| free (t); |
| t = temp; |
| } |
| dispose_word_desc (w); |
| |
| return t; |
| } |
| |
| /* Expand an indirect reference to a variable: ${!NAME} expands to the |
| value of the variable whose name is the value of NAME. */ |
| static WORD_DESC * |
| parameter_brace_expand_indir (name, var_is_special, quoted, pflags, quoted_dollar_atp, contains_dollar_at) |
| char *name; |
| int var_is_special, quoted, pflags; |
| int *quoted_dollar_atp, *contains_dollar_at; |
| { |
| char *t; |
| WORD_DESC *w; |
| SHELL_VAR *v; |
| |
| /* See if it's a nameref first, behave in ksh93-compatible fashion. |
| There is at least one incompatibility: given ${!foo[0]} where foo=bar, |
| bash performs an indirect lookup on foo[0] and expands the result; |
| ksh93 expands bar[0]. We could do that here -- there are enough usable |
| primitives to do that -- but do not at this point. */ |
| if (var_is_special == 0 && (v = find_variable_last_nameref (name, 0))) |
| { |
| if (nameref_p (v) && (t = nameref_cell (v)) && *t) |
| { |
| w = alloc_word_desc (); |
| w->word = savestring (t); |
| w->flags = 0; |
| return w; |
| } |
| } |
| |
| /* An indirect reference to a positional parameter or a special parameter |
| is ok. Indirect references to array references, as explained above, are |
| ok (currently). Only references to unset variables are errors at this |
| point. */ |
| if (legal_identifier (name) && v == 0) |
| { |
| report_error (_("%s: invalid indirect expansion"), name); |
| w = alloc_word_desc (); |
| w->word = &expand_param_error; |
| w->flags = 0; |
| return (w); |
| } |
| |
| t = parameter_brace_find_indir (name, var_is_special, quoted, 0); |
| |
| chk_atstar (t, quoted, pflags, quoted_dollar_atp, contains_dollar_at); |
| |
| #if defined (ARRAY_VARS) |
| /* Array references to unset variables are also an error */ |
| if (t == 0 && valid_array_reference (name, 0)) |
| { |
| v = array_variable_part (name, 0, (char **)0, (int *)0); |
| if (v == 0) |
| { |
| report_error (_("%s: invalid indirect expansion"), name); |
| w = alloc_word_desc (); |
| w->word = &expand_param_error; |
| w->flags = 0; |
| return (w); |
| } |
| else |
| return (WORD_DESC *)NULL; |
| } |
| #endif |
| |
| if (t == 0) |
| return (WORD_DESC *)NULL; |
| |
| if (valid_brace_expansion_word (t, SPECIAL_VAR (t, 0)) == 0) |
| { |
| report_error (_("%s: invalid variable name"), t); |
| free (t); |
| w = alloc_word_desc (); |
| w->word = &expand_param_error; |
| w->flags = 0; |
| return (w); |
| } |
| |
| w = parameter_brace_expand_word (t, SPECIAL_VAR(t, 0), quoted, pflags, 0); |
| free (t); |
| |
| return w; |
| } |
| |
| /* Expand the right side of a parameter expansion of the form ${NAMEcVALUE}, |
| depending on the value of C, the separating character. C can be one of |
| "-", "+", or "=". QUOTED is true if the entire brace expression occurs |
| between double quotes. */ |
| static WORD_DESC * |
| parameter_brace_expand_rhs (name, value, op, quoted, pflags, qdollaratp, hasdollarat) |
| char *name, *value; |
| int op, quoted, pflags, *qdollaratp, *hasdollarat; |
| { |
| WORD_DESC *w; |
| WORD_LIST *l, *tl; |
| char *t, *t1, *temp, *vname; |
| int l_hasdollat, sindex; |
| SHELL_VAR *v; |
| |
| /*itrace("parameter_brace_expand_rhs: %s:%s pflags = %d", name, value, pflags);*/ |
| /* If the entire expression is between double quotes, we want to treat |
| the value as a double-quoted string, with the exception that we strip |
| embedded unescaped double quotes (for sh backwards compatibility). */ |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && *value) |
| { |
| sindex = 0; |
| temp = string_extract_double_quoted (value, &sindex, SX_STRIPDQ); |
| } |
| else |
| temp = value; |
| |
| w = alloc_word_desc (); |
| l_hasdollat = 0; |
| l = *temp ? expand_string_for_rhs (temp, quoted, op, pflags, &l_hasdollat, (int *)NULL) |
| : (WORD_LIST *)0; |
| if (hasdollarat) |
| *hasdollarat = l_hasdollat || (l && l->next); |
| if (temp != value) |
| free (temp); |
| |
| /* list_string takes multiple CTLNULs and turns them into an empty word |
| with W_SAWQUOTEDNULL set. Turn it back into a single CTLNUL for the |
| rest of this function and the caller. */ |
| for (tl = l; tl; tl = tl->next) |
| { |
| if (tl->word && (tl->word->word == 0 || tl->word->word[0] == 0) && |
| (tl->word->flags | W_SAWQUOTEDNULL)) |
| { |
| t = make_quoted_char ('\0'); |
| FREE (tl->word->word); |
| tl->word->word = t; |
| tl->word->flags |= W_QUOTED|W_HASQUOTEDNULL; |
| tl->word->flags &= ~W_SAWQUOTEDNULL; |
| } |
| } |
| |
| if (l) |
| { |
| /* If l->next is not null, we know that TEMP contained "$@", since that |
| is the only expansion that creates more than one word. */ |
| if (qdollaratp && ((l_hasdollat && quoted) || l->next)) |
| { |
| /*itrace("parameter_brace_expand_rhs: %s:%s: l != NULL, set *qdollaratp", name, value);*/ |
| *qdollaratp = 1; |
| } |
| |
| /* The expansion of TEMP returned something. We need to treat things |
| slightly differently if L_HASDOLLAT is non-zero. If we have "$@", |
| the individual words have already been quoted. We need to turn them |
| into a string with the words separated by the first character of |
| $IFS without any additional quoting, so string_list_dollar_at won't |
| do the right thing. If IFS is null, we want "$@" to split into |
| separate arguments, not be concatenated, so we use string_list_internal |
| and mark the word to be split on spaces later. We use |
| string_list_dollar_star for "$@" otherwise. */ |
| if (l->next && ifs_is_null) |
| { |
| temp = string_list_internal (l, " "); |
| w->flags |= W_SPLITSPACE; |
| } |
| else if (l_hasdollat || l->next) |
| temp = string_list_dollar_star (l, quoted, 0); |
| else |
| { |
| temp = string_list (l); |
| if (temp && (QUOTED_NULL (temp) == 0) && (l->word->flags & W_SAWQUOTEDNULL)) |
| w->flags |= W_SAWQUOTEDNULL; /* XXX */ |
| } |
| |
| /* If we have a quoted null result (QUOTED_NULL(temp)) and the word is |
| a quoted null (l->next == 0 && QUOTED_NULL(l->word->word)), the |
| flags indicate it (l->word->flags & W_HASQUOTEDNULL), and the |
| expansion is quoted (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) |
| (which is more paranoia than anything else), we need to return the |
| quoted null string and set the flags to indicate it. */ |
| if (l->next == 0 && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && QUOTED_NULL (temp) && QUOTED_NULL (l->word->word) && (l->word->flags & W_HASQUOTEDNULL)) |
| { |
| w->flags |= W_HASQUOTEDNULL; |
| /*itrace("parameter_brace_expand_rhs (%s:%s): returning quoted null, turning off qdollaratp", name, value);*/ |
| /* If we return a quoted null with L_HASDOLLARAT, we either have a |
| construct like "${@-$@}" or "${@-${@-$@}}" with no positional |
| parameters or a quoted expansion of "$@" with $1 == ''. In either |
| case, we don't want to enable special handling of $@. */ |
| if (qdollaratp && l_hasdollat) |
| *qdollaratp = 0; |
| } |
| dispose_words (l); |
| } |
| else if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && l_hasdollat) |
| { |
| /* Posix interp 221 changed the rules on this. The idea is that |
| something like "$xxx$@" should expand the same as "${foo-$xxx$@}" |
| when foo and xxx are unset. The problem is that it's not in any |
| way backwards compatible and few other shells do it. We're eventually |
| going to try and split the difference (heh) a little bit here. */ |
| /* l_hasdollat == 1 means we saw a quoted dollar at. */ |
| |
| /* The brace expansion occurred between double quotes and there was |
| a $@ in TEMP. It does not matter if the $@ is quoted, as long as |
| it does not expand to anything. In this case, we want to return |
| a quoted empty string. Posix interp 888 */ |
| temp = make_quoted_char ('\0'); |
| w->flags |= W_HASQUOTEDNULL; |
| /*itrace("parameter_brace_expand_rhs (%s:%s): returning quoted null", name, value);*/ |
| } |
| else |
| temp = (char *)NULL; |
| |
| if (op == '-' || op == '+') |
| { |
| w->word = temp; |
| return w; |
| } |
| |
| /* op == '=' */ |
| t1 = temp ? dequote_string (temp) : savestring (""); |
| free (temp); |
| |
| /* bash-4.4/5.0 */ |
| vname = name; |
| if (*name == '!' && |
| (legal_variable_starter ((unsigned char)name[1]) || DIGIT (name[1]) || VALID_INDIR_PARAM (name[1]))) |
| { |
| vname = parameter_brace_find_indir (name + 1, SPECIAL_VAR (name, 1), quoted, 1); |
| if (vname == 0 || *vname == 0) |
| { |
| report_error (_("%s: invalid indirect expansion"), name); |
| free (vname); |
| free (t1); |
| dispose_word (w); |
| return &expand_wdesc_error; |
| } |
| if (legal_identifier (vname) == 0) |
| { |
| report_error (_("%s: invalid variable name"), vname); |
| free (vname); |
| free (t1); |
| dispose_word (w); |
| return &expand_wdesc_error; |
| } |
| } |
| |
| #if defined (ARRAY_VARS) |
| if (valid_array_reference (vname, 0)) |
| v = assign_array_element (vname, t1, 0); |
| else |
| #endif /* ARRAY_VARS */ |
| v = bind_variable (vname, t1, 0); |
| |
| if (v == 0 || readonly_p (v) || noassign_p (v)) /* expansion error */ |
| { |
| if ((v == 0 || readonly_p (v)) && interactive_shell == 0 && posixly_correct) |
| { |
| last_command_exit_value = EXECUTION_FAILURE; |
| exp_jump_to_top_level (FORCE_EOF); |
| } |
| else |
| { |
| if (vname != name) |
| free (vname); |
| last_command_exit_value = EX_BADUSAGE; |
| exp_jump_to_top_level (DISCARD); |
| } |
| } |
| |
| stupidly_hack_special_variables (vname); |
| |
| if (vname != name) |
| free (vname); |
| |
| /* From Posix group discussion Feb-March 2010. Issue 7 0000221 */ |
| |
| /* If we are double-quoted or if we are not going to be performing word |
| splitting, we want to quote the value we return appropriately, like |
| the other expansions this function handles. */ |
| w->word = (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) ? quote_string (t1) : quote_escapes (t1); |
| /* If we have something that's non-null, that's not a quoted null string, |
| and we're not going to be performing word splitting (we know we're not |
| because the operator is `='), we can forget we saw a quoted null. */ |
| if (w->word && w->word[0] && QUOTED_NULL (w->word) == 0) |
| w->flags &= ~W_SAWQUOTEDNULL; |
| free (t1); |
| |
| /* If we convert a null string into a quoted null, make sure the caller |
| knows it. */ |
| if ((quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) && QUOTED_NULL (w->word)) |
| w->flags |= W_HASQUOTEDNULL; |
| |
| return w; |
| } |
| |
| /* Deal with the right hand side of a ${name:?value} expansion in the case |
| that NAME is null or not set. If VALUE is non-null it is expanded and |
| used as the error message to print, otherwise a standard message is |
| printed. */ |
| static void |
| parameter_brace_expand_error (name, value, check_null) |
| char *name, *value; |
| int check_null; |
| { |
| WORD_LIST *l; |
| char *temp; |
| |
| set_exit_status (EXECUTION_FAILURE); /* ensure it's non-zero */ |
| if (value && *value) |
| { |
| l = expand_string (value, 0); |
| temp = string_list (l); |
| report_error ("%s: %s", name, temp ? temp : ""); /* XXX was value not "" */ |
| FREE (temp); |
| dispose_words (l); |
| } |
| else if (check_null == 0) |
| report_error (_("%s: parameter not set"), name); |
| else |
| report_error (_("%s: parameter null or not set"), name); |
| |
| /* Free the data we have allocated during this expansion, since we |
| are about to longjmp out. */ |
| free (name); |
| FREE (value); |
| } |
| |
| /* Return 1 if NAME is something for which parameter_brace_expand_length is |
| OK to do. */ |
| static int |
| valid_length_expression (name) |
| char *name; |
| { |
| return (name[1] == '\0' || /* ${#} */ |
| ((sh_syntaxtab[(unsigned char) name[1]] & CSPECVAR) && name[2] == '\0') || /* special param */ |
| (DIGIT (name[1]) && all_digits (name + 1)) || /* ${#11} */ |
| #if defined (ARRAY_VARS) |
| valid_array_reference (name + 1, 0) || /* ${#a[7]} */ |
| #endif |
| legal_identifier (name + 1)); /* ${#PS1} */ |
| } |
| |
| /* Handle the parameter brace expansion that requires us to return the |
| length of a parameter. */ |
| static intmax_t |
| parameter_brace_expand_length (name) |
| char *name; |
| { |
| char *t, *newname; |
| intmax_t number, arg_index; |
| WORD_LIST *list; |
| SHELL_VAR *var; |
| |
| var = (SHELL_VAR *)NULL; |
| |
| if (name[1] == '\0') /* ${#} */ |
| number = number_of_args (); |
| else if (DOLLAR_AT_STAR (name[1]) && name[2] == '\0') /* ${#@}, ${#*} */ |
| number = number_of_args (); |
| else if ((sh_syntaxtab[(unsigned char) name[1]] & CSPECVAR) && name[2] == '\0') |
| { |
| /* Take the lengths of some of the shell's special parameters. */ |
| switch (name[1]) |
| { |
| case '-': |
| t = which_set_flags (); |
| break; |
| case '?': |
| t = itos (last_command_exit_value); |
| break; |
| case '$': |
| t = itos (dollar_dollar_pid); |
| break; |
| case '!': |
| if (last_asynchronous_pid == NO_PID) |
| t = (char *)NULL; /* XXX - error if set -u set? */ |
| else |
| t = itos (last_asynchronous_pid); |
| break; |
| case '#': |
| t = itos (number_of_args ()); |
| break; |
| } |
| number = STRLEN (t); |
| FREE (t); |
| } |
| #if defined (ARRAY_VARS) |
| else if (valid_array_reference (name + 1, 0)) |
| number = array_length_reference (name + 1); |
| #endif /* ARRAY_VARS */ |
| else |
| { |
| number = 0; |
| |
| if (legal_number (name + 1, &arg_index)) /* ${#1} */ |
| { |
| t = get_dollar_var_value (arg_index); |
| if (t == 0 && unbound_vars_is_error) |
| return INTMAX_MIN; |
| number = MB_STRLEN (t); |
| FREE (t); |
| } |
| #if defined (ARRAY_VARS) |
| else if ((var = find_variable (name + 1)) && (invisible_p (var) == 0) && (array_p (var) || assoc_p (var))) |
| { |
| if (assoc_p (var)) |
| t = assoc_reference (assoc_cell (var), "0"); |
| else |
| t = array_reference (array_cell (var), 0); |
| if (t == 0 && unbound_vars_is_error) |
| return INTMAX_MIN; |
| number = MB_STRLEN (t); |
| } |
| #endif |
| /* Fast path for the common case of taking the length of a non-dynamic |
| scalar variable value. */ |
| else if ((var || (var = find_variable (name + 1))) && |
| invisible_p (var) == 0 && |
| array_p (var) == 0 && assoc_p (var) == 0 && |
| var->dynamic_value == 0) |
| number = value_cell (var) ? MB_STRLEN (value_cell (var)) : 0; |
| else if (var == 0 && unbound_vars_is_error == 0) |
| number = 0; |
| else /* ${#PS1} */ |
| { |
| newname = savestring (name); |
| newname[0] = '$'; |
| list = expand_string (newname, Q_DOUBLE_QUOTES); |
| t = list ? string_list (list) : (char *)NULL; |
| free (newname); |
| if (list) |
| dispose_words (list); |
| |
| number = t ? MB_STRLEN (t) : 0; |
| FREE (t); |
| } |
| } |
| |
| return (number); |
| } |
| |
| /* Skip characters in SUBSTR until DELIM. SUBSTR is an arithmetic expression, |
| so we do some ad-hoc parsing of an arithmetic expression to find |
| the first DELIM, instead of using strchr(3). Two rules: |
| 1. If the substring contains a `(', read until closing `)'. |
| 2. If the substring contains a `?', read past one `:' for each `?'. |
| The SD_ARITHEXP flag to skip_to_delim takes care of doing this. |
| */ |
| |
| static char * |
| skiparith (substr, delim) |
| char *substr; |
| int delim; |
| { |
| int i; |
| char delims[2]; |
| |
| delims[0] = delim; |
| delims[1] = '\0'; |
| |
| i = skip_to_delim (substr, 0, delims, SD_ARITHEXP); |
| return (substr + i); |
| } |
| |
| /* Verify and limit the start and end of the desired substring. If |
| VTYPE == 0, a regular shell variable is being used; if it is 1, |
| then the positional parameters are being used; if it is 2, then |
| VALUE is really a pointer to an array variable that should be used. |
| Return value is 1 if both values were OK, 0 if there was a problem |
| with an invalid expression, or -1 if the values were out of range. */ |
| static int |
| verify_substring_values (v, value, substr, vtype, e1p, e2p) |
| SHELL_VAR *v; |
| char *value, *substr; |
| int vtype; |
| intmax_t *e1p, *e2p; |
| { |
| char *t, *temp1, *temp2; |
| arrayind_t len; |
| int expok; |
| #if defined (ARRAY_VARS) |
| ARRAY *a; |
| HASH_TABLE *h; |
| #endif |
| |
| /* duplicate behavior of strchr(3) */ |
| t = skiparith (substr, ':'); |
| if (*t && *t == ':') |
| *t = '\0'; |
| else |
| t = (char *)0; |
| |
| temp1 = expand_arith_string (substr, Q_DOUBLE_QUOTES); |
| *e1p = evalexp (temp1, 0, &expok); /* XXX - EXP_EXPANDED? */ |
| free (temp1); |
| if (expok == 0) |
| return (0); |
| |
| len = -1; /* paranoia */ |
| switch (vtype) |
| { |
| case VT_VARIABLE: |
| case VT_ARRAYMEMBER: |
| len = MB_STRLEN (value); |
| break; |
| case VT_POSPARMS: |
| len = number_of_args () + 1; |
| if (*e1p == 0) |
| len++; /* add one arg if counting from $0 */ |
| break; |
| #if defined (ARRAY_VARS) |
| case VT_ARRAYVAR: |
| /* For arrays, the first value deals with array indices. Negative |
| offsets count from one past the array's maximum index. Associative |
| arrays treat the number of elements as the maximum index. */ |
| if (assoc_p (v)) |
| { |
| h = assoc_cell (v); |
| len = assoc_num_elements (h) + (*e1p < 0); |
| } |
| else |
| { |
| a = (ARRAY *)value; |
| len = array_max_index (a) + (*e1p < 0); /* arrays index from 0 to n - 1 */ |
| } |
| break; |
| #endif |
| } |
| |
| if (len == -1) /* paranoia */ |
| return -1; |
| |
| if (*e1p < 0) /* negative offsets count from end */ |
| *e1p += len; |
| |
| if (*e1p > len || *e1p < 0) |
| return (-1); |
| |
| #if defined (ARRAY_VARS) |
| /* For arrays, the second offset deals with the number of elements. */ |
| if (vtype == VT_ARRAYVAR) |
| len = assoc_p (v) ? assoc_num_elements (h) : array_num_elements (a); |
| #endif |
| |
| if (t) |
| { |
| t++; |
| temp2 = savestring (t); |
| temp1 = expand_arith_string (temp2, Q_DOUBLE_QUOTES); |
| free (temp2); |
| t[-1] = ':'; |
| *e2p = evalexp (temp1, 0, &expok); /* XXX - EXP_EXPANDED? */ |
| free (temp1); |
| if (expok == 0) |
| return (0); |
| |
| /* Should we allow positional parameter length < 0 to count backwards |
| from end of positional parameters? */ |
| #if 1 |
| if ((vtype == VT_ARRAYVAR || vtype == VT_POSPARMS) && *e2p < 0) |
| #else /* TAG: bash-5.2 */ |
| if (vtype == VT_ARRAYVAR && *e2p < 0) |
| #endif |
| { |
| internal_error (_("%s: substring expression < 0"), t); |
| return (0); |
| } |
| #if defined (ARRAY_VARS) |
| /* In order to deal with sparse arrays, push the intelligence about how |
| to deal with the number of elements desired down to the array- |
| specific functions. */ |
| if (vtype != VT_ARRAYVAR) |
| #endif |
| { |
| if (*e2p < 0) |
| { |
| *e2p += len; |
| if (*e2p < 0 || *e2p < *e1p) |
| { |
| internal_error (_("%s: substring expression < 0"), t); |
| return (0); |
| } |
| } |
| else |
| *e2p += *e1p; /* want E2 chars starting at E1 */ |
| if (*e2p > len) |
| *e2p = len; |
| } |
| } |
| else |
| *e2p = len; |
| |
| return (1); |
| } |
| |
| /* Return the type of variable specified by VARNAME (simple variable, |
| positional param, or array variable). Also return the value specified |
| by VARNAME (value of a variable or a reference to an array element). |
| QUOTED is the standard description of quoting state, using Q_* defines. |
| FLAGS is currently a set of flags to pass to array_value. If IND is |
| non-null and not INTMAX_MIN, and FLAGS includes AV_USEIND, IND is |
| passed to array_value so the array index is not computed again. |
| If this returns VT_VARIABLE, the caller assumes that CTLESC and CTLNUL |
| characters in the value are quoted with CTLESC and takes appropriate |
| steps. For convenience, *VALP is set to the dequoted VALUE. */ |
| static int |
| get_var_and_type (varname, value, ind, quoted, flags, varp, valp) |
| char *varname, *value; |
| arrayind_t ind; |
| int quoted, flags; |
| SHELL_VAR **varp; |
| char **valp; |
| { |
| int vtype, want_indir; |
| char *temp, *vname; |
| SHELL_VAR *v; |
| arrayind_t lind; |
| |
| want_indir = *varname == '!' && |
| (legal_variable_starter ((unsigned char)varname[1]) || DIGIT (varname[1]) |
| || VALID_INDIR_PARAM (varname[1])); |
| if (want_indir) |
| vname = parameter_brace_find_indir (varname+1, SPECIAL_VAR (varname, 1), quoted, 1); |
| /* XXX - what if vname == 0 || *vname == 0 ? */ |
| else |
| vname = varname; |
| |
| if (vname == 0) |
| { |
| vtype = VT_VARIABLE; |
| *varp = (SHELL_VAR *)NULL; |
| *valp = (char *)NULL; |
| return (vtype); |
| } |
| |
| /* This sets vtype to VT_VARIABLE or VT_POSPARMS */ |
| vtype = STR_DOLLAR_AT_STAR (vname); |
| if (vtype == VT_POSPARMS && vname[0] == '*') |
| vtype |= VT_STARSUB; |
| *varp = (SHELL_VAR *)NULL; |
| |
| #if defined (ARRAY_VARS) |
| if (valid_array_reference (vname, 0)) |
| { |
| v = array_variable_part (vname, 0, &temp, (int *)0); |
| /* If we want to signal array_value to use an already-computed index, |
| set LIND to that index */ |
| lind = (ind != INTMAX_MIN && (flags & AV_USEIND)) ? ind : 0; |
| if (v && invisible_p (v)) |
| { |
| vtype = VT_ARRAYMEMBER; |
| *varp = (SHELL_VAR *)NULL; |
| *valp = (char *)NULL; |
| } |
| if (v && (array_p (v) || assoc_p (v))) |
| { |
| if (ALL_ELEMENT_SUB (temp[0]) && temp[1] == RBRACK) |
| { |
| /* Callers have to differentiate between indexed and associative */ |
| vtype = VT_ARRAYVAR; |
| if (temp[0] == '*') |
| vtype |= VT_STARSUB; |
| *valp = array_p (v) ? (char *)array_cell (v) : (char *)assoc_cell (v); |
| } |
| else |
| { |
| vtype = VT_ARRAYMEMBER; |
| *valp = array_value (vname, Q_DOUBLE_QUOTES, flags, (int *)NULL, &lind); |
| } |
| *varp = v; |
| } |
| else if (v && (ALL_ELEMENT_SUB (temp[0]) && temp[1] == RBRACK)) |
| { |
| vtype = VT_VARIABLE; |
| *varp = v; |
| if (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) |
| *valp = value ? dequote_string (value) : (char *)NULL; |
| else |
| *valp = value ? dequote_escapes (value) : (char *)NULL; |
| } |
| else |
| { |
| vtype = VT_ARRAYMEMBER; |
| *varp = v; |
| *valp = array_value (vname, Q_DOUBLE_QUOTES, flags, (int *)NULL, &lind); |
| } |
| } |
| else if ((v = find_variable (vname)) && (invisible_p (v) == 0) && (assoc_p (v) || array_p (v))) |
| { |
| vtype = VT_ARRAYMEMBER; |
| *varp = v; |
| *valp = assoc_p (v) ? assoc_reference (assoc_cell (v), "0") : array_reference (array_cell (v), 0); |
| } |
| else |
| #endif |
| { |
| if (value && vtype == VT_VARIABLE) |
| { |
| *varp = find_variable (vname); |
| if (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) |
| *valp = dequote_string (value); |
| else |
| *valp = dequote_escapes (value); |
| } |
| else |
| *valp = value; |
| } |
| |
| if (want_indir) |
| free (vname); |
| |
| return vtype; |
| } |
| |
| /***********************************************************/ |
| /* */ |
| /* Functions to perform transformations on variable values */ |
| /* */ |
| /***********************************************************/ |
| |
| static char * |
| string_var_assignment (v, s) |
| SHELL_VAR *v; |
| char *s; |
| { |
| char flags[MAX_ATTRIBUTES], *ret, *val; |
| int i; |
| |
| val = (v && (invisible_p (v) || var_isset (v) == 0)) ? (char *)NULL : sh_quote_reusable (s, 0); |
| i = var_attribute_string (v, 0, flags); |
| if (i == 0 && val == 0) |
| return (char *)NULL; |
| |
| ret = (char *)xmalloc (i + STRLEN (val) + strlen (v->name) + 16 + MAX_ATTRIBUTES); |
| if (i > 0 && val == 0) |
| sprintf (ret, "declare -%s %s", flags, v->name); |
| else if (i > 0) |
| sprintf (ret, "declare -%s %s=%s", flags, v->name, val); |
| else |
| sprintf (ret, "%s=%s", v->name, val); |
| free (val); |
| return ret; |
| } |
| |
| #if defined (ARRAY_VARS) |
| static char * |
| array_var_assignment (v, itype, quoted, atype) |
| SHELL_VAR *v; |
| int itype, quoted, atype; |
| { |
| char *ret, *val, flags[MAX_ATTRIBUTES]; |
| int i; |
| |
| if (v == 0) |
| return (char *)NULL; |
| if (atype == 2) |
| val = array_p (v) ? array_to_kvpair (array_cell (v), 0) |
| : assoc_to_kvpair (assoc_cell (v), 0); |
| else |
| val = array_p (v) ? array_to_assign (array_cell (v), 0) |
| : assoc_to_assign (assoc_cell (v), 0); |
| |
| if (val == 0 && (invisible_p (v) || var_isset (v) == 0)) |
| ; /* placeholder */ |
| else if (val == 0) |
| { |
| val = (char *)xmalloc (3); |
| val[0] = LPAREN; |
| val[1] = RPAREN; |
| val[2] = 0; |
| } |
| else |
| { |
| ret = (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) ? quote_string (val) : quote_escapes (val); |
| free (val); |
| val = ret; |
| } |
| |
| if (atype == 2) |
| return val; |
| |
| i = var_attribute_string (v, 0, flags); |
| ret = (char *)xmalloc (i + STRLEN (val) + strlen (v->name) + 16); |
| if (val) |
| sprintf (ret, "declare -%s %s=%s", flags, v->name, val); |
| else |
| sprintf (ret, "declare -%s %s", flags, v->name); |
| free (val); |
| return ret; |
| } |
| #endif |
| |
| static char * |
| pos_params_assignment (list, itype, quoted) |
| WORD_LIST *list; |
| int itype; |
| int quoted; |
| { |
| char *temp, *ret; |
| |
| /* first, we transform the list to quote each word. */ |
| temp = list_transform ('Q', (SHELL_VAR *)0, list, itype, quoted); |
| ret = (char *)xmalloc (strlen (temp) + 8); |
| strcpy (ret, "set -- "); |
| strcpy (ret + 7, temp); |
| free (temp); |
| return ret; |
| } |
| |
| static char * |
| string_transform (xc, v, s) |
| int xc; |
| SHELL_VAR *v; |
| char *s; |
| { |
| char *ret, flags[MAX_ATTRIBUTES], *t; |
| int i; |
| |
| if (((xc == 'A' || xc == 'a') && v == 0)) |
| return (char *)NULL; |
| else if (xc != 'a' && xc != 'A' && s == 0) |
| return (char *)NULL; |
| |
| switch (xc) |
| { |
| /* Transformations that interrogate the variable */ |
| case 'a': |
| i = var_attribute_string (v, 0, flags); |
| ret = (i > 0) ? savestring (flags) : (char *)NULL; |
| break; |
| case 'A': |
| ret = string_var_assignment (v, s); |
| break; |
| case 'K': |
| ret = sh_quote_reusable (s, 0); |
| break; |
| /* Transformations that modify the variable's value */ |
| case 'E': |
| t = ansiexpand (s, 0, strlen (s), (int *)0); |
| ret = dequote_escapes (t); |
| free (t); |
| break; |
| case 'P': |
| ret = decode_prompt_string (s); |
| break; |
| case 'Q': |
| ret = sh_quote_reusable (s, 0); |
| break; |
| case 'U': |
| ret = sh_modcase (s, 0, CASE_UPPER); |
| break; |
| case 'u': |
| ret = sh_modcase (s, 0, CASE_UPFIRST); /* capitalize */ |
| break; |
| case 'L': |
| ret = sh_modcase (s, 0, CASE_LOWER); |
| break; |
| default: |
| ret = (char *)NULL; |
| break; |
| } |
| return ret; |
| } |
| |
| static char * |
| list_transform (xc, v, list, itype, quoted) |
| int xc; |
| SHELL_VAR *v; |
| WORD_LIST *list; |
| int itype, quoted; |
| { |
| WORD_LIST *new, *l; |
| WORD_DESC *w; |
| char *tword; |
| int qflags; |
| |
| for (new = (WORD_LIST *)NULL, l = list; l; l = l->next) |
| { |
| tword = string_transform (xc, v, l->word->word); |
| w = alloc_word_desc (); |
| w->word = tword ? tword : savestring (""); /* XXX */ |
| new = make_word_list (w, new); |
| } |
| l = REVERSE_LIST (new, WORD_LIST *); |
| |
| qflags = quoted; |
| /* If we are expanding in a context where word splitting will not be |
| performed, treat as quoted. This changes how $* will be expanded. */ |
| if (itype == '*' && expand_no_split_dollar_star && ifs_is_null) |
| qflags |= Q_DOUBLE_QUOTES; /* Posix interp 888 */ |
| |
| tword = string_list_pos_params (itype, l, qflags, 0); |
| dispose_words (l); |
| |
| return (tword); |
| } |
| |
| static char * |
| parameter_list_transform (xc, itype, quoted) |
| int xc; |
| int itype; |
| int quoted; |
| { |
| char *ret; |
| WORD_LIST *list; |
| |
| list = list_rest_of_args (); |
| if (list == 0) |
| return ((char *)NULL); |
| if (xc == 'A') |
| ret = pos_params_assignment (list, itype, quoted); |
| else |
| ret = list_transform (xc, (SHELL_VAR *)0, list, itype, quoted); |
| dispose_words (list); |
| return (ret); |
| } |
| |
| #if defined (ARRAY_VARS) |
| static char * |
| array_transform (xc, var, starsub, quoted) |
| int xc; |
| SHELL_VAR *var; |
| int starsub; /* so we can figure out how it's indexed */ |
| int quoted; |
| { |
| ARRAY *a; |
| HASH_TABLE *h; |
| int itype; |
| char *ret; |
| WORD_LIST *list; |
| SHELL_VAR *v; |
| |
| v = var; /* XXX - for now */ |
| |
| itype = starsub ? '*' : '@'; |
| |
| if (xc == 'A') |
| return (array_var_assignment (v, itype, quoted, 1)); |
| else if (xc == 'K') |
| return (array_var_assignment (v, itype, quoted, 2)); |
| |
| /* special case for unset arrays and attributes */ |
| if (xc == 'a' && (invisible_p (v) || var_isset (v) == 0)) |
| { |
| char flags[MAX_ATTRIBUTES]; |
| int i; |
| |
| i = var_attribute_string (v, 0, flags); |
| return ((i > 0) ? savestring (flags) : (char *)NULL); |
| } |
| |
| a = (v && array_p (v)) ? array_cell (v) : 0; |
| h = (v && assoc_p (v)) ? assoc_cell (v) : 0; |
| |
| list = a ? array_to_word_list (a) : (h ? assoc_to_word_list (h) : 0); |
| if (list == 0) |
| return ((char *)NULL); |
| ret = list_transform (xc, v, list, itype, quoted); |
| dispose_words (list); |
| |
| return ret; |
| } |
| #endif /* ARRAY_VARS */ |
| |
| static int |
| valid_parameter_transform (xform) |
| char *xform; |
| { |
| if (xform[1]) |
| return 0; |
| |
| /* check for valid values of xform[0] */ |
| switch (xform[0]) |
| { |
| case 'a': /* expand to a string with just attributes */ |
| case 'A': /* expand as an assignment statement with attributes */ |
| case 'K': /* expand assoc array to list of key/value pairs */ |
| case 'E': /* expand like $'...' */ |
| case 'P': /* expand like prompt string */ |
| case 'Q': /* quote reusably */ |
| case 'U': /* transform to uppercase */ |
| case 'u': /* tranform by capitalizing */ |
| case 'L': /* transform to lowercase */ |
| return 1; |
| default: |
| return 0; |
| } |
| } |
| |
| static char * |
| parameter_brace_transform (varname, value, ind, xform, rtype, quoted, pflags, flags) |
| char *varname, *value; |
| int ind; |
| char *xform; |
| int rtype, quoted, pflags, flags; |
| { |
| int vtype, xc, starsub; |
| char *temp1, *val, *oname; |
| SHELL_VAR *v; |
| |
| xc = xform[0]; |
| if (value == 0 && xc != 'A' && xc != 'a') |
| return ((char *)NULL); |
| |
| oname = this_command_name; |
| this_command_name = varname; |
| |
| vtype = get_var_and_type (varname, value, ind, quoted, flags, &v, &val); |
| if (vtype == -1) |
| { |
| this_command_name = oname; |
| return ((char *)NULL); |
| } |
| |
| if (valid_parameter_transform (xform) == 0) |
| { |
| this_command_name = oname; |
| #if 0 /* TAG: bash-5.2 Martin Schulte <gnu@schrader-schulte.de> 10/2020 */ |
| return (interactive_shell ? &expand_param_error : &expand_param_fatal); |
| #else |
| return &expand_param_error; |
| #endif |
| } |
| |
| starsub = vtype & VT_STARSUB; |
| vtype &= ~VT_STARSUB; |
| |
| /* If we are asked to display the attributes of an unset variable, V will |
| be NULL after the call to get_var_and_type. Double-check here. */ |
| if ((xc == 'a' || xc == 'A') && vtype == VT_VARIABLE && varname && v == 0) |
| v = find_variable (varname); |
| |
| temp1 = (char *)NULL; /* shut up gcc */ |
| switch (vtype) |
| { |
| case VT_VARIABLE: |
| case VT_ARRAYMEMBER: |
| temp1 = string_transform (xc, v, val); |
| if (vtype == VT_VARIABLE) |
| FREE (val); |
| if (temp1) |
| { |
| val = (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) |
| ? quote_string (temp1) |
| : quote_escapes (temp1); |
| free (temp1); |
| temp1 = val; |
| } |
| break; |
| #if defined (ARRAY_VARS) |
| case VT_ARRAYVAR: |
| temp1 = array_transform (xc, v, starsub, quoted); |
| if (temp1 && quoted == 0 && ifs_is_null) |
| { |
| /* Posix interp 888 */ |
| } |
| else if (temp1 && ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) == 0)) |
| { |
| val = quote_escapes (temp1); |
| free (temp1); |
| temp1 = val; |
| } |
| break; |
| #endif |
| case VT_POSPARMS: |
| temp1 = parameter_list_transform (xc, varname[0], quoted); |
| if (temp1 && quoted == 0 && ifs_is_null) |
| { |
| /* Posix interp 888 */ |
| } |
| else if (temp1 && ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) == 0)) |
| { |
| val = quote_escapes (temp1); |
| free (temp1); |
| temp1 = val; |
| } |
| break; |
| } |
| |
| this_command_name = oname; |
| return temp1; |
| } |
| |
| /******************************************************/ |
| /* */ |
| /* Functions to extract substrings of variable values */ |
| /* */ |
| /******************************************************/ |
| |
| #if defined (HANDLE_MULTIBYTE) |
| /* Character-oriented rather than strictly byte-oriented substrings. S and |
| E, rather being strict indices into STRING, indicate character (possibly |
| multibyte character) positions that require calculation. |
| Used by the ${param:offset[:length]} expansion. */ |
| static char * |
| mb_substring (string, s, e) |
| char *string; |
| int s, e; |
| { |
| char *tt; |
| int start, stop, i; |
| size_t slen; |
| DECLARE_MBSTATE; |
| |
| start = 0; |
| /* Don't need string length in ADVANCE_CHAR unless multibyte chars possible. */ |
| slen = (MB_CUR_MAX > 1) ? STRLEN (string) : 0; |
| |
| i = s; |
| while (string[start] && i--) |
| ADVANCE_CHAR (string, slen, start); |
| stop = start; |
| i = e - s; |
| while (string[stop] && i--) |
| ADVANCE_CHAR (string, slen, stop); |
| tt = substring (string, start, stop); |
| return tt; |
| } |
| #endif |
| |
| /* Process a variable substring expansion: ${name:e1[:e2]}. If VARNAME |
| is `@', use the positional parameters; otherwise, use the value of |
| VARNAME. If VARNAME is an array variable, use the array elements. */ |
| |
| static char * |
| parameter_brace_substring (varname, value, ind, substr, quoted, pflags, flags) |
| char *varname, *value; |
| int ind; |
| char *substr; |
| int quoted, pflags, flags; |
| { |
| intmax_t e1, e2; |
| int vtype, r, starsub; |
| char *temp, *val, *tt, *oname; |
| SHELL_VAR *v; |
| |
| if (value == 0 && ((varname[0] != '@' && varname[0] != '*') || varname[1])) |
| return ((char *)NULL); |
| |
| oname = this_command_name; |
| this_command_name = varname; |
| |
| vtype = get_var_and_type (varname, value, ind, quoted, flags, &v, &val); |
| if (vtype == -1) |
| { |
| this_command_name = oname; |
| return ((char *)NULL); |
| } |
| |
| starsub = vtype & VT_STARSUB; |
| vtype &= ~VT_STARSUB; |
| |
| r = verify_substring_values (v, val, substr, vtype, &e1, &e2); |
| this_command_name = oname; |
| if (r <= 0) |
| { |
| if (vtype == VT_VARIABLE) |
| FREE (val); |
| return ((r == 0) ? &expand_param_error : (char *)NULL); |
| } |
| |
| switch (vtype) |
| { |
| case VT_VARIABLE: |
| case VT_ARRAYMEMBER: |
| #if defined (HANDLE_MULTIBYTE) |
| if (MB_CUR_MAX > 1) |
| tt = mb_substring (val, e1, e2); |
| else |
| #endif |
| tt = substring (val, e1, e2); |
| |
| if (vtype == VT_VARIABLE) |
| FREE (val); |
| if (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) |
| temp = quote_string (tt); |
| else |
| temp = tt ? quote_escapes (tt) : (char *)NULL; |
| FREE (tt); |
| break; |
| case VT_POSPARMS: |
| case VT_ARRAYVAR: |
| if (vtype == VT_POSPARMS) |
| tt = pos_params (varname, e1, e2, quoted, pflags); |
| #if defined (ARRAY_VARS) |
| /* assoc_subrange and array_subrange both call string_list_pos_params, |
| so we can treat this case just like VT_POSPARAMS. */ |
| else if (assoc_p (v)) |
| /* we convert to list and take first e2 elements starting at e1th |
| element -- officially undefined for now */ |
| tt = assoc_subrange (assoc_cell (v), e1, e2, starsub, quoted, pflags); |
| else |
| /* We want E2 to be the number of elements desired (arrays can be |
| sparse, so verify_substring_values just returns the numbers |
| specified and we rely on array_subrange to understand how to |
| deal with them). */ |
| tt = array_subrange (array_cell (v), e1, e2, starsub, quoted, pflags); |
| #endif |
| /* We want to leave this alone in every case where pos_params/ |
| string_list_pos_params quotes the list members */ |
| if (tt && quoted == 0 && ifs_is_null) |
| { |
| temp = tt; /* Posix interp 888 */ |
| } |
| else if (tt && quoted == 0 && (pflags & PF_ASSIGNRHS)) |
| { |
| temp = tt; /* Posix interp 888 */ |
| } |
| else if ((quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) == 0) |
| { |
| temp = tt ? quote_escapes (tt) : (char *)NULL; |
| FREE (tt); |
| } |
| else |
| temp = tt; |
| break; |
| |
| default: |
| temp = (char *)NULL; |
| } |
| |
| return temp; |
| } |
| |
| /****************************************************************/ |
| /* */ |
| /* Functions to perform pattern substitution on variable values */ |
| /* */ |
| /****************************************************************/ |
| |
| #ifdef INCLUDE_UNUSED |
| static int |
| shouldexp_replacement (s) |
| char *s; |
| { |
| register char *p; |
| |
| for (p = s; p && *p; p++) |
| { |
| if (*p == '\\') |
| p++; |
| else if (*p == '&') |
| return 1; |
| } |
| return 0; |
| } |
| #endif |
| |
| char * |
| pat_subst (string, pat, rep, mflags) |
| char *string, *pat, *rep; |
| int mflags; |
| { |
| char *ret, *s, *e, *str, *rstr, *mstr, *send; |
| int rptr, mtype, rxpand, mlen; |
| size_t rsize, l, replen, rslen; |
| DECLARE_MBSTATE; |
| |
| if (string == 0) |
| return (savestring ("")); |
| |
| mtype = mflags & MATCH_TYPEMASK; |
| |
| #if 0 /* TAG: bash-5.2? */ |
| rxpand = (rep && *rep) ? shouldexp_replacement (rep) : 0; |
| #else |
| rxpand = 0; |
| #endif |
| |
| /* Special cases: |
| * 1. A null pattern with mtype == MATCH_BEG means to prefix STRING |
| * with REP and return the result. |
| * 2. A null pattern with mtype == MATCH_END means to append REP to |
| * STRING and return the result. |
| * 3. A null STRING with a matching pattern means to append REP to |
| * STRING and return the result. |
| * These don't understand or process `&' in the replacement string. |
| */ |
| if ((pat == 0 || *pat == 0) && (mtype == MATCH_BEG || mtype == MATCH_END)) |
| { |
| replen = STRLEN (rep); |
| l = STRLEN (string); |
| ret = (char *)xmalloc (replen + l + 2); |
| if (replen == 0) |
| strcpy (ret, string); |
| else if (mtype == MATCH_BEG) |
| { |
| strcpy (ret, rep); |
| strcpy (ret + replen, string); |
| } |
| else |
| { |
| strcpy (ret, string); |
| strcpy (ret + l, rep); |
| } |
| return (ret); |
| } |
| else if (*string == 0 && (match_pattern (string, pat, mtype, &s, &e) != 0)) |
| { |
| replen = STRLEN (rep); |
| ret = (char *)xmalloc (replen + 1); |
| if (replen == 0) |
| ret[0] = '\0'; |
| else |
| strcpy (ret, rep); |
| return (ret); |
| } |
| |
| ret = (char *)xmalloc (rsize = 64); |
| ret[0] = '\0'; |
| send = string + strlen (string); |
| |
| for (replen = STRLEN (rep), rptr = 0, str = string; *str;) |
| { |
| if (match_pattern (str, pat, mtype, &s, &e) == 0) |
| break; |
| l = s - str; |
| |
| if (rep && rxpand) |
| { |
| int x; |
| mlen = e - s; |
| mstr = xmalloc (mlen + 1); |
| for (x = 0; x < mlen; x++) |
| mstr[x] = s[x]; |
| mstr[mlen] = '\0'; |
| rstr = strcreplace (rep, '&', mstr, 0); |
| free (mstr); |
| rslen = strlen (rstr); |
| } |
| else |
| { |
| rstr = rep; |
| rslen = replen; |
| } |
| |
| RESIZE_MALLOCED_BUFFER (ret, rptr, (l + rslen), rsize, 64); |
| |
| /* OK, now copy the leading unmatched portion of the string (from |
| str to s) to ret starting at rptr (the current offset). Then copy |
| the replacement string at ret + rptr + (s - str). Increment |
| rptr (if necessary) and str and go on. */ |
| if (l) |
| { |
| strncpy (ret + rptr, str, l); |
| rptr += l; |
| } |
| if (replen) |
| { |
| strncpy (ret + rptr, rstr, rslen); |
| rptr += rslen; |
| } |
| str = e; /* e == end of match */ |
| |
| if (rstr != rep) |
| free (rstr); |
| |
| if (((mflags & MATCH_GLOBREP) == 0) || mtype != MATCH_ANY) |
| break; |
| |
| if (s == e) |
| { |
| /* On a zero-length match, make sure we copy one character, since |
| we increment one character to avoid infinite recursion. */ |
| char *p, *origp, *origs; |
| size_t clen; |
| |
| RESIZE_MALLOCED_BUFFER (ret, rptr, locale_mb_cur_max, rsize, 64); |
| #if defined (HANDLE_MULTIBYTE) |
| p = origp = ret + rptr; |
| origs = str; |
| COPY_CHAR_P (p, str, send); |
| rptr += p - origp; |
| e += str - origs; |
| #else |
| ret[rptr++] = *str++; |
| e++; /* avoid infinite recursion on zero-length match */ |
| #endif |
| } |
| } |
| |
| /* Now copy the unmatched portion of the input string */ |
| if (str && *str) |
| { |
| RESIZE_MALLOCED_BUFFER (ret, rptr, STRLEN(str) + 1, rsize, 64); |
| strcpy (ret + rptr, str); |
| } |
| else |
| ret[rptr] = '\0'; |
| |
| return ret; |
| } |
| |
| /* Do pattern match and replacement on the positional parameters. */ |
| static char * |
| pos_params_pat_subst (string, pat, rep, mflags) |
| char *string, *pat, *rep; |
| int mflags; |
| { |
| WORD_LIST *save, *params; |
| WORD_DESC *w; |
| char *ret; |
| int pchar, qflags, pflags; |
| |
| save = params = list_rest_of_args (); |
| if (save == 0) |
| return ((char *)NULL); |
| |
| for ( ; params; params = params->next) |
| { |
| ret = pat_subst (params->word->word, pat, rep, mflags); |
| w = alloc_word_desc (); |
| w->word = ret ? ret : savestring (""); |
| dispose_word (params->word); |
| params->word = w; |
| } |
| |
| pchar = (mflags & MATCH_STARSUB) == MATCH_STARSUB ? '*' : '@'; |
| qflags = (mflags & MATCH_QUOTED) == MATCH_QUOTED ? Q_DOUBLE_QUOTES : 0; |
| pflags = (mflags & MATCH_ASSIGNRHS) == MATCH_ASSIGNRHS ? PF_ASSIGNRHS : 0; |
| |
| /* If we are expanding in a context where word splitting will not be |
| performed, treat as quoted. This changes how $* will be expanded. */ |
| if (pchar == '*' && (mflags & MATCH_ASSIGNRHS) && expand_no_split_dollar_star && ifs_is_null) |
| qflags |= Q_DOUBLE_QUOTES; /* Posix interp 888 */ |
| |
| ret = string_list_pos_params (pchar, save, qflags, pflags); |
| dispose_words (save); |
| |
| return (ret); |
| } |
| |
| /* Perform pattern substitution on VALUE, which is the expansion of |
| VARNAME. PATSUB is an expression supplying the pattern to match |
| and the string to substitute. QUOTED is a flags word containing |
| the type of quoting currently in effect. */ |
| static char * |
| parameter_brace_patsub (varname, value, ind, patsub, quoted, pflags, flags) |
| char *varname, *value; |
| int ind; |
| char *patsub; |
| int quoted, pflags, flags; |
| { |
| int vtype, mflags, starsub, delim; |
| char *val, *temp, *pat, *rep, *p, *lpatsub, *tt, *oname; |
| SHELL_VAR *v; |
| |
| if (value == 0) |
| return ((char *)NULL); |
| |
| oname = this_command_name; |
| this_command_name = varname; /* error messages */ |
| |
| vtype = get_var_and_type (varname, value, ind, quoted, flags, &v, &val); |
| if (vtype == -1) |
| { |
| this_command_name = oname; |
| return ((char *)NULL); |
| } |
| |
| starsub = vtype & VT_STARSUB; |
| vtype &= ~VT_STARSUB; |
| |
| mflags = 0; |
| /* PATSUB is never NULL when this is called. */ |
| if (*patsub == '/') |
| { |
| mflags |= MATCH_GLOBREP; |
| patsub++; |
| } |
| |
| /* Malloc this because expand_string_if_necessary or one of the expansion |
| functions in its call chain may free it on a substitution error. */ |
| lpatsub = savestring (patsub); |
| |
| if (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) |
| mflags |= MATCH_QUOTED; |
| |
| if (starsub) |
| mflags |= MATCH_STARSUB; |
| |
| if (pflags & PF_ASSIGNRHS) |
| mflags |= MATCH_ASSIGNRHS; |
| |
| /* If the pattern starts with a `/', make sure we skip over it when looking |
| for the replacement delimiter. */ |
| delim = skip_to_delim (lpatsub, ((*patsub == '/') ? 1 : 0), "/", 0); |
| if (lpatsub[delim] == '/') |
| { |
| lpatsub[delim] = 0; |
| rep = lpatsub + delim + 1; |
| } |
| else |
| rep = (char *)NULL; |
| |
| if (rep && *rep == '\0') |
| rep = (char *)NULL; |
| |
| /* Perform the same expansions on the pattern as performed by the |
| pattern removal expansions. */ |
| pat = getpattern (lpatsub, quoted, 1); |
| |
| if (rep) |
| { |
| /* We want to perform quote removal on the expanded replacement even if |
| the entire expansion is double-quoted because the parser and string |
| extraction functions treated quotes in the replacement string as |
| special. THIS IS NOT BACKWARDS COMPATIBLE WITH BASH-4.2. */ |
| if (shell_compatibility_level > 42) |
| rep = expand_string_if_necessary (rep, quoted & ~(Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT), expand_string_unsplit); |
| /* This is the bash-4.2 code. */ |
| else if ((mflags & MATCH_QUOTED) == 0) |
| rep = expand_string_if_necessary (rep, quoted, expand_string_unsplit); |
| else |
| rep = expand_string_to_string_internal (rep, quoted, expand_string_unsplit); |
| } |
| |
| /* ksh93 doesn't allow the match specifier to be a part of the expanded |
| pattern. This is an extension. Make sure we don't anchor the pattern |
| at the beginning or end of the string if we're doing global replacement, |
| though. */ |
| p = pat; |
| if (mflags & MATCH_GLOBREP) |
| mflags |= MATCH_ANY; |
| else if (pat && pat[0] == '#') |
| { |
| mflags |= MATCH_BEG; |
| p++; |
| } |
| else if (pat && pat[0] == '%') |
| { |
| mflags |= MATCH_END; |
| p++; |
| } |
| else |
| mflags |= MATCH_ANY; |
| |
| /* OK, we now want to substitute REP for PAT in VAL. If |
| flags & MATCH_GLOBREP is non-zero, the substitution is done |
| everywhere, otherwise only the first occurrence of PAT is |
| replaced. The pattern matching code doesn't understand |
| CTLESC quoting CTLESC and CTLNUL so we use the dequoted variable |
| values passed in (VT_VARIABLE) so the pattern substitution |
| code works right. We need to requote special chars after |
| we're done for VT_VARIABLE and VT_ARRAYMEMBER, and for the |
| other cases if QUOTED == 0, since the posparams and arrays |
| indexed by * or @ do special things when QUOTED != 0. */ |
| |
| switch (vtype) |
| { |
| case VT_VARIABLE: |
| case VT_ARRAYMEMBER: |
| temp = pat_subst (val, p, rep, mflags); |
| if (vtype == VT_VARIABLE) |
| FREE (val); |
| if (temp) |
| { |
| tt = (mflags & MATCH_QUOTED) ? quote_string (temp) : quote_escapes (temp); |
| free (temp); |
| temp = tt; |
| } |
| break; |
| case VT_POSPARMS: |
| /* This does the right thing for the case where we are not performing |
| word splitting. MATCH_STARSUB restricts it to ${* /foo/bar}, and |
| pos_params_pat_subst/string_list_pos_params will do the right thing |
| in turn for the case where ifs_is_null. Posix interp 888 */ |
| if ((pflags & PF_NOSPLIT2) && (mflags & MATCH_STARSUB)) |
| mflags |= MATCH_ASSIGNRHS; |
| temp = pos_params_pat_subst (val, p, rep, mflags); |
| if (temp && quoted == 0 && ifs_is_null) |
| { |
| /* Posix interp 888 */ |
| } |
| else if (temp && quoted == 0 && (pflags & PF_ASSIGNRHS)) |
| { |
| /* Posix interp 888 */ |
| } |
| else if (temp && (mflags & MATCH_QUOTED) == 0) |
| { |
| tt = quote_escapes (temp); |
| free (temp); |
| temp = tt; |
| } |
| break; |
| #if defined (ARRAY_VARS) |
| case VT_ARRAYVAR: |
| /* If we are expanding in a context where word splitting will not be |
| performed, treat as quoted. This changes how ${A[*]} will be |
| expanded to make it identical to $*. */ |
| if ((mflags & MATCH_STARSUB) && (mflags & MATCH_ASSIGNRHS) && ifs_is_null) |
| mflags |= MATCH_QUOTED; /* Posix interp 888 */ |
| |
| /* these eventually call string_list_pos_params */ |
| if (assoc_p (v)) |
| temp = assoc_patsub (assoc_cell (v), p, rep, mflags); |
| else |
| temp = array_patsub (array_cell (v), p, rep, mflags); |
| |
| if (temp && quoted == 0 && ifs_is_null) |
| { |
| /* Posix interp 888 */ |
| } |
| else if (temp && (mflags & MATCH_QUOTED) == 0) |
| { |
| tt = quote_escapes (temp); |
| free (temp); |
| temp = tt; |
| } |
| break; |
| #endif |
| } |
| |
| FREE (pat); |
| FREE (rep); |
| free (lpatsub); |
| |
| this_command_name = oname; |
| |
| return temp; |
| } |
| |
| /****************************************************************/ |
| /* */ |
| /* Functions to perform case modification on variable values */ |
| /* */ |
| /****************************************************************/ |
| |
| /* Do case modification on the positional parameters. */ |
| |
| static char * |
| pos_params_modcase (string, pat, modop, mflags) |
| char *string, *pat; |
| int modop; |
| int mflags; |
| { |
| WORD_LIST *save, *params; |
| WORD_DESC *w; |
| char *ret; |
| int pchar, qflags, pflags; |
| |
| save = params = list_rest_of_args (); |
| if (save == 0) |
| return ((char *)NULL); |
| |
| for ( ; params; params = params->next) |
| { |
| ret = sh_modcase (params->word->word, pat, modop); |
| w = alloc_word_desc (); |
| w->word = ret ? ret : savestring (""); |
| dispose_word (params->word); |
| params->word = w; |
| } |
| |
| pchar = (mflags & MATCH_STARSUB) == MATCH_STARSUB ? '*' : '@'; |
| qflags = (mflags & MATCH_QUOTED) == MATCH_QUOTED ? Q_DOUBLE_QUOTES : 0; |
| pflags = (mflags & MATCH_ASSIGNRHS) == MATCH_ASSIGNRHS ? PF_ASSIGNRHS : 0; |
| |
| /* If we are expanding in a context where word splitting will not be |
| performed, treat as quoted. This changes how $* will be expanded. */ |
| if (pchar == '*' && (mflags & MATCH_ASSIGNRHS) && ifs_is_null) |
| qflags |= Q_DOUBLE_QUOTES; /* Posix interp 888 */ |
| |
| ret = string_list_pos_params (pchar, save, qflags, pflags); |
| dispose_words (save); |
| |
| return (ret); |
| } |
| |
| /* Perform case modification on VALUE, which is the expansion of |
| VARNAME. MODSPEC is an expression supplying the type of modification |
| to perform. QUOTED is a flags word containing the type of quoting |
| currently in effect. */ |
| static char * |
| parameter_brace_casemod (varname, value, ind, modspec, patspec, quoted, pflags, flags) |
| char *varname, *value; |
| int ind, modspec; |
| char *patspec; |
| int quoted, pflags, flags; |
| { |
| int vtype, starsub, modop, mflags, x; |
| char *val, *temp, *pat, *p, *lpat, *tt, *oname; |
| SHELL_VAR *v; |
| |
| if (value == 0) |
| return ((char *)NULL); |
| |
| oname = this_command_name; |
| this_command_name = varname; |
| |
| vtype = get_var_and_type (varname, value, ind, quoted, flags, &v, &val); |
| if (vtype == -1) |
| { |
| this_command_name = oname; |
| return ((char *)NULL); |
| } |
| |
| starsub = vtype & VT_STARSUB; |
| vtype &= ~VT_STARSUB; |
| |
| modop = 0; |
| mflags = 0; |
| if (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) |
| mflags |= MATCH_QUOTED; |
| if (starsub) |
| mflags |= MATCH_STARSUB; |
| if (pflags & PF_ASSIGNRHS) |
| mflags |= MATCH_ASSIGNRHS; |
| |
| p = patspec; |
| if (modspec == '^') |
| { |
| x = p && p[0] == modspec; |
| modop = x ? CASE_UPPER : CASE_UPFIRST; |
| p += x; |
| } |
| else if (modspec == ',') |
| { |
| x = p && p[0] == modspec; |
| modop = x ? CASE_LOWER : CASE_LOWFIRST; |
| p += x; |
| } |
| else if (modspec == '~') |
| { |
| x = p && p[0] == modspec; |
| modop = x ? CASE_TOGGLEALL : CASE_TOGGLE; |
| p += x; |
| } |
| |
| lpat = p ? savestring (p) : 0; |
| /* Perform the same expansions on the pattern as performed by the |
| pattern removal expansions. */ |
| pat = lpat ? getpattern (lpat, quoted, 1) : 0; |
| |
| /* OK, now we do the case modification. */ |
| switch (vtype) |
| { |
| case VT_VARIABLE: |
| case VT_ARRAYMEMBER: |
| temp = sh_modcase (val, pat, modop); |
| if (vtype == VT_VARIABLE) |
| FREE (val); |
| if (temp) |
| { |
| tt = (mflags & MATCH_QUOTED) ? quote_string (temp) : quote_escapes (temp); |
| free (temp); |
| temp = tt; |
| } |
| break; |
| |
| case VT_POSPARMS: |
| temp = pos_params_modcase (val, pat, modop, mflags); |
| if (temp && quoted == 0 && ifs_is_null) |
| { |
| /* Posix interp 888 */ |
| } |
| else if (temp && (mflags & MATCH_QUOTED) == 0) |
| { |
| tt = quote_escapes (temp); |
| free (temp); |
| temp = tt; |
| } |
| break; |
| |
| #if defined (ARRAY_VARS) |
| case VT_ARRAYVAR: |
| /* If we are expanding in a context where word splitting will not be |
| performed, treat as quoted. This changes how ${A[*]} will be |
| expanded to make it identical to $*. */ |
| if ((mflags & MATCH_STARSUB) && (mflags & MATCH_ASSIGNRHS) && ifs_is_null) |
| mflags |= MATCH_QUOTED; /* Posix interp 888 */ |
| |
| temp = assoc_p (v) ? assoc_modcase (assoc_cell (v), pat, modop, mflags) |
| : array_modcase (array_cell (v), pat, modop, mflags); |
| |
| if (temp && quoted == 0 && ifs_is_null) |
| { |
| /* Posix interp 888 */ |
| } |
| else if (temp && (mflags & MATCH_QUOTED) == 0) |
| { |
| tt = quote_escapes (temp); |
| free (temp); |
| temp = tt; |
| } |
| |
| break; |
| #endif |
| } |
| |
| FREE (pat); |
| free (lpat); |
| |
| this_command_name = oname; |
| |
| return temp; |
| } |
| |
| /* Check for unbalanced parens in S, which is the contents of $(( ... )). If |
| any occur, this must be a nested command substitution, so return 0. |
| Otherwise, return 1. A valid arithmetic expression must always have a |
| ( before a matching ), so any cases where there are more right parens |
| means that this must not be an arithmetic expression, though the parser |
| will not accept it without a balanced total number of parens. */ |
| static int |
| chk_arithsub (s, len) |
| const char *s; |
| int len; |
| { |
| int i, count; |
| DECLARE_MBSTATE; |
| |
| i = count = 0; |
| while (i < len) |
| { |
| if (s[i] == LPAREN) |
| count++; |
| else if (s[i] == RPAREN) |
| { |
| count--; |
| if (count < 0) |
| return 0; |
| } |
| |
| switch (s[i]) |
| { |
| default: |
| ADVANCE_CHAR (s, len, i); |
| break; |
| |
| case '\\': |
| i++; |
| if (s[i]) |
| ADVANCE_CHAR (s, len, i); |
| break; |
| |
| case '\'': |
| i = skip_single_quoted (s, len, ++i, 0); |
| break; |
| |
| case '"': |
| i = skip_double_quoted ((char *)s, len, ++i, 0); |
| break; |
| } |
| } |
| |
| return (count == 0); |
| } |
| |
| /****************************************************************/ |
| /* */ |
| /* Functions to perform parameter expansion on a string */ |
| /* */ |
| /****************************************************************/ |
| |
| /* ${[#][!]name[[:][^[^]][,[,]]#[#]%[%]-=?+[word][:e1[:e2]]]} */ |
| static WORD_DESC * |
| parameter_brace_expand (string, indexp, quoted, pflags, quoted_dollar_atp, contains_dollar_at) |
| char *string; |
| int *indexp, quoted, pflags, *quoted_dollar_atp, *contains_dollar_at; |
| { |
| int check_nullness, var_is_set, var_is_null, var_is_special; |
| int want_substring, want_indir, want_patsub, want_casemod, want_attributes; |
| char *name, *value, *temp, *temp1; |
| WORD_DESC *tdesc, *ret; |
| int t_index, sindex, c, tflag, modspec, local_pflags, all_element_arrayref; |
| intmax_t number; |
| arrayind_t ind; |
| |
| temp = temp1 = value = (char *)NULL; |
| var_is_set = var_is_null = var_is_special = check_nullness = 0; |
| want_substring = want_indir = want_patsub = want_casemod = want_attributes = 0; |
| |
| local_pflags = 0; |
| all_element_arrayref = 0; |
| |
| sindex = *indexp; |
| t_index = ++sindex; |
| /* ${#var} doesn't have any of the other parameter expansions on it. */ |
| if (string[t_index] == '#' && legal_variable_starter (string[t_index+1])) /* {{ */ |
| name = string_extract (string, &t_index, "}", SX_VARNAME); |
| else |
| #if defined (CASEMOD_EXPANSIONS) |
| /* To enable case-toggling expansions using the `~' operator character |
| define CASEMOD_TOGGLECASE in config-top.h */ |
| # if defined (CASEMOD_TOGGLECASE) |
| name = string_extract (string, &t_index, "#%^,~:-=?+/@}", SX_VARNAME); |
| # else |
| name = string_extract (string, &t_index, "#%^,:-=?+/@}", SX_VARNAME); |
| # endif /* CASEMOD_TOGGLECASE */ |
| #else |
| name = string_extract (string, &t_index, "#%:-=?+/@}", SX_VARNAME); |
| #endif /* CASEMOD_EXPANSIONS */ |
| |
| /* Handle ${@[stuff]} now that @ is a word expansion operator. Not exactly |
| the cleanest code ever. */ |
| if (*name == 0 && sindex == t_index && string[sindex] == '@') |
| { |
| name = (char *)xrealloc (name, 2); |
| name[0] = '@'; |
| name[1] = '\0'; |
| t_index++; |
| } |
| else if (*name == '!' && t_index > sindex && string[t_index] == '@' && string[t_index+1] == RBRACE) |
| { |
| name = (char *)xrealloc (name, t_index - sindex + 2); |
| name[t_index - sindex] = '@'; |
| name[t_index - sindex + 1] = '\0'; |
| t_index++; |
| } |
| |
| ret = 0; |
| tflag = 0; |
| |
| ind = INTMAX_MIN; |
| |
| /* If the name really consists of a special variable, then make sure |
| that we have the entire name. We don't allow indirect references |
| to special variables except `#', `?', `@' and `*'. This clause is |
| designed to handle ${#SPECIAL} and ${!SPECIAL}, not anything more |
| general. */ |
| if ((sindex == t_index && VALID_SPECIAL_LENGTH_PARAM (string[t_index])) || |
| (sindex == t_index && string[sindex] == '#' && VALID_SPECIAL_LENGTH_PARAM (string[sindex + 1])) || |
| (sindex == t_index - 1 && string[sindex] == '!' && VALID_INDIR_PARAM (string[t_index]))) |
| { |
| t_index++; |
| temp1 = string_extract (string, &t_index, "#%:-=?+/@}", 0); |
| name = (char *)xrealloc (name, 3 + (strlen (temp1))); |
| *name = string[sindex]; |
| if (string[sindex] == '!') |
| { |
| /* indirect reference of $#, $?, $@, or $* */ |
| name[1] = string[sindex + 1]; |
| strcpy (name + 2, temp1); |
| } |
| else |
| strcpy (name + 1, temp1); |
| free (temp1); |
| } |
| sindex = t_index; |
| |
| /* Find out what character ended the variable name. Then |
| do the appropriate thing. */ |
| if (c = string[sindex]) |
| sindex++; |
| |
| /* If c is followed by one of the valid parameter expansion |
| characters, move past it as normal. If not, assume that |
| a substring specification is being given, and do not move |
| past it. */ |
| if (c == ':' && VALID_PARAM_EXPAND_CHAR (string[sindex])) |
| { |
| check_nullness++; |
| if (c = string[sindex]) |
| sindex++; |
| } |
| else if (c == ':' && string[sindex] != RBRACE) |
| want_substring = 1; |
| else if (c == '/' /* && string[sindex] != RBRACE */) /* XXX */ |
| want_patsub = 1; |
| #if defined (CASEMOD_EXPANSIONS) |
| else if (c == '^' || c == ',' || c == '~') |
| { |
| modspec = c; |
| want_casemod = 1; |
| } |
| #endif |
| else if (c == '@' && (string[sindex] == 'a' || string[sindex] == 'A') && string[sindex+1] == RBRACE) |
| { |
| /* special case because we do not want to shortcut foo as foo[0] here */ |
| want_attributes = 1; |
| local_pflags |= PF_ALLINDS; |
| } |
| |
| /* Catch the valid and invalid brace expressions that made it through the |
| tests above. */ |
| /* ${#-} is a valid expansion and means to take the length of $-. |
| Similarly for ${#?} and ${##}... */ |
| if (name[0] == '#' && name[1] == '\0' && check_nullness == 0 && |
| VALID_SPECIAL_LENGTH_PARAM (c) && string[sindex] == RBRACE) |
| { |
| name = (char *)xrealloc (name, 3); |
| name[1] = c; |
| name[2] = '\0'; |
| c = string[sindex++]; |
| } |
| |
| /* ...but ${#%}, ${#:}, ${#=}, ${#+}, and ${#/} are errors. */ |
| if (name[0] == '#' && name[1] == '\0' && check_nullness == 0 && |
| member (c, "%:=+/") && string[sindex] == RBRACE) |
| { |
| temp = (char *)NULL; |
| goto bad_substitution; /* XXX - substitution error */ |
| } |
| |
| /* Indirect expansion begins with a `!'. A valid indirect expansion is |
| either a variable name, one of the positional parameters or a special |
| variable that expands to one of the positional parameters. */ |
| want_indir = *name == '!' && |
| (legal_variable_starter ((unsigned char)name[1]) || DIGIT (name[1]) |
| || VALID_INDIR_PARAM (name[1])); |
| |
| /* Determine the value of this variable whose name is NAME. */ |
| |
| /* Check for special variables, directly referenced. */ |
| if (SPECIAL_VAR (name, want_indir)) |
| var_is_special++; |
| |
| /* Check for special expansion things, like the length of a parameter */ |
| if (*name == '#' && name[1]) |
| { |
| /* If we are not pointing at the character just after the |
| closing brace, then we haven't gotten all of the name. |
| Since it begins with a special character, this is a bad |
| substitution. Also check NAME for validity before trying |
| to go on. */ |
| if (string[sindex - 1] != RBRACE || (valid_length_expression (name) == 0)) |
| { |
| temp = (char *)NULL; |
| goto bad_substitution; /* substitution error */ |
| } |
| |
| number = parameter_brace_expand_length (name); |
| if (number == INTMAX_MIN && unbound_vars_is_error) |
| { |
| set_exit_status (EXECUTION_FAILURE); |
| err_unboundvar (name+1); |
| free (name); |
| return (interactive_shell ? &expand_wdesc_error : &expand_wdesc_fatal); |
| } |
| free (name); |
| |
| *indexp = sindex; |
| if (number < 0) |
| return (&expand_wdesc_error); |
| else |
| { |
| ret = alloc_word_desc (); |
| ret->word = itos (number); |
| return ret; |
| } |
| } |
| |
| /* ${@} is identical to $@. */ |
| if (name[0] == '@' && name[1] == '\0') |
| { |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && quoted_dollar_atp) |
| *quoted_dollar_atp = 1; |
| |
| if (contains_dollar_at) |
| *contains_dollar_at = 1; |
| |
| tflag |= W_DOLLARAT; |
| } |
| |
| /* Process ${!PREFIX*} expansion. */ |
| if (want_indir && string[sindex - 1] == RBRACE && |
| (string[sindex - 2] == '*' || string[sindex - 2] == '@') && |
| legal_variable_starter ((unsigned char) name[1])) |
| { |
| char **x; |
| WORD_LIST *xlist; |
| |
| temp1 = savestring (name + 1); |
| number = strlen (temp1); |
| temp1[number - 1] = '\0'; |
| x = all_variables_matching_prefix (temp1); |
| xlist = strvec_to_word_list (x, 0, 0); |
| if (string[sindex - 2] == '*') |
| temp = string_list_dollar_star (xlist, quoted, 0); |
| else |
| { |
| temp = string_list_dollar_at (xlist, quoted, 0); |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && quoted_dollar_atp) |
| *quoted_dollar_atp = 1; |
| if (contains_dollar_at) |
| *contains_dollar_at = 1; |
| |
| tflag |= W_DOLLARAT; |
| } |
| free (x); |
| dispose_words (xlist); |
| free (temp1); |
| *indexp = sindex; |
| |
| free (name); |
| |
| ret = alloc_word_desc (); |
| ret->word = temp; |
| ret->flags = tflag; /* XXX */ |
| return ret; |
| } |
| |
| #if defined (ARRAY_VARS) |
| /* Process ${!ARRAY[@]} and ${!ARRAY[*]} expansion. */ |
| if (want_indir && string[sindex - 1] == RBRACE && |
| string[sindex - 2] == RBRACK && valid_array_reference (name+1, 0)) |
| { |
| char *x, *x1; |
| |
| temp1 = savestring (name + 1); |
| x = array_variable_name (temp1, 0, &x1, (int *)0); |
| FREE (x); |
| if (ALL_ELEMENT_SUB (x1[0]) && x1[1] == RBRACK) |
| { |
| temp = array_keys (temp1, quoted, pflags); /* handles assoc vars too */ |
| if (x1[0] == '@') |
| { |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && quoted_dollar_atp) |
| *quoted_dollar_atp = 1; |
| if (contains_dollar_at) |
| *contains_dollar_at = 1; |
| |
| tflag |= W_DOLLARAT; |
| } |
| |
| free (name); |
| free (temp1); |
| *indexp = sindex; |
| |
| ret = alloc_word_desc (); |
| ret->word = temp; |
| ret->flags = tflag; /* XXX */ |
| return ret; |
| } |
| |
| free (temp1); |
| } |
| #endif /* ARRAY_VARS */ |
| |
| /* Make sure that NAME is valid before trying to go on. */ |
| if (valid_brace_expansion_word (want_indir ? name + 1 : name, |
| var_is_special) == 0) |
| { |
| temp = (char *)NULL; |
| goto bad_substitution; /* substitution error */ |
| } |
| |
| if (want_indir) |
| { |
| tdesc = parameter_brace_expand_indir (name + 1, var_is_special, quoted, pflags|local_pflags, quoted_dollar_atp, contains_dollar_at); |
| if (tdesc == &expand_wdesc_error || tdesc == &expand_wdesc_fatal) |
| { |
| temp = (char *)NULL; |
| goto bad_substitution; |
| } |
| |
| /* Turn off the W_ARRAYIND flag because there is no way for this function |
| to return the index we're supposed to be using. */ |
| if (tdesc && tdesc->flags) |
| tdesc->flags &= ~W_ARRAYIND; |
| } |
| else |
| { |
| local_pflags |= PF_IGNUNBOUND|(pflags&(PF_NOSPLIT2|PF_ASSIGNRHS)); |
| tdesc = parameter_brace_expand_word (name, var_is_special, quoted, local_pflags, &ind); |
| } |
| |
| if (tdesc == &expand_wdesc_error || tdesc == &expand_wdesc_fatal) |
| { |
| tflag = 0; |
| tdesc = 0; |
| } |
| |
| if (tdesc) |
| { |
| temp = tdesc->word; |
| tflag = tdesc->flags; |
| dispose_word_desc (tdesc); |
| } |
| else |
| temp = (char *)0; |
| |
| if (temp == &expand_param_error || temp == &expand_param_fatal) |
| { |
| FREE (name); |
| FREE (value); |
| return (temp == &expand_param_error ? &expand_wdesc_error : &expand_wdesc_fatal); |
| } |
| |
| #if defined (ARRAY_VARS) |
| if (valid_array_reference (name, 0)) |
| { |
| int qflags; |
| char *t; |
| |
| qflags = quoted; |
| /* If in a context where word splitting will not take place, treat as |
| if double-quoted. Has effects with $* and ${array[*]} */ |
| |
| if (pflags & PF_ASSIGNRHS) |
| qflags |= Q_DOUBLE_QUOTES; |
| /* We duplicate a little code here */ |
| t = mbschr (name, LBRACK); |
| if (t && ALL_ELEMENT_SUB (t[1]) && t[2] == RBRACK) |
| { |
| all_element_arrayref = 1; |
| if (expand_no_split_dollar_star && t[1] == '*') /* XXX */ |
| qflags |= Q_DOUBLE_QUOTES; |
| } |
| chk_atstar (name, qflags, pflags, quoted_dollar_atp, contains_dollar_at); |
| } |
| #endif |
| |
| var_is_set = temp != (char *)0; |
| var_is_null = check_nullness && (var_is_set == 0 || *temp == 0); |
| /* XXX - this may not need to be restricted to special variables */ |
| if (check_nullness) |
| var_is_null |= var_is_set && var_is_special && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && QUOTED_NULL (temp); |
| #if defined (ARRAY_VARS) |
| if (check_nullness) |
| var_is_null |= var_is_set && |
| (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && |
| QUOTED_NULL (temp) && |
| valid_array_reference (name, 0) && |
| chk_atstar (name, 0, 0, (int *)0, (int *)0); |
| #endif |
| |
| /* Get the rest of the stuff inside the braces. */ |
| if (c && c != RBRACE) |
| { |
| /* Extract the contents of the ${ ... } expansion |
| according to the Posix.2 rules. */ |
| value = extract_dollar_brace_string (string, &sindex, quoted, (c == '%' || c == '#' || c =='/' || c == '^' || c == ',' || c ==':') ? SX_POSIXEXP|SX_WORD : SX_WORD); |
| if (string[sindex] == RBRACE) |
| sindex++; |
| else |
| goto bad_substitution; /* substitution error */ |
| } |
| else |
| value = (char *)NULL; |
| |
| *indexp = sindex; |
| |
| /* All the cases where an expansion can possibly generate an unbound |
| variable error. */ |
| if (want_substring || want_patsub || want_casemod || c == '@' || c == '#' || c == '%' || c == RBRACE) |
| { |
| if (var_is_set == 0 && unbound_vars_is_error && ((name[0] != '@' && name[0] != '*') || name[1]) && all_element_arrayref == 0) |
| { |
| set_exit_status (EXECUTION_FAILURE); |
| err_unboundvar (name); |
| FREE (value); |
| FREE (temp); |
| free (name); |
| return (interactive_shell ? &expand_wdesc_error : &expand_wdesc_fatal); |
| } |
| } |
| |
| /* If this is a substring spec, process it and add the result. */ |
| if (want_substring) |
| { |
| temp1 = parameter_brace_substring (name, temp, ind, value, quoted, pflags, (tflag & W_ARRAYIND) ? AV_USEIND : 0); |
| FREE (value); |
| FREE (temp); |
| |
| if (temp1 == &expand_param_error || temp1 == &expand_param_fatal) |
| { |
| FREE (name); |
| return (temp1 == &expand_param_error ? &expand_wdesc_error : &expand_wdesc_fatal); |
| } |
| |
| ret = alloc_word_desc (); |
| ret->word = temp1; |
| /* We test quoted_dollar_atp because we want variants with double-quoted |
| "$@" to take a different code path. In fact, we make sure at the end |
| of expand_word_internal that we're only looking at these flags if |
| quoted_dollar_at == 0. */ |
| if (temp1 && |
| (quoted_dollar_atp == 0 || *quoted_dollar_atp == 0) && |
| QUOTED_NULL (temp1) && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES))) |
| ret->flags |= W_QUOTED|W_HASQUOTEDNULL; |
| else if (temp1 && (name[0] == '*' && name[1] == 0) && quoted == 0 && |
| (pflags & PF_ASSIGNRHS)) |
| ret->flags |= W_SPLITSPACE; /* Posix interp 888 */ |
| /* Special handling for $* when unquoted and $IFS is null. Posix interp 888 */ |
| else if (temp1 && (name[0] == '*' && name[1] == 0) && quoted == 0 && ifs_is_null) |
| ret->flags |= W_SPLITSPACE; /* Posix interp 888 */ |
| |
| FREE (name); |
| return ret; |
| } |
| else if (want_patsub) |
| { |
| temp1 = parameter_brace_patsub (name, temp, ind, value, quoted, pflags, (tflag & W_ARRAYIND) ? AV_USEIND : 0); |
| FREE (value); |
| FREE (temp); |
| |
| if (temp1 == &expand_param_error || temp1 == &expand_param_fatal) |
| { |
| FREE (name); |
| return (temp1 == &expand_param_error ? &expand_wdesc_error : &expand_wdesc_fatal); |
| } |
| |
| ret = alloc_word_desc (); |
| ret->word = temp1; |
| if (temp1 && |
| (quoted_dollar_atp == 0 || *quoted_dollar_atp == 0) && |
| QUOTED_NULL (temp1) && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES))) |
| ret->flags |= W_QUOTED|W_HASQUOTEDNULL; |
| /* Special handling for $* when unquoted and $IFS is null. Posix interp 888 */ |
| else if (temp1 && (name[0] == '*' && name[1] == 0) && quoted == 0 && ifs_is_null) |
| ret->flags |= W_SPLITSPACE; /* Posix interp 888 */ |
| |
| FREE (name); |
| return ret; |
| } |
| #if defined (CASEMOD_EXPANSIONS) |
| else if (want_casemod) |
| { |
| temp1 = parameter_brace_casemod (name, temp, ind, modspec, value, quoted, pflags, (tflag & W_ARRAYIND) ? AV_USEIND : 0); |
| FREE (value); |
| FREE (temp); |
| |
| if (temp1 == &expand_param_error || temp1 == &expand_param_fatal) |
| { |
| FREE (name); |
| return (temp1 == &expand_param_error ? &expand_wdesc_error : &expand_wdesc_fatal); |
| } |
| |
| ret = alloc_word_desc (); |
| ret->word = temp1; |
| if (temp1 && |
| (quoted_dollar_atp == 0 || *quoted_dollar_atp == 0) && |
| QUOTED_NULL (temp1) && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES))) |
| ret->flags |= W_QUOTED|W_HASQUOTEDNULL; |
| /* Special handling for $* when unquoted and $IFS is null. Posix interp 888 */ |
| else if (temp1 && (name[0] == '*' && name[1] == 0) && quoted == 0 && ifs_is_null) |
| ret->flags |= W_SPLITSPACE; /* Posix interp 888 */ |
| |
| FREE (name); |
| return ret; |
| } |
| #endif |
| |
| /* Do the right thing based on which character ended the variable name. */ |
| switch (c) |
| { |
| default: |
| case '\0': |
| bad_substitution: |
| set_exit_status (EXECUTION_FAILURE); |
| report_error (_("%s: bad substitution"), string ? string : "??"); |
| FREE (value); |
| FREE (temp); |
| free (name); |
| if (shell_compatibility_level <= 43) |
| return &expand_wdesc_error; |
| else |
| return ((posixly_correct && interactive_shell == 0) ? &expand_wdesc_fatal : &expand_wdesc_error); |
| |
| case RBRACE: |
| break; |
| |
| case '@': |
| temp1 = parameter_brace_transform (name, temp, ind, value, c, quoted, pflags, (tflag & W_ARRAYIND) ? AV_USEIND : 0); |
| free (temp); |
| free (value); |
| |
| if (temp1 == &expand_param_error || temp1 == &expand_param_fatal) |
| { |
| free (name); |
| set_exit_status (EXECUTION_FAILURE); |
| report_error (_("%s: bad substitution"), string ? string : "??"); |
| return (temp1 == &expand_param_error ? &expand_wdesc_error : &expand_wdesc_fatal); |
| } |
| |
| ret = alloc_word_desc (); |
| ret->word = temp1; |
| if (temp1 && QUOTED_NULL (temp1) && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES))) |
| ret->flags |= W_QUOTED|W_HASQUOTEDNULL; |
| /* Special handling for $* when unquoted and $IFS is null. Posix interp 888 */ |
| else if (temp1 && (name[0] == '*' && name[1] == 0) && quoted == 0 && ifs_is_null) |
| ret->flags |= W_SPLITSPACE; /* Posix interp 888 */ |
| |
| free (name); |
| return ret; |
| |
| case '#': /* ${param#[#]pattern} */ |
| case '%': /* ${param%[%]pattern} */ |
| if (value == 0 || *value == '\0' || temp == 0 || *temp == '\0') |
| { |
| FREE (value); |
| break; |
| } |
| temp1 = parameter_brace_remove_pattern (name, temp, ind, value, c, quoted, (tflag & W_ARRAYIND) ? AV_USEIND : 0); |
| free (temp); |
| free (value); |
| |
| ret = alloc_word_desc (); |
| ret->word = temp1; |
| if (temp1 && QUOTED_NULL (temp1) && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES))) |
| ret->flags |= W_QUOTED|W_HASQUOTEDNULL; |
| /* Special handling for $* when unquoted and $IFS is null. Posix interp 888 */ |
| else if (temp1 && (name[0] == '*' && name[1] == 0) && quoted == 0 && ifs_is_null) |
| ret->flags |= W_SPLITSPACE; /* Posix interp 888 */ |
| |
| free (name); |
| return ret; |
| |
| case '-': |
| case '=': |
| case '?': |
| case '+': |
| if (var_is_set && var_is_null == 0) |
| { |
| /* If the operator is `+', we don't want the value of the named |
| variable for anything, just the value of the right hand side. */ |
| if (c == '+') |
| { |
| /* XXX -- if we're double-quoted and the named variable is "$@", |
| we want to turn off any special handling of "$@" -- |
| we're not using it, so whatever is on the rhs applies. */ |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && quoted_dollar_atp) |
| *quoted_dollar_atp = 0; |
| if (contains_dollar_at) |
| *contains_dollar_at = 0; |
| |
| FREE (temp); |
| if (value) |
| { |
| /* From Posix discussion on austin-group list. Issue 221 |
| requires that backslashes escaping `}' inside |
| double-quoted ${...} be removed. */ |
| if (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) |
| quoted |= Q_DOLBRACE; |
| ret = parameter_brace_expand_rhs (name, value, c, |
| quoted, |
| pflags, |
| quoted_dollar_atp, |
| contains_dollar_at); |
| /* XXX - fix up later, esp. noting presence of |
| W_HASQUOTEDNULL in ret->flags */ |
| free (value); |
| } |
| else |
| temp = (char *)NULL; |
| } |
| else |
| { |
| FREE (value); |
| } |
| /* Otherwise do nothing; just use the value in TEMP. */ |
| } |
| else /* VAR not set or VAR is NULL. */ |
| { |
| FREE (temp); |
| temp = (char *)NULL; |
| if (c == '=' && var_is_special) |
| { |
| set_exit_status (EXECUTION_FAILURE); |
| report_error (_("$%s: cannot assign in this way"), name); |
| free (name); |
| free (value); |
| return &expand_wdesc_error; |
| } |
| else if (c == '?') |
| { |
| parameter_brace_expand_error (name, value, check_nullness); |
| return (interactive_shell ? &expand_wdesc_error : &expand_wdesc_fatal); |
| } |
| else if (c != '+') |
| { |
| /* XXX -- if we're double-quoted and the named variable is "$@", |
| we want to turn off any special handling of "$@" -- |
| we're not using it, so whatever is on the rhs applies. */ |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && quoted_dollar_atp) |
| *quoted_dollar_atp = 0; |
| if (contains_dollar_at) |
| *contains_dollar_at = 0; |
| |
| /* From Posix discussion on austin-group list. Issue 221 requires |
| that backslashes escaping `}' inside double-quoted ${...} be |
| removed. */ |
| if (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) |
| quoted |= Q_DOLBRACE; |
| ret = parameter_brace_expand_rhs (name, value, c, quoted, pflags, |
| quoted_dollar_atp, |
| contains_dollar_at); |
| /* XXX - fix up later, esp. noting presence of |
| W_HASQUOTEDNULL in tdesc->flags */ |
| } |
| free (value); |
| } |
| |
| break; |
| } |
| free (name); |
| |
| if (ret == 0) |
| { |
| ret = alloc_word_desc (); |
| ret->flags = tflag; |
| ret->word = temp; |
| } |
| return (ret); |
| } |
| |
| /* Expand a single ${xxx} expansion. The braces are optional. When |
| the braces are used, parameter_brace_expand() does the work, |
| possibly calling param_expand recursively. */ |
| static WORD_DESC * |
| param_expand (string, sindex, quoted, expanded_something, |
| contains_dollar_at, quoted_dollar_at_p, had_quoted_null_p, |
| pflags) |
| char *string; |
| int *sindex, quoted, *expanded_something, *contains_dollar_at; |
| int *quoted_dollar_at_p, *had_quoted_null_p, pflags; |
| { |
| char *temp, *temp1, uerror[3], *savecmd; |
| int zindex, t_index, expok; |
| unsigned char c; |
| intmax_t number; |
| SHELL_VAR *var; |
| WORD_LIST *list, *l; |
| WORD_DESC *tdesc, *ret; |
| int tflag, nullarg; |
| |
| /*itrace("param_expand: `%s' pflags = %d", string+*sindex, pflags);*/ |
| zindex = *sindex; |
| c = string[++zindex]; |
| |
| temp = (char *)NULL; |
| ret = tdesc = (WORD_DESC *)NULL; |
| tflag = 0; |
| |
| /* Do simple cases first. Switch on what follows '$'. */ |
| switch (c) |
| { |
| /* $0 .. $9? */ |
| case '0': |
| case '1': |
| case '2': |
| case '3': |
| case '4': |
| case '5': |
| case '6': |
| case '7': |
| case '8': |
| case '9': |
| temp1 = dollar_vars[TODIGIT (c)]; |
| /* This doesn't get called when (pflags&PF_IGNUNBOUND) != 0 */ |
| if (unbound_vars_is_error && temp1 == (char *)NULL) |
| { |
| uerror[0] = '$'; |
| uerror[1] = c; |
| uerror[2] = '\0'; |
| set_exit_status (EXECUTION_FAILURE); |
| err_unboundvar (uerror); |
| return (interactive_shell ? &expand_wdesc_error : &expand_wdesc_fatal); |
| } |
| if (temp1) |
| temp = (*temp1 && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES))) |
| ? quote_string (temp1) |
| : quote_escapes (temp1); |
| else |
| temp = (char *)NULL; |
| |
| break; |
| |
| /* $$ -- pid of the invoking shell. */ |
| case '$': |
| temp = itos (dollar_dollar_pid); |
| break; |
| |
| /* $# -- number of positional parameters. */ |
| case '#': |
| temp = itos (number_of_args ()); |
| break; |
| |
| /* $? -- return value of the last synchronous command. */ |
| case '?': |
| temp = itos (last_command_exit_value); |
| break; |
| |
| /* $- -- flags supplied to the shell on invocation or by `set'. */ |
| case '-': |
| temp = which_set_flags (); |
| break; |
| |
| /* $! -- Pid of the last asynchronous command. */ |
| case '!': |
| /* If no asynchronous pids have been created, expand to nothing. |
| If `set -u' has been executed, and no async processes have |
| been created, this is an expansion error. */ |
| if (last_asynchronous_pid == NO_PID) |
| { |
| if (expanded_something) |
| *expanded_something = 0; |
| temp = (char *)NULL; |
| if (unbound_vars_is_error && (pflags & PF_IGNUNBOUND) == 0) |
| { |
| uerror[0] = '$'; |
| uerror[1] = c; |
| uerror[2] = '\0'; |
| set_exit_status (EXECUTION_FAILURE); |
| err_unboundvar (uerror); |
| return (interactive_shell ? &expand_wdesc_error : &expand_wdesc_fatal); |
| } |
| } |
| else |
| temp = itos (last_asynchronous_pid); |
| break; |
| |
| /* The only difference between this and $@ is when the arg is quoted. */ |
| case '*': /* `$*' */ |
| list = list_rest_of_args (); |
| |
| #if 0 |
| /* According to austin-group posix proposal by Geoff Clare in |
| <20090505091501.GA10097@squonk.masqnet> of 5 May 2009: |
| |
| "The shell shall write a message to standard error and |
| immediately exit when it tries to expand an unset parameter |
| other than the '@' and '*' special parameters." |
| */ |
| |
| if (list == 0 && unbound_vars_is_error && (pflags & PF_IGNUNBOUND) == 0) |
| { |
| uerror[0] = '$'; |
| uerror[1] = '*'; |
| uerror[2] = '\0'; |
| set_exit_status (EXECUTION_FAILURE); |
| err_unboundvar (uerror); |
| return (interactive_shell ? &expand_wdesc_error : &expand_wdesc_fatal); |
| } |
| #endif |
| |
| /* If there are no command-line arguments, this should just |
| disappear if there are other characters in the expansion, |
| even if it's quoted. */ |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && list == 0) |
| temp = (char *)NULL; |
| else if (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES|Q_PATQUOTE)) |
| { |
| /* If we have "$*" we want to make a string of the positional |
| parameters, separated by the first character of $IFS, and |
| quote the whole string, including the separators. If IFS |
| is unset, the parameters are separated by ' '; if $IFS is |
| null, the parameters are concatenated. */ |
| temp = (quoted & (Q_DOUBLE_QUOTES|Q_PATQUOTE)) ? string_list_dollar_star (list, quoted, 0) : string_list (list); |
| if (temp) |
| { |
| temp1 = (quoted & Q_DOUBLE_QUOTES) ? quote_string (temp) : temp; |
| if (*temp == 0) |
| tflag |= W_HASQUOTEDNULL; |
| if (temp != temp1) |
| free (temp); |
| temp = temp1; |
| } |
| } |
| else |
| { |
| /* We check whether or not we're eventually going to split $* here, |
| for example when IFS is empty and we are processing the rhs of |
| an assignment statement. In that case, we don't separate the |
| arguments at all. Otherwise, if the $* is not quoted it is |
| identical to $@ */ |
| if (expand_no_split_dollar_star && quoted == 0 && ifs_is_set == 0 && (pflags & PF_ASSIGNRHS)) |
| { |
| /* Posix interp 888: RHS of assignment, IFS unset: no splitting, |
| separate with space */ |
| temp1 = string_list_dollar_star (list, quoted, pflags); |
| temp = temp1 ? quote_string (temp1) : temp1; |
| /* XXX - tentative - note that we saw a quoted null here */ |
| if (temp1 && *temp1 == 0 && QUOTED_NULL (temp)) |
| tflag |= W_SAWQUOTEDNULL; |
| FREE (temp1); |
| } |
| else if (expand_no_split_dollar_star && quoted == 0 && ifs_is_null && (pflags & PF_ASSIGNRHS)) |
| { |
| /* Posix interp 888: RHS of assignment, IFS set to '' */ |
| temp1 = string_list_dollar_star (list, quoted, pflags); |
| temp = temp1 ? quote_escapes (temp1) : temp1; |
| FREE (temp1); |
| } |
| else if (expand_no_split_dollar_star && quoted == 0 && ifs_is_set && ifs_is_null == 0 && (pflags & PF_ASSIGNRHS)) |
| { |
| /* Posix interp 888: RHS of assignment, IFS set to non-null value */ |
| temp1 = string_list_dollar_star (list, quoted, pflags); |
| temp = temp1 ? quote_string (temp1) : temp1; |
| |
| /* XXX - tentative - note that we saw a quoted null here */ |
| if (temp1 && *temp1 == 0 && QUOTED_NULL (temp)) |
| tflag |= W_SAWQUOTEDNULL; |
| FREE (temp1); |
| } |
| /* XXX - should we check ifs_is_set here as well? */ |
| # if defined (HANDLE_MULTIBYTE) |
| else if (expand_no_split_dollar_star && ifs_firstc[0] == 0) |
| # else |
| else if (expand_no_split_dollar_star && ifs_firstc == 0) |
| # endif |
| /* Posix interp 888: not RHS, no splitting, IFS set to '' */ |
| temp = string_list_dollar_star (list, quoted, 0); |
| else |
| { |
| temp = string_list_dollar_at (list, quoted, 0); |
| /* Set W_SPLITSPACE to make sure the individual positional |
| parameters are split into separate arguments */ |
| #if 0 |
| if (quoted == 0 && (ifs_is_set == 0 || ifs_is_null)) |
| #else /* change with bash-5.0 */ |
| if (quoted == 0 && ifs_is_null) |
| #endif |
| tflag |= W_SPLITSPACE; |
| /* If we're not quoted but we still don't want word splitting, make |
| we quote the IFS characters to protect them from splitting (e.g., |
| when $@ is in the string as well). */ |
| else if (temp && quoted == 0 && ifs_is_set && (pflags & PF_ASSIGNRHS)) |
| { |
| temp1 = quote_string (temp); |
| free (temp); |
| temp = temp1; |
| } |
| } |
| |
| if (expand_no_split_dollar_star == 0 && contains_dollar_at) |
| *contains_dollar_at = 1; |
| } |
| |
| dispose_words (list); |
| break; |
| |
| /* When we have "$@" what we want is "$1" "$2" "$3" ... This |
| means that we have to turn quoting off after we split into |
| the individually quoted arguments so that the final split |
| on the first character of $IFS is still done. */ |
| case '@': /* `$@' */ |
| list = list_rest_of_args (); |
| |
| #if 0 |
| /* According to austin-group posix proposal by Geoff Clare in |
| <20090505091501.GA10097@squonk.masqnet> of 5 May 2009: |
| |
| "The shell shall write a message to standard error and |
| immediately exit when it tries to expand an unset parameter |
| other than the '@' and '*' special parameters." |
| */ |
| |
| if (list == 0 && unbound_vars_is_error && (pflags & PF_IGNUNBOUND) == 0) |
| { |
| uerror[0] = '$'; |
| uerror[1] = '@'; |
| uerror[2] = '\0'; |
| set_exit_status (EXECUTION_FAILURE); |
| err_unboundvar (uerror); |
| return (interactive_shell ? &expand_wdesc_error : &expand_wdesc_fatal); |
| } |
| #endif |
| |
| for (nullarg = 0, l = list; l; l = l->next) |
| { |
| if (l->word && (l->word->word == 0 || l->word->word[0] == 0)) |
| nullarg = 1; |
| } |
| |
| /* We want to flag the fact that we saw this. We can't turn |
| off quoting entirely, because other characters in the |
| string might need it (consider "\"$@\""), but we need some |
| way to signal that the final split on the first character |
| of $IFS should be done, even though QUOTED is 1. */ |
| /* XXX - should this test include Q_PATQUOTE? */ |
| if (quoted_dollar_at_p && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES))) |
| *quoted_dollar_at_p = 1; |
| if (contains_dollar_at) |
| *contains_dollar_at = 1; |
| |
| /* We want to separate the positional parameters with the first |
| character of $IFS in case $IFS is something other than a space. |
| We also want to make sure that splitting is done no matter what -- |
| according to POSIX.2, this expands to a list of the positional |
| parameters no matter what IFS is set to. */ |
| /* XXX - what to do when in a context where word splitting is not |
| performed? Even when IFS is not the default, posix seems to imply |
| that we have to expand $@ to all the positional parameters and |
| separate them with spaces, which are preserved because word splitting |
| doesn't take place. See below for how we use PF_NOSPLIT2 here. */ |
| |
| /* These are the cases where word splitting will not be performed. */ |
| if (pflags & PF_ASSIGNRHS) |
| { |
| temp = string_list_dollar_at (list, (quoted|Q_DOUBLE_QUOTES), pflags); |
| if (nullarg) |
| tflag |= W_HASQUOTEDNULL; /* we know quoting produces quoted nulls */ |
| } |
| |
| /* This needs to match what expand_word_internal does with non-quoted $@ |
| does with separating with spaces. Passing Q_DOUBLE_QUOTES means that |
| the characters in LIST will be quoted, and PF_ASSIGNRHS ensures that |
| they will separated by spaces. After doing this, we need the special |
| handling for PF_NOSPLIT2 in expand_word_internal to remove the CTLESC |
| quotes. */ |
| else if (pflags & PF_NOSPLIT2) |
| { |
| #if defined (HANDLE_MULTIBYTE) |
| if (quoted == 0 && ifs_is_set && ifs_is_null == 0 && ifs_firstc[0] != ' ') |
| #else |
| if (quoted == 0 && ifs_is_set && ifs_is_null == 0 && ifs_firstc != ' ') |
| #endif |
| /* Posix interp 888 */ |
| temp = string_list_dollar_at (list, Q_DOUBLE_QUOTES, pflags); |
| else |
| temp = string_list_dollar_at (list, quoted, pflags); |
| } |
| else |
| temp = string_list_dollar_at (list, quoted, pflags); |
| |
| tflag |= W_DOLLARAT; |
| dispose_words (list); |
| break; |
| |
| case LBRACE: |
| tdesc = parameter_brace_expand (string, &zindex, quoted, pflags, |
| quoted_dollar_at_p, |
| contains_dollar_at); |
| |
| if (tdesc == &expand_wdesc_error || tdesc == &expand_wdesc_fatal) |
| return (tdesc); |
| temp = tdesc ? tdesc->word : (char *)0; |
| |
| /* XXX */ |
| /* Quoted nulls should be removed if there is anything else |
| in the string. */ |
| /* Note that we saw the quoted null so we can add one back at |
| the end of this function if there are no other characters |
| in the string, discard TEMP, and go on. The exception to |
| this is when we have "${@}" and $1 is '', since $@ needs |
| special handling. */ |
| if (tdesc && tdesc->word && (tdesc->flags & W_HASQUOTEDNULL) && QUOTED_NULL (temp)) |
| { |
| if (had_quoted_null_p) |
| *had_quoted_null_p = 1; |
| if (*quoted_dollar_at_p == 0) |
| { |
| free (temp); |
| tdesc->word = temp = (char *)NULL; |
| } |
| |
| } |
| |
| ret = tdesc; |
| goto return0; |
| |
| /* Do command or arithmetic substitution. */ |
| case LPAREN: |
| /* We have to extract the contents of this paren substitution. */ |
| t_index = zindex + 1; |
| /* XXX - might want to check for string[t_index+2] == LPAREN and parse |
| as arithmetic substitution immediately. */ |
| temp = extract_command_subst (string, &t_index, (pflags&PF_COMPLETE) ? SX_COMPLETE : 0); |
| zindex = t_index; |
| |
| /* For Posix.2-style `$(( ))' arithmetic substitution, |
| extract the expression and pass it to the evaluator. */ |
| if (temp && *temp == LPAREN) |
| { |
| char *temp2; |
| temp1 = temp + 1; |
| temp2 = savestring (temp1); |
| t_index = strlen (temp2) - 1; |
| |
| if (temp2[t_index] != RPAREN) |
| { |
| free (temp2); |
| goto comsub; |
| } |
| |
| /* Cut off ending `)' */ |
| temp2[t_index] = '\0'; |
| |
| if (chk_arithsub (temp2, t_index) == 0) |
| { |
| free (temp2); |
| #if 0 |
| internal_warning (_("future versions of the shell will force evaluation as an arithmetic substitution")); |
| #endif |
| goto comsub; |
| } |
| |
| /* Expand variables found inside the expression. */ |
| temp1 = expand_arith_string (temp2, Q_DOUBLE_QUOTES|Q_ARITH); |
| free (temp2); |
| |
| arithsub: |
| /* No error messages. */ |
| savecmd = this_command_name; |
| this_command_name = (char *)NULL; |
| number = evalexp (temp1, EXP_EXPANDED, &expok); |
| this_command_name = savecmd; |
| free (temp); |
| free (temp1); |
| if (expok == 0) |
| { |
| if (interactive_shell == 0 && posixly_correct) |
| { |
| set_exit_status (EXECUTION_FAILURE); |
| return (&expand_wdesc_fatal); |
| } |
| else |
| return (&expand_wdesc_error); |
| } |
| temp = itos (number); |
| break; |
| } |
| |
| comsub: |
| if (pflags & PF_NOCOMSUB) |
| /* we need zindex+1 because string[zindex] == RPAREN */ |
| temp1 = substring (string, *sindex, zindex+1); |
| else |
| { |
| tdesc = command_substitute (temp, quoted, pflags&PF_ASSIGNRHS); |
| temp1 = tdesc ? tdesc->word : (char *)NULL; |
| if (tdesc) |
| dispose_word_desc (tdesc); |
| } |
| FREE (temp); |
| temp = temp1; |
| break; |
| |
| /* Do POSIX.2d9-style arithmetic substitution. This will probably go |
| away in a future bash release. */ |
| case '[': /*]*/ |
| /* Extract the contents of this arithmetic substitution. */ |
| t_index = zindex + 1; |
| temp = extract_arithmetic_subst (string, &t_index); |
| zindex = t_index; |
| if (temp == 0) |
| { |
| temp = savestring (string); |
| if (expanded_something) |
| *expanded_something = 0; |
| goto return0; |
| } |
| |
| /* Do initial variable expansion. */ |
| temp1 = expand_arith_string (temp, Q_DOUBLE_QUOTES|Q_ARITH); |
| |
| goto arithsub; |
| |
| default: |
| /* Find the variable in VARIABLE_LIST. */ |
| temp = (char *)NULL; |
| |
| for (t_index = zindex; (c = string[zindex]) && legal_variable_char (c); zindex++) |
| ; |
| temp1 = (zindex > t_index) ? substring (string, t_index, zindex) : (char *)NULL; |
| |
| /* If this isn't a variable name, then just output the `$'. */ |
| if (temp1 == 0 || *temp1 == '\0') |
| { |
| FREE (temp1); |
| temp = (char *)xmalloc (2); |
| temp[0] = '$'; |
| temp[1] = '\0'; |
| if (expanded_something) |
| *expanded_something = 0; |
| goto return0; |
| } |
| |
| /* If the variable exists, return its value cell. */ |
| var = find_variable (temp1); |
| |
| if (var && invisible_p (var) == 0 && var_isset (var)) |
| { |
| #if defined (ARRAY_VARS) |
| if (assoc_p (var) || array_p (var)) |
| { |
| temp = array_p (var) ? array_reference (array_cell (var), 0) |
| : assoc_reference (assoc_cell (var), "0"); |
| if (temp) |
| temp = (*temp && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES))) |
| ? quote_string (temp) |
| : quote_escapes (temp); |
| else if (unbound_vars_is_error) |
| goto unbound_variable; |
| } |
| else |
| #endif |
| { |
| temp = value_cell (var); |
| |
| temp = (*temp && (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES))) |
| ? quote_string (temp) |
| : ((pflags & PF_ASSIGNRHS) ? quote_rhs (temp) |
| : quote_escapes (temp)); |
| } |
| |
| free (temp1); |
| |
| goto return0; |
| } |
| else if (var && (invisible_p (var) || var_isset (var) == 0)) |
| temp = (char *)NULL; |
| else if ((var = find_variable_last_nameref (temp1, 0)) && var_isset (var) && invisible_p (var) == 0) |
| { |
| temp = nameref_cell (var); |
| #if defined (ARRAY_VARS) |
| if (temp && *temp && valid_array_reference (temp, 0)) |
| { |
| tdesc = parameter_brace_expand_word (temp, SPECIAL_VAR (temp, 0), quoted, pflags, (arrayind_t *)NULL); |
| if (tdesc == &expand_wdesc_error || tdesc == &expand_wdesc_fatal) |
| return (tdesc); |
| ret = tdesc; |
| goto return0; |
| } |
| else |
| #endif |
| /* y=2 ; typeset -n x=y; echo $x is not the same as echo $2 in ksh */ |
| if (temp && *temp && legal_identifier (temp) == 0) |
| { |
| set_exit_status (EXECUTION_FAILURE); |
| report_error (_("%s: invalid variable name for name reference"), temp); |
| return (&expand_wdesc_error); /* XXX */ |
| } |
| else |
| temp = (char *)NULL; |
| } |
| |
| temp = (char *)NULL; |
| |
| unbound_variable: |
| if (unbound_vars_is_error) |
| { |
| set_exit_status (EXECUTION_FAILURE); |
| err_unboundvar (temp1); |
| } |
| else |
| { |
| free (temp1); |
| goto return0; |
| } |
| |
| free (temp1); |
| set_exit_status (EXECUTION_FAILURE); |
| return ((unbound_vars_is_error && interactive_shell == 0) |
| ? &expand_wdesc_fatal |
| : &expand_wdesc_error); |
| } |
| |
| if (string[zindex]) |
| zindex++; |
| |
| return0: |
| *sindex = zindex; |
| |
| if (ret == 0) |
| { |
| ret = alloc_word_desc (); |
| ret->flags = tflag; /* XXX */ |
| ret->word = temp; |
| } |
| return ret; |
| } |
| |
| void |
| invalidate_cached_quoted_dollar_at () |
| { |
| dispose_words (cached_quoted_dollar_at); |
| cached_quoted_dollar_at = 0; |
| } |
| |
| /* Make a word list which is the result of parameter and variable |
| expansion, command substitution, arithmetic substitution, and |
| quote removal of WORD. Return a pointer to a WORD_LIST which is |
| the result of the expansion. If WORD contains a null word, the |
| word list returned is also null. |
| |
| QUOTED contains flag values defined in shell.h. |
| |
| ISEXP is used to tell expand_word_internal that the word should be |
| treated as the result of an expansion. This has implications for |
| how IFS characters in the word are treated. |
| |
| CONTAINS_DOLLAR_AT and EXPANDED_SOMETHING are return values; when non-null |
| they point to an integer value which receives information about expansion. |
| CONTAINS_DOLLAR_AT gets non-zero if WORD contained "$@", else zero. |
| EXPANDED_SOMETHING get non-zero if WORD contained any parameter expansions, |
| else zero. |
| |
| This only does word splitting in the case of $@ expansion. In that |
| case, we split on ' '. */ |
| |
| /* Values for the local variable quoted_state. */ |
| #define UNQUOTED 0 |
| #define PARTIALLY_QUOTED 1 |
| #define WHOLLY_QUOTED 2 |
| |
| static WORD_LIST * |
| expand_word_internal (word, quoted, isexp, contains_dollar_at, expanded_something) |
| WORD_DESC *word; |
| int quoted, isexp; |
| int *contains_dollar_at; |
| int *expanded_something; |
| { |
| WORD_LIST *list; |
| WORD_DESC *tword; |
| |
| /* The intermediate string that we build while expanding. */ |
| char *istring; |
| |
| /* The current size of the above object. */ |
| size_t istring_size; |
| |
| /* Index into ISTRING. */ |
| int istring_index; |
| |
| /* Temporary string storage. */ |
| char *temp, *temp1; |
| |
| /* The text of WORD. */ |
| register char *string; |
| |
| /* The size of STRING. */ |
| size_t string_size; |
| |
| /* The index into STRING. */ |
| int sindex; |
| |
| /* This gets 1 if we see a $@ while quoted. */ |
| int quoted_dollar_at; |
| |
| /* One of UNQUOTED, PARTIALLY_QUOTED, or WHOLLY_QUOTED, depending on |
| whether WORD contains no quoting characters, a partially quoted |
| string (e.g., "xx"ab), or is fully quoted (e.g., "xxab"). */ |
| int quoted_state; |
| |
| /* State flags */ |
| int had_quoted_null; |
| int has_quoted_ifs; /* did we add a quoted $IFS character here? */ |
| int has_dollar_at, temp_has_dollar_at; |
| int split_on_spaces; |
| int local_expanded; |
| int tflag; |
| int pflags; /* flags passed to param_expand */ |
| int mb_cur_max; |
| |
| int assignoff; /* If assignment, offset of `=' */ |
| |
| register unsigned char c; /* Current character. */ |
| int t_index; /* For calls to string_extract_xxx. */ |
| |
| char twochars[2]; |
| |
| DECLARE_MBSTATE; |
| |
| /* OK, let's see if we can optimize a common idiom: "$@" */ |
| if (STREQ (word->word, "\"$@\"") && |
| (word->flags == (W_HASDOLLAR|W_QUOTED)) && |
| dollar_vars[1]) /* XXX - check IFS here as well? */ |
| { |
| if (contains_dollar_at) |
| *contains_dollar_at = 1; |
| if (expanded_something) |
| *expanded_something = 1; |
| if (cached_quoted_dollar_at) |
| return (copy_word_list (cached_quoted_dollar_at)); |
| list = list_rest_of_args (); |
| list = quote_list (list); |
| cached_quoted_dollar_at = copy_word_list (list); |
| return (list); |
| } |
| |
| istring = (char *)xmalloc (istring_size = DEFAULT_INITIAL_ARRAY_SIZE); |
| istring[istring_index = 0] = '\0'; |
| quoted_dollar_at = had_quoted_null = has_dollar_at = 0; |
| has_quoted_ifs = 0; |
| split_on_spaces = 0; |
| quoted_state = UNQUOTED; |
| |
| string = word->word; |
| if (string == 0) |
| goto finished_with_string; |
| mb_cur_max = MB_CUR_MAX; |
| |
| /* Don't need the string length for the SADD... and COPY_ macros unless |
| multibyte characters are possible, but do need it for bounds checking. */ |
| string_size = (mb_cur_max > 1) ? strlen (string) : 1; |
| |
| if (contains_dollar_at) |
| *contains_dollar_at = 0; |
| |
| assignoff = -1; |
| |
| /* Begin the expansion. */ |
| |
| for (sindex = 0; ;) |
| { |
| c = string[sindex]; |
| |
| /* Case on top-level character. */ |
| switch (c) |
| { |
| case '\0': |
| goto finished_with_string; |
| |
| case CTLESC: |
| sindex++; |
| #if HANDLE_MULTIBYTE |
| if (mb_cur_max > 1 && string[sindex]) |
| { |
| SADD_MBQCHAR_BODY(temp, string, sindex, string_size); |
| } |
| else |
| #endif |
| { |
| temp = (char *)xmalloc (3); |
| temp[0] = CTLESC; |
| temp[1] = c = string[sindex]; |
| temp[2] = '\0'; |
| } |
| |
| dollar_add_string: |
| if (string[sindex]) |
| sindex++; |
| |
| add_string: |
| if (temp) |
| { |
| istring = sub_append_string (temp, istring, &istring_index, &istring_size); |
| temp = (char *)0; |
| } |
| |
| break; |
| |
| #if defined (PROCESS_SUBSTITUTION) |
| /* Process substitution. */ |
| case '<': |
| case '>': |
| { |
| /* XXX - technically this should only be expanded at the start |
| of a word */ |
| if (string[++sindex] != LPAREN || (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) || (word->flags & (W_DQUOTE|W_NOPROCSUB))) |
| { |
| sindex--; /* add_character: label increments sindex */ |
| goto add_character; |
| } |
| else |
| t_index = sindex + 1; /* skip past both '<' and LPAREN */ |
| |
| temp1 = extract_process_subst (string, (c == '<') ? "<(" : ">(", &t_index, 0); /*))*/ |
| sindex = t_index; |
| |
| /* If the process substitution specification is `<()', we want to |
| open the pipe for writing in the child and produce output; if |
| it is `>()', we want to open the pipe for reading in the child |
| and consume input. */ |
| temp = temp1 ? process_substitute (temp1, (c == '>')) : (char *)0; |
| |
| FREE (temp1); |
| |
| goto dollar_add_string; |
| } |
| #endif /* PROCESS_SUBSTITUTION */ |
| |
| case '=': |
| /* Posix.2 section 3.6.1 says that tildes following `=' in words |
| which are not assignment statements are not expanded. If the |
| shell isn't in posix mode, though, we perform tilde expansion |
| on `likely candidate' unquoted assignment statements (flags |
| include W_ASSIGNMENT but not W_QUOTED). A likely candidate |
| contains an unquoted :~ or =~. Something to think about: we |
| now have a flag that says to perform tilde expansion on arguments |
| to `assignment builtins' like declare and export that look like |
| assignment statements. We now do tilde expansion on such words |
| even in POSIX mode. */ |
| if (word->flags & (W_ASSIGNRHS|W_NOTILDE)) |
| { |
| if (isexp == 0 && (word->flags & (W_NOSPLIT|W_NOSPLIT2)) == 0 && isifs (c)) |
| goto add_ifs_character; |
| else |
| goto add_character; |
| } |
| /* If we're not in posix mode or forcing assignment-statement tilde |
| expansion, note where the first `=' appears in the word and prepare |
| to do tilde expansion following the first `='. We have to keep |
| track of the first `=' (using assignoff) to avoid being confused |
| by an `=' in the rhs of the assignment statement. */ |
| if ((word->flags & W_ASSIGNMENT) && |
| (posixly_correct == 0 || (word->flags & W_TILDEEXP)) && |
| assignoff == -1 && sindex > 0) |
| assignoff = sindex; |
| if (sindex == assignoff && string[sindex+1] == '~') /* XXX */ |
| word->flags |= W_ITILDE; |
| |
| if (word->flags & W_ASSIGNARG) |
| word->flags |= W_ASSIGNRHS; /* affects $@ */ |
| |
| if (isexp == 0 && (word->flags & (W_NOSPLIT|W_NOSPLIT2)) == 0 && isifs (c)) |
| { |
| has_quoted_ifs++; |
| goto add_ifs_character; |
| } |
| else |
| goto add_character; |
| |
| case ':': |
| if (word->flags & (W_NOTILDE|W_NOASSNTILDE)) |
| { |
| if (isexp == 0 && (word->flags & (W_NOSPLIT|W_NOSPLIT2)) == 0 && isifs (c)) |
| goto add_ifs_character; |
| else |
| goto add_character; |
| } |
| |
| if ((word->flags & (W_ASSIGNMENT|W_ASSIGNRHS)) && |
| (posixly_correct == 0 || (word->flags & W_TILDEEXP)) && |
| string[sindex+1] == '~') |
| word->flags |= W_ITILDE; |
| |
| if (isexp == 0 && (word->flags & (W_NOSPLIT|W_NOSPLIT2)) == 0 && isifs (c)) |
| goto add_ifs_character; |
| else |
| goto add_character; |
| |
| case '~': |
| /* If the word isn't supposed to be tilde expanded, or we're not |
| at the start of a word or after an unquoted : or = in an |
| assignment statement, we don't do tilde expansion. We don't |
| do tilde expansion if quoted or in an arithmetic context. */ |
| |
| if ((word->flags & (W_NOTILDE|W_DQUOTE)) || |
| (sindex > 0 && ((word->flags & W_ITILDE) == 0)) || |
| (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT))) |
| { |
| word->flags &= ~W_ITILDE; |
| if (isexp == 0 && (word->flags & (W_NOSPLIT|W_NOSPLIT2)) == 0 && isifs (c) && (quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) == 0) |
| goto add_ifs_character; |
| else |
| goto add_character; |
| } |
| |
| if (word->flags & W_ASSIGNRHS) |
| tflag = 2; |
| else if (word->flags & (W_ASSIGNMENT|W_TILDEEXP)) |
| tflag = 1; |
| else |
| tflag = 0; |
| |
| temp = bash_tilde_find_word (string + sindex, tflag, &t_index); |
| |
| word->flags &= ~W_ITILDE; |
| |
| if (temp && *temp && t_index > 0) |
| { |
| temp1 = bash_tilde_expand (temp, tflag); |
| if (temp1 && *temp1 == '~' && STREQ (temp, temp1)) |
| { |
| FREE (temp); |
| FREE (temp1); |
| goto add_character; /* tilde expansion failed */ |
| } |
| free (temp); |
| temp = temp1; |
| sindex += t_index; |
| goto add_quoted_string; /* XXX was add_string */ |
| } |
| else |
| { |
| FREE (temp); |
| goto add_character; |
| } |
| |
| case '$': |
| if (expanded_something) |
| *expanded_something = 1; |
| local_expanded = 1; |
| |
| temp_has_dollar_at = 0; |
| pflags = (word->flags & W_NOCOMSUB) ? PF_NOCOMSUB : 0; |
| if (word->flags & W_NOSPLIT2) |
| pflags |= PF_NOSPLIT2; |
| if (word->flags & W_ASSIGNRHS) |
| pflags |= PF_ASSIGNRHS; |
| if (word->flags & W_COMPLETE) |
| pflags |= PF_COMPLETE; |
| |
| tword = param_expand (string, &sindex, quoted, expanded_something, |
| &temp_has_dollar_at, "ed_dollar_at, |
| &had_quoted_null, pflags); |
| has_dollar_at += temp_has_dollar_at; |
| split_on_spaces += (tword->flags & W_SPLITSPACE); |
| |
| if (tword == &expand_wdesc_error || tword == &expand_wdesc_fatal) |
| { |
| free (string); |
| free (istring); |
| return ((tword == &expand_wdesc_error) ? &expand_word_error |
| : &expand_word_fatal); |
| } |
| if (contains_dollar_at && has_dollar_at) |
| *contains_dollar_at = 1; |
| |
| if (tword && (tword->flags & W_HASQUOTEDNULL)) |
| had_quoted_null = 1; /* note for later */ |
| if (tword && (tword->flags & W_SAWQUOTEDNULL)) |
| had_quoted_null = 1; /* XXX */ |
| |
| temp = tword ? tword->word : (char *)NULL; |
| dispose_word_desc (tword); |
| |
| /* Kill quoted nulls; we will add them back at the end of |
| expand_word_internal if nothing else in the string */ |
| if (had_quoted_null && temp && QUOTED_NULL (temp)) |
| { |
| FREE (temp); |
| temp = (char *)NULL; |
| } |
| |
| goto add_string; |
| break; |
| |
| case '`': /* Backquoted command substitution. */ |
| { |
| t_index = sindex++; |
| |
| temp = string_extract (string, &sindex, "`", SX_REQMATCH); |
| /* The test of sindex against t_index is to allow bare instances of |
| ` to pass through, for backwards compatibility. */ |
| if (temp == &extract_string_error || temp == &extract_string_fatal) |
| { |
| if (sindex - 1 == t_index) |
| { |
| sindex = t_index; |
| goto add_character; |
| } |
| set_exit_status (EXECUTION_FAILURE); |
| report_error (_("bad substitution: no closing \"`\" in %s") , string+t_index); |
| free (string); |
| free (istring); |
| return ((temp == &extract_string_error) ? &expand_word_error |
| : &expand_word_fatal); |
| } |
| |
| if (expanded_something) |
| *expanded_something = 1; |
| local_expanded = 1; |
| |
| if (word->flags & W_NOCOMSUB) |
| /* sindex + 1 because string[sindex] == '`' */ |
| temp1 = substring (string, t_index, sindex + 1); |
| else |
| { |
| de_backslash (temp); |
| tword = command_substitute (temp, quoted, 0); |
| temp1 = tword ? tword->word : (char *)NULL; |
| if (tword) |
| dispose_word_desc (tword); |
| } |
| FREE (temp); |
| temp = temp1; |
| goto dollar_add_string; |
| } |
| |
| case '\\': |
| if (string[sindex + 1] == '\n') |
| { |
| sindex += 2; |
| continue; |
| } |
| |
| c = string[++sindex]; |
| |
| /* "However, the double-quote character ( '"' ) shall not be treated |
| specially within a here-document, except when the double-quote |
| appears within "$()", "``", or "${}"." */ |
| if ((quoted & Q_HERE_DOCUMENT) && (quoted & Q_DOLBRACE) && c == '"') |
| tflag = CBSDQUOTE; /* special case */ |
| else if (quoted & Q_HERE_DOCUMENT) |
| tflag = CBSHDOC; |
| else if (quoted & Q_DOUBLE_QUOTES) |
| tflag = CBSDQUOTE; |
| else |
| tflag = 0; |
| |
| /* From Posix discussion on austin-group list: Backslash escaping |
| a } in ${...} is removed. Issue 0000221 */ |
| if ((quoted & Q_DOLBRACE) && c == RBRACE) |
| { |
| SCOPY_CHAR_I (twochars, CTLESC, c, string, sindex, string_size); |
| } |
| /* This is the fix for " $@\ " */ |
| else if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && ((sh_syntaxtab[c] & tflag) == 0) && isexp == 0 && isifs (c)) |
| { |
| RESIZE_MALLOCED_BUFFER (istring, istring_index, 2, istring_size, |
| DEFAULT_ARRAY_SIZE); |
| istring[istring_index++] = CTLESC; |
| istring[istring_index++] = '\\'; |
| istring[istring_index] = '\0'; |
| |
| SCOPY_CHAR_I (twochars, CTLESC, c, string, sindex, string_size); |
| } |
| else if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && c == 0) |
| { |
| RESIZE_MALLOCED_BUFFER (istring, istring_index, 2, istring_size, |
| DEFAULT_ARRAY_SIZE); |
| istring[istring_index++] = CTLESC; |
| istring[istring_index++] = '\\'; |
| istring[istring_index] = '\0'; |
| break; |
| } |
| else if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) && ((sh_syntaxtab[c] & tflag) == 0)) |
| { |
| SCOPY_CHAR_I (twochars, '\\', c, string, sindex, string_size); |
| } |
| else if (c == 0) |
| { |
| c = CTLNUL; |
| sindex--; /* add_character: label increments sindex */ |
| goto add_character; |
| } |
| else |
| { |
| SCOPY_CHAR_I (twochars, CTLESC, c, string, sindex, string_size); |
| } |
| |
| sindex++; |
| add_twochars: |
| /* BEFORE jumping here, we need to increment sindex if appropriate */ |
| RESIZE_MALLOCED_BUFFER (istring, istring_index, 2, istring_size, |
| DEFAULT_ARRAY_SIZE); |
| istring[istring_index++] = twochars[0]; |
| istring[istring_index++] = twochars[1]; |
| istring[istring_index] = '\0'; |
| |
| break; |
| |
| case '"': |
| if ((quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) && ((quoted & Q_ARITH) == 0)) |
| goto add_character; |
| |
| t_index = ++sindex; |
| temp = string_extract_double_quoted (string, &sindex, (word->flags & W_COMPLETE) ? SX_COMPLETE : 0); |
| |
| /* If the quotes surrounded the entire string, then the |
| whole word was quoted. */ |
| quoted_state = (t_index == 1 && string[sindex] == '\0') |
| ? WHOLLY_QUOTED |
| : PARTIALLY_QUOTED; |
| |
| if (temp && *temp) |
| { |
| tword = alloc_word_desc (); |
| tword->word = temp; |
| |
| if (word->flags & W_ASSIGNARG) |
| tword->flags |= word->flags & (W_ASSIGNARG|W_ASSIGNRHS); /* affects $@ */ |
| if (word->flags & W_COMPLETE) |
| tword->flags |= W_COMPLETE; /* for command substitutions */ |
| if (word->flags & W_NOCOMSUB) |
| tword->flags |= W_NOCOMSUB; |
| if (word->flags & W_NOPROCSUB) |
| tword->flags |= W_NOPROCSUB; |
| |
| if (word->flags & W_ASSIGNRHS) |
| tword->flags |= W_ASSIGNRHS; |
| |
| temp = (char *)NULL; |
| |
| temp_has_dollar_at = 0; /* does this quoted (sub)string include $@? */ |
| /* Need to get W_HASQUOTEDNULL flag through this function. */ |
| list = expand_word_internal (tword, Q_DOUBLE_QUOTES, 0, &temp_has_dollar_at, (int *)NULL); |
| has_dollar_at += temp_has_dollar_at; |
| |
| if (list == &expand_word_error || list == &expand_word_fatal) |
| { |
| free (istring); |
| free (string); |
| /* expand_word_internal has already freed temp_word->word |
| for us because of the way it prints error messages. */ |
| tword->word = (char *)NULL; |
| dispose_word (tword); |
| return list; |
| } |
| |
| dispose_word (tword); |
| |
| /* "$@" (a double-quoted dollar-at) expands into nothing, |
| not even a NULL word, when there are no positional |
| parameters. Posix interp 888 says that other parts of the |
| word that expand to quoted nulls result in quoted nulls, so |
| we can't just throw the entire word away if we have "$@" |
| anywhere in it. We use had_quoted_null to keep track */ |
| if (list == 0 && temp_has_dollar_at) /* XXX - was has_dollar_at */ |
| { |
| quoted_dollar_at++; |
| break; |
| } |
| |
| /* If this list comes back with a quoted null from expansion, |
| we have either "$x" or "$@" with $1 == ''. In either case, |
| we need to make sure we add a quoted null argument and |
| disable the special handling that "$@" gets. */ |
| if (list && list->word && list->next == 0 && (list->word->flags & W_HASQUOTEDNULL)) |
| { |
| if (had_quoted_null && temp_has_dollar_at) |
| quoted_dollar_at++; |
| had_quoted_null = 1; /* XXX */ |
| } |
| |
| /* If we get "$@", we know we have expanded something, so we |
| need to remember it for the final split on $IFS. This is |
| a special case; it's the only case where a quoted string |
| can expand into more than one word. It's going to come back |
| from the above call to expand_word_internal as a list with |
| multiple words. */ |
| if (list) |
| dequote_list (list); |
| |
| if (temp_has_dollar_at) /* XXX - was has_dollar_at */ |
| { |
| quoted_dollar_at++; |
| if (contains_dollar_at) |
| *contains_dollar_at = 1; |
| if (expanded_something) |
| *expanded_something = 1; |
| local_expanded = 1; |
| } |
| } |
| else |
| { |
| /* What we have is "". This is a minor optimization. */ |
| FREE (temp); |
| list = (WORD_LIST *)NULL; |
| had_quoted_null = 1; /* note for later */ |
| } |
| |
| /* The code above *might* return a list (consider the case of "$@", |
| where it returns "$1", "$2", etc.). We can't throw away the |
| rest of the list, and we have to make sure each word gets added |
| as quoted. We test on tresult->next: if it is non-NULL, we |
| quote the whole list, save it to a string with string_list, and |
| add that string. We don't need to quote the results of this |
| (and it would be wrong, since that would quote the separators |
| as well), so we go directly to add_string. */ |
| if (list) |
| { |
| if (list->next) |
| { |
| /* Testing quoted_dollar_at makes sure that "$@" is |
| split correctly when $IFS does not contain a space. */ |
| temp = quoted_dollar_at |
| ? string_list_dollar_at (list, Q_DOUBLE_QUOTES, 0) |
| : string_list (quote_list (list)); |
| dispose_words (list); |
| goto add_string; |
| } |
| else |
| { |
| temp = savestring (list->word->word); |
| tflag = list->word->flags; |
| dispose_words (list); |
| |
| /* If the string is not a quoted null string, we want |
| to remove any embedded unquoted CTLNUL characters. |
| We do not want to turn quoted null strings back into |
| the empty string, though. We do this because we |
| want to remove any quoted nulls from expansions that |
| contain other characters. For example, if we have |
| x"$*"y or "x$*y" and there are no positional parameters, |
| the $* should expand into nothing. */ |
| /* We use the W_HASQUOTEDNULL flag to differentiate the |
| cases: a quoted null character as above and when |
| CTLNUL is contained in the (non-null) expansion |
| of some variable. We use the had_quoted_null flag to |
| pass the value through this function to its caller. */ |
| if ((tflag & W_HASQUOTEDNULL) && QUOTED_NULL (temp) == 0) |
| remove_quoted_nulls (temp); /* XXX */ |
| } |
| } |
| else |
| temp = (char *)NULL; |
| |
| if (temp == 0 && quoted_state == PARTIALLY_QUOTED) |
| had_quoted_null = 1; /* note for later */ |
| |
| /* We do not want to add quoted nulls to strings that are only |
| partially quoted; we can throw them away. The exception to |
| this is when we are going to be performing word splitting, |
| since we have to preserve a null argument if the next character |
| will cause word splitting. */ |
| if (temp == 0 && quoted_state == PARTIALLY_QUOTED && quoted == 0 && (word->flags & (W_NOSPLIT|W_EXPANDRHS|W_ASSIGNRHS)) == W_EXPANDRHS) |
| { |
| c = CTLNUL; |
| sindex--; |
| had_quoted_null = 1; |
| goto add_character; |
| } |
| if (temp == 0 && quoted_state == PARTIALLY_QUOTED && (word->flags & (W_NOSPLIT|W_NOSPLIT2))) |
| continue; |
| |
| add_quoted_string: |
| |
| if (temp) |
| { |
| temp1 = temp; |
| temp = quote_string (temp); |
| free (temp1); |
| goto add_string; |
| } |
| else |
| { |
| /* Add NULL arg. */ |
| c = CTLNUL; |
| sindex--; /* add_character: label increments sindex */ |
| had_quoted_null = 1; /* note for later */ |
| goto add_character; |
| } |
| |
| /* break; */ |
| |
| case '\'': |
| if ((quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT))) |
| goto add_character; |
| |
| t_index = ++sindex; |
| temp = string_extract_single_quoted (string, &sindex); |
| |
| /* If the entire STRING was surrounded by single quotes, |
| then the string is wholly quoted. */ |
| quoted_state = (t_index == 1 && string[sindex] == '\0') |
| ? WHOLLY_QUOTED |
| : PARTIALLY_QUOTED; |
| |
| /* If all we had was '', it is a null expansion. */ |
| if (*temp == '\0') |
| { |
| free (temp); |
| temp = (char *)NULL; |
| } |
| else |
| remove_quoted_escapes (temp); /* ??? */ |
| |
| if (temp == 0 && quoted_state == PARTIALLY_QUOTED) |
| had_quoted_null = 1; /* note for later */ |
| |
| /* We do not want to add quoted nulls to strings that are only |
| partially quoted; such nulls are discarded. See above for the |
| exception, which is when the string is going to be split. |
| Posix interp 888/1129 */ |
| if (temp == 0 && quoted_state == PARTIALLY_QUOTED && quoted == 0 && (word->flags & (W_NOSPLIT|W_EXPANDRHS|W_ASSIGNRHS)) == W_EXPANDRHS) |
| { |
| c = CTLNUL; |
| sindex--; |
| goto add_character; |
| } |
| |
| if (temp == 0 && (quoted_state == PARTIALLY_QUOTED) && (word->flags & (W_NOSPLIT|W_NOSPLIT2))) |
| continue; |
| |
| /* If we have a quoted null expansion, add a quoted NULL to istring. */ |
| if (temp == 0) |
| { |
| c = CTLNUL; |
| sindex--; /* add_character: label increments sindex */ |
| goto add_character; |
| } |
| else |
| goto add_quoted_string; |
| |
| /* break; */ |
| |
| case ' ': |
| /* If we are in a context where the word is not going to be split, but |
| we need to account for $@ and $* producing one word for each |
| positional parameter, add quoted spaces so the spaces in the |
| expansion of "$@", if any, behave correctly. We still may need to |
| split if we are expanding the rhs of a word expansion. */ |
| if (ifs_is_null || split_on_spaces || ((word->flags & (W_NOSPLIT|W_NOSPLIT2|W_ASSIGNRHS)) && (word->flags & W_EXPANDRHS) == 0)) |
| { |
| if (string[sindex]) |
| sindex++; |
| twochars[0] = CTLESC; |
| twochars[1] = c; |
| goto add_twochars; |
| } |
| /* FALLTHROUGH */ |
| |
| default: |
| /* This is the fix for " $@ " */ |
| add_ifs_character: |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) || (isexp == 0 && isifs (c) && (word->flags & (W_NOSPLIT|W_NOSPLIT2)) == 0)) |
| { |
| if ((quoted&(Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) == 0) |
| has_quoted_ifs++; |
| add_quoted_character: |
| if (string[sindex]) /* from old goto dollar_add_string */ |
| sindex++; |
| if (c == 0) |
| { |
| c = CTLNUL; |
| goto add_character; |
| } |
| else |
| { |
| #if HANDLE_MULTIBYTE |
| /* XXX - should make sure that c is actually multibyte, |
| otherwise we can use the twochars branch */ |
| if (mb_cur_max > 1) |
| sindex--; |
| |
| if (mb_cur_max > 1) |
| { |
| SADD_MBQCHAR_BODY(temp, string, sindex, string_size); |
| } |
| else |
| #endif |
| { |
| twochars[0] = CTLESC; |
| twochars[1] = c; |
| goto add_twochars; |
| } |
| } |
| } |
| |
| SADD_MBCHAR (temp, string, sindex, string_size); |
| |
| add_character: |
| RESIZE_MALLOCED_BUFFER (istring, istring_index, 1, istring_size, |
| DEFAULT_ARRAY_SIZE); |
| istring[istring_index++] = c; |
| istring[istring_index] = '\0'; |
| |
| /* Next character. */ |
| sindex++; |
| } |
| } |
| |
| finished_with_string: |
| /* OK, we're ready to return. If we have a quoted string, and |
| quoted_dollar_at is not set, we do no splitting at all; otherwise |
| we split on ' '. The routines that call this will handle what to |
| do if nothing has been expanded. */ |
| |
| /* Partially and wholly quoted strings which expand to the empty |
| string are retained as an empty arguments. Unquoted strings |
| which expand to the empty string are discarded. The single |
| exception is the case of expanding "$@" when there are no |
| positional parameters. In that case, we discard the expansion. */ |
| |
| /* Because of how the code that handles "" and '' in partially |
| quoted strings works, we need to make ISTRING into a QUOTED_NULL |
| if we saw quoting characters, but the expansion was empty. |
| "" and '' are tossed away before we get to this point when |
| processing partially quoted strings. This makes "" and $xxx"" |
| equivalent when xxx is unset. We also look to see whether we |
| saw a quoted null from a ${} expansion and add one back if we |
| need to. */ |
| |
| /* If we expand to nothing and there were no single or double quotes |
| in the word, we throw it away. Otherwise, we return a NULL word. |
| The single exception is for $@ surrounded by double quotes when |
| there are no positional parameters. In that case, we also throw |
| the word away. */ |
| |
| if (*istring == '\0') |
| { |
| if (quoted_dollar_at == 0 && (had_quoted_null || quoted_state == PARTIALLY_QUOTED)) |
| { |
| istring[0] = CTLNUL; |
| istring[1] = '\0'; |
| tword = alloc_word_desc (); |
| tword->word = istring; |
| istring = 0; /* avoid later free() */ |
| tword->flags |= W_HASQUOTEDNULL; /* XXX */ |
| list = make_word_list (tword, (WORD_LIST *)NULL); |
| if (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) |
| tword->flags |= W_QUOTED; |
| } |
| /* According to sh, ksh, and Posix.2, if a word expands into nothing |
| and a double-quoted "$@" appears anywhere in it, then the entire |
| word is removed. */ |
| /* XXX - exception appears to be that quoted null strings result in |
| null arguments */ |
| else if (quoted_state == UNQUOTED || quoted_dollar_at) |
| list = (WORD_LIST *)NULL; |
| else |
| list = (WORD_LIST *)NULL; |
| } |
| else if (word->flags & W_NOSPLIT) |
| { |
| tword = alloc_word_desc (); |
| tword->word = istring; |
| if (had_quoted_null && QUOTED_NULL (istring)) |
| tword->flags |= W_HASQUOTEDNULL; |
| istring = 0; /* avoid later free() */ |
| if (word->flags & W_ASSIGNMENT) |
| tword->flags |= W_ASSIGNMENT; /* XXX */ |
| if (word->flags & W_COMPASSIGN) |
| tword->flags |= W_COMPASSIGN; /* XXX */ |
| if (word->flags & W_NOGLOB) |
| tword->flags |= W_NOGLOB; /* XXX */ |
| if (word->flags & W_NOBRACE) |
| tword->flags |= W_NOBRACE; /* XXX */ |
| if (quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) |
| tword->flags |= W_QUOTED; |
| list = make_word_list (tword, (WORD_LIST *)NULL); |
| } |
| else if (word->flags & W_ASSIGNRHS) |
| { |
| list = list_string (istring, "", quoted); |
| tword = list->word; |
| if (had_quoted_null && QUOTED_NULL (istring)) |
| tword->flags |= W_HASQUOTEDNULL; |
| free (list); |
| free (istring); |
| istring = 0; /* avoid later free() */ |
| goto set_word_flags; |
| } |
| else |
| { |
| char *ifs_chars; |
| |
| ifs_chars = (quoted_dollar_at || has_dollar_at) ? ifs_value : (char *)NULL; |
| |
| /* If we have $@, we need to split the results no matter what. If |
| IFS is unset or NULL, string_list_dollar_at has separated the |
| positional parameters with a space, so we split on space (we have |
| set ifs_chars to " \t\n" above if ifs is unset). If IFS is set, |
| string_list_dollar_at has separated the positional parameters |
| with the first character of $IFS, so we split on $IFS. If |
| SPLIT_ON_SPACES is set, we expanded $* (unquoted) with IFS either |
| unset or null, and we want to make sure that we split on spaces |
| regardless of what else has happened to IFS since the expansion, |
| or we expanded "$@" with IFS null and we need to split the positional |
| parameters into separate words. */ |
| if (split_on_spaces) |
| { |
| /* If IFS is not set, and the word is not quoted, we want to split |
| the individual words on $' \t\n'. We rely on previous steps to |
| quote the portions of the word that should not be split */ |
| if (ifs_is_set == 0) |
| list = list_string (istring, " \t\n", 1); /* XXX quoted == 1? */ |
| else |
| list = list_string (istring, " ", 1); /* XXX quoted == 1? */ |
| } |
| |
| /* If we have $@ (has_dollar_at != 0) and we are in a context where we |
| don't want to split the result (W_NOSPLIT2), and we are not quoted, |
| we have already separated the arguments with the first character of |
| $IFS. In this case, we want to return a list with a single word |
| with the separator possibly replaced with a space (it's what other |
| shells seem to do). |
| quoted_dollar_at is internal to this function and is set if we are |
| passed an argument that is unquoted (quoted == 0) but we encounter a |
| double-quoted $@ while expanding it. */ |
| else if (has_dollar_at && quoted_dollar_at == 0 && ifs_chars && quoted == 0 && (word->flags & W_NOSPLIT2)) |
| { |
| tword = alloc_word_desc (); |
| /* Only split and rejoin if we have to */ |
| if (*ifs_chars && *ifs_chars != ' ') |
| { |
| /* list_string dequotes CTLESCs in the string it's passed, so we |
| need it to get the space separation right if space isn't the |
| first character in IFS (but is present) and to remove the |
| quoting we added back in param_expand(). */ |
| list = list_string (istring, *ifs_chars ? ifs_chars : " ", 1); |
| /* This isn't exactly right in the case where we're expanding |
| the RHS of an expansion like ${var-$@} where IFS=: (for |
| example). The W_NOSPLIT2 means we do the separation with :; |
| the list_string removes the quotes and breaks the string into |
| a list, and the string_list rejoins it on spaces. When we |
| return, we expect to be able to split the results, but the |
| space separation means the right split doesn't happen. */ |
| tword->word = string_list (list); |
| } |
| else |
| tword->word = istring; |
| if (had_quoted_null && QUOTED_NULL (istring)) |
| tword->flags |= W_HASQUOTEDNULL; /* XXX */ |
| if (tword->word != istring) |
| free (istring); |
| istring = 0; /* avoid later free() */ |
| goto set_word_flags; |
| } |
| else if (has_dollar_at && ifs_chars) |
| list = list_string (istring, *ifs_chars ? ifs_chars : " ", 1); |
| else |
| { |
| tword = alloc_word_desc (); |
| if (expanded_something && *expanded_something == 0 && has_quoted_ifs) |
| tword->word = remove_quoted_ifs (istring); |
| else |
| tword->word = istring; |
| if (had_quoted_null && QUOTED_NULL (istring)) /* should check for more than one */ |
| tword->flags |= W_HASQUOTEDNULL; /* XXX */ |
| else if (had_quoted_null) |
| tword->flags |= W_SAWQUOTEDNULL; /* XXX */ |
| if (tword->word != istring) |
| free (istring); |
| istring = 0; /* avoid later free() */ |
| set_word_flags: |
| if ((quoted & (Q_DOUBLE_QUOTES|Q_HERE_DOCUMENT)) || (quoted_state == WHOLLY_QUOTED)) |
| tword->flags |= W_QUOTED; |
| if (word->flags & W_ASSIGNMENT) |
| tword->flags |= W_ASSIGNMENT; |
| if (word->flags & W_COMPASSIGN) |
| tword->flags |= W_COMPASSIGN; |
| if (word->flags & W_NOGLOB) |
| tword->flags |= W_NOGLOB; |
| if (word->flags & W_NOBRACE) |
| tword->flags |= W_NOBRACE; |
| list = make_word_list (tword, (WORD_LIST *)NULL); |
| } |
| } |
| |
| free (istring); |
| return (list); |
| } |
| |
| /* **************************************************************** */ |
| /* */ |
| /* Functions for Quote Removal */ |
| /* */ |
| /* **************************************************************** */ |
| |
| /* Perform quote removal on STRING. If QUOTED > 0, assume we are obeying the |
| backslash quoting rules for within double quotes or a here document. */ |
| char * |
| string_quote_removal (string, quoted) |
| char *string; |
| int quoted; |
| { |
| size_t slen; |
| char *r, *result_string, *temp, *send; |
| int sindex, tindex, dquote; |
| unsigned char c; |
| DECLARE_MBSTATE; |
| |
| /* The result can be no longer than the original string. */ |
| slen = strlen (string); |
| send = string + slen; |
| |
| r = result_string = (char *)xmalloc (slen + 1); |
| |
| for (dquote = sindex = 0; c = string[sindex];) |
| { |
| switch (c) |
| { |
| case '\\': |
| c = string[++sindex]; |
| if (c == 0) |
| { |
| *r++ = '\\'; |
| break; |
| } |
| if (((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) || dquote) && (sh_syntaxtab[c] & CBSDQUOTE) == 0) |
| *r++ = '\\'; |
| /* FALLTHROUGH */ |
| |
| default: |
| SCOPY_CHAR_M (r, string, send, sindex); |
| break; |
| |
| case '\'': |
| if ((quoted & (Q_HERE_DOCUMENT|Q_DOUBLE_QUOTES)) || dquote) |
| { |
| *r++ = c; |
| sindex++; |
| break; |
| } |
| tindex = sindex + 1; |
| temp = string_extract_single_quoted (string, &tindex); |
| if (temp) |
| { |
| strcpy (r, temp); |
| r += strlen (r); |
| free (temp); |
| } |
| sindex = tindex; |
| break; |
| |
| case '"': |
| dquote = 1 - dquote; |
| sindex++; |
| break; |
| } |
| } |
| *r = '\0'; |
| return (result_string); |
| } |
| |
| #if 0 |
| /* UNUSED */ |
| /* Perform quote removal on word WORD. This allocates and returns a new |
| WORD_DESC *. */ |
| WORD_DESC * |
| word_quote_removal (word, quoted) |
| WORD_DESC *word; |
| int quoted; |
| { |
| WORD_DESC *w; |
| char *t; |
| |
| t = string_quote_removal (word->word, quoted); |
| w = alloc_word_desc (); |
| w->word = t ? t : savestring (""); |
| return (w); |
| } |
| |
| /* Perform quote removal on all words in LIST. If QUOTED is non-zero, |
| the members of the list are treated as if they are surrounded by |
| double quotes. Return a new list, or NULL if LIST is NULL. */ |
| WORD_LIST * |
| word_list_quote_removal (list, quoted) |
| WORD_LIST *list; |
| int quoted; |
| { |
| WORD_LIST *result, *t, *tresult, *e; |
| |
| for (t = list, result = (WORD_LIST *)NULL; t; t = t->next) |
| { |
| tresult = make_word_list (word_quote_removal (t->word, quoted), (WORD_LIST *)NULL); |
| #if 0 |
| result = (WORD_LIST *) list_append (result, tresult); |
| #else |
| if (result == 0) |
| result = e = tresult; |
| else |
| { |
| e->next = tresult; |
| while (e->next) |
| e = e->next; |
| } |
| #endif |
| } |
| return (result); |
| } |
| #endif |
| |
| /******************************************* |
| * * |
| * Functions to perform word splitting * |
| * * |
| *******************************************/ |
| |
| void |
| setifs (v) |
| SHELL_VAR *v; |
| { |
| char *t; |
| unsigned char uc; |
| |
| ifs_var = v; |
| ifs_value = (v && value_cell (v)) ? value_cell (v) : " \t\n"; |
| |
| ifs_is_set = ifs_var != 0; |
| ifs_is_null = ifs_is_set && (*ifs_value == 0); |
| |
| /* Should really merge ifs_cmap with sh_syntaxtab. XXX - doesn't yet |
| handle multibyte chars in IFS */ |
| memset (ifs_cmap, '\0', sizeof (ifs_cmap)); |
| for (t = ifs_value ; t && *t; t++) |
| { |
| uc = *t; |
| ifs_cmap[uc] = 1; |
| } |
| |
| #if defined (HANDLE_MULTIBYTE) |
| if (ifs_value == 0) |
| { |
| ifs_firstc[0] = '\0'; /* XXX - ? */ |
| ifs_firstc_len = 1; |
| } |
| else |
| { |
| if (locale_utf8locale && UTF8_SINGLEBYTE (*ifs_value)) |
| ifs_firstc_len = (*ifs_value != 0) ? 1 : 0; |
| else |
| { |
| size_t ifs_len; |
| ifs_len = strnlen (ifs_value, MB_CUR_MAX); |
| ifs_firstc_len = MBLEN (ifs_value, ifs_len); |
| } |
| if (ifs_firstc_len == 1 || ifs_firstc_len == 0 || MB_INVALIDCH (ifs_firstc_len)) |
| { |
| ifs_firstc[0] = ifs_value[0]; |
| ifs_firstc[1] = '\0'; |
| ifs_firstc_len = 1; |
| } |
| else |
| memcpy (ifs_firstc, ifs_value, ifs_firstc_len); |
| } |
| #else |
| ifs_firstc = ifs_value ? *ifs_value : 0; |
| #endif |
| } |
| |
| char * |
| getifs () |
| { |
| return ifs_value; |
| } |
| |
| /* This splits a single word into a WORD LIST on $IFS, but only if the word |
| is not quoted. list_string () performs quote removal for us, even if we |
| don't do any splitting. */ |
| WORD_LIST * |
| word_split (w, ifs_chars) |
| WORD_DESC *w; |
| char *ifs_chars; |
| { |
| WORD_LIST *result; |
| |
| if (w) |
| { |
| char *xifs; |
| |
| xifs = ((w->flags & W_QUOTED) || ifs_chars == 0) ? "" : ifs_chars; |
| result = list_string (w->word, xifs, w->flags & W_QUOTED); |
| } |
| else |
| result = (WORD_LIST *)NULL; |
| |
| return (result); |
| } |
| |
| /* Perform word splitting on LIST and return the RESULT. It is possible |
| to return (WORD_LIST *)NULL. */ |
| static WORD_LIST * |
| word_list_split (list) |
| WORD_LIST *list; |
| { |
| WORD_LIST *result, *t, *tresult, *e; |
| WORD_DESC *w; |
| |
| for (t = list, result = (WORD_LIST *)NULL; t; t = t->next) |
| { |
| tresult = word_split (t->word, ifs_value); |
| /* POSIX 2.6: "If the complete expansion appropriate for a word results |
| in an empty field, that empty field shall be deleted from the list |
| of fields that form the completely expanded command, unless the |
| original word contained single-quote or double-quote characters." |
| This is where we handle these words that contain quoted null strings |
| and other characters that expand to nothing after word splitting. */ |
| if (tresult == 0 && t->word && (t->word->flags & W_SAWQUOTEDNULL)) /* XXX */ |
| { |
| w = alloc_word_desc (); |
| w->word = (char *)xmalloc (1); |
| w->word[0] = '\0'; |
| tresult = make_word_list (w, (WORD_LIST *)NULL); |
| } |
| if (result == 0) |
| result = e = tresult; |
| else |
| { |
| e->next = tresult; |
| while (e->next) |
| e = e->next; |
| } |
| } |
| return (result); |
| } |
| |
| /************************************************** |
| * * |
| * Functions to expand an entire WORD_LIST * |
| * * |
| **************************************************/ |
| |
| /* Do any word-expansion-specific cleanup and jump to top_level */ |
| static void |
| exp_jump_to_top_level (v) |
| int v; |
| { |
| set_pipestatus_from_exit (last_command_exit_value); |
| |
| /* Cleanup code goes here. */ |
| expand_no_split_dollar_star = 0; /* XXX */ |
| if (expanding_redir) |
| undo_partial_redirects (); |
| expanding_redir = 0; |
| assigning_in_environment = 0; |
| |
| if (parse_and_execute_level == 0) |
| top_level_cleanup (); /* from sig.c */ |
| |
| jump_to_top_level (v); |
| } |
| |
| /* Put NLIST (which is a WORD_LIST * of only one element) at the front of |
| ELIST, and set ELIST to the new list. */ |
| #define PREPEND_LIST(nlist, elist) \ |
| do { nlist->next = elist; elist = nlist; } while (0) |
| |
| /* Separate out any initial variable assignments from TLIST. If set -k has |
| been executed, remove all assignment statements from TLIST. Initial |
| variable assignments and other environment assignments are placed |
| on SUBST_ASSIGN_VARLIST. */ |
| static WORD_LIST * |
| separate_out_assignments (tlist) |
| WORD_LIST *tlist; |
| { |
| register WORD_LIST *vp, *lp; |
| |
| if (tlist == 0) |
| return ((WORD_LIST *)NULL); |
| |
| if (subst_assign_varlist) |
| dispose_words (subst_assign_varlist); /* Clean up after previous error */ |
| |
| subst_assign_varlist = (WORD_LIST *)NULL; |
| vp = lp = tlist; |
| |
| /* Separate out variable assignments at the start of the command. |
| Loop invariant: vp->next == lp |
| Loop postcondition: |
| lp = list of words left after assignment statements skipped |
| tlist = original list of words |
| */ |
| while (lp && (lp->word->flags & W_ASSIGNMENT)) |
| { |
| vp = lp; |
| lp = lp->next; |
| } |
| |
| /* If lp != tlist, we have some initial assignment statements. |
| We make SUBST_ASSIGN_VARLIST point to the list of assignment |
| words and TLIST point to the remaining words. */ |
| if (lp != tlist) |
| { |
| subst_assign_varlist = tlist; |
| /* ASSERT(vp->next == lp); */ |
| vp->next = (WORD_LIST *)NULL; /* terminate variable list */ |
| tlist = lp; /* remainder of word list */ |
| } |
| |
| /* vp == end of variable list */ |
| /* tlist == remainder of original word list without variable assignments */ |
| if (!tlist) |
| /* All the words in tlist were assignment statements */ |
| return ((WORD_LIST *)NULL); |
| |
| /* ASSERT(tlist != NULL); */ |
| /* ASSERT((tlist->word->flags & W_ASSIGNMENT) == 0); */ |
| |
| /* If the -k option is in effect, we need to go through the remaining |
| words, separate out the assignment words, and place them on |
| SUBST_ASSIGN_VARLIST. */ |
| if (place_keywords_in_env) |
| { |
| WORD_LIST *tp; /* tp == running pointer into tlist */ |
| |
| tp = tlist; |
| lp = tlist->next; |
| |
| /* Loop Invariant: tp->next == lp */ |
| /* Loop postcondition: tlist == word list without assignment statements */ |
| while (lp) |
| { |
| if (lp->word->flags & W_ASSIGNMENT) |
| { |
| /* Found an assignment statement, add this word to end of |
| subst_assign_varlist (vp). */ |
| if (!subst_assign_varlist) |
| subst_assign_varlist = vp = lp; |
| else |
| { |
| vp->next = lp; |
| vp = lp; |
| } |
| |
| /* Remove the word pointed to by LP from TLIST. */ |
| tp->next = lp->next; |
| /* ASSERT(vp == lp); */ |
| lp->next = (WORD_LIST *)NULL; |
| lp = tp->next; |
| } |
| else |
| { |
| tp = lp; |
| lp = lp->next; |
| } |
| } |
| } |
| return (tlist); |
| } |
| |
| #define WEXP_VARASSIGN 0x001 |
| #define WEXP_BRACEEXP 0x002 |
| #define WEXP_TILDEEXP 0x004 |
| #define WEXP_PARAMEXP 0x008 |
| #define WEXP_PATHEXP 0x010 |
| |
| /* All of the expansions, including variable assignments at the start of |
| the list. */ |
| #define WEXP_ALL (WEXP_VARASSIGN|WEXP_BRACEEXP|WEXP_TILDEEXP|WEXP_PARAMEXP|WEXP_PATHEXP) |
| |
| /* All of the expansions except variable assignments at the start of |
| the list. */ |
| #define WEXP_NOVARS (WEXP_BRACEEXP|WEXP_TILDEEXP|WEXP_PARAMEXP|WEXP_PATHEXP) |
| |
| /* All of the `shell expansions': brace expansion, tilde expansion, parameter |
| expansion, command substitution, arithmetic expansion, word splitting, and |
| quote removal. */ |
| #define WEXP_SHELLEXP (WEXP_BRACEEXP|WEXP_TILDEEXP|WEXP_PARAMEXP) |
| |
| /* Take the list of words in LIST and do the various substitutions. Return |
| a new list of words which is the expanded list, and without things like |
| variable assignments. */ |
| |
| WORD_LIST * |
| expand_words (list) |
| WORD_LIST *list; |
| { |
| return (expand_word_list_internal (list, WEXP_ALL)); |
| } |
| |
| /* Same as expand_words (), but doesn't hack variable or environment |
| variables. */ |
| WORD_LIST * |
| expand_words_no_vars (list) |
| WORD_LIST *list; |
| { |
| return (expand_word_list_internal (list, WEXP_NOVARS)); |
| } |
| |
| WORD_LIST * |
| expand_words_shellexp (list) |
| WORD_LIST *list; |
| { |
| return (expand_word_list_internal (list, WEXP_SHELLEXP)); |
| } |
| |
| static WORD_LIST * |
| glob_expand_word_list (tlist, eflags) |
| WORD_LIST *tlist; |
| int eflags; |
| { |
| char **glob_array, *temp_string; |
| register int glob_index; |
| WORD_LIST *glob_list, *output_list, *disposables, *next; |
| WORD_DESC *tword; |
| int x; |
| |
| output_list = disposables = (WORD_LIST *)NULL; |
| glob_array = (char **)NULL; |
| while (tlist) |
| { |
| /* For each word, either globbing is attempted or the word is |
| added to orig_list. If globbing succeeds, the results are |
| added to orig_list and the word (tlist) is added to the list |
| of disposable words. If globbing fails and failed glob |
| expansions are left unchanged (the shell default), the |
| original word is added to orig_list. If globbing fails and |
| failed glob expansions are removed, the original word is |
| added to the list of disposable words. orig_list ends up |
| in reverse order and requires a call to REVERSE_LIST to |
| be set right. After all words are examined, the disposable |
| words are freed. */ |
| next = tlist->next; |
| |
| /* If the word isn't an assignment and contains an unquoted |
| pattern matching character, then glob it. */ |
| if ((tlist->word->flags & W_NOGLOB) == 0 && |
| unquoted_glob_pattern_p (tlist->word->word)) |
| { |
| glob_array = shell_glob_filename (tlist->word->word, QGLOB_CTLESC); /* XXX */ |
| |
| /* Handle error cases. |
| I don't think we should report errors like "No such file |
| or directory". However, I would like to report errors |
| like "Read failed". */ |
| |
| if (glob_array == 0 || GLOB_FAILED (glob_array)) |
| { |
| glob_array = (char **)xmalloc (sizeof (char *)); |
| glob_array[0] = (char *)NULL; |
| } |
| |
| /* Dequote the current word in case we have to use it. */ |
| if (glob_array[0] == NULL) |
| { |
| temp_string = dequote_string (tlist->word->word); |
| free (tlist->word->word); |
| tlist->word->word = temp_string; |
| } |
| |
| /* Make the array into a word list. */ |
| glob_list = (WORD_LIST *)NULL; |
| for (glob_index = 0; glob_array[glob_index]; glob_index++) |
| { |
| tword = make_bare_word (glob_array[glob_index]); |
| glob_list = make_word_list (tword, glob_list); |
| } |
| |
| if (glob_list) |
| { |
| output_list = (WORD_LIST *)list_append (glob_list, output_list); |
| PREPEND_LIST (tlist, disposables); |
| } |
| else if (fail_glob_expansion != 0) |
| { |
| last_command_exit_value = EXECUTION_FAILURE; |
| report_error (_("no match: %s"), tlist->word->word); |
| exp_jump_to_top_level (DISCARD); |
| } |
| else if (allow_null_glob_expansion == 0) |
| { |
| /* Failed glob expressions are left unchanged. */ |
| PREPEND_LIST (tlist, output_list); |
| } |
| else |
| { |
| /* Failed glob expressions are removed. */ |
| PREPEND_LIST (tlist, disposables); |
| } |
| } |
| else |
| { |
| /* Dequote the string. */ |
| temp_string = dequote_string (tlist->word->word); |
| free (tlist->word->word); |
| tlist->word->word = temp_string; |
| PREPEND_LIST (tlist, output_list); |
| } |
| |
| strvec_dispose (glob_array); |
| glob_array = (char **)NULL; |
| |
| tlist = next; |
| } |
| |
| if (disposables) |
| dispose_words (disposables); |
| |
| if (output_list) |
| output_list = REVERSE_LIST (output_list, WORD_LIST *); |
| |
| return (output_list); |
| } |
| |
| #if defined (BRACE_EXPANSION) |
| static WORD_LIST * |
| brace_expand_word_list (tlist, eflags) |
| WORD_LIST *tlist; |
| int eflags; |
| { |
| register char **expansions; |
| char *temp_string; |
| WORD_LIST *disposables, *output_list, *next; |
| WORD_DESC *w; |
| int eindex; |
| |
| for (disposables = output_list = (WORD_LIST *)NULL; tlist; tlist = next) |
| { |
| next = tlist->next; |
| |
| if (tlist->word->flags & W_NOBRACE) |
| { |
| /*itrace("brace_expand_word_list: %s: W_NOBRACE", tlist->word->word);*/ |
| PREPEND_LIST (tlist, output_list); |
| continue; |
| } |
| |
| if ((tlist->word->flags & (W_COMPASSIGN|W_ASSIGNARG)) == (W_COMPASSIGN|W_ASSIGNARG)) |
| { |
| /*itrace("brace_expand_word_list: %s: W_COMPASSIGN|W_ASSIGNARG", tlist->word->word);*/ |
| PREPEND_LIST (tlist, output_list); |
| continue; |
| } |
| |
| /* Only do brace expansion if the word has a brace character. If |
| not, just add the word list element to BRACES and continue. In |
| the common case, at least when running shell scripts, this will |
| degenerate to a bunch of calls to `mbschr', and then what is |
| basically a reversal of TLIST into BRACES, which is corrected |
| by a call to REVERSE_LIST () on BRACES when the end of TLIST |
| is reached. */ |
| if (mbschr (tlist->word->word, LBRACE)) |
| { |
| expansions = brace_expand (tlist->word->word); |
| |
| for (eindex = 0; temp_string = expansions[eindex]; eindex++) |
| { |
| w = alloc_word_desc (); |
| w->word = temp_string; |
| |
| /* If brace expansion didn't change the word, preserve |
| the flags. We may want to preserve the flags |
| unconditionally someday -- XXX */ |
| if (STREQ (temp_string, tlist->word->word)) |
| w->flags = tlist->word->flags; |
| else |
| w = make_word_flags (w, temp_string); |
| |
| output_list = make_word_list (w, output_list); |
| } |
| free (expansions); |
| |
| /* Add TLIST to the list of words to be freed after brace |
| expansion has been performed. */ |
| PREPEND_LIST (tlist, disposables); |
| } |
| else |
| PREPEND_LIST (tlist, output_list); |
| } |
| |
| if (disposables) |
| dispose_words (disposables); |
| |
| if (output_list) |
| output_list = REVERSE_LIST (output_list, WORD_LIST *); |
| |
| return (output_list); |
| } |
| #endif |
| |
| #if defined (ARRAY_VARS) |
| /* Take WORD, a compound array assignment, and internally run (for example), |
| 'declare -A w', where W is the variable name portion of WORD. OPTION is |
| the list of options to supply to `declare'. CMD is the declaration command |
| we are expanding right now; it's unused currently. */ |
| static int |
| make_internal_declare (word, option, cmd) |
| char *word; |
| char *option; |
| char *cmd; |
| { |
| int t, r; |
| WORD_LIST *wl; |
| WORD_DESC *w; |
| |
| w = make_word (word); |
| |
| t = assignment (w->word, 0); |
| if (w->word[t] == '=') |
| { |
| w->word[t] = '\0'; |
| if (w->word[t - 1] == '+') /* cut off any append op */ |
| w->word[t - 1] = '\0'; |
| } |
| |
| wl = make_word_list (w, (WORD_LIST *)NULL); |
| wl = make_word_list (make_word (option), wl); |
| |
| r = declare_builtin (wl); |
| |
| dispose_words (wl); |
| return r; |
| } |
| |
| /* Expand VALUE in NAME[+]=( VALUE ) to a list of words. FLAGS is 1 if NAME |
| is an associative array. |
| |
| If we are processing an indexed array, expand_compound_array_assignment |
| will expand all the individual words and quote_compound_array_list will |
| single-quote them. If we are processing an associative array, we use |
| parse_string_to_word_list to split VALUE into a list of words instead of |
| faking up a shell variable and calling expand_compound_array_assignment. |
| expand_and_quote_assoc_word expands and single-quotes each word in VALUE |
| together so we don't have problems finding the end of the subscript when |
| quoting it. |
| |
| Words in VALUE can be individual words, which are expanded and single-quoted, |
| or words of the form [IND]=VALUE, which end up as explained below, as |
| ['expanded-ind']='expanded-value'. */ |
| |
| static WORD_LIST * |
| expand_oneword (value, flags) |
| char *value; |
| int flags; |
| { |
| WORD_LIST *l, *nl; |
| char *t; |
| |
| if (flags == 0) |
| { |
| /* Indexed array */ |
| l = expand_compound_array_assignment ((SHELL_VAR *)NULL, value, flags); |
| /* Now we quote the results of the expansion above to prevent double |
| expansion. */ |
| quote_compound_array_list (l, flags); |
| return l; |
| } |
| else |
| { |
| /* Associative array */ |
| l = parse_string_to_word_list (value, 1, "array assign"); |
| /* For associative arrays, with their arbitrary subscripts, we have to |
| expand and quote in one step so we don't have to search for the |
| closing right bracket more than once. */ |
| for (nl = l; nl; nl = nl->next) |
| { |
| if ((nl->word->flags & W_ASSIGNMENT) == 0) |
| t = sh_single_quote (nl->word->word ? nl->word->word : ""); |
| else |
| t = expand_and_quote_assoc_word (nl->word->word, flags); |
| free (nl->word->word); |
| nl->word->word = t; |
| } |
| return l; |
| } |
| } |
| |
| /* Expand a single compound assignment argument to a declaration builtin. |
| This word takes the form NAME[+]=( VALUE ). The NAME[+]= is passed through |
| unchanged. The VALUE is expanded and each word in the result is single- |
| quoted. Words of the form [key]=value end up as |
| ['expanded-key']='expanded-value'. Associative arrays have special |
| handling, see expand_oneword() above. The return value is |
| NAME[+]=( expanded-and-quoted-VALUE ). */ |
| static void |
| expand_compound_assignment_word (tlist, flags) |
| WORD_LIST *tlist; |
| int flags; |
| { |
| WORD_LIST *l; |
| int wlen, oind, t; |
| char *value, *temp; |
| |
| /*itrace("expand_compound_assignment_word: original word = -%s-", tlist->word->word);*/ |
| t = assignment (tlist->word->word, 0); |
| |
| /* value doesn't have the open and close parens */ |
| oind = 1; |
| value = extract_array_assignment_list (tlist->word->word + t + 1, &oind); |
| /* This performs one round of expansion on the index/key and value and |
| single-quotes each word in the result. */ |
| l = expand_oneword (value, flags); |
| free (value); |
| |
| value = string_list (l); |
| wlen = STRLEN (value); |
| |
| /* Now, let's rebuild the string */ |
| temp = xmalloc (t + 3 + wlen + 1); /* name[+]=(value) */ |
| memcpy (temp, tlist->word->word, ++t); |
| temp[t++] = '('; |
| if (value) |
| memcpy (temp + t, value, wlen); |
| t += wlen; |
| temp[t++] = ')'; |
| temp[t] = '\0'; |
| /*itrace("expand_compound_assignment_word: reconstructed word = -%s-", temp);*/ |
| |
| free (tlist->word->word); |
| tlist->word->word = temp; |
| |
| free (value); |
| } |
| |
| /* Expand and process an argument to a declaration command. We have already |
| set flags in TLIST->word->flags depending on the declaration command |
| (declare, local, etc.) and the options supplied to it (-a, -A, etc.). |
| TLIST->word->word is of the form NAME[+]=( VALUE ). |
| |
| This does several things, all using pieces of other functions to get the |
| evaluation sequence right. It's called for compound array assignments with |
| the W_ASSIGNMENT flag set (basically, valid identifier names on the lhs). |
| It parses out which flags need to be set for declare to create the variable |
| correctly, then calls declare internally (make_internal_declare) to make |
| sure the variable exists with the correct attributes. Before the variable |
| is created, it calls expand_compound_assignment_word to expand VALUE to a |
| list of words, appropriately quoted for further evaluation. This preserves |
| the semantics of word-expansion-before-calling-builtins. Finally, it calls |
| do_word_assignment to perform the expansion and assignment with the same |
| expansion semantics as a standalone assignment statement (no word splitting, |
| etc.) even though the word is single-quoted so all that needs to happen is |
| quote removal. */ |
| static WORD_LIST * |
| expand_declaration_argument (tlist, wcmd) |
| WORD_LIST *tlist, *wcmd; |
| { |
| char opts[16], omap[128]; |
| int t, opti, oind, skip, inheriting; |
| WORD_LIST *l; |
| |
| inheriting = localvar_inherit; |
| opti = 0; |
| if (tlist->word->flags & (W_ASSIGNASSOC|W_ASSNGLOBAL|W_CHKLOCAL|W_ASSIGNARRAY)) |
| opts[opti++] = '-'; |
| |
| if ((tlist->word->flags & (W_ASSIGNASSOC|W_ASSNGLOBAL)) == (W_ASSIGNASSOC|W_ASSNGLOBAL)) |
| { |
| opts[opti++] = 'g'; |
| opts[opti++] = 'A'; |
| } |
| else if (tlist->word->flags & W_ASSIGNASSOC) |
| { |
| opts[opti++] = 'A'; |
| } |
| else if ((tlist->word->flags & (W_ASSIGNARRAY|W_ASSNGLOBAL)) == (W_ASSIGNARRAY|W_ASSNGLOBAL)) |
| { |
| opts[opti++] = 'g'; |
| opts[opti++] = 'a'; |
| } |
| else if (tlist->word->flags & W_ASSIGNARRAY) |
| { |
| opts[opti++] = 'a'; |
| } |
| else if (tlist->word->flags & W_ASSNGLOBAL) |
| opts[opti++] = 'g'; |
| |
| if (tlist->word->flags & W_CHKLOCAL) |
| opts[opti++] = 'G'; |
| |
| /* If we have special handling note the integer attribute and others |
| that transform the value upon assignment. What we do is take all |
| of the option arguments and scan through them looking for options |
| that cause such transformations, and add them to the `opts' array. */ |
| |
| memset (omap, '\0', sizeof (omap)); |
| for (l = wcmd->next; l != tlist; l = l->next) |
| { |
| if (l->word->word[0] != '-') |
| break; /* non-option argument */ |
| if (l->word->word[0] == '-' && l->word->word[1] == '-' && l->word->word[2] == 0) |
| break; /* -- signals end of options */ |
| for (oind = 1; l->word->word[oind]; oind++) |
| switch (l->word->word[oind]) |
| { |
| case 'I': |
| inheriting = 1; |
| case 'i': |
| case 'l': |
| case 'u': |
| case 'c': |
| omap[l->word->word[oind]] = 1; |
| if (opti == 0) |
| opts[opti++] = '-'; |
| break; |
| default: |
| break; |
| } |
| } |
| |
| for (oind = 0; oind < sizeof (omap); oind++) |
| if (omap[oind]) |
| opts[opti++] = oind; |
| |
| /* If there are no -a/-A options, but we have a compound assignment, |
| we have a choice: we can set opts[0]='-', opts[1]='a', since the |
| default is to create an indexed array, and call |
| make_internal_declare with that, or we can just skip the -a and let |
| declare_builtin deal with it. Once we're here, we're better set |
| up for the latter, since we don't want to deal with looking up |
| any existing variable here -- better to let declare_builtin do it. |
| We need the variable created, though, especially if it's local, so |
| we get the scoping right before we call do_word_assignment. |
| To ensure that make_local_declare gets called, we add `--' if there |
| aren't any options. */ |
| if ((tlist->word->flags & (W_ASSIGNASSOC|W_ASSIGNARRAY)) == 0) |
| { |
| if (opti == 0) |
| { |
| opts[opti++] = '-'; |
| opts[opti++] = '-'; |
| } |
| } |
| opts[opti] = '\0'; |
| |
| /* This isn't perfect, but it's a start. Improvements later. We expand |
| tlist->word->word and single-quote the results to avoid multiple |
| expansions by, say, do_assignment_internal(). We have to weigh the |
| cost of reconstructing the compound assignment string with its single |
| quoting and letting the declare builtin handle it. The single quotes |
| will prevent any unwanted additional expansion or word splitting. */ |
| expand_compound_assignment_word (tlist, (tlist->word->flags & W_ASSIGNASSOC) ? 1 : 0); |
| |
| skip = 0; |
| if (opti > 0) |
| { |
| t = make_internal_declare (tlist->word->word, opts, wcmd ? wcmd->word->word : (char *)0); |
| if (t != EXECUTION_SUCCESS) |
| { |
| last_command_exit_value = t; |
| if (tlist->word->flags & W_FORCELOCAL) /* non-fatal error */ |
| skip = 1; |
| else |
| exp_jump_to_top_level (DISCARD); |
| } |
| } |
| |
| if (skip == 0) |
| { |
| t = do_word_assignment (tlist->word, 0); |
| if (t == 0) |
| { |
| last_command_exit_value = EXECUTION_FAILURE; |
| exp_jump_to_top_level (DISCARD); |
| } |
| } |
| |
| /* Now transform the word as ksh93 appears to do and go on */ |
| t = assignment (tlist->word->word, 0); |
| tlist->word->word[t] = '\0'; |
| if (tlist->word->word[t - 1] == '+') |
| tlist->word->word[t - 1] = '\0'; /* cut off append op */ |
| tlist->word->flags &= ~(W_ASSIGNMENT|W_NOSPLIT|W_COMPASSIGN|W_ASSIGNARG|W_ASSIGNASSOC|W_ASSIGNARRAY); |
| |
| return (tlist); |
| } |
| #endif /* ARRAY_VARS */ |
| |
| static WORD_LIST * |
| shell_expand_word_list (tlist, eflags) |
| WORD_LIST *tlist; |
| int eflags; |
| { |
| WORD_LIST *expanded, *orig_list, *new_list, *next, *temp_list, *wcmd; |
| int expanded_something, has_dollar_at; |
| |
| /* We do tilde expansion all the time. This is what 1003.2 says. */ |
| wcmd = new_list = (WORD_LIST *)NULL; |
| |
| for (orig_list = tlist; tlist; tlist = next) |
| { |
| if (wcmd == 0 && (tlist->word->flags & W_ASSNBLTIN)) |
| wcmd = tlist; |
| |
| next = tlist->next; |
| |
| #if defined (ARRAY_VARS) |
| /* If this is a compound array assignment to a builtin that accepts |
| such assignments (e.g., `declare'), take the assignment and perform |
| it separately, handling the semantics of declarations inside shell |
| functions. This avoids the double-evaluation of such arguments, |
| because `declare' does some evaluation of compound assignments on |
| its own. */ |
| if ((tlist->word->flags & (W_COMPASSIGN|W_ASSIGNARG)) == (W_COMPASSIGN|W_ASSIGNARG)) |
| expand_declaration_argument (tlist, wcmd); |
| #endif |
| |
| expanded_something = 0; |
| expanded = expand_word_internal |
| (tlist->word, 0, 0, &has_dollar_at, &expanded_something); |
| |
| if (expanded == &expand_word_error || expanded == &expand_word_fatal) |
| { |
| /* By convention, each time this error is returned, |
| tlist->word->word has already been freed. */ |
| tlist->word->word = (char *)NULL; |
| |
| /* Dispose our copy of the original list. */ |
| dispose_words (orig_list); |
| /* Dispose the new list we're building. */ |
| dispose_words (new_list); |
| |
| last_command_exit_value = EXECUTION_FAILURE; |
| if (expanded == &expand_word_error) |
| exp_jump_to_top_level (DISCARD); |
| else |
| exp_jump_to_top_level (FORCE_EOF); |
| } |
| |
| /* Don't split words marked W_NOSPLIT. */ |
| if (expanded_something && (tlist->word->flags & W_NOSPLIT) == 0) |
| { |
| temp_list = word_list_split (expanded); |
| dispose_words (expanded); |
| } |
| else |
| { |
| /* If no parameter expansion, command substitution, process |
| substitution, or arithmetic substitution took place, then |
| do not do word splitting. We still have to remove quoted |
| null characters from the result. */ |
| word_list_remove_quoted_nulls (expanded); |
| temp_list = expanded; |
| } |
| |
| expanded = REVERSE_LIST (temp_list, WORD_LIST *); |
| new_list = (WORD_LIST *)list_append (expanded, new_list); |
| } |
| |
| if (orig_list) |
| dispose_words (orig_list); |
| |
| if (new_list) |
| new_list = REVERSE_LIST (new_list, WORD_LIST *); |
| |
| return (new_list); |
| } |
| |
| /* The workhorse for expand_words () and expand_words_no_vars (). |
| First arg is LIST, a WORD_LIST of words. |
| Second arg EFLAGS is a flags word controlling which expansions are |
| performed. |
| |
| This does all of the substitutions: brace expansion, tilde expansion, |
| parameter expansion, command substitution, arithmetic expansion, |
| process substitution, word splitting, and pathname expansion, according |
| to the bits set in EFLAGS. Words with the W_QUOTED or W_NOSPLIT bits |
| set, or for which no expansion is done, do not undergo word splitting. |
| Words with the W_NOGLOB bit set do not undergo pathname expansion; words |
| with W_NOBRACE set do not undergo brace expansion (see |
| brace_expand_word_list above). */ |
| static WORD_LIST * |
| expand_word_list_internal (list, eflags) |
| WORD_LIST *list; |
| int eflags; |
| { |
| WORD_LIST *new_list, *temp_list; |
| int tint; |
| char *savecmd; |
| |
| tempenv_assign_error = 0; |
| if (list == 0) |
| return ((WORD_LIST *)NULL); |
| |
| garglist = new_list = copy_word_list (list); |
| if (eflags & WEXP_VARASSIGN) |
| { |
| garglist = new_list = separate_out_assignments (new_list); |
| if (new_list == 0) |
| { |
| if (subst_assign_varlist) |
| { |
| /* All the words were variable assignments, so they are placed |
| into the shell's environment. */ |
| for (temp_list = subst_assign_varlist; temp_list; temp_list = temp_list->next) |
| { |
| savecmd = this_command_name; |
| this_command_name = (char *)NULL; /* no arithmetic errors */ |
| tint = do_word_assignment (temp_list->word, 0); |
| this_command_name = savecmd; |
| /* Variable assignment errors in non-interactive shells |
| running in Posix.2 mode cause the shell to exit, unless |
| they are being run by the `command' builtin. */ |
| if (tint == 0) |
| { |
| last_command_exit_value = EXECUTION_FAILURE; |
| if (interactive_shell == 0 && posixly_correct && executing_command_builtin == 0) |
| exp_jump_to_top_level (FORCE_EOF); |
| else |
| exp_jump_to_top_level (DISCARD); |
| } |
| } |
| dispose_words (subst_assign_varlist); |
| subst_assign_varlist = (WORD_LIST *)NULL; |
| } |
| return ((WORD_LIST *)NULL); |
| } |
| } |
| |
| /* Begin expanding the words that remain. The expansions take place on |
| things that aren't really variable assignments. */ |
| |
| #if defined (BRACE_EXPANSION) |
| /* Do brace expansion on this word if there are any brace characters |
| in the string. */ |
| if ((eflags & WEXP_BRACEEXP) && brace_expansion && new_list) |
| new_list = brace_expand_word_list (new_list, eflags); |
| #endif /* BRACE_EXPANSION */ |
| |
| /* Perform the `normal' shell expansions: tilde expansion, parameter and |
| variable substitution, command substitution, arithmetic expansion, |
| and word splitting. */ |
| new_list = shell_expand_word_list (new_list, eflags); |
| |
| /* Okay, we're almost done. Now let's just do some filename |
| globbing. */ |
| if (new_list) |
| { |
| if ((eflags & WEXP_PATHEXP) && disallow_filename_globbing == 0) |
| /* Glob expand the word list unless globbing has been disabled. */ |
| new_list = glob_expand_word_list (new_list, eflags); |
| else |
| /* Dequote the words, because we're not performing globbing. */ |
| new_list = dequote_list (new_list); |
| } |
| |
| if ((eflags & WEXP_VARASSIGN) && subst_assign_varlist) |
| { |
| sh_wassign_func_t *assign_func; |
| int is_special_builtin, is_builtin_or_func; |
| |
| /* If the remainder of the words expand to nothing, Posix.2 requires |
| that the variable and environment assignments affect the shell's |
| environment. */ |
| assign_func = new_list ? assign_in_env : do_word_assignment; |
| tempenv_assign_error = 0; |
| |
| is_builtin_or_func = (new_list && new_list->word && (find_shell_builtin (new_list->word->word) || find_function (new_list->word->word))); |
| /* Posix says that special builtins exit if a variable assignment error |
| occurs in an assignment preceding it. */ |
| is_special_builtin = (posixly_correct && new_list && new_list->word && find_special_builtin (new_list->word->word)); |
| |
| for (temp_list = subst_assign_varlist; temp_list; temp_list = temp_list->next) |
| { |
| savecmd = this_command_name; |
| this_command_name = (char *)NULL; |
| assigning_in_environment = (assign_func == assign_in_env); |
| tint = (*assign_func) (temp_list->word, is_builtin_or_func); |
| assigning_in_environment = 0; |
| this_command_name = savecmd; |
| /* Variable assignment errors in non-interactive shells running |
| in Posix.2 mode cause the shell to exit. */ |
| if (tint == 0) |
| { |
| if (assign_func == do_word_assignment) |
| { |
| last_command_exit_value = EXECUTION_FAILURE; |
| if (interactive_shell == 0 && posixly_correct) |
| exp_jump_to_top_level (FORCE_EOF); |
| else |
| exp_jump_to_top_level (DISCARD); |
| } |
| else if (interactive_shell == 0 && is_special_builtin) |
| { |
| last_command_exit_value = EXECUTION_FAILURE; |
| exp_jump_to_top_level (FORCE_EOF); |
| } |
| else |
| tempenv_assign_error++; |
| } |
| } |
| |
| dispose_words (subst_assign_varlist); |
| subst_assign_varlist = (WORD_LIST *)NULL; |
| } |
| |
| return (new_list); |
| } |