parser.c revision 253659
11556Srgrimes/*- 21556Srgrimes * Copyright (c) 1991, 1993 31556Srgrimes * The Regents of the University of California. All rights reserved. 41556Srgrimes * 51556Srgrimes * This code is derived from software contributed to Berkeley by 61556Srgrimes * Kenneth Almquist. 71556Srgrimes * 81556Srgrimes * Redistribution and use in source and binary forms, with or without 91556Srgrimes * modification, are permitted provided that the following conditions 101556Srgrimes * are met: 111556Srgrimes * 1. Redistributions of source code must retain the above copyright 121556Srgrimes * notice, this list of conditions and the following disclaimer. 131556Srgrimes * 2. Redistributions in binary form must reproduce the above copyright 141556Srgrimes * notice, this list of conditions and the following disclaimer in the 151556Srgrimes * documentation and/or other materials provided with the distribution. 161556Srgrimes * 4. Neither the name of the University nor the names of its contributors 171556Srgrimes * may be used to endorse or promote products derived from this software 181556Srgrimes * without specific prior written permission. 191556Srgrimes * 201556Srgrimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 211556Srgrimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 221556Srgrimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 231556Srgrimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 241556Srgrimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 251556Srgrimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 261556Srgrimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 271556Srgrimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 281556Srgrimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 291556Srgrimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 301556Srgrimes * SUCH DAMAGE. 311556Srgrimes */ 321556Srgrimes 331556Srgrimes#ifndef lint 3436150Scharnier#if 0 3536150Scharnierstatic char sccsid[] = "@(#)parser.c 8.7 (Berkeley) 5/16/95"; 3636150Scharnier#endif 371556Srgrimes#endif /* not lint */ 3899110Sobrien#include <sys/cdefs.h> 3999110Sobrien__FBSDID("$FreeBSD: head/bin/sh/parser.c 253659 2013-07-25 20:50:35Z jilles $"); 401556Srgrimes 4117987Speter#include <stdlib.h> 42149017Sstefanf#include <unistd.h> 43209337Sjilles#include <stdio.h> 4417987Speter 451556Srgrimes#include "shell.h" 461556Srgrimes#include "parser.h" 471556Srgrimes#include "nodes.h" 481556Srgrimes#include "expand.h" /* defines rmescapes() */ 491556Srgrimes#include "syntax.h" 501556Srgrimes#include "options.h" 511556Srgrimes#include "input.h" 521556Srgrimes#include "output.h" 531556Srgrimes#include "var.h" 541556Srgrimes#include "error.h" 551556Srgrimes#include "memalloc.h" 561556Srgrimes#include "mystring.h" 571556Srgrimes#include "alias.h" 5817987Speter#include "show.h" 5959436Scracauer#include "eval.h" 60214304Sjilles#include "exec.h" /* to check for special builtins */ 6117987Speter#ifndef NO_HISTORY 621556Srgrimes#include "myhistedit.h" 6317987Speter#endif 641556Srgrimes 651556Srgrimes/* 661556Srgrimes * Shell command parser. 671556Srgrimes */ 681556Srgrimes 69142845Sobrien#define EOFMARKLEN 79 70142845Sobrien#define PROMPTLEN 128 711556Srgrimes 72214709Sjilles/* values of checkkwd variable */ 73214709Sjilles#define CHKALIAS 0x1 74214709Sjilles#define CHKKWD 0x2 75214709Sjilles#define CHKNL 0x4 76214709Sjilles 771556Srgrimes/* values returned by readtoken */ 7817987Speter#include "token.h" 791556Srgrimes 801556Srgrimes 811556Srgrimes 821556Srgrimesstruct heredoc { 831556Srgrimes struct heredoc *next; /* next here document in list */ 841556Srgrimes union node *here; /* redirection node */ 851556Srgrimes char *eofmark; /* string indicating end of input */ 861556Srgrimes int striptabs; /* if set, strip leading tabs */ 871556Srgrimes}; 881556Srgrimes 89206145Sjillesstruct parser_temp { 90206145Sjilles struct parser_temp *next; 91206145Sjilles void *data; 92206145Sjilles}; 931556Srgrimes 941556Srgrimes 95213760Sobrienstatic struct heredoc *heredoclist; /* list of here documents to read */ 96213760Sobrienstatic int doprompt; /* if set, prompt the user */ 97213760Sobrienstatic int needprompt; /* true if interactive and at start of line */ 98213760Sobrienstatic int lasttoken; /* last token read */ 99253658Sjillesint tokpushback; /* last token pushed back */ 100213760Sobrienstatic char *wordtext; /* text of last word returned by readtoken */ 101253659Sjillesstatic int checkkwd; 102213760Sobrienstatic struct nodelist *backquotelist; 103213760Sobrienstatic union node *redirnode; 104213760Sobrienstatic struct heredoc *heredoc; 105213760Sobrienstatic int quoteflag; /* set if (part of) last token was quoted */ 106213760Sobrienstatic int startlinno; /* line # where last token started */ 107213760Sobrienstatic int funclinno; /* line # where the current function started */ 108213760Sobrienstatic struct parser_temp *parser_temp; 1091556Srgrimes 1101556Srgrimes 111214525Sjillesstatic union node *list(int, int); 112213811Sobrienstatic union node *andor(void); 113213811Sobrienstatic union node *pipeline(void); 114213811Sobrienstatic union node *command(void); 115213811Sobrienstatic union node *simplecmd(union node **, union node *); 116213811Sobrienstatic union node *makename(void); 117213811Sobrienstatic void parsefname(void); 118213811Sobrienstatic void parseheredoc(void); 119213811Sobrienstatic int peektoken(void); 120213811Sobrienstatic int readtoken(void); 121213811Sobrienstatic int xxreadtoken(void); 122248980Sjillesstatic int readtoken1(int, const char *, const char *, int); 123213811Sobrienstatic int noexpand(char *); 124213811Sobrienstatic void synexpect(int) __dead2; 125213811Sobrienstatic void synerror(const char *) __dead2; 126213811Sobrienstatic void setprompt(int); 1271556Srgrimes 12817987Speter 129213811Sobrienstatic void * 130206145Sjillesparser_temp_alloc(size_t len) 131206145Sjilles{ 132206145Sjilles struct parser_temp *t; 133206145Sjilles 134206145Sjilles INTOFF; 135206145Sjilles t = ckmalloc(sizeof(*t)); 136206145Sjilles t->data = NULL; 137206145Sjilles t->next = parser_temp; 138206145Sjilles parser_temp = t; 139206145Sjilles t->data = ckmalloc(len); 140206145Sjilles INTON; 141206145Sjilles return t->data; 142206145Sjilles} 143206145Sjilles 144206145Sjilles 145213811Sobrienstatic void * 146206145Sjillesparser_temp_realloc(void *ptr, size_t len) 147206145Sjilles{ 148206145Sjilles struct parser_temp *t; 149206145Sjilles 150206145Sjilles INTOFF; 151206145Sjilles t = parser_temp; 152206145Sjilles if (ptr != t->data) 153206145Sjilles error("bug: parser_temp_realloc misused"); 154206145Sjilles t->data = ckrealloc(t->data, len); 155206145Sjilles INTON; 156206145Sjilles return t->data; 157206145Sjilles} 158206145Sjilles 159206145Sjilles 160213811Sobrienstatic void 161206145Sjillesparser_temp_free_upto(void *ptr) 162206145Sjilles{ 163206145Sjilles struct parser_temp *t; 164206145Sjilles int done = 0; 165206145Sjilles 166206145Sjilles INTOFF; 167206145Sjilles while (parser_temp != NULL && !done) { 168206145Sjilles t = parser_temp; 169206145Sjilles parser_temp = t->next; 170206145Sjilles done = t->data == ptr; 171206145Sjilles ckfree(t->data); 172206145Sjilles ckfree(t); 173206145Sjilles } 174206145Sjilles INTON; 175206145Sjilles if (!done) 176206145Sjilles error("bug: parser_temp_free_upto misused"); 177206145Sjilles} 178206145Sjilles 179206145Sjilles 180213811Sobrienstatic void 181206145Sjillesparser_temp_free_all(void) 182206145Sjilles{ 183206145Sjilles struct parser_temp *t; 184206145Sjilles 185206145Sjilles INTOFF; 186206145Sjilles while (parser_temp != NULL) { 187206145Sjilles t = parser_temp; 188206145Sjilles parser_temp = t->next; 189206145Sjilles ckfree(t->data); 190206145Sjilles ckfree(t); 191206145Sjilles } 192206145Sjilles INTON; 193206145Sjilles} 194206145Sjilles 195206145Sjilles 1961556Srgrimes/* 1971556Srgrimes * Read and parse a command. Returns NEOF on end of file. (NULL is a 1981556Srgrimes * valid parse tree indicating a blank line.) 1991556Srgrimes */ 2001556Srgrimes 2011556Srgrimesunion node * 20290111Simpparsecmd(int interact) 20317987Speter{ 2041556Srgrimes int t; 2051556Srgrimes 206206145Sjilles /* This assumes the parser is not re-entered, 207206145Sjilles * which could happen if we add command substitution on PS1/PS2. 208206145Sjilles */ 209206145Sjilles parser_temp_free_all(); 210208656Sjilles heredoclist = NULL; 211206145Sjilles 21260593Scracauer tokpushback = 0; 2131556Srgrimes doprompt = interact; 2141556Srgrimes if (doprompt) 2151556Srgrimes setprompt(1); 2161556Srgrimes else 2171556Srgrimes setprompt(0); 2181556Srgrimes needprompt = 0; 2191556Srgrimes t = readtoken(); 2201556Srgrimes if (t == TEOF) 2211556Srgrimes return NEOF; 2221556Srgrimes if (t == TNL) 2231556Srgrimes return NULL; 2241556Srgrimes tokpushback++; 225214531Sjilles return list(1, 1); 2261556Srgrimes} 2271556Srgrimes 2281556Srgrimes 229213811Sobrienstatic union node * 230214525Sjilleslist(int nlflag, int erflag) 23117987Speter{ 232214599Sjilles union node *ntop, *n1, *n2, *n3; 23317987Speter int tok; 2341556Srgrimes 235214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 236214531Sjilles if (!nlflag && !erflag && tokendlist[peektoken()]) 2371556Srgrimes return NULL; 238214599Sjilles ntop = n1 = NULL; 2391556Srgrimes for (;;) { 24017987Speter n2 = andor(); 24117987Speter tok = readtoken(); 24217987Speter if (tok == TBACKGND) { 243245382Sjilles if (n2 != NULL && n2->type == NPIPE) { 244223282Sjilles n2->npipe.backgnd = 1; 245245382Sjilles } else if (n2 != NULL && n2->type == NREDIR) { 24617987Speter n2->type = NBACKGND; 24717987Speter } else { 24817987Speter n3 = (union node *)stalloc(sizeof (struct nredir)); 24917987Speter n3->type = NBACKGND; 25017987Speter n3->nredir.n = n2; 25117987Speter n3->nredir.redirect = NULL; 25217987Speter n2 = n3; 25317987Speter } 25417987Speter } 255214599Sjilles if (ntop == NULL) 256214599Sjilles ntop = n2; 257214599Sjilles else if (n1 == NULL) { 258214599Sjilles n1 = (union node *)stalloc(sizeof (struct nbinary)); 259214599Sjilles n1->type = NSEMI; 260214599Sjilles n1->nbinary.ch1 = ntop; 261214599Sjilles n1->nbinary.ch2 = n2; 262214599Sjilles ntop = n1; 26317987Speter } 26417987Speter else { 26517987Speter n3 = (union node *)stalloc(sizeof (struct nbinary)); 26617987Speter n3->type = NSEMI; 267214599Sjilles n3->nbinary.ch1 = n1->nbinary.ch2; 26817987Speter n3->nbinary.ch2 = n2; 269214599Sjilles n1->nbinary.ch2 = n3; 27017987Speter n1 = n3; 27117987Speter } 27217987Speter switch (tok) { 27313882Sjoerg case TBACKGND: 27417987Speter case TSEMI: 27517987Speter tok = readtoken(); 276102410Scharnier /* FALLTHROUGH */ 2771556Srgrimes case TNL: 27817987Speter if (tok == TNL) { 27917987Speter parseheredoc(); 28017987Speter if (nlflag) 281214599Sjilles return ntop; 282210488Sjilles } else if (tok == TEOF && nlflag) { 283210488Sjilles parseheredoc(); 284214599Sjilles return ntop; 28517987Speter } else { 28617987Speter tokpushback++; 28717987Speter } 288214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 289245381Sjilles if (!nlflag && (erflag ? peektoken() == TEOF : 290245381Sjilles tokendlist[peektoken()])) 291214599Sjilles return ntop; 2921556Srgrimes break; 2931556Srgrimes case TEOF: 2941556Srgrimes if (heredoclist) 2951556Srgrimes parseheredoc(); 2961556Srgrimes else 2971556Srgrimes pungetc(); /* push back EOF on input */ 298214599Sjilles return ntop; 2991556Srgrimes default: 300214525Sjilles if (nlflag || erflag) 3011556Srgrimes synexpect(-1); 3021556Srgrimes tokpushback++; 303214599Sjilles return ntop; 3041556Srgrimes } 3051556Srgrimes } 3061556Srgrimes} 3071556Srgrimes 3081556Srgrimes 3091556Srgrimes 310213811Sobrienstatic union node * 31190111Simpandor(void) 31290111Simp{ 3131556Srgrimes union node *n1, *n2, *n3; 3141556Srgrimes int t; 3151556Srgrimes 3161556Srgrimes n1 = pipeline(); 3171556Srgrimes for (;;) { 3181556Srgrimes if ((t = readtoken()) == TAND) { 3191556Srgrimes t = NAND; 3201556Srgrimes } else if (t == TOR) { 3211556Srgrimes t = NOR; 3221556Srgrimes } else { 3231556Srgrimes tokpushback++; 3241556Srgrimes return n1; 3251556Srgrimes } 3261556Srgrimes n2 = pipeline(); 3271556Srgrimes n3 = (union node *)stalloc(sizeof (struct nbinary)); 3281556Srgrimes n3->type = t; 3291556Srgrimes n3->nbinary.ch1 = n1; 3301556Srgrimes n3->nbinary.ch2 = n2; 3311556Srgrimes n1 = n3; 3321556Srgrimes } 3331556Srgrimes} 3341556Srgrimes 3351556Srgrimes 3361556Srgrimes 337213811Sobrienstatic union node * 33890111Simppipeline(void) 33990111Simp{ 34075336Sbrian union node *n1, *n2, *pipenode; 3411556Srgrimes struct nodelist *lp, *prev; 342214281Sjilles int negate, t; 3431556Srgrimes 34475336Sbrian negate = 0; 345214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 3461556Srgrimes TRACE(("pipeline: entered\n")); 34775336Sbrian while (readtoken() == TNOT) 34875336Sbrian negate = !negate; 34975336Sbrian tokpushback++; 3501556Srgrimes n1 = command(); 3511556Srgrimes if (readtoken() == TPIPE) { 3521556Srgrimes pipenode = (union node *)stalloc(sizeof (struct npipe)); 3531556Srgrimes pipenode->type = NPIPE; 3541556Srgrimes pipenode->npipe.backgnd = 0; 3551556Srgrimes lp = (struct nodelist *)stalloc(sizeof (struct nodelist)); 3561556Srgrimes pipenode->npipe.cmdlist = lp; 3571556Srgrimes lp->n = n1; 3581556Srgrimes do { 3591556Srgrimes prev = lp; 3601556Srgrimes lp = (struct nodelist *)stalloc(sizeof (struct nodelist)); 361214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 362214281Sjilles t = readtoken(); 363214281Sjilles tokpushback++; 364214281Sjilles if (t == TNOT) 365214281Sjilles lp->n = pipeline(); 366214281Sjilles else 367214281Sjilles lp->n = command(); 3681556Srgrimes prev->next = lp; 3691556Srgrimes } while (readtoken() == TPIPE); 3701556Srgrimes lp->next = NULL; 3711556Srgrimes n1 = pipenode; 3721556Srgrimes } 3731556Srgrimes tokpushback++; 37475336Sbrian if (negate) { 37575336Sbrian n2 = (union node *)stalloc(sizeof (struct nnot)); 37675336Sbrian n2->type = NNOT; 37775336Sbrian n2->nnot.com = n1; 37875336Sbrian return n2; 37975336Sbrian } else 38075336Sbrian return n1; 3811556Srgrimes} 3821556Srgrimes 3831556Srgrimes 3841556Srgrimes 385213811Sobrienstatic union node * 38690111Simpcommand(void) 38790111Simp{ 3881556Srgrimes union node *n1, *n2; 3891556Srgrimes union node *ap, **app; 3901556Srgrimes union node *cp, **cpp; 3911556Srgrimes union node *redir, **rpp; 392214281Sjilles int t; 393218325Sjilles int is_subshell; 3941556Srgrimes 395214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 396218325Sjilles is_subshell = 0; 39717987Speter redir = NULL; 39817987Speter n1 = NULL; 3991556Srgrimes rpp = &redir; 40020425Ssteve 4011556Srgrimes /* Check for redirection which may precede command */ 4021556Srgrimes while (readtoken() == TREDIR) { 4031556Srgrimes *rpp = n2 = redirnode; 4041556Srgrimes rpp = &n2->nfile.next; 4051556Srgrimes parsefname(); 4061556Srgrimes } 4071556Srgrimes tokpushback++; 4081556Srgrimes 4091556Srgrimes switch (readtoken()) { 4101556Srgrimes case TIF: 4111556Srgrimes n1 = (union node *)stalloc(sizeof (struct nif)); 4121556Srgrimes n1->type = NIF; 413214525Sjilles if ((n1->nif.test = list(0, 0)) == NULL) 414104554Stjr synexpect(-1); 4151556Srgrimes if (readtoken() != TTHEN) 4161556Srgrimes synexpect(TTHEN); 417214525Sjilles n1->nif.ifpart = list(0, 0); 4181556Srgrimes n2 = n1; 4191556Srgrimes while (readtoken() == TELIF) { 4201556Srgrimes n2->nif.elsepart = (union node *)stalloc(sizeof (struct nif)); 4211556Srgrimes n2 = n2->nif.elsepart; 4221556Srgrimes n2->type = NIF; 423214525Sjilles if ((n2->nif.test = list(0, 0)) == NULL) 424104554Stjr synexpect(-1); 4251556Srgrimes if (readtoken() != TTHEN) 4261556Srgrimes synexpect(TTHEN); 427214525Sjilles n2->nif.ifpart = list(0, 0); 4281556Srgrimes } 4291556Srgrimes if (lasttoken == TELSE) 430214525Sjilles n2->nif.elsepart = list(0, 0); 4311556Srgrimes else { 4321556Srgrimes n2->nif.elsepart = NULL; 4331556Srgrimes tokpushback++; 4341556Srgrimes } 4351556Srgrimes if (readtoken() != TFI) 4361556Srgrimes synexpect(TFI); 437214709Sjilles checkkwd = CHKKWD | CHKALIAS; 4381556Srgrimes break; 4391556Srgrimes case TWHILE: 4401556Srgrimes case TUNTIL: { 4411556Srgrimes int got; 4421556Srgrimes n1 = (union node *)stalloc(sizeof (struct nbinary)); 4431556Srgrimes n1->type = (lasttoken == TWHILE)? NWHILE : NUNTIL; 444214525Sjilles if ((n1->nbinary.ch1 = list(0, 0)) == NULL) 445104554Stjr synexpect(-1); 4461556Srgrimes if ((got=readtoken()) != TDO) { 4471556SrgrimesTRACE(("expecting DO got %s %s\n", tokname[got], got == TWORD ? wordtext : "")); 4481556Srgrimes synexpect(TDO); 4491556Srgrimes } 450214525Sjilles n1->nbinary.ch2 = list(0, 0); 4511556Srgrimes if (readtoken() != TDONE) 4521556Srgrimes synexpect(TDONE); 453214709Sjilles checkkwd = CHKKWD | CHKALIAS; 4541556Srgrimes break; 4551556Srgrimes } 4561556Srgrimes case TFOR: 4571556Srgrimes if (readtoken() != TWORD || quoteflag || ! goodname(wordtext)) 4581556Srgrimes synerror("Bad for loop variable"); 4591556Srgrimes n1 = (union node *)stalloc(sizeof (struct nfor)); 4601556Srgrimes n1->type = NFOR; 4611556Srgrimes n1->nfor.var = wordtext; 462199282Sjilles while (readtoken() == TNL) 463199282Sjilles ; 464199282Sjilles if (lasttoken == TWORD && ! quoteflag && equal(wordtext, "in")) { 4651556Srgrimes app = ≈ 4661556Srgrimes while (readtoken() == TWORD) { 4671556Srgrimes n2 = (union node *)stalloc(sizeof (struct narg)); 4681556Srgrimes n2->type = NARG; 4691556Srgrimes n2->narg.text = wordtext; 4701556Srgrimes n2->narg.backquote = backquotelist; 4711556Srgrimes *app = n2; 4721556Srgrimes app = &n2->narg.next; 4731556Srgrimes } 4741556Srgrimes *app = NULL; 4751556Srgrimes n1->nfor.args = ap; 4761556Srgrimes if (lasttoken != TNL && lasttoken != TSEMI) 4771556Srgrimes synexpect(-1); 4781556Srgrimes } else { 479149096Sstefanf static char argvars[5] = { 480149096Sstefanf CTLVAR, VSNORMAL|VSQUOTE, '@', '=', '\0' 481149096Sstefanf }; 4821556Srgrimes n2 = (union node *)stalloc(sizeof (struct narg)); 4831556Srgrimes n2->type = NARG; 484149096Sstefanf n2->narg.text = argvars; 4851556Srgrimes n2->narg.backquote = NULL; 4861556Srgrimes n2->narg.next = NULL; 4871556Srgrimes n1->nfor.args = n2; 4881556Srgrimes /* 4891556Srgrimes * Newline or semicolon here is optional (but note 4901556Srgrimes * that the original Bourne shell only allowed NL). 4911556Srgrimes */ 4921556Srgrimes if (lasttoken != TNL && lasttoken != TSEMI) 4931556Srgrimes tokpushback++; 4941556Srgrimes } 495214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 4961556Srgrimes if ((t = readtoken()) == TDO) 4971556Srgrimes t = TDONE; 4981556Srgrimes else if (t == TBEGIN) 4991556Srgrimes t = TEND; 5001556Srgrimes else 5011556Srgrimes synexpect(-1); 502214525Sjilles n1->nfor.body = list(0, 0); 5031556Srgrimes if (readtoken() != t) 5041556Srgrimes synexpect(t); 505214709Sjilles checkkwd = CHKKWD | CHKALIAS; 5061556Srgrimes break; 5071556Srgrimes case TCASE: 5081556Srgrimes n1 = (union node *)stalloc(sizeof (struct ncase)); 5091556Srgrimes n1->type = NCASE; 5101556Srgrimes if (readtoken() != TWORD) 5111556Srgrimes synexpect(TWORD); 5121556Srgrimes n1->ncase.expr = n2 = (union node *)stalloc(sizeof (struct narg)); 5131556Srgrimes n2->type = NARG; 5141556Srgrimes n2->narg.text = wordtext; 5151556Srgrimes n2->narg.backquote = backquotelist; 5161556Srgrimes n2->narg.next = NULL; 5171556Srgrimes while (readtoken() == TNL); 5181556Srgrimes if (lasttoken != TWORD || ! equal(wordtext, "in")) 5191556Srgrimes synerror("expecting \"in\""); 5201556Srgrimes cpp = &n1->ncase.cases; 521214709Sjilles checkkwd = CHKNL | CHKKWD, readtoken(); 522104202Stjr while (lasttoken != TESAC) { 5231556Srgrimes *cpp = cp = (union node *)stalloc(sizeof (struct nclist)); 5241556Srgrimes cp->type = NCLIST; 5251556Srgrimes app = &cp->nclist.pattern; 526104207Stjr if (lasttoken == TLP) 527104207Stjr readtoken(); 5281556Srgrimes for (;;) { 5291556Srgrimes *app = ap = (union node *)stalloc(sizeof (struct narg)); 5301556Srgrimes ap->type = NARG; 5311556Srgrimes ap->narg.text = wordtext; 5321556Srgrimes ap->narg.backquote = backquotelist; 533214709Sjilles checkkwd = CHKNL | CHKKWD; 534214709Sjilles if (readtoken() != TPIPE) 5351556Srgrimes break; 5361556Srgrimes app = &ap->narg.next; 5372760Ssef readtoken(); 5381556Srgrimes } 5391556Srgrimes ap->narg.next = NULL; 5401556Srgrimes if (lasttoken != TRP) 541214709Sjilles synexpect(TRP); 542214525Sjilles cp->nclist.body = list(0, 0); 5432760Ssef 544214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 5452760Ssef if ((t = readtoken()) != TESAC) { 546223186Sjilles if (t == TENDCASE) 547223186Sjilles ; 548223186Sjilles else if (t == TFALLTHRU) 549223186Sjilles cp->type = NCLISTFALLTHRU; 550223186Sjilles else 551214709Sjilles synexpect(TENDCASE); 552223186Sjilles checkkwd = CHKNL | CHKKWD, readtoken(); 5532760Ssef } 5541556Srgrimes cpp = &cp->nclist.next; 555104202Stjr } 5561556Srgrimes *cpp = NULL; 557214709Sjilles checkkwd = CHKKWD | CHKALIAS; 5581556Srgrimes break; 5591556Srgrimes case TLP: 5601556Srgrimes n1 = (union node *)stalloc(sizeof (struct nredir)); 5611556Srgrimes n1->type = NSUBSHELL; 562214525Sjilles n1->nredir.n = list(0, 0); 5631556Srgrimes n1->nredir.redirect = NULL; 5641556Srgrimes if (readtoken() != TRP) 5651556Srgrimes synexpect(TRP); 566214709Sjilles checkkwd = CHKKWD | CHKALIAS; 567218325Sjilles is_subshell = 1; 5681556Srgrimes break; 5691556Srgrimes case TBEGIN: 570214525Sjilles n1 = list(0, 0); 5711556Srgrimes if (readtoken() != TEND) 5721556Srgrimes synexpect(TEND); 573214709Sjilles checkkwd = CHKKWD | CHKALIAS; 5741556Srgrimes break; 5751556Srgrimes /* Handle an empty command like other simple commands. */ 576210221Sjilles case TBACKGND: 57717987Speter case TSEMI: 578101662Stjr case TAND: 579101662Stjr case TOR: 58017987Speter /* 58117987Speter * An empty command before a ; doesn't make much sense, and 58217987Speter * should certainly be disallowed in the case of `if ;'. 58317987Speter */ 58417987Speter if (!redir) 58517987Speter synexpect(-1); 5861556Srgrimes case TNL: 58710399Sjoerg case TEOF: 5881556Srgrimes case TWORD: 58917987Speter case TRP: 5901556Srgrimes tokpushback++; 59175160Sbrian n1 = simplecmd(rpp, redir); 592214281Sjilles return n1; 5931556Srgrimes default: 5941556Srgrimes synexpect(-1); 5951556Srgrimes } 5961556Srgrimes 5971556Srgrimes /* Now check for redirection which may follow command */ 5981556Srgrimes while (readtoken() == TREDIR) { 5991556Srgrimes *rpp = n2 = redirnode; 6001556Srgrimes rpp = &n2->nfile.next; 6011556Srgrimes parsefname(); 6021556Srgrimes } 6031556Srgrimes tokpushback++; 6041556Srgrimes *rpp = NULL; 6051556Srgrimes if (redir) { 606218325Sjilles if (!is_subshell) { 6071556Srgrimes n2 = (union node *)stalloc(sizeof (struct nredir)); 6081556Srgrimes n2->type = NREDIR; 6091556Srgrimes n2->nredir.n = n1; 6101556Srgrimes n1 = n2; 6111556Srgrimes } 6121556Srgrimes n1->nredir.redirect = redir; 6131556Srgrimes } 61475160Sbrian 615214281Sjilles return n1; 6161556Srgrimes} 6171556Srgrimes 6181556Srgrimes 619213811Sobrienstatic union node * 62090111Simpsimplecmd(union node **rpp, union node *redir) 62190111Simp{ 6221556Srgrimes union node *args, **app; 6231556Srgrimes union node **orig_rpp = rpp; 624210087Sjilles union node *n = NULL; 625214304Sjilles int special; 626222165Sjilles int savecheckkwd; 6271556Srgrimes 6281556Srgrimes /* If we don't have any redirections already, then we must reset */ 6291556Srgrimes /* rpp to be the address of the local redir variable. */ 6301556Srgrimes if (redir == 0) 6311556Srgrimes rpp = &redir; 6321556Srgrimes 6331556Srgrimes args = NULL; 6341556Srgrimes app = &args; 6358855Srgrimes /* 6361556Srgrimes * We save the incoming value, because we need this for shell 6371556Srgrimes * functions. There can not be a redirect or an argument between 6388855Srgrimes * the function name and the open parenthesis. 6391556Srgrimes */ 6401556Srgrimes orig_rpp = rpp; 6411556Srgrimes 642222165Sjilles savecheckkwd = CHKALIAS; 643222165Sjilles 6441556Srgrimes for (;;) { 645222165Sjilles checkkwd = savecheckkwd; 6461556Srgrimes if (readtoken() == TWORD) { 6471556Srgrimes n = (union node *)stalloc(sizeof (struct narg)); 6481556Srgrimes n->type = NARG; 6491556Srgrimes n->narg.text = wordtext; 6501556Srgrimes n->narg.backquote = backquotelist; 6511556Srgrimes *app = n; 6521556Srgrimes app = &n->narg.next; 653222165Sjilles if (savecheckkwd != 0 && !isassignment(wordtext)) 654222165Sjilles savecheckkwd = 0; 6551556Srgrimes } else if (lasttoken == TREDIR) { 6561556Srgrimes *rpp = n = redirnode; 6571556Srgrimes rpp = &n->nfile.next; 6581556Srgrimes parsefname(); /* read name of redirection file */ 6591556Srgrimes } else if (lasttoken == TLP && app == &args->narg.next 6601556Srgrimes && rpp == orig_rpp) { 6611556Srgrimes /* We have a function */ 6621556Srgrimes if (readtoken() != TRP) 6631556Srgrimes synexpect(TRP); 664179022Sstefanf funclinno = plinno; 665214291Sjilles /* 666214291Sjilles * - Require plain text. 667214291Sjilles * - Functions with '/' cannot be called. 668214534Sjilles * - Reject name=(). 669214534Sjilles * - Reject ksh extended glob patterns. 670214291Sjilles */ 671214291Sjilles if (!noexpand(n->narg.text) || quoteflag || 672214534Sjilles strchr(n->narg.text, '/') || 673214534Sjilles strchr("!%*+-=?@}~", 674214534Sjilles n->narg.text[strlen(n->narg.text) - 1])) 6751556Srgrimes synerror("Bad function name"); 676214291Sjilles rmescapes(n->narg.text); 677214304Sjilles if (find_builtin(n->narg.text, &special) >= 0 && 678214304Sjilles special) 679214304Sjilles synerror("Cannot override a special builtin with a function"); 6801556Srgrimes n->type = NDEFUN; 6811556Srgrimes n->narg.next = command(); 682179022Sstefanf funclinno = 0; 683210087Sjilles return n; 6841556Srgrimes } else { 6851556Srgrimes tokpushback++; 6861556Srgrimes break; 6871556Srgrimes } 6881556Srgrimes } 6891556Srgrimes *app = NULL; 6901556Srgrimes *rpp = NULL; 6911556Srgrimes n = (union node *)stalloc(sizeof (struct ncmd)); 6921556Srgrimes n->type = NCMD; 6931556Srgrimes n->ncmd.args = args; 6941556Srgrimes n->ncmd.redirect = redir; 695210087Sjilles return n; 6961556Srgrimes} 6971556Srgrimes 698213811Sobrienstatic union node * 69990111Simpmakename(void) 70090111Simp{ 70117987Speter union node *n; 7021556Srgrimes 70317987Speter n = (union node *)stalloc(sizeof (struct narg)); 70417987Speter n->type = NARG; 70517987Speter n->narg.next = NULL; 70617987Speter n->narg.text = wordtext; 70717987Speter n->narg.backquote = backquotelist; 70817987Speter return n; 70917987Speter} 71017987Speter 711213760Sobrienvoid 712213760Sobrienfixredir(union node *n, const char *text, int err) 71390111Simp{ 71417987Speter TRACE(("Fix redir %s %d\n", text, err)); 71517987Speter if (!err) 71617987Speter n->ndup.vname = NULL; 71717987Speter 71817987Speter if (is_digit(text[0]) && text[1] == '\0') 71917987Speter n->ndup.dupfd = digit_val(text[0]); 72017987Speter else if (text[0] == '-' && text[1] == '\0') 72117987Speter n->ndup.dupfd = -1; 72217987Speter else { 72320425Ssteve 72417987Speter if (err) 72517987Speter synerror("Bad fd number"); 72617987Speter else 72717987Speter n->ndup.vname = makename(); 72817987Speter } 72917987Speter} 73017987Speter 73117987Speter 732213811Sobrienstatic void 73390111Simpparsefname(void) 73490111Simp{ 7351556Srgrimes union node *n = redirnode; 7361556Srgrimes 7371556Srgrimes if (readtoken() != TWORD) 7381556Srgrimes synexpect(-1); 7391556Srgrimes if (n->type == NHERE) { 7401556Srgrimes struct heredoc *here = heredoc; 7411556Srgrimes struct heredoc *p; 7421556Srgrimes int i; 7431556Srgrimes 7441556Srgrimes if (quoteflag == 0) 7451556Srgrimes n->type = NXHERE; 7461556Srgrimes TRACE(("Here document %d\n", n->type)); 7471556Srgrimes if (here->striptabs) { 7481556Srgrimes while (*wordtext == '\t') 7491556Srgrimes wordtext++; 7501556Srgrimes } 7511556Srgrimes if (! noexpand(wordtext) || (i = strlen(wordtext)) == 0 || i > EOFMARKLEN) 7521556Srgrimes synerror("Illegal eof marker for << redirection"); 7531556Srgrimes rmescapes(wordtext); 7541556Srgrimes here->eofmark = wordtext; 7551556Srgrimes here->next = NULL; 7561556Srgrimes if (heredoclist == NULL) 7571556Srgrimes heredoclist = here; 7581556Srgrimes else { 7591556Srgrimes for (p = heredoclist ; p->next ; p = p->next); 7601556Srgrimes p->next = here; 7611556Srgrimes } 7621556Srgrimes } else if (n->type == NTOFD || n->type == NFROMFD) { 76317987Speter fixredir(n, wordtext, 0); 7641556Srgrimes } else { 76517987Speter n->nfile.fname = makename(); 7661556Srgrimes } 7671556Srgrimes} 7681556Srgrimes 7691556Srgrimes 7701556Srgrimes/* 7711556Srgrimes * Input any here documents. 7721556Srgrimes */ 7731556Srgrimes 774213811Sobrienstatic void 77590111Simpparseheredoc(void) 77690111Simp{ 7771556Srgrimes struct heredoc *here; 7781556Srgrimes union node *n; 7791556Srgrimes 7801556Srgrimes while (heredoclist) { 7811556Srgrimes here = heredoclist; 7821556Srgrimes heredoclist = here->next; 7831556Srgrimes if (needprompt) { 7841556Srgrimes setprompt(2); 7851556Srgrimes needprompt = 0; 7861556Srgrimes } 7871556Srgrimes readtoken1(pgetc(), here->here->type == NHERE? SQSYNTAX : DQSYNTAX, 7881556Srgrimes here->eofmark, here->striptabs); 7891556Srgrimes n = (union node *)stalloc(sizeof (struct narg)); 7901556Srgrimes n->narg.type = NARG; 7911556Srgrimes n->narg.next = NULL; 7921556Srgrimes n->narg.text = wordtext; 7931556Srgrimes n->narg.backquote = backquotelist; 7941556Srgrimes here->here->nhere.doc = n; 7951556Srgrimes } 7961556Srgrimes} 7971556Srgrimes 798213811Sobrienstatic int 79990111Simppeektoken(void) 80090111Simp{ 8011556Srgrimes int t; 8021556Srgrimes 8031556Srgrimes t = readtoken(); 8041556Srgrimes tokpushback++; 8051556Srgrimes return (t); 8061556Srgrimes} 8071556Srgrimes 808213811Sobrienstatic int 80990111Simpreadtoken(void) 81090111Simp{ 8111556Srgrimes int t; 8121556Srgrimes struct alias *ap; 8131556Srgrimes#ifdef DEBUG 8141556Srgrimes int alreadyseen = tokpushback; 8151556Srgrimes#endif 8168855Srgrimes 8171556Srgrimes top: 8181556Srgrimes t = xxreadtoken(); 8191556Srgrimes 820214709Sjilles /* 821214709Sjilles * eat newlines 822214709Sjilles */ 823214709Sjilles if (checkkwd & CHKNL) { 824214709Sjilles while (t == TNL) { 825214709Sjilles parseheredoc(); 826214709Sjilles t = xxreadtoken(); 827214709Sjilles } 828214709Sjilles } 8291556Srgrimes 830214709Sjilles /* 831214709Sjilles * check for keywords and aliases 832214709Sjilles */ 833214709Sjilles if (t == TWORD && !quoteflag) 834214709Sjilles { 835214709Sjilles const char * const *pp; 836214709Sjilles 837214709Sjilles if (checkkwd & CHKKWD) 83898463Sjmallett for (pp = parsekwd; *pp; pp++) { 83920425Ssteve if (**pp == *wordtext && equal(*pp, wordtext)) 84017987Speter { 8411556Srgrimes lasttoken = t = pp - parsekwd + KWDOFFSET; 8421556Srgrimes TRACE(("keyword %s recognized\n", tokname[t])); 8431556Srgrimes goto out; 8441556Srgrimes } 8451556Srgrimes } 846214709Sjilles if (checkkwd & CHKALIAS && 847214709Sjilles (ap = lookupalias(wordtext, 1)) != NULL) { 848214709Sjilles pushstring(ap->val, strlen(ap->val), ap); 849214709Sjilles goto top; 8501556Srgrimes } 851214709Sjilles } 8521556Srgrimesout: 853214709Sjilles if (t != TNOT) 854214709Sjilles checkkwd = 0; 855214709Sjilles 8561556Srgrimes#ifdef DEBUG 8571556Srgrimes if (!alreadyseen) 8581556Srgrimes TRACE(("token %s %s\n", tokname[t], t == TWORD ? wordtext : "")); 8591556Srgrimes else 8601556Srgrimes TRACE(("reread token %s %s\n", tokname[t], t == TWORD ? wordtext : "")); 8611556Srgrimes#endif 8621556Srgrimes return (t); 8631556Srgrimes} 8641556Srgrimes 8651556Srgrimes 8661556Srgrimes/* 8671556Srgrimes * Read the next input token. 8681556Srgrimes * If the token is a word, we set backquotelist to the list of cmds in 8691556Srgrimes * backquotes. We set quoteflag to true if any part of the word was 8701556Srgrimes * quoted. 8711556Srgrimes * If the token is TREDIR, then we set redirnode to a structure containing 8721556Srgrimes * the redirection. 8731556Srgrimes * In all cases, the variable startlinno is set to the number of the line 8741556Srgrimes * on which the token starts. 8751556Srgrimes * 8761556Srgrimes * [Change comment: here documents and internal procedures] 8771556Srgrimes * [Readtoken shouldn't have any arguments. Perhaps we should make the 8781556Srgrimes * word parsing code into a separate routine. In this case, readtoken 8791556Srgrimes * doesn't need to have any internal procedures, but parseword does. 8801556Srgrimes * We could also make parseoperator in essence the main routine, and 8811556Srgrimes * have parseword (readtoken1?) handle both words and redirection.] 8821556Srgrimes */ 8831556Srgrimes 8841556Srgrimes#define RETURN(token) return lasttoken = token 8851556Srgrimes 886213811Sobrienstatic int 88790111Simpxxreadtoken(void) 88890111Simp{ 88925230Ssteve int c; 8901556Srgrimes 8911556Srgrimes if (tokpushback) { 8921556Srgrimes tokpushback = 0; 8931556Srgrimes return lasttoken; 8941556Srgrimes } 8951556Srgrimes if (needprompt) { 8961556Srgrimes setprompt(2); 8971556Srgrimes needprompt = 0; 8981556Srgrimes } 8991556Srgrimes startlinno = plinno; 9001556Srgrimes for (;;) { /* until token or start of word found */ 9011556Srgrimes c = pgetc_macro(); 9021556Srgrimes switch (c) { 9031556Srgrimes case ' ': case '\t': 9041556Srgrimes continue; 9051556Srgrimes case '#': 9061556Srgrimes while ((c = pgetc()) != '\n' && c != PEOF); 9071556Srgrimes pungetc(); 9081556Srgrimes continue; 9091556Srgrimes case '\\': 9101556Srgrimes if (pgetc() == '\n') { 9111556Srgrimes startlinno = ++plinno; 9121556Srgrimes if (doprompt) 9131556Srgrimes setprompt(2); 9141556Srgrimes else 9151556Srgrimes setprompt(0); 9161556Srgrimes continue; 9171556Srgrimes } 9181556Srgrimes pungetc(); 9191556Srgrimes goto breakloop; 9201556Srgrimes case '\n': 9211556Srgrimes plinno++; 9221556Srgrimes needprompt = doprompt; 9231556Srgrimes RETURN(TNL); 9241556Srgrimes case PEOF: 9251556Srgrimes RETURN(TEOF); 9261556Srgrimes case '&': 9271556Srgrimes if (pgetc() == '&') 9281556Srgrimes RETURN(TAND); 9291556Srgrimes pungetc(); 9301556Srgrimes RETURN(TBACKGND); 9311556Srgrimes case '|': 9321556Srgrimes if (pgetc() == '|') 9331556Srgrimes RETURN(TOR); 9341556Srgrimes pungetc(); 9351556Srgrimes RETURN(TPIPE); 9361556Srgrimes case ';': 937223186Sjilles c = pgetc(); 938223186Sjilles if (c == ';') 9391556Srgrimes RETURN(TENDCASE); 940223186Sjilles else if (c == '&') 941223186Sjilles RETURN(TFALLTHRU); 9421556Srgrimes pungetc(); 9431556Srgrimes RETURN(TSEMI); 9441556Srgrimes case '(': 9451556Srgrimes RETURN(TLP); 9461556Srgrimes case ')': 9471556Srgrimes RETURN(TRP); 9481556Srgrimes default: 9491556Srgrimes goto breakloop; 9501556Srgrimes } 9511556Srgrimes } 9521556Srgrimesbreakloop: 9531556Srgrimes return readtoken1(c, BASESYNTAX, (char *)NULL, 0); 9541556Srgrimes#undef RETURN 9551556Srgrimes} 9561556Srgrimes 9571556Srgrimes 958213811Sobrien#define MAXNEST_static 8 959206145Sjillesstruct tokenstate 960206145Sjilles{ 961206145Sjilles const char *syntax; /* *SYNTAX */ 962206145Sjilles int parenlevel; /* levels of parentheses in arithmetic */ 963206145Sjilles enum tokenstate_category 964206145Sjilles { 965206145Sjilles TSTATE_TOP, 966206145Sjilles TSTATE_VAR_OLD, /* ${var+-=?}, inherits dquotes */ 967206145Sjilles TSTATE_VAR_NEW, /* other ${var...}, own dquote state */ 968206145Sjilles TSTATE_ARITH 969206145Sjilles } category; 970206145Sjilles}; 971206145Sjilles 972206145Sjilles 973205130Sjilles/* 974205130Sjilles * Called to parse command substitutions. 975205130Sjilles */ 9761556Srgrimes 977213811Sobrienstatic char * 978205130Sjillesparsebackq(char *out, struct nodelist **pbqlist, 979205130Sjilles int oldstyle, int dblquote, int quoted) 980205130Sjilles{ 981205130Sjilles struct nodelist **nlpp; 982205130Sjilles union node *n; 983205130Sjilles char *volatile str; 984205130Sjilles struct jmploc jmploc; 985205130Sjilles struct jmploc *const savehandler = handler; 986248980Sjilles size_t savelen; 987205130Sjilles int saveprompt; 988205130Sjilles const int bq_startlinno = plinno; 989205130Sjilles char *volatile ostr = NULL; 990205130Sjilles struct parsefile *const savetopfile = getcurrentfile(); 991208655Sjilles struct heredoc *const saveheredoclist = heredoclist; 992208655Sjilles struct heredoc *here; 993205130Sjilles 994205130Sjilles str = NULL; 995205130Sjilles if (setjmp(jmploc.loc)) { 996205130Sjilles popfilesupto(savetopfile); 997205130Sjilles if (str) 998205130Sjilles ckfree(str); 999205130Sjilles if (ostr) 1000205130Sjilles ckfree(ostr); 1001208655Sjilles heredoclist = saveheredoclist; 1002205130Sjilles handler = savehandler; 1003205130Sjilles if (exception == EXERROR) { 1004205130Sjilles startlinno = bq_startlinno; 1005205130Sjilles synerror("Error in command substitution"); 1006205130Sjilles } 1007205130Sjilles longjmp(handler->loc, 1); 1008205130Sjilles } 1009205130Sjilles INTOFF; 1010205130Sjilles savelen = out - stackblock(); 1011205130Sjilles if (savelen > 0) { 1012205130Sjilles str = ckmalloc(savelen); 1013205130Sjilles memcpy(str, stackblock(), savelen); 1014205130Sjilles } 1015205130Sjilles handler = &jmploc; 1016208655Sjilles heredoclist = NULL; 1017205130Sjilles INTON; 1018205130Sjilles if (oldstyle) { 1019205130Sjilles /* We must read until the closing backquote, giving special 1020205130Sjilles treatment to some slashes, and then push the string and 1021205130Sjilles reread it as input, interpreting it normally. */ 1022205130Sjilles char *oout; 1023205130Sjilles int c; 1024205130Sjilles int olen; 1025205130Sjilles 1026205130Sjilles 1027205130Sjilles STARTSTACKSTR(oout); 1028205130Sjilles for (;;) { 1029205130Sjilles if (needprompt) { 1030205130Sjilles setprompt(2); 1031205130Sjilles needprompt = 0; 1032205130Sjilles } 1033215783Sjilles CHECKSTRSPACE(2, oout); 1034205130Sjilles switch (c = pgetc()) { 1035205130Sjilles case '`': 1036205130Sjilles goto done; 1037205130Sjilles 1038205130Sjilles case '\\': 1039205130Sjilles if ((c = pgetc()) == '\n') { 1040205130Sjilles plinno++; 1041205130Sjilles if (doprompt) 1042205130Sjilles setprompt(2); 1043205130Sjilles else 1044205130Sjilles setprompt(0); 1045205130Sjilles /* 1046205130Sjilles * If eating a newline, avoid putting 1047205130Sjilles * the newline into the new character 1048215783Sjilles * stream (via the USTPUTC after the 1049205130Sjilles * switch). 1050205130Sjilles */ 1051205130Sjilles continue; 1052205130Sjilles } 1053205130Sjilles if (c != '\\' && c != '`' && c != '$' 1054205130Sjilles && (!dblquote || c != '"')) 1055215783Sjilles USTPUTC('\\', oout); 1056205130Sjilles break; 1057205130Sjilles 1058205130Sjilles case '\n': 1059205130Sjilles plinno++; 1060205130Sjilles needprompt = doprompt; 1061205130Sjilles break; 1062205130Sjilles 1063205130Sjilles case PEOF: 1064205130Sjilles startlinno = plinno; 1065205130Sjilles synerror("EOF in backquote substitution"); 1066205130Sjilles break; 1067205130Sjilles 1068205130Sjilles default: 1069205130Sjilles break; 1070205130Sjilles } 1071215783Sjilles USTPUTC(c, oout); 1072205130Sjilles } 1073205130Sjillesdone: 1074215783Sjilles USTPUTC('\0', oout); 1075205130Sjilles olen = oout - stackblock(); 1076205130Sjilles INTOFF; 1077205130Sjilles ostr = ckmalloc(olen); 1078205130Sjilles memcpy(ostr, stackblock(), olen); 1079205130Sjilles setinputstring(ostr, 1); 1080205130Sjilles INTON; 1081205130Sjilles } 1082205130Sjilles nlpp = pbqlist; 1083205130Sjilles while (*nlpp) 1084205130Sjilles nlpp = &(*nlpp)->next; 1085205130Sjilles *nlpp = (struct nodelist *)stalloc(sizeof (struct nodelist)); 1086205130Sjilles (*nlpp)->next = NULL; 1087205130Sjilles 1088205130Sjilles if (oldstyle) { 1089205130Sjilles saveprompt = doprompt; 1090205130Sjilles doprompt = 0; 1091205130Sjilles } 1092205130Sjilles 1093214525Sjilles n = list(0, oldstyle); 1094205130Sjilles 1095205130Sjilles if (oldstyle) 1096205130Sjilles doprompt = saveprompt; 1097205130Sjilles else { 1098205130Sjilles if (readtoken() != TRP) 1099205130Sjilles synexpect(TRP); 1100205130Sjilles } 1101205130Sjilles 1102205130Sjilles (*nlpp)->n = n; 1103205130Sjilles if (oldstyle) { 1104205130Sjilles /* 1105205130Sjilles * Start reading from old file again, ignoring any pushed back 1106205130Sjilles * tokens left from the backquote parsing 1107205130Sjilles */ 1108205130Sjilles popfile(); 1109205130Sjilles tokpushback = 0; 1110205130Sjilles } 1111205130Sjilles STARTSTACKSTR(out); 1112216706Sjilles CHECKSTRSPACE(savelen + 1, out); 1113208655Sjilles INTOFF; 1114205130Sjilles if (str) { 1115205130Sjilles memcpy(out, str, savelen); 1116205130Sjilles STADJUST(savelen, out); 1117205130Sjilles ckfree(str); 1118205130Sjilles str = NULL; 1119205130Sjilles } 1120205130Sjilles if (ostr) { 1121205130Sjilles ckfree(ostr); 1122205130Sjilles ostr = NULL; 1123205130Sjilles } 1124208655Sjilles here = saveheredoclist; 1125208655Sjilles if (here != NULL) { 1126208655Sjilles while (here->next != NULL) 1127208655Sjilles here = here->next; 1128208655Sjilles here->next = heredoclist; 1129208655Sjilles heredoclist = saveheredoclist; 1130208655Sjilles } 1131205130Sjilles handler = savehandler; 1132208655Sjilles INTON; 1133205130Sjilles if (quoted) 1134205130Sjilles USTPUTC(CTLBACKQ | CTLQUOTE, out); 1135205130Sjilles else 1136205130Sjilles USTPUTC(CTLBACKQ, out); 1137205130Sjilles return out; 1138205130Sjilles} 1139205130Sjilles 1140205130Sjilles 11411556Srgrimes/* 1142221513Sjilles * Called to parse a backslash escape sequence inside $'...'. 1143221513Sjilles * The backslash has already been read. 1144221513Sjilles */ 1145221513Sjillesstatic char * 1146221513Sjillesreadcstyleesc(char *out) 1147221513Sjilles{ 1148221513Sjilles int c, v, i, n; 1149221513Sjilles 1150221513Sjilles c = pgetc(); 1151221513Sjilles switch (c) { 1152221513Sjilles case '\0': 1153221513Sjilles synerror("Unterminated quoted string"); 1154221513Sjilles case '\n': 1155221513Sjilles plinno++; 1156221513Sjilles if (doprompt) 1157221513Sjilles setprompt(2); 1158221513Sjilles else 1159221513Sjilles setprompt(0); 1160221513Sjilles return out; 1161221513Sjilles case '\\': 1162221513Sjilles case '\'': 1163221513Sjilles case '"': 1164221513Sjilles v = c; 1165221513Sjilles break; 1166221513Sjilles case 'a': v = '\a'; break; 1167221513Sjilles case 'b': v = '\b'; break; 1168221513Sjilles case 'e': v = '\033'; break; 1169221513Sjilles case 'f': v = '\f'; break; 1170221513Sjilles case 'n': v = '\n'; break; 1171221513Sjilles case 'r': v = '\r'; break; 1172221513Sjilles case 't': v = '\t'; break; 1173221513Sjilles case 'v': v = '\v'; break; 1174221513Sjilles case 'x': 1175221513Sjilles v = 0; 1176221513Sjilles for (;;) { 1177221513Sjilles c = pgetc(); 1178221513Sjilles if (c >= '0' && c <= '9') 1179221513Sjilles v = (v << 4) + c - '0'; 1180221513Sjilles else if (c >= 'A' && c <= 'F') 1181221513Sjilles v = (v << 4) + c - 'A' + 10; 1182221513Sjilles else if (c >= 'a' && c <= 'f') 1183221513Sjilles v = (v << 4) + c - 'a' + 10; 1184221513Sjilles else 1185221513Sjilles break; 1186221513Sjilles } 1187221513Sjilles pungetc(); 1188221513Sjilles break; 1189221513Sjilles case '0': case '1': case '2': case '3': 1190221513Sjilles case '4': case '5': case '6': case '7': 1191221513Sjilles v = c - '0'; 1192221513Sjilles c = pgetc(); 1193221513Sjilles if (c >= '0' && c <= '7') { 1194221513Sjilles v <<= 3; 1195221513Sjilles v += c - '0'; 1196221513Sjilles c = pgetc(); 1197221513Sjilles if (c >= '0' && c <= '7') { 1198221513Sjilles v <<= 3; 1199221513Sjilles v += c - '0'; 1200221513Sjilles } else 1201221513Sjilles pungetc(); 1202221513Sjilles } else 1203221513Sjilles pungetc(); 1204221513Sjilles break; 1205221513Sjilles case 'c': 1206221513Sjilles c = pgetc(); 1207221513Sjilles if (c < 0x3f || c > 0x7a || c == 0x60) 1208221513Sjilles synerror("Bad escape sequence"); 1209221513Sjilles if (c == '\\' && pgetc() != '\\') 1210221513Sjilles synerror("Bad escape sequence"); 1211221513Sjilles if (c == '?') 1212221513Sjilles v = 127; 1213221513Sjilles else 1214221513Sjilles v = c & 0x1f; 1215221513Sjilles break; 1216221513Sjilles case 'u': 1217221513Sjilles case 'U': 1218221513Sjilles n = c == 'U' ? 8 : 4; 1219221513Sjilles v = 0; 1220221513Sjilles for (i = 0; i < n; i++) { 1221221513Sjilles c = pgetc(); 1222221513Sjilles if (c >= '0' && c <= '9') 1223221513Sjilles v = (v << 4) + c - '0'; 1224221513Sjilles else if (c >= 'A' && c <= 'F') 1225221513Sjilles v = (v << 4) + c - 'A' + 10; 1226221513Sjilles else if (c >= 'a' && c <= 'f') 1227221513Sjilles v = (v << 4) + c - 'a' + 10; 1228221513Sjilles else 1229221513Sjilles synerror("Bad escape sequence"); 1230221513Sjilles } 1231221513Sjilles if (v == 0 || (v >= 0xd800 && v <= 0xdfff)) 1232221513Sjilles synerror("Bad escape sequence"); 1233221513Sjilles /* We really need iconv here. */ 1234221669Sjilles if (initial_localeisutf8 && v > 127) { 1235221669Sjilles CHECKSTRSPACE(4, out); 1236221669Sjilles /* 1237221669Sjilles * We cannot use wctomb() as the locale may have 1238221669Sjilles * changed. 1239221669Sjilles */ 1240221669Sjilles if (v <= 0x7ff) { 1241221669Sjilles USTPUTC(0xc0 | v >> 6, out); 1242221669Sjilles USTPUTC(0x80 | (v & 0x3f), out); 1243221669Sjilles return out; 1244221669Sjilles } else if (v <= 0xffff) { 1245221669Sjilles USTPUTC(0xe0 | v >> 12, out); 1246221669Sjilles USTPUTC(0x80 | ((v >> 6) & 0x3f), out); 1247221669Sjilles USTPUTC(0x80 | (v & 0x3f), out); 1248221669Sjilles return out; 1249221669Sjilles } else if (v <= 0x10ffff) { 1250221669Sjilles USTPUTC(0xf0 | v >> 18, out); 1251221669Sjilles USTPUTC(0x80 | ((v >> 12) & 0x3f), out); 1252221669Sjilles USTPUTC(0x80 | ((v >> 6) & 0x3f), out); 1253221669Sjilles USTPUTC(0x80 | (v & 0x3f), out); 1254221669Sjilles return out; 1255221669Sjilles } 1256221669Sjilles } 1257221513Sjilles if (v > 127) 1258221513Sjilles v = '?'; 1259221513Sjilles break; 1260221513Sjilles default: 1261221513Sjilles synerror("Bad escape sequence"); 1262221513Sjilles } 1263221513Sjilles v = (char)v; 1264221513Sjilles /* 1265221513Sjilles * We can't handle NUL bytes. 1266221513Sjilles * POSIX says we should skip till the closing quote. 1267221513Sjilles */ 1268221513Sjilles if (v == '\0') { 1269221513Sjilles while ((c = pgetc()) != '\'') { 1270221513Sjilles if (c == '\\') 1271221513Sjilles c = pgetc(); 1272221513Sjilles if (c == PEOF) 1273221513Sjilles synerror("Unterminated quoted string"); 1274221513Sjilles } 1275221513Sjilles pungetc(); 1276221513Sjilles return out; 1277221513Sjilles } 1278221513Sjilles if (SQSYNTAX[v] == CCTL) 1279221513Sjilles USTPUTC(CTLESC, out); 1280221513Sjilles USTPUTC(v, out); 1281221513Sjilles return out; 1282221513Sjilles} 1283221513Sjilles 1284221513Sjilles 1285221513Sjilles/* 12861556Srgrimes * If eofmark is NULL, read a word or a redirection symbol. If eofmark 12871556Srgrimes * is not NULL, read a here document. In the latter case, eofmark is the 12881556Srgrimes * word which marks the end of the document and striptabs is true if 12891556Srgrimes * leading tabs should be stripped from the document. The argument firstc 12901556Srgrimes * is the first character of the input token or document. 12911556Srgrimes * 12921556Srgrimes * Because C does not have internal subroutines, I have simulated them 12931556Srgrimes * using goto's to implement the subroutine linkage. The following macros 12941556Srgrimes * will run code that appears at the end of readtoken1. 12951556Srgrimes */ 12961556Srgrimes 12971556Srgrimes#define CHECKEND() {goto checkend; checkend_return:;} 12981556Srgrimes#define PARSEREDIR() {goto parseredir; parseredir_return:;} 12991556Srgrimes#define PARSESUB() {goto parsesub; parsesub_return:;} 13001556Srgrimes#define PARSEARITH() {goto parsearith; parsearith_return:;} 13011556Srgrimes 1302213811Sobrienstatic int 1303248980Sjillesreadtoken1(int firstc, char const *initialsyntax, const char *eofmark, 1304248980Sjilles int striptabs) 130590111Simp{ 130617987Speter int c = firstc; 130717987Speter char *out; 13081556Srgrimes int len; 13091556Srgrimes char line[EOFMARKLEN + 1]; 13101556Srgrimes struct nodelist *bqlist; 13111556Srgrimes int quotef; 1312206145Sjilles int newvarnest; 1313206145Sjilles int level; 131454679Scracauer int synentry; 1315213811Sobrien struct tokenstate state_static[MAXNEST_static]; 1316213811Sobrien int maxnest = MAXNEST_static; 1317206145Sjilles struct tokenstate *state = state_static; 1318221513Sjilles int sqiscstyle = 0; 13191556Srgrimes 13201556Srgrimes startlinno = plinno; 13211556Srgrimes quotef = 0; 13221556Srgrimes bqlist = NULL; 1323206145Sjilles newvarnest = 0; 1324206145Sjilles level = 0; 1325206145Sjilles state[level].syntax = initialsyntax; 1326206145Sjilles state[level].parenlevel = 0; 1327206145Sjilles state[level].category = TSTATE_TOP; 13281556Srgrimes 13291556Srgrimes STARTSTACKSTR(out); 13301556Srgrimes loop: { /* for each line, until end of word */ 13311556Srgrimes CHECKEND(); /* set c to PEOF if at end of here document */ 13321556Srgrimes for (;;) { /* until end of line or end of word */ 1333214512Sjilles CHECKSTRSPACE(4, out); /* permit 4 calls to USTPUTC */ 133454679Scracauer 1335206145Sjilles synentry = state[level].syntax[c]; 133654679Scracauer 133754679Scracauer switch(synentry) { 13381556Srgrimes case CNL: /* '\n' */ 1339206145Sjilles if (state[level].syntax == BASESYNTAX) 13401556Srgrimes goto endword; /* exit outer loop */ 13411556Srgrimes USTPUTC(c, out); 13421556Srgrimes plinno++; 13431556Srgrimes if (doprompt) 13441556Srgrimes setprompt(2); 13451556Srgrimes else 13461556Srgrimes setprompt(0); 13471556Srgrimes c = pgetc(); 13481556Srgrimes goto loop; /* continue outer loop */ 1349221513Sjilles case CSBACK: 1350221513Sjilles if (sqiscstyle) { 1351221513Sjilles out = readcstyleesc(out); 1352221513Sjilles break; 1353221513Sjilles } 1354221513Sjilles /* FALLTHROUGH */ 13551556Srgrimes case CWORD: 13561556Srgrimes USTPUTC(c, out); 13571556Srgrimes break; 13581556Srgrimes case CCTL: 1359206145Sjilles if (eofmark == NULL || initialsyntax != SQSYNTAX) 13601556Srgrimes USTPUTC(CTLESC, out); 13611556Srgrimes USTPUTC(c, out); 13621556Srgrimes break; 13631556Srgrimes case CBACK: /* backslash */ 13641556Srgrimes c = pgetc(); 13651556Srgrimes if (c == PEOF) { 13661556Srgrimes USTPUTC('\\', out); 13671556Srgrimes pungetc(); 13681556Srgrimes } else if (c == '\n') { 1369160849Syar plinno++; 13701556Srgrimes if (doprompt) 13711556Srgrimes setprompt(2); 13721556Srgrimes else 13731556Srgrimes setprompt(0); 13741556Srgrimes } else { 1375206145Sjilles if (state[level].syntax == DQSYNTAX && 1376206145Sjilles c != '\\' && c != '`' && c != '$' && 1377206145Sjilles (c != '"' || (eofmark != NULL && 1378206145Sjilles newvarnest == 0)) && 1379206145Sjilles (c != '}' || state[level].category != TSTATE_VAR_OLD)) 13801556Srgrimes USTPUTC('\\', out); 1381214512Sjilles if ((eofmark == NULL || 1382214512Sjilles newvarnest > 0) && 1383214512Sjilles state[level].syntax == BASESYNTAX) 1384214512Sjilles USTPUTC(CTLQUOTEMARK, out); 138583675Stegge if (SQSYNTAX[c] == CCTL) 13861556Srgrimes USTPUTC(CTLESC, out); 13871556Srgrimes USTPUTC(c, out); 1388214512Sjilles if ((eofmark == NULL || 1389214512Sjilles newvarnest > 0) && 1390214512Sjilles state[level].syntax == BASESYNTAX && 1391214512Sjilles state[level].category == TSTATE_VAR_OLD) 1392214512Sjilles USTPUTC(CTLQUOTEEND, out); 13931556Srgrimes quotef++; 13941556Srgrimes } 13951556Srgrimes break; 13961556Srgrimes case CSQUOTE: 1397206145Sjilles USTPUTC(CTLQUOTEMARK, out); 1398206145Sjilles state[level].syntax = SQSYNTAX; 1399221513Sjilles sqiscstyle = 0; 14001556Srgrimes break; 14011556Srgrimes case CDQUOTE: 1402206145Sjilles USTPUTC(CTLQUOTEMARK, out); 1403206145Sjilles state[level].syntax = DQSYNTAX; 14041556Srgrimes break; 14051556Srgrimes case CENDQUOTE: 1406206145Sjilles if (eofmark != NULL && newvarnest == 0) 14071556Srgrimes USTPUTC(c, out); 1408206145Sjilles else { 1409214512Sjilles if (state[level].category == TSTATE_VAR_OLD) 1410214512Sjilles USTPUTC(CTLQUOTEEND, out); 1411214305Sjilles state[level].syntax = BASESYNTAX; 14121556Srgrimes quotef++; 14131556Srgrimes } 14141556Srgrimes break; 14151556Srgrimes case CVAR: /* '$' */ 14161556Srgrimes PARSESUB(); /* parse substitution */ 14171556Srgrimes break; 14181556Srgrimes case CENDVAR: /* '}' */ 1419206145Sjilles if (level > 0 && 1420214492Sjilles ((state[level].category == TSTATE_VAR_OLD && 1421214492Sjilles state[level].syntax == 1422214492Sjilles state[level - 1].syntax) || 1423214490Sjilles (state[level].category == TSTATE_VAR_NEW && 1424214490Sjilles state[level].syntax == BASESYNTAX))) { 1425214492Sjilles if (state[level].category == TSTATE_VAR_NEW) 1426206145Sjilles newvarnest--; 1427206145Sjilles level--; 14281556Srgrimes USTPUTC(CTLENDVAR, out); 14291556Srgrimes } else { 14301556Srgrimes USTPUTC(c, out); 14311556Srgrimes } 14321556Srgrimes break; 14331556Srgrimes case CLP: /* '(' in arithmetic */ 1434206145Sjilles state[level].parenlevel++; 14351556Srgrimes USTPUTC(c, out); 14361556Srgrimes break; 14371556Srgrimes case CRP: /* ')' in arithmetic */ 1438206145Sjilles if (state[level].parenlevel > 0) { 14391556Srgrimes USTPUTC(c, out); 1440206145Sjilles --state[level].parenlevel; 14411556Srgrimes } else { 14421556Srgrimes if (pgetc() == ')') { 1443206145Sjilles if (level > 0 && 1444206145Sjilles state[level].category == TSTATE_ARITH) { 1445206145Sjilles level--; 14461556Srgrimes USTPUTC(CTLENDARI, out); 14471556Srgrimes } else 14481556Srgrimes USTPUTC(')', out); 14491556Srgrimes } else { 14508855Srgrimes /* 14511556Srgrimes * unbalanced parens 14521556Srgrimes * (don't 2nd guess - no error) 14531556Srgrimes */ 14541556Srgrimes pungetc(); 14551556Srgrimes USTPUTC(')', out); 14561556Srgrimes } 14571556Srgrimes } 14581556Srgrimes break; 14591556Srgrimes case CBQUOTE: /* '`' */ 1460206145Sjilles out = parsebackq(out, &bqlist, 1, 1461206145Sjilles state[level].syntax == DQSYNTAX && 1462206145Sjilles (eofmark == NULL || newvarnest > 0), 1463206145Sjilles state[level].syntax == DQSYNTAX || state[level].syntax == ARISYNTAX); 14641556Srgrimes break; 14651556Srgrimes case CEOF: 14661556Srgrimes goto endword; /* exit outer loop */ 1467214305Sjilles case CIGN: 1468214305Sjilles break; 14691556Srgrimes default: 1470206145Sjilles if (level == 0) 14711556Srgrimes goto endword; /* exit outer loop */ 14721556Srgrimes USTPUTC(c, out); 14731556Srgrimes } 14741556Srgrimes c = pgetc_macro(); 14751556Srgrimes } 14761556Srgrimes } 14771556Srgrimesendword: 1478206145Sjilles if (state[level].syntax == ARISYNTAX) 14791556Srgrimes synerror("Missing '))'"); 1480206145Sjilles if (state[level].syntax != BASESYNTAX && eofmark == NULL) 14811556Srgrimes synerror("Unterminated quoted string"); 1482206145Sjilles if (state[level].category == TSTATE_VAR_OLD || 1483206145Sjilles state[level].category == TSTATE_VAR_NEW) { 14841556Srgrimes startlinno = plinno; 14851556Srgrimes synerror("Missing '}'"); 14861556Srgrimes } 1487206145Sjilles if (state != state_static) 1488206145Sjilles parser_temp_free_upto(state); 14891556Srgrimes USTPUTC('\0', out); 14901556Srgrimes len = out - stackblock(); 14911556Srgrimes out = stackblock(); 14921556Srgrimes if (eofmark == NULL) { 14931556Srgrimes if ((c == '>' || c == '<') 14941556Srgrimes && quotef == 0 14951556Srgrimes && len <= 2 14961556Srgrimes && (*out == '\0' || is_digit(*out))) { 14971556Srgrimes PARSEREDIR(); 14981556Srgrimes return lasttoken = TREDIR; 14991556Srgrimes } else { 15001556Srgrimes pungetc(); 15011556Srgrimes } 15021556Srgrimes } 15031556Srgrimes quoteflag = quotef; 15041556Srgrimes backquotelist = bqlist; 15051556Srgrimes grabstackblock(len); 15061556Srgrimes wordtext = out; 15071556Srgrimes return lasttoken = TWORD; 15081556Srgrimes/* end of readtoken routine */ 15091556Srgrimes 15101556Srgrimes 15111556Srgrimes/* 15121556Srgrimes * Check to see whether we are at the end of the here document. When this 15131556Srgrimes * is called, c is set to the first character of the next input line. If 15141556Srgrimes * we are at the end of the here document, this routine sets the c to PEOF. 15151556Srgrimes */ 15161556Srgrimes 15171556Srgrimescheckend: { 15181556Srgrimes if (eofmark) { 15191556Srgrimes if (striptabs) { 15201556Srgrimes while (c == '\t') 15211556Srgrimes c = pgetc(); 15221556Srgrimes } 15231556Srgrimes if (c == *eofmark) { 15241556Srgrimes if (pfgets(line, sizeof line) != NULL) { 1525248980Sjilles const char *p, *q; 15261556Srgrimes 15271556Srgrimes p = line; 15281556Srgrimes for (q = eofmark + 1 ; *q && *p == *q ; p++, q++); 1529222134Sjilles if ((*p == '\0' || *p == '\n') && *q == '\0') { 15301556Srgrimes c = PEOF; 1531222134Sjilles if (*p == '\n') { 1532222134Sjilles plinno++; 1533222134Sjilles needprompt = doprompt; 1534222134Sjilles } 15351556Srgrimes } else { 15361556Srgrimes pushstring(line, strlen(line), NULL); 15371556Srgrimes } 15381556Srgrimes } 15391556Srgrimes } 15401556Srgrimes } 15411556Srgrimes goto checkend_return; 15421556Srgrimes} 15431556Srgrimes 15441556Srgrimes 15451556Srgrimes/* 15461556Srgrimes * Parse a redirection operator. The variable "out" points to a string 15471556Srgrimes * specifying the fd to be redirected. The variable "c" contains the 15481556Srgrimes * first character of the redirection operator. 15491556Srgrimes */ 15501556Srgrimes 15511556Srgrimesparseredir: { 15521556Srgrimes char fd = *out; 15531556Srgrimes union node *np; 15541556Srgrimes 15551556Srgrimes np = (union node *)stalloc(sizeof (struct nfile)); 15561556Srgrimes if (c == '>') { 15571556Srgrimes np->nfile.fd = 1; 15581556Srgrimes c = pgetc(); 15591556Srgrimes if (c == '>') 15601556Srgrimes np->type = NAPPEND; 15611556Srgrimes else if (c == '&') 15621556Srgrimes np->type = NTOFD; 156396922Stjr else if (c == '|') 156496922Stjr np->type = NCLOBBER; 15651556Srgrimes else { 15661556Srgrimes np->type = NTO; 15671556Srgrimes pungetc(); 15681556Srgrimes } 15691556Srgrimes } else { /* c == '<' */ 15701556Srgrimes np->nfile.fd = 0; 15711556Srgrimes c = pgetc(); 15721556Srgrimes if (c == '<') { 15731556Srgrimes if (sizeof (struct nfile) != sizeof (struct nhere)) { 15741556Srgrimes np = (union node *)stalloc(sizeof (struct nhere)); 15751556Srgrimes np->nfile.fd = 0; 15761556Srgrimes } 15771556Srgrimes np->type = NHERE; 15781556Srgrimes heredoc = (struct heredoc *)stalloc(sizeof (struct heredoc)); 15791556Srgrimes heredoc->here = np; 15801556Srgrimes if ((c = pgetc()) == '-') { 15811556Srgrimes heredoc->striptabs = 1; 15821556Srgrimes } else { 15831556Srgrimes heredoc->striptabs = 0; 15841556Srgrimes pungetc(); 15851556Srgrimes } 15861556Srgrimes } else if (c == '&') 15871556Srgrimes np->type = NFROMFD; 158866612Sbrian else if (c == '>') 158966612Sbrian np->type = NFROMTO; 15901556Srgrimes else { 15911556Srgrimes np->type = NFROM; 15921556Srgrimes pungetc(); 15931556Srgrimes } 15941556Srgrimes } 15951556Srgrimes if (fd != '\0') 15961556Srgrimes np->nfile.fd = digit_val(fd); 15971556Srgrimes redirnode = np; 15981556Srgrimes goto parseredir_return; 15991556Srgrimes} 16001556Srgrimes 16011556Srgrimes 16021556Srgrimes/* 16031556Srgrimes * Parse a substitution. At this point, we have read the dollar sign 16041556Srgrimes * and nothing else. 16051556Srgrimes */ 16061556Srgrimes 16071556Srgrimesparsesub: { 1608179022Sstefanf char buf[10]; 16091556Srgrimes int subtype; 16101556Srgrimes int typeloc; 16111556Srgrimes int flags; 16121556Srgrimes char *p; 16131556Srgrimes static const char types[] = "}-+?="; 1614179022Sstefanf int bracketed_name = 0; /* used to handle ${[0-9]*} variables */ 1615179022Sstefanf int linno; 1616179387Sstefanf int length; 1617219623Sjilles int c1; 16181556Srgrimes 16191556Srgrimes c = pgetc(); 1620221513Sjilles if (c == '(') { /* $(command) or $((arith)) */ 16211556Srgrimes if (pgetc() == '(') { 16221556Srgrimes PARSEARITH(); 16231556Srgrimes } else { 16241556Srgrimes pungetc(); 1625206145Sjilles out = parsebackq(out, &bqlist, 0, 1626206145Sjilles state[level].syntax == DQSYNTAX && 1627206145Sjilles (eofmark == NULL || newvarnest > 0), 1628206145Sjilles state[level].syntax == DQSYNTAX || 1629206145Sjilles state[level].syntax == ARISYNTAX); 16301556Srgrimes } 1631221513Sjilles } else if (c == '{' || is_name(c) || is_special(c)) { 16321556Srgrimes USTPUTC(CTLVAR, out); 16331556Srgrimes typeloc = out - stackblock(); 16341556Srgrimes USTPUTC(VSNORMAL, out); 16351556Srgrimes subtype = VSNORMAL; 1636179022Sstefanf flags = 0; 16371556Srgrimes if (c == '{') { 163818202Speter bracketed_name = 1; 16391556Srgrimes c = pgetc(); 1640219623Sjilles subtype = 0; 16411556Srgrimes } 1642219623Sjillesvarname: 1643149026Sstefanf if (!is_eof(c) && is_name(c)) { 1644179387Sstefanf length = 0; 16451556Srgrimes do { 16461556Srgrimes STPUTC(c, out); 16471556Srgrimes c = pgetc(); 1648179387Sstefanf length++; 1649149026Sstefanf } while (!is_eof(c) && is_in_name(c)); 1650179387Sstefanf if (length == 6 && 1651179387Sstefanf strncmp(out - length, "LINENO", length) == 0) { 1652179022Sstefanf /* Replace the variable name with the 1653179022Sstefanf * current line number. */ 1654179022Sstefanf linno = plinno; 1655179022Sstefanf if (funclinno != 0) 1656179022Sstefanf linno -= funclinno - 1; 1657179022Sstefanf snprintf(buf, sizeof(buf), "%d", linno); 1658179022Sstefanf STADJUST(-6, out); 1659215783Sjilles STPUTS(buf, out); 1660179022Sstefanf flags |= VSLINENO; 1661179022Sstefanf } 166218202Speter } else if (is_digit(c)) { 166318202Speter if (bracketed_name) { 166418202Speter do { 166518202Speter STPUTC(c, out); 166618202Speter c = pgetc(); 166718202Speter } while (is_digit(c)); 166818202Speter } else { 166918202Speter STPUTC(c, out); 167018202Speter c = pgetc(); 167118202Speter } 1672219623Sjilles } else if (is_special(c)) { 1673219623Sjilles c1 = c; 1674219623Sjilles c = pgetc(); 1675219623Sjilles if (subtype == 0 && c1 == '#') { 1676219623Sjilles subtype = VSLENGTH; 1677219623Sjilles if (strchr(types, c) == NULL && c != ':' && 1678219623Sjilles c != '#' && c != '%') 1679219623Sjilles goto varname; 1680219623Sjilles c1 = c; 1681219623Sjilles c = pgetc(); 1682219623Sjilles if (c1 != '}' && c == '}') { 1683219623Sjilles pungetc(); 1684219623Sjilles c = c1; 1685219623Sjilles goto varname; 1686219623Sjilles } 1687219623Sjilles pungetc(); 1688219623Sjilles c = c1; 1689219623Sjilles c1 = '#'; 1690219623Sjilles subtype = 0; 1691219623Sjilles } 1692219623Sjilles USTPUTC(c1, out); 16931556Srgrimes } else { 1694219623Sjilles subtype = VSERROR; 1695219623Sjilles if (c == '}') 1696219623Sjilles pungetc(); 1697219623Sjilles else if (c == '\n' || c == PEOF) 1698219623Sjilles synerror("Unexpected end of line in substitution"); 1699219623Sjilles else 1700164003Sstefanf USTPUTC(c, out); 17011556Srgrimes } 17021556Srgrimes if (subtype == 0) { 170317987Speter switch (c) { 170417987Speter case ':': 1705179022Sstefanf flags |= VSNUL; 17061556Srgrimes c = pgetc(); 170717987Speter /*FALLTHROUGH*/ 170817987Speter default: 170917987Speter p = strchr(types, c); 1710164003Sstefanf if (p == NULL) { 1711206144Sjilles if (c == '\n' || c == PEOF) 1712206144Sjilles synerror("Unexpected end of line in substitution"); 1713164003Sstefanf if (flags == VSNUL) 1714164003Sstefanf STPUTC(':', out); 1715164003Sstefanf STPUTC(c, out); 1716164003Sstefanf subtype = VSERROR; 1717164003Sstefanf } else 1718164003Sstefanf subtype = p - types + VSNORMAL; 171917987Speter break; 172017987Speter case '%': 172120425Ssteve case '#': 172217987Speter { 172317987Speter int cc = c; 172417987Speter subtype = c == '#' ? VSTRIMLEFT : 172517987Speter VSTRIMRIGHT; 172617987Speter c = pgetc(); 172717987Speter if (c == cc) 172817987Speter subtype++; 172917987Speter else 173017987Speter pungetc(); 173117987Speter break; 173217987Speter } 17331556Srgrimes } 1734164003Sstefanf } else if (subtype != VSERROR) { 1735221461Sjilles if (subtype == VSLENGTH && c != '}') 1736221461Sjilles subtype = VSERROR; 17371556Srgrimes pungetc(); 17381556Srgrimes } 1739164003Sstefanf STPUTC('=', out); 1740220903Sjilles if (state[level].syntax == DQSYNTAX || 1741220903Sjilles state[level].syntax == ARISYNTAX) 17421556Srgrimes flags |= VSQUOTE; 17431556Srgrimes *(stackblock() + typeloc) = subtype | flags; 1744206145Sjilles if (subtype != VSNORMAL) { 1745206145Sjilles if (level + 1 >= maxnest) { 1746206145Sjilles maxnest *= 2; 1747206145Sjilles if (state == state_static) { 1748206145Sjilles state = parser_temp_alloc( 1749206145Sjilles maxnest * sizeof(*state)); 1750206145Sjilles memcpy(state, state_static, 1751213811Sobrien MAXNEST_static * sizeof(*state)); 1752206145Sjilles } else 1753206145Sjilles state = parser_temp_realloc(state, 1754206145Sjilles maxnest * sizeof(*state)); 1755206145Sjilles } 1756206145Sjilles level++; 1757206145Sjilles state[level].parenlevel = 0; 1758206145Sjilles if (subtype == VSMINUS || subtype == VSPLUS || 1759206145Sjilles subtype == VSQUESTION || subtype == VSASSIGN) { 1760206145Sjilles /* 1761206145Sjilles * For operators that were in the Bourne shell, 1762206145Sjilles * inherit the double-quote state. 1763206145Sjilles */ 1764206145Sjilles state[level].syntax = state[level - 1].syntax; 1765206145Sjilles state[level].category = TSTATE_VAR_OLD; 1766206145Sjilles } else { 1767206145Sjilles /* 1768206145Sjilles * The other operators take a pattern, 1769206145Sjilles * so go to BASESYNTAX. 1770206145Sjilles * Also, ' and " are now special, even 1771206145Sjilles * in here documents. 1772206145Sjilles */ 1773206145Sjilles state[level].syntax = BASESYNTAX; 1774206145Sjilles state[level].category = TSTATE_VAR_NEW; 1775206145Sjilles newvarnest++; 1776206145Sjilles } 1777206145Sjilles } 1778221513Sjilles } else if (c == '\'' && state[level].syntax == BASESYNTAX) { 1779221513Sjilles /* $'cstylequotes' */ 1780221513Sjilles USTPUTC(CTLQUOTEMARK, out); 1781221513Sjilles state[level].syntax = SQSYNTAX; 1782221513Sjilles sqiscstyle = 1; 1783221513Sjilles } else { 1784221513Sjilles USTPUTC('$', out); 1785221513Sjilles pungetc(); 17861556Srgrimes } 17871556Srgrimes goto parsesub_return; 17881556Srgrimes} 17891556Srgrimes 17901556Srgrimes 17911556Srgrimes/* 17921556Srgrimes * Parse an arithmetic expansion (indicate start of one and set state) 17931556Srgrimes */ 17941556Srgrimesparsearith: { 17951556Srgrimes 1796206145Sjilles if (level + 1 >= maxnest) { 1797206145Sjilles maxnest *= 2; 1798206145Sjilles if (state == state_static) { 1799206145Sjilles state = parser_temp_alloc( 1800206145Sjilles maxnest * sizeof(*state)); 1801206145Sjilles memcpy(state, state_static, 1802213811Sobrien MAXNEST_static * sizeof(*state)); 1803206145Sjilles } else 1804206145Sjilles state = parser_temp_realloc(state, 1805206145Sjilles maxnest * sizeof(*state)); 18061556Srgrimes } 1807206145Sjilles level++; 1808206145Sjilles state[level].syntax = ARISYNTAX; 1809206145Sjilles state[level].parenlevel = 0; 1810206145Sjilles state[level].category = TSTATE_ARITH; 1811206145Sjilles USTPUTC(CTLARI, out); 1812206145Sjilles if (state[level - 1].syntax == DQSYNTAX) 1813206145Sjilles USTPUTC('"',out); 1814206145Sjilles else 1815206145Sjilles USTPUTC(' ',out); 18161556Srgrimes goto parsearith_return; 18171556Srgrimes} 18181556Srgrimes 18191556Srgrimes} /* end of readtoken */ 18201556Srgrimes 18211556Srgrimes 1822253650Sjillesvoid 1823253650Sjillesresetparser(void) 1824253650Sjilles{ 18251556Srgrimes tokpushback = 0; 18261556Srgrimes checkkwd = 0; 18271556Srgrimes} 18281556Srgrimes 1829253650Sjilles 18301556Srgrimes/* 18311556Srgrimes * Returns true if the text contains nothing to expand (no dollar signs 18321556Srgrimes * or backquotes). 18331556Srgrimes */ 18341556Srgrimes 1835213811Sobrienstatic int 183690111Simpnoexpand(char *text) 183790111Simp{ 183825230Ssteve char *p; 183925230Ssteve char c; 18401556Srgrimes 18411556Srgrimes p = text; 18421556Srgrimes while ((c = *p++) != '\0') { 184339137Stegge if ( c == CTLQUOTEMARK) 184439137Stegge continue; 18451556Srgrimes if (c == CTLESC) 18461556Srgrimes p++; 184783675Stegge else if (BASESYNTAX[(int)c] == CCTL) 18481556Srgrimes return 0; 18491556Srgrimes } 18501556Srgrimes return 1; 18511556Srgrimes} 18521556Srgrimes 18531556Srgrimes 18541556Srgrimes/* 18551556Srgrimes * Return true if the argument is a legal variable name (a letter or 18561556Srgrimes * underscore followed by zero or more letters, underscores, and digits). 18571556Srgrimes */ 18581556Srgrimes 18591556Srgrimesint 1860200956Sjillesgoodname(const char *name) 186190111Simp{ 1862200956Sjilles const char *p; 18631556Srgrimes 18641556Srgrimes p = name; 18651556Srgrimes if (! is_name(*p)) 18661556Srgrimes return 0; 18671556Srgrimes while (*++p) { 18681556Srgrimes if (! is_in_name(*p)) 18691556Srgrimes return 0; 18701556Srgrimes } 18711556Srgrimes return 1; 18721556Srgrimes} 18731556Srgrimes 18741556Srgrimes 1875222165Sjillesint 1876222165Sjillesisassignment(const char *p) 1877222165Sjilles{ 1878222165Sjilles if (!is_name(*p)) 1879222165Sjilles return 0; 1880222165Sjilles p++; 1881222165Sjilles for (;;) { 1882222165Sjilles if (*p == '=') 1883222165Sjilles return 1; 1884222165Sjilles else if (!is_in_name(*p)) 1885222165Sjilles return 0; 1886222165Sjilles p++; 1887222165Sjilles } 1888222165Sjilles} 1889222165Sjilles 1890222165Sjilles 18911556Srgrimes/* 18921556Srgrimes * Called when an unexpected token is read during the parse. The argument 18931556Srgrimes * is the token that is expected, or -1 if more than one type of token can 18941556Srgrimes * occur at this point. 18951556Srgrimes */ 18961556Srgrimes 1897213811Sobrienstatic void 189890111Simpsynexpect(int token) 189917987Speter{ 19001556Srgrimes char msg[64]; 19011556Srgrimes 19021556Srgrimes if (token >= 0) { 19031556Srgrimes fmtstr(msg, 64, "%s unexpected (expecting %s)", 19041556Srgrimes tokname[lasttoken], tokname[token]); 19051556Srgrimes } else { 19061556Srgrimes fmtstr(msg, 64, "%s unexpected", tokname[lasttoken]); 19071556Srgrimes } 19081556Srgrimes synerror(msg); 19091556Srgrimes} 19101556Srgrimes 19111556Srgrimes 1912213811Sobrienstatic void 1913201053Sjillessynerror(const char *msg) 191490111Simp{ 19151556Srgrimes if (commandname) 1916201366Sjilles outfmt(out2, "%s: %d: ", commandname, startlinno); 1917201366Sjilles outfmt(out2, "Syntax error: %s\n", msg); 19181556Srgrimes error((char *)NULL); 19191556Srgrimes} 19201556Srgrimes 1921213811Sobrienstatic void 192290111Simpsetprompt(int which) 192390111Simp{ 19241556Srgrimes whichprompt = which; 19251556Srgrimes 192617987Speter#ifndef NO_HISTORY 19271556Srgrimes if (!el) 192817987Speter#endif 1929199629Sjilles { 19301556Srgrimes out2str(getprompt(NULL)); 1931199629Sjilles flushout(out2); 1932199629Sjilles } 19331556Srgrimes} 19341556Srgrimes 19351556Srgrimes/* 19361556Srgrimes * called by editline -- any expansions to the prompt 19371556Srgrimes * should be added here. 19381556Srgrimes */ 19391556Srgrimeschar * 194090111Simpgetprompt(void *unused __unused) 194125905Ssteve{ 1942142845Sobrien static char ps[PROMPTLEN]; 1943142845Sobrien char *fmt; 1944209653Sjilles const char *pwd; 1945209653Sjilles int i, trim; 1946214538Sjilles static char internal_error[] = "??"; 1947142845Sobrien 1948142845Sobrien /* 1949142845Sobrien * Select prompt format. 1950142845Sobrien */ 19511556Srgrimes switch (whichprompt) { 19521556Srgrimes case 0: 1953201053Sjilles fmt = nullstr; 1954142845Sobrien break; 19551556Srgrimes case 1: 1956142845Sobrien fmt = ps1val(); 1957142845Sobrien break; 19581556Srgrimes case 2: 1959142845Sobrien fmt = ps2val(); 1960142845Sobrien break; 19611556Srgrimes default: 1962201053Sjilles return internal_error; 19631556Srgrimes } 1964142845Sobrien 1965142845Sobrien /* 1966142845Sobrien * Format prompt string. 1967142845Sobrien */ 1968142845Sobrien for (i = 0; (i < 127) && (*fmt != '\0'); i++, fmt++) 1969142845Sobrien if (*fmt == '\\') 1970142845Sobrien switch (*++fmt) { 1971142845Sobrien 1972142845Sobrien /* 1973142845Sobrien * Hostname. 1974142845Sobrien * 1975142845Sobrien * \h specifies just the local hostname, 1976142845Sobrien * \H specifies fully-qualified hostname. 1977142845Sobrien */ 1978142845Sobrien case 'h': 1979142845Sobrien case 'H': 1980149024Sstefanf ps[i] = '\0'; 1981142845Sobrien gethostname(&ps[i], PROMPTLEN - i); 1982142845Sobrien /* Skip to end of hostname. */ 1983142845Sobrien trim = (*fmt == 'h') ? '.' : '\0'; 1984142845Sobrien while ((ps[i+1] != '\0') && (ps[i+1] != trim)) 1985142845Sobrien i++; 1986142845Sobrien break; 1987142845Sobrien 1988142845Sobrien /* 1989142845Sobrien * Working directory. 1990142845Sobrien * 1991142845Sobrien * \W specifies just the final component, 1992142845Sobrien * \w specifies the entire path. 1993142845Sobrien */ 1994142845Sobrien case 'W': 1995142845Sobrien case 'w': 1996209653Sjilles pwd = lookupvar("PWD"); 1997209653Sjilles if (pwd == NULL) 1998209653Sjilles pwd = "?"; 1999209653Sjilles if (*fmt == 'W' && 2000209653Sjilles *pwd == '/' && pwd[1] != '\0') 2001209653Sjilles strlcpy(&ps[i], strrchr(pwd, '/') + 1, 2002209653Sjilles PROMPTLEN - i); 2003209653Sjilles else 2004209653Sjilles strlcpy(&ps[i], pwd, PROMPTLEN - i); 2005142845Sobrien /* Skip to end of path. */ 2006142845Sobrien while (ps[i + 1] != '\0') 2007142845Sobrien i++; 2008142845Sobrien break; 2009142845Sobrien 2010142845Sobrien /* 2011142845Sobrien * Superuser status. 2012142845Sobrien * 2013142845Sobrien * '$' for normal users, '#' for root. 2014142845Sobrien */ 2015142845Sobrien case '$': 2016142845Sobrien ps[i] = (geteuid() != 0) ? '$' : '#'; 2017142845Sobrien break; 2018142845Sobrien 2019142845Sobrien /* 2020142845Sobrien * A literal \. 2021142845Sobrien */ 2022142845Sobrien case '\\': 2023142845Sobrien ps[i] = '\\'; 2024142845Sobrien break; 2025142845Sobrien 2026142845Sobrien /* 2027142845Sobrien * Emit unrecognized formats verbatim. 2028142845Sobrien */ 2029142845Sobrien default: 2030142845Sobrien ps[i++] = '\\'; 2031142845Sobrien ps[i] = *fmt; 2032142845Sobrien break; 2033142845Sobrien } 2034142845Sobrien else 2035142845Sobrien ps[i] = *fmt; 2036142845Sobrien ps[i] = '\0'; 2037142845Sobrien return (ps); 20381556Srgrimes} 2039222907Sjilles 2040222907Sjilles 2041222907Sjillesconst char * 2042248980Sjillesexpandstr(const char *ps) 2043222907Sjilles{ 2044222907Sjilles union node n; 2045222907Sjilles struct jmploc jmploc; 2046222907Sjilles struct jmploc *const savehandler = handler; 2047222907Sjilles const int saveprompt = doprompt; 2048222907Sjilles struct parsefile *const savetopfile = getcurrentfile(); 2049222907Sjilles struct parser_temp *const saveparser_temp = parser_temp; 2050222907Sjilles const char *result = NULL; 2051222907Sjilles 2052222907Sjilles if (!setjmp(jmploc.loc)) { 2053222907Sjilles handler = &jmploc; 2054222907Sjilles parser_temp = NULL; 2055222907Sjilles setinputstring(ps, 1); 2056222907Sjilles doprompt = 0; 2057222907Sjilles readtoken1(pgetc(), DQSYNTAX, "\n\n", 0); 2058222907Sjilles if (backquotelist != NULL) 2059222907Sjilles error("Command substitution not allowed here"); 2060222907Sjilles 2061222907Sjilles n.narg.type = NARG; 2062222907Sjilles n.narg.next = NULL; 2063222907Sjilles n.narg.text = wordtext; 2064222907Sjilles n.narg.backquote = backquotelist; 2065222907Sjilles 2066222907Sjilles expandarg(&n, NULL, 0); 2067222907Sjilles result = stackblock(); 2068222907Sjilles INTOFF; 2069222907Sjilles } 2070222907Sjilles handler = savehandler; 2071222907Sjilles doprompt = saveprompt; 2072222907Sjilles popfilesupto(savetopfile); 2073222907Sjilles if (parser_temp != saveparser_temp) { 2074222907Sjilles parser_temp_free_all(); 2075222907Sjilles parser_temp = saveparser_temp; 2076222907Sjilles } 2077222907Sjilles if (result != NULL) { 2078222907Sjilles INTON; 2079222907Sjilles } else if (exception == EXINT) 2080222907Sjilles raise(SIGINT); 2081222907Sjilles return result; 2082222907Sjilles} 2083