parser.c revision 254843
11556Srgrimes/*- 21556Srgrimes * Copyright (c) 1991, 1993 31556Srgrimes * The Regents of the University of California. All rights reserved. 41556Srgrimes * 51556Srgrimes * This code is derived from software contributed to Berkeley by 61556Srgrimes * Kenneth Almquist. 71556Srgrimes * 81556Srgrimes * Redistribution and use in source and binary forms, with or without 91556Srgrimes * modification, are permitted provided that the following conditions 101556Srgrimes * are met: 111556Srgrimes * 1. Redistributions of source code must retain the above copyright 121556Srgrimes * notice, this list of conditions and the following disclaimer. 131556Srgrimes * 2. Redistributions in binary form must reproduce the above copyright 141556Srgrimes * notice, this list of conditions and the following disclaimer in the 151556Srgrimes * documentation and/or other materials provided with the distribution. 161556Srgrimes * 4. Neither the name of the University nor the names of its contributors 171556Srgrimes * may be used to endorse or promote products derived from this software 181556Srgrimes * without specific prior written permission. 191556Srgrimes * 201556Srgrimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 211556Srgrimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 221556Srgrimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 231556Srgrimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 241556Srgrimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 251556Srgrimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 261556Srgrimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 271556Srgrimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 281556Srgrimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 291556Srgrimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 301556Srgrimes * SUCH DAMAGE. 311556Srgrimes */ 321556Srgrimes 331556Srgrimes#ifndef lint 3436150Scharnier#if 0 3536150Scharnierstatic char sccsid[] = "@(#)parser.c 8.7 (Berkeley) 5/16/95"; 3636150Scharnier#endif 371556Srgrimes#endif /* not lint */ 3899110Sobrien#include <sys/cdefs.h> 3999110Sobrien__FBSDID("$FreeBSD: head/bin/sh/parser.c 254843 2013-08-25 10:57:48Z jilles $"); 401556Srgrimes 4117987Speter#include <stdlib.h> 42149017Sstefanf#include <unistd.h> 43209337Sjilles#include <stdio.h> 4417987Speter 451556Srgrimes#include "shell.h" 461556Srgrimes#include "parser.h" 471556Srgrimes#include "nodes.h" 481556Srgrimes#include "expand.h" /* defines rmescapes() */ 491556Srgrimes#include "syntax.h" 501556Srgrimes#include "options.h" 511556Srgrimes#include "input.h" 521556Srgrimes#include "output.h" 531556Srgrimes#include "var.h" 541556Srgrimes#include "error.h" 551556Srgrimes#include "memalloc.h" 561556Srgrimes#include "mystring.h" 571556Srgrimes#include "alias.h" 5817987Speter#include "show.h" 5959436Scracauer#include "eval.h" 60214304Sjilles#include "exec.h" /* to check for special builtins */ 6117987Speter#ifndef NO_HISTORY 621556Srgrimes#include "myhistedit.h" 6317987Speter#endif 641556Srgrimes 651556Srgrimes/* 661556Srgrimes * Shell command parser. 671556Srgrimes */ 681556Srgrimes 69142845Sobrien#define EOFMARKLEN 79 70142845Sobrien#define PROMPTLEN 128 711556Srgrimes 72214709Sjilles/* values of checkkwd variable */ 73214709Sjilles#define CHKALIAS 0x1 74214709Sjilles#define CHKKWD 0x2 75214709Sjilles#define CHKNL 0x4 76214709Sjilles 771556Srgrimes/* values returned by readtoken */ 7817987Speter#include "token.h" 791556Srgrimes 801556Srgrimes 811556Srgrimes 821556Srgrimesstruct heredoc { 831556Srgrimes struct heredoc *next; /* next here document in list */ 841556Srgrimes union node *here; /* redirection node */ 851556Srgrimes char *eofmark; /* string indicating end of input */ 861556Srgrimes int striptabs; /* if set, strip leading tabs */ 871556Srgrimes}; 881556Srgrimes 89206145Sjillesstruct parser_temp { 90206145Sjilles struct parser_temp *next; 91206145Sjilles void *data; 92206145Sjilles}; 931556Srgrimes 941556Srgrimes 95213760Sobrienstatic struct heredoc *heredoclist; /* list of here documents to read */ 96213760Sobrienstatic int doprompt; /* if set, prompt the user */ 97213760Sobrienstatic int needprompt; /* true if interactive and at start of line */ 98213760Sobrienstatic int lasttoken; /* last token read */ 99253658Sjillesint tokpushback; /* last token pushed back */ 100213760Sobrienstatic char *wordtext; /* text of last word returned by readtoken */ 101253659Sjillesstatic int checkkwd; 102213760Sobrienstatic struct nodelist *backquotelist; 103213760Sobrienstatic union node *redirnode; 104213760Sobrienstatic struct heredoc *heredoc; 105213760Sobrienstatic int quoteflag; /* set if (part of) last token was quoted */ 106213760Sobrienstatic int startlinno; /* line # where last token started */ 107213760Sobrienstatic int funclinno; /* line # where the current function started */ 108213760Sobrienstatic struct parser_temp *parser_temp; 1091556Srgrimes 1101556Srgrimes 111214525Sjillesstatic union node *list(int, int); 112213811Sobrienstatic union node *andor(void); 113213811Sobrienstatic union node *pipeline(void); 114213811Sobrienstatic union node *command(void); 115213811Sobrienstatic union node *simplecmd(union node **, union node *); 116213811Sobrienstatic union node *makename(void); 117213811Sobrienstatic void parsefname(void); 118213811Sobrienstatic void parseheredoc(void); 119213811Sobrienstatic int peektoken(void); 120213811Sobrienstatic int readtoken(void); 121213811Sobrienstatic int xxreadtoken(void); 122248980Sjillesstatic int readtoken1(int, const char *, const char *, int); 123213811Sobrienstatic int noexpand(char *); 124213811Sobrienstatic void synexpect(int) __dead2; 125213811Sobrienstatic void synerror(const char *) __dead2; 126213811Sobrienstatic void setprompt(int); 1271556Srgrimes 12817987Speter 129213811Sobrienstatic void * 130206145Sjillesparser_temp_alloc(size_t len) 131206145Sjilles{ 132206145Sjilles struct parser_temp *t; 133206145Sjilles 134206145Sjilles INTOFF; 135206145Sjilles t = ckmalloc(sizeof(*t)); 136206145Sjilles t->data = NULL; 137206145Sjilles t->next = parser_temp; 138206145Sjilles parser_temp = t; 139206145Sjilles t->data = ckmalloc(len); 140206145Sjilles INTON; 141206145Sjilles return t->data; 142206145Sjilles} 143206145Sjilles 144206145Sjilles 145213811Sobrienstatic void * 146206145Sjillesparser_temp_realloc(void *ptr, size_t len) 147206145Sjilles{ 148206145Sjilles struct parser_temp *t; 149206145Sjilles 150206145Sjilles INTOFF; 151206145Sjilles t = parser_temp; 152206145Sjilles if (ptr != t->data) 153206145Sjilles error("bug: parser_temp_realloc misused"); 154206145Sjilles t->data = ckrealloc(t->data, len); 155206145Sjilles INTON; 156206145Sjilles return t->data; 157206145Sjilles} 158206145Sjilles 159206145Sjilles 160213811Sobrienstatic void 161206145Sjillesparser_temp_free_upto(void *ptr) 162206145Sjilles{ 163206145Sjilles struct parser_temp *t; 164206145Sjilles int done = 0; 165206145Sjilles 166206145Sjilles INTOFF; 167206145Sjilles while (parser_temp != NULL && !done) { 168206145Sjilles t = parser_temp; 169206145Sjilles parser_temp = t->next; 170206145Sjilles done = t->data == ptr; 171206145Sjilles ckfree(t->data); 172206145Sjilles ckfree(t); 173206145Sjilles } 174206145Sjilles INTON; 175206145Sjilles if (!done) 176206145Sjilles error("bug: parser_temp_free_upto misused"); 177206145Sjilles} 178206145Sjilles 179206145Sjilles 180213811Sobrienstatic void 181206145Sjillesparser_temp_free_all(void) 182206145Sjilles{ 183206145Sjilles struct parser_temp *t; 184206145Sjilles 185206145Sjilles INTOFF; 186206145Sjilles while (parser_temp != NULL) { 187206145Sjilles t = parser_temp; 188206145Sjilles parser_temp = t->next; 189206145Sjilles ckfree(t->data); 190206145Sjilles ckfree(t); 191206145Sjilles } 192206145Sjilles INTON; 193206145Sjilles} 194206145Sjilles 195206145Sjilles 1961556Srgrimes/* 1971556Srgrimes * Read and parse a command. Returns NEOF on end of file. (NULL is a 1981556Srgrimes * valid parse tree indicating a blank line.) 1991556Srgrimes */ 2001556Srgrimes 2011556Srgrimesunion node * 20290111Simpparsecmd(int interact) 20317987Speter{ 2041556Srgrimes int t; 2051556Srgrimes 206206145Sjilles /* This assumes the parser is not re-entered, 207206145Sjilles * which could happen if we add command substitution on PS1/PS2. 208206145Sjilles */ 209206145Sjilles parser_temp_free_all(); 210208656Sjilles heredoclist = NULL; 211206145Sjilles 21260593Scracauer tokpushback = 0; 213254426Sjilles checkkwd = 0; 2141556Srgrimes doprompt = interact; 2151556Srgrimes if (doprompt) 2161556Srgrimes setprompt(1); 2171556Srgrimes else 2181556Srgrimes setprompt(0); 2191556Srgrimes needprompt = 0; 2201556Srgrimes t = readtoken(); 2211556Srgrimes if (t == TEOF) 2221556Srgrimes return NEOF; 2231556Srgrimes if (t == TNL) 2241556Srgrimes return NULL; 2251556Srgrimes tokpushback++; 226214531Sjilles return list(1, 1); 2271556Srgrimes} 2281556Srgrimes 2291556Srgrimes 230213811Sobrienstatic union node * 231214525Sjilleslist(int nlflag, int erflag) 23217987Speter{ 233214599Sjilles union node *ntop, *n1, *n2, *n3; 23417987Speter int tok; 2351556Srgrimes 236214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 237214531Sjilles if (!nlflag && !erflag && tokendlist[peektoken()]) 2381556Srgrimes return NULL; 239214599Sjilles ntop = n1 = NULL; 2401556Srgrimes for (;;) { 24117987Speter n2 = andor(); 24217987Speter tok = readtoken(); 24317987Speter if (tok == TBACKGND) { 244245382Sjilles if (n2 != NULL && n2->type == NPIPE) { 245223282Sjilles n2->npipe.backgnd = 1; 246245382Sjilles } else if (n2 != NULL && n2->type == NREDIR) { 24717987Speter n2->type = NBACKGND; 24817987Speter } else { 24917987Speter n3 = (union node *)stalloc(sizeof (struct nredir)); 25017987Speter n3->type = NBACKGND; 25117987Speter n3->nredir.n = n2; 25217987Speter n3->nredir.redirect = NULL; 25317987Speter n2 = n3; 25417987Speter } 25517987Speter } 256214599Sjilles if (ntop == NULL) 257214599Sjilles ntop = n2; 258214599Sjilles else if (n1 == NULL) { 259214599Sjilles n1 = (union node *)stalloc(sizeof (struct nbinary)); 260214599Sjilles n1->type = NSEMI; 261214599Sjilles n1->nbinary.ch1 = ntop; 262214599Sjilles n1->nbinary.ch2 = n2; 263214599Sjilles ntop = n1; 26417987Speter } 26517987Speter else { 26617987Speter n3 = (union node *)stalloc(sizeof (struct nbinary)); 26717987Speter n3->type = NSEMI; 268214599Sjilles n3->nbinary.ch1 = n1->nbinary.ch2; 26917987Speter n3->nbinary.ch2 = n2; 270214599Sjilles n1->nbinary.ch2 = n3; 27117987Speter n1 = n3; 27217987Speter } 27317987Speter switch (tok) { 27413882Sjoerg case TBACKGND: 27517987Speter case TSEMI: 27617987Speter tok = readtoken(); 277102410Scharnier /* FALLTHROUGH */ 2781556Srgrimes case TNL: 27917987Speter if (tok == TNL) { 28017987Speter parseheredoc(); 28117987Speter if (nlflag) 282214599Sjilles return ntop; 283210488Sjilles } else if (tok == TEOF && nlflag) { 284210488Sjilles parseheredoc(); 285214599Sjilles return ntop; 28617987Speter } else { 28717987Speter tokpushback++; 28817987Speter } 289214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 290245381Sjilles if (!nlflag && (erflag ? peektoken() == TEOF : 291245381Sjilles tokendlist[peektoken()])) 292214599Sjilles return ntop; 2931556Srgrimes break; 2941556Srgrimes case TEOF: 2951556Srgrimes if (heredoclist) 2961556Srgrimes parseheredoc(); 2971556Srgrimes else 2981556Srgrimes pungetc(); /* push back EOF on input */ 299214599Sjilles return ntop; 3001556Srgrimes default: 301214525Sjilles if (nlflag || erflag) 3021556Srgrimes synexpect(-1); 3031556Srgrimes tokpushback++; 304214599Sjilles return ntop; 3051556Srgrimes } 3061556Srgrimes } 3071556Srgrimes} 3081556Srgrimes 3091556Srgrimes 3101556Srgrimes 311213811Sobrienstatic union node * 31290111Simpandor(void) 31390111Simp{ 3141556Srgrimes union node *n1, *n2, *n3; 3151556Srgrimes int t; 3161556Srgrimes 3171556Srgrimes n1 = pipeline(); 3181556Srgrimes for (;;) { 3191556Srgrimes if ((t = readtoken()) == TAND) { 3201556Srgrimes t = NAND; 3211556Srgrimes } else if (t == TOR) { 3221556Srgrimes t = NOR; 3231556Srgrimes } else { 3241556Srgrimes tokpushback++; 3251556Srgrimes return n1; 3261556Srgrimes } 3271556Srgrimes n2 = pipeline(); 3281556Srgrimes n3 = (union node *)stalloc(sizeof (struct nbinary)); 3291556Srgrimes n3->type = t; 3301556Srgrimes n3->nbinary.ch1 = n1; 3311556Srgrimes n3->nbinary.ch2 = n2; 3321556Srgrimes n1 = n3; 3331556Srgrimes } 3341556Srgrimes} 3351556Srgrimes 3361556Srgrimes 3371556Srgrimes 338213811Sobrienstatic union node * 33990111Simppipeline(void) 34090111Simp{ 34175336Sbrian union node *n1, *n2, *pipenode; 3421556Srgrimes struct nodelist *lp, *prev; 343214281Sjilles int negate, t; 3441556Srgrimes 34575336Sbrian negate = 0; 346214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 3471556Srgrimes TRACE(("pipeline: entered\n")); 34875336Sbrian while (readtoken() == TNOT) 34975336Sbrian negate = !negate; 35075336Sbrian tokpushback++; 3511556Srgrimes n1 = command(); 3521556Srgrimes if (readtoken() == TPIPE) { 3531556Srgrimes pipenode = (union node *)stalloc(sizeof (struct npipe)); 3541556Srgrimes pipenode->type = NPIPE; 3551556Srgrimes pipenode->npipe.backgnd = 0; 3561556Srgrimes lp = (struct nodelist *)stalloc(sizeof (struct nodelist)); 3571556Srgrimes pipenode->npipe.cmdlist = lp; 3581556Srgrimes lp->n = n1; 3591556Srgrimes do { 3601556Srgrimes prev = lp; 3611556Srgrimes lp = (struct nodelist *)stalloc(sizeof (struct nodelist)); 362214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 363214281Sjilles t = readtoken(); 364214281Sjilles tokpushback++; 365214281Sjilles if (t == TNOT) 366214281Sjilles lp->n = pipeline(); 367214281Sjilles else 368214281Sjilles lp->n = command(); 3691556Srgrimes prev->next = lp; 3701556Srgrimes } while (readtoken() == TPIPE); 3711556Srgrimes lp->next = NULL; 3721556Srgrimes n1 = pipenode; 3731556Srgrimes } 3741556Srgrimes tokpushback++; 37575336Sbrian if (negate) { 37675336Sbrian n2 = (union node *)stalloc(sizeof (struct nnot)); 37775336Sbrian n2->type = NNOT; 37875336Sbrian n2->nnot.com = n1; 37975336Sbrian return n2; 38075336Sbrian } else 38175336Sbrian return n1; 3821556Srgrimes} 3831556Srgrimes 3841556Srgrimes 3851556Srgrimes 386213811Sobrienstatic union node * 38790111Simpcommand(void) 38890111Simp{ 3891556Srgrimes union node *n1, *n2; 3901556Srgrimes union node *ap, **app; 3911556Srgrimes union node *cp, **cpp; 3921556Srgrimes union node *redir, **rpp; 393214281Sjilles int t; 394218325Sjilles int is_subshell; 3951556Srgrimes 396214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 397218325Sjilles is_subshell = 0; 39817987Speter redir = NULL; 39917987Speter n1 = NULL; 4001556Srgrimes rpp = &redir; 40120425Ssteve 4021556Srgrimes /* Check for redirection which may precede command */ 4031556Srgrimes while (readtoken() == TREDIR) { 4041556Srgrimes *rpp = n2 = redirnode; 4051556Srgrimes rpp = &n2->nfile.next; 4061556Srgrimes parsefname(); 4071556Srgrimes } 4081556Srgrimes tokpushback++; 4091556Srgrimes 4101556Srgrimes switch (readtoken()) { 4111556Srgrimes case TIF: 4121556Srgrimes n1 = (union node *)stalloc(sizeof (struct nif)); 4131556Srgrimes n1->type = NIF; 414214525Sjilles if ((n1->nif.test = list(0, 0)) == NULL) 415104554Stjr synexpect(-1); 4161556Srgrimes if (readtoken() != TTHEN) 4171556Srgrimes synexpect(TTHEN); 418214525Sjilles n1->nif.ifpart = list(0, 0); 4191556Srgrimes n2 = n1; 4201556Srgrimes while (readtoken() == TELIF) { 4211556Srgrimes n2->nif.elsepart = (union node *)stalloc(sizeof (struct nif)); 4221556Srgrimes n2 = n2->nif.elsepart; 4231556Srgrimes n2->type = NIF; 424214525Sjilles if ((n2->nif.test = list(0, 0)) == NULL) 425104554Stjr synexpect(-1); 4261556Srgrimes if (readtoken() != TTHEN) 4271556Srgrimes synexpect(TTHEN); 428214525Sjilles n2->nif.ifpart = list(0, 0); 4291556Srgrimes } 4301556Srgrimes if (lasttoken == TELSE) 431214525Sjilles n2->nif.elsepart = list(0, 0); 4321556Srgrimes else { 4331556Srgrimes n2->nif.elsepart = NULL; 4341556Srgrimes tokpushback++; 4351556Srgrimes } 4361556Srgrimes if (readtoken() != TFI) 4371556Srgrimes synexpect(TFI); 438214709Sjilles checkkwd = CHKKWD | CHKALIAS; 4391556Srgrimes break; 4401556Srgrimes case TWHILE: 4411556Srgrimes case TUNTIL: { 4421556Srgrimes int got; 4431556Srgrimes n1 = (union node *)stalloc(sizeof (struct nbinary)); 4441556Srgrimes n1->type = (lasttoken == TWHILE)? NWHILE : NUNTIL; 445214525Sjilles if ((n1->nbinary.ch1 = list(0, 0)) == NULL) 446104554Stjr synexpect(-1); 4471556Srgrimes if ((got=readtoken()) != TDO) { 4481556SrgrimesTRACE(("expecting DO got %s %s\n", tokname[got], got == TWORD ? wordtext : "")); 4491556Srgrimes synexpect(TDO); 4501556Srgrimes } 451214525Sjilles n1->nbinary.ch2 = list(0, 0); 4521556Srgrimes if (readtoken() != TDONE) 4531556Srgrimes synexpect(TDONE); 454214709Sjilles checkkwd = CHKKWD | CHKALIAS; 4551556Srgrimes break; 4561556Srgrimes } 4571556Srgrimes case TFOR: 4581556Srgrimes if (readtoken() != TWORD || quoteflag || ! goodname(wordtext)) 4591556Srgrimes synerror("Bad for loop variable"); 4601556Srgrimes n1 = (union node *)stalloc(sizeof (struct nfor)); 4611556Srgrimes n1->type = NFOR; 4621556Srgrimes n1->nfor.var = wordtext; 463199282Sjilles while (readtoken() == TNL) 464199282Sjilles ; 465199282Sjilles if (lasttoken == TWORD && ! quoteflag && equal(wordtext, "in")) { 4661556Srgrimes app = ≈ 4671556Srgrimes while (readtoken() == TWORD) { 4681556Srgrimes n2 = (union node *)stalloc(sizeof (struct narg)); 4691556Srgrimes n2->type = NARG; 4701556Srgrimes n2->narg.text = wordtext; 4711556Srgrimes n2->narg.backquote = backquotelist; 4721556Srgrimes *app = n2; 4731556Srgrimes app = &n2->narg.next; 4741556Srgrimes } 4751556Srgrimes *app = NULL; 4761556Srgrimes n1->nfor.args = ap; 4771556Srgrimes if (lasttoken != TNL && lasttoken != TSEMI) 4781556Srgrimes synexpect(-1); 4791556Srgrimes } else { 480149096Sstefanf static char argvars[5] = { 481149096Sstefanf CTLVAR, VSNORMAL|VSQUOTE, '@', '=', '\0' 482149096Sstefanf }; 4831556Srgrimes n2 = (union node *)stalloc(sizeof (struct narg)); 4841556Srgrimes n2->type = NARG; 485149096Sstefanf n2->narg.text = argvars; 4861556Srgrimes n2->narg.backquote = NULL; 4871556Srgrimes n2->narg.next = NULL; 4881556Srgrimes n1->nfor.args = n2; 4891556Srgrimes /* 4901556Srgrimes * Newline or semicolon here is optional (but note 4911556Srgrimes * that the original Bourne shell only allowed NL). 4921556Srgrimes */ 4931556Srgrimes if (lasttoken != TNL && lasttoken != TSEMI) 4941556Srgrimes tokpushback++; 4951556Srgrimes } 496214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 4971556Srgrimes if ((t = readtoken()) == TDO) 4981556Srgrimes t = TDONE; 4991556Srgrimes else if (t == TBEGIN) 5001556Srgrimes t = TEND; 5011556Srgrimes else 5021556Srgrimes synexpect(-1); 503214525Sjilles n1->nfor.body = list(0, 0); 5041556Srgrimes if (readtoken() != t) 5051556Srgrimes synexpect(t); 506214709Sjilles checkkwd = CHKKWD | CHKALIAS; 5071556Srgrimes break; 5081556Srgrimes case TCASE: 5091556Srgrimes n1 = (union node *)stalloc(sizeof (struct ncase)); 5101556Srgrimes n1->type = NCASE; 5111556Srgrimes if (readtoken() != TWORD) 5121556Srgrimes synexpect(TWORD); 5131556Srgrimes n1->ncase.expr = n2 = (union node *)stalloc(sizeof (struct narg)); 5141556Srgrimes n2->type = NARG; 5151556Srgrimes n2->narg.text = wordtext; 5161556Srgrimes n2->narg.backquote = backquotelist; 5171556Srgrimes n2->narg.next = NULL; 5181556Srgrimes while (readtoken() == TNL); 5191556Srgrimes if (lasttoken != TWORD || ! equal(wordtext, "in")) 5201556Srgrimes synerror("expecting \"in\""); 5211556Srgrimes cpp = &n1->ncase.cases; 522214709Sjilles checkkwd = CHKNL | CHKKWD, readtoken(); 523104202Stjr while (lasttoken != TESAC) { 5241556Srgrimes *cpp = cp = (union node *)stalloc(sizeof (struct nclist)); 5251556Srgrimes cp->type = NCLIST; 5261556Srgrimes app = &cp->nclist.pattern; 527104207Stjr if (lasttoken == TLP) 528104207Stjr readtoken(); 5291556Srgrimes for (;;) { 5301556Srgrimes *app = ap = (union node *)stalloc(sizeof (struct narg)); 5311556Srgrimes ap->type = NARG; 5321556Srgrimes ap->narg.text = wordtext; 5331556Srgrimes ap->narg.backquote = backquotelist; 534214709Sjilles checkkwd = CHKNL | CHKKWD; 535214709Sjilles if (readtoken() != TPIPE) 5361556Srgrimes break; 5371556Srgrimes app = &ap->narg.next; 5382760Ssef readtoken(); 5391556Srgrimes } 5401556Srgrimes ap->narg.next = NULL; 5411556Srgrimes if (lasttoken != TRP) 542214709Sjilles synexpect(TRP); 543214525Sjilles cp->nclist.body = list(0, 0); 5442760Ssef 545214709Sjilles checkkwd = CHKNL | CHKKWD | CHKALIAS; 5462760Ssef if ((t = readtoken()) != TESAC) { 547223186Sjilles if (t == TENDCASE) 548223186Sjilles ; 549223186Sjilles else if (t == TFALLTHRU) 550223186Sjilles cp->type = NCLISTFALLTHRU; 551223186Sjilles else 552214709Sjilles synexpect(TENDCASE); 553223186Sjilles checkkwd = CHKNL | CHKKWD, readtoken(); 5542760Ssef } 5551556Srgrimes cpp = &cp->nclist.next; 556104202Stjr } 5571556Srgrimes *cpp = NULL; 558214709Sjilles checkkwd = CHKKWD | CHKALIAS; 5591556Srgrimes break; 5601556Srgrimes case TLP: 5611556Srgrimes n1 = (union node *)stalloc(sizeof (struct nredir)); 5621556Srgrimes n1->type = NSUBSHELL; 563214525Sjilles n1->nredir.n = list(0, 0); 5641556Srgrimes n1->nredir.redirect = NULL; 5651556Srgrimes if (readtoken() != TRP) 5661556Srgrimes synexpect(TRP); 567214709Sjilles checkkwd = CHKKWD | CHKALIAS; 568218325Sjilles is_subshell = 1; 5691556Srgrimes break; 5701556Srgrimes case TBEGIN: 571214525Sjilles n1 = list(0, 0); 5721556Srgrimes if (readtoken() != TEND) 5731556Srgrimes synexpect(TEND); 574214709Sjilles checkkwd = CHKKWD | CHKALIAS; 5751556Srgrimes break; 576254843Sjilles /* A simple command must have at least one redirection or word. */ 577210221Sjilles case TBACKGND: 57817987Speter case TSEMI: 579101662Stjr case TAND: 580101662Stjr case TOR: 581254335Sjilles case TPIPE: 582254335Sjilles case TENDCASE: 583254335Sjilles case TFALLTHRU: 584254843Sjilles case TEOF: 585254843Sjilles case TNL: 586254843Sjilles case TRP: 58717987Speter if (!redir) 58817987Speter synexpect(-1); 5891556Srgrimes case TWORD: 5901556Srgrimes tokpushback++; 59175160Sbrian n1 = simplecmd(rpp, redir); 592214281Sjilles return n1; 5931556Srgrimes default: 5941556Srgrimes synexpect(-1); 5951556Srgrimes } 5961556Srgrimes 5971556Srgrimes /* Now check for redirection which may follow command */ 5981556Srgrimes while (readtoken() == TREDIR) { 5991556Srgrimes *rpp = n2 = redirnode; 6001556Srgrimes rpp = &n2->nfile.next; 6011556Srgrimes parsefname(); 6021556Srgrimes } 6031556Srgrimes tokpushback++; 6041556Srgrimes *rpp = NULL; 6051556Srgrimes if (redir) { 606218325Sjilles if (!is_subshell) { 6071556Srgrimes n2 = (union node *)stalloc(sizeof (struct nredir)); 6081556Srgrimes n2->type = NREDIR; 6091556Srgrimes n2->nredir.n = n1; 6101556Srgrimes n1 = n2; 6111556Srgrimes } 6121556Srgrimes n1->nredir.redirect = redir; 6131556Srgrimes } 61475160Sbrian 615214281Sjilles return n1; 6161556Srgrimes} 6171556Srgrimes 6181556Srgrimes 619213811Sobrienstatic union node * 62090111Simpsimplecmd(union node **rpp, union node *redir) 62190111Simp{ 6221556Srgrimes union node *args, **app; 6231556Srgrimes union node **orig_rpp = rpp; 624210087Sjilles union node *n = NULL; 625214304Sjilles int special; 626222165Sjilles int savecheckkwd; 6271556Srgrimes 6281556Srgrimes /* If we don't have any redirections already, then we must reset */ 6291556Srgrimes /* rpp to be the address of the local redir variable. */ 6301556Srgrimes if (redir == 0) 6311556Srgrimes rpp = &redir; 6321556Srgrimes 6331556Srgrimes args = NULL; 6341556Srgrimes app = &args; 6358855Srgrimes /* 6361556Srgrimes * We save the incoming value, because we need this for shell 6371556Srgrimes * functions. There can not be a redirect or an argument between 6388855Srgrimes * the function name and the open parenthesis. 6391556Srgrimes */ 6401556Srgrimes orig_rpp = rpp; 6411556Srgrimes 642222165Sjilles savecheckkwd = CHKALIAS; 643222165Sjilles 6441556Srgrimes for (;;) { 645222165Sjilles checkkwd = savecheckkwd; 6461556Srgrimes if (readtoken() == TWORD) { 6471556Srgrimes n = (union node *)stalloc(sizeof (struct narg)); 6481556Srgrimes n->type = NARG; 6491556Srgrimes n->narg.text = wordtext; 6501556Srgrimes n->narg.backquote = backquotelist; 6511556Srgrimes *app = n; 6521556Srgrimes app = &n->narg.next; 653222165Sjilles if (savecheckkwd != 0 && !isassignment(wordtext)) 654222165Sjilles savecheckkwd = 0; 6551556Srgrimes } else if (lasttoken == TREDIR) { 6561556Srgrimes *rpp = n = redirnode; 6571556Srgrimes rpp = &n->nfile.next; 6581556Srgrimes parsefname(); /* read name of redirection file */ 6591556Srgrimes } else if (lasttoken == TLP && app == &args->narg.next 6601556Srgrimes && rpp == orig_rpp) { 6611556Srgrimes /* We have a function */ 6621556Srgrimes if (readtoken() != TRP) 6631556Srgrimes synexpect(TRP); 664179022Sstefanf funclinno = plinno; 665214291Sjilles /* 666214291Sjilles * - Require plain text. 667214291Sjilles * - Functions with '/' cannot be called. 668214534Sjilles * - Reject name=(). 669214534Sjilles * - Reject ksh extended glob patterns. 670214291Sjilles */ 671214291Sjilles if (!noexpand(n->narg.text) || quoteflag || 672214534Sjilles strchr(n->narg.text, '/') || 673214534Sjilles strchr("!%*+-=?@}~", 674214534Sjilles n->narg.text[strlen(n->narg.text) - 1])) 6751556Srgrimes synerror("Bad function name"); 676214291Sjilles rmescapes(n->narg.text); 677214304Sjilles if (find_builtin(n->narg.text, &special) >= 0 && 678214304Sjilles special) 679214304Sjilles synerror("Cannot override a special builtin with a function"); 6801556Srgrimes n->type = NDEFUN; 6811556Srgrimes n->narg.next = command(); 682179022Sstefanf funclinno = 0; 683210087Sjilles return n; 6841556Srgrimes } else { 6851556Srgrimes tokpushback++; 6861556Srgrimes break; 6871556Srgrimes } 6881556Srgrimes } 6891556Srgrimes *app = NULL; 6901556Srgrimes *rpp = NULL; 6911556Srgrimes n = (union node *)stalloc(sizeof (struct ncmd)); 6921556Srgrimes n->type = NCMD; 6931556Srgrimes n->ncmd.args = args; 6941556Srgrimes n->ncmd.redirect = redir; 695210087Sjilles return n; 6961556Srgrimes} 6971556Srgrimes 698213811Sobrienstatic union node * 69990111Simpmakename(void) 70090111Simp{ 70117987Speter union node *n; 7021556Srgrimes 70317987Speter n = (union node *)stalloc(sizeof (struct narg)); 70417987Speter n->type = NARG; 70517987Speter n->narg.next = NULL; 70617987Speter n->narg.text = wordtext; 70717987Speter n->narg.backquote = backquotelist; 70817987Speter return n; 70917987Speter} 71017987Speter 711213760Sobrienvoid 712213760Sobrienfixredir(union node *n, const char *text, int err) 71390111Simp{ 71417987Speter TRACE(("Fix redir %s %d\n", text, err)); 71517987Speter if (!err) 71617987Speter n->ndup.vname = NULL; 71717987Speter 71817987Speter if (is_digit(text[0]) && text[1] == '\0') 71917987Speter n->ndup.dupfd = digit_val(text[0]); 72017987Speter else if (text[0] == '-' && text[1] == '\0') 72117987Speter n->ndup.dupfd = -1; 72217987Speter else { 72320425Ssteve 72417987Speter if (err) 72517987Speter synerror("Bad fd number"); 72617987Speter else 72717987Speter n->ndup.vname = makename(); 72817987Speter } 72917987Speter} 73017987Speter 73117987Speter 732213811Sobrienstatic void 73390111Simpparsefname(void) 73490111Simp{ 7351556Srgrimes union node *n = redirnode; 7361556Srgrimes 7371556Srgrimes if (readtoken() != TWORD) 7381556Srgrimes synexpect(-1); 7391556Srgrimes if (n->type == NHERE) { 7401556Srgrimes struct heredoc *here = heredoc; 7411556Srgrimes struct heredoc *p; 7421556Srgrimes int i; 7431556Srgrimes 7441556Srgrimes if (quoteflag == 0) 7451556Srgrimes n->type = NXHERE; 7461556Srgrimes TRACE(("Here document %d\n", n->type)); 7471556Srgrimes if (here->striptabs) { 7481556Srgrimes while (*wordtext == '\t') 7491556Srgrimes wordtext++; 7501556Srgrimes } 7511556Srgrimes if (! noexpand(wordtext) || (i = strlen(wordtext)) == 0 || i > EOFMARKLEN) 7521556Srgrimes synerror("Illegal eof marker for << redirection"); 7531556Srgrimes rmescapes(wordtext); 7541556Srgrimes here->eofmark = wordtext; 7551556Srgrimes here->next = NULL; 7561556Srgrimes if (heredoclist == NULL) 7571556Srgrimes heredoclist = here; 7581556Srgrimes else { 7591556Srgrimes for (p = heredoclist ; p->next ; p = p->next); 7601556Srgrimes p->next = here; 7611556Srgrimes } 7621556Srgrimes } else if (n->type == NTOFD || n->type == NFROMFD) { 76317987Speter fixredir(n, wordtext, 0); 7641556Srgrimes } else { 76517987Speter n->nfile.fname = makename(); 7661556Srgrimes } 7671556Srgrimes} 7681556Srgrimes 7691556Srgrimes 7701556Srgrimes/* 7711556Srgrimes * Input any here documents. 7721556Srgrimes */ 7731556Srgrimes 774213811Sobrienstatic void 77590111Simpparseheredoc(void) 77690111Simp{ 7771556Srgrimes struct heredoc *here; 7781556Srgrimes union node *n; 7791556Srgrimes 7801556Srgrimes while (heredoclist) { 7811556Srgrimes here = heredoclist; 7821556Srgrimes heredoclist = here->next; 7831556Srgrimes if (needprompt) { 7841556Srgrimes setprompt(2); 7851556Srgrimes needprompt = 0; 7861556Srgrimes } 7871556Srgrimes readtoken1(pgetc(), here->here->type == NHERE? SQSYNTAX : DQSYNTAX, 7881556Srgrimes here->eofmark, here->striptabs); 7891556Srgrimes n = (union node *)stalloc(sizeof (struct narg)); 7901556Srgrimes n->narg.type = NARG; 7911556Srgrimes n->narg.next = NULL; 7921556Srgrimes n->narg.text = wordtext; 7931556Srgrimes n->narg.backquote = backquotelist; 7941556Srgrimes here->here->nhere.doc = n; 7951556Srgrimes } 7961556Srgrimes} 7971556Srgrimes 798213811Sobrienstatic int 79990111Simppeektoken(void) 80090111Simp{ 8011556Srgrimes int t; 8021556Srgrimes 8031556Srgrimes t = readtoken(); 8041556Srgrimes tokpushback++; 8051556Srgrimes return (t); 8061556Srgrimes} 8071556Srgrimes 808213811Sobrienstatic int 80990111Simpreadtoken(void) 81090111Simp{ 8111556Srgrimes int t; 8121556Srgrimes struct alias *ap; 8131556Srgrimes#ifdef DEBUG 8141556Srgrimes int alreadyseen = tokpushback; 8151556Srgrimes#endif 8168855Srgrimes 8171556Srgrimes top: 8181556Srgrimes t = xxreadtoken(); 8191556Srgrimes 820214709Sjilles /* 821214709Sjilles * eat newlines 822214709Sjilles */ 823214709Sjilles if (checkkwd & CHKNL) { 824214709Sjilles while (t == TNL) { 825214709Sjilles parseheredoc(); 826214709Sjilles t = xxreadtoken(); 827214709Sjilles } 828214709Sjilles } 8291556Srgrimes 830214709Sjilles /* 831214709Sjilles * check for keywords and aliases 832214709Sjilles */ 833214709Sjilles if (t == TWORD && !quoteflag) 834214709Sjilles { 835214709Sjilles const char * const *pp; 836214709Sjilles 837214709Sjilles if (checkkwd & CHKKWD) 83898463Sjmallett for (pp = parsekwd; *pp; pp++) { 83920425Ssteve if (**pp == *wordtext && equal(*pp, wordtext)) 84017987Speter { 8411556Srgrimes lasttoken = t = pp - parsekwd + KWDOFFSET; 8421556Srgrimes TRACE(("keyword %s recognized\n", tokname[t])); 8431556Srgrimes goto out; 8441556Srgrimes } 8451556Srgrimes } 846214709Sjilles if (checkkwd & CHKALIAS && 847214709Sjilles (ap = lookupalias(wordtext, 1)) != NULL) { 848214709Sjilles pushstring(ap->val, strlen(ap->val), ap); 849214709Sjilles goto top; 8501556Srgrimes } 851214709Sjilles } 8521556Srgrimesout: 853214709Sjilles if (t != TNOT) 854214709Sjilles checkkwd = 0; 855214709Sjilles 8561556Srgrimes#ifdef DEBUG 8571556Srgrimes if (!alreadyseen) 8581556Srgrimes TRACE(("token %s %s\n", tokname[t], t == TWORD ? wordtext : "")); 8591556Srgrimes else 8601556Srgrimes TRACE(("reread token %s %s\n", tokname[t], t == TWORD ? wordtext : "")); 8611556Srgrimes#endif 8621556Srgrimes return (t); 8631556Srgrimes} 8641556Srgrimes 8651556Srgrimes 8661556Srgrimes/* 8671556Srgrimes * Read the next input token. 8681556Srgrimes * If the token is a word, we set backquotelist to the list of cmds in 8691556Srgrimes * backquotes. We set quoteflag to true if any part of the word was 8701556Srgrimes * quoted. 8711556Srgrimes * If the token is TREDIR, then we set redirnode to a structure containing 8721556Srgrimes * the redirection. 8731556Srgrimes * In all cases, the variable startlinno is set to the number of the line 8741556Srgrimes * on which the token starts. 8751556Srgrimes * 8761556Srgrimes * [Change comment: here documents and internal procedures] 8771556Srgrimes * [Readtoken shouldn't have any arguments. Perhaps we should make the 8781556Srgrimes * word parsing code into a separate routine. In this case, readtoken 8791556Srgrimes * doesn't need to have any internal procedures, but parseword does. 8801556Srgrimes * We could also make parseoperator in essence the main routine, and 8811556Srgrimes * have parseword (readtoken1?) handle both words and redirection.] 8821556Srgrimes */ 8831556Srgrimes 8841556Srgrimes#define RETURN(token) return lasttoken = token 8851556Srgrimes 886213811Sobrienstatic int 88790111Simpxxreadtoken(void) 88890111Simp{ 88925230Ssteve int c; 8901556Srgrimes 8911556Srgrimes if (tokpushback) { 8921556Srgrimes tokpushback = 0; 8931556Srgrimes return lasttoken; 8941556Srgrimes } 8951556Srgrimes if (needprompt) { 8961556Srgrimes setprompt(2); 8971556Srgrimes needprompt = 0; 8981556Srgrimes } 8991556Srgrimes startlinno = plinno; 9001556Srgrimes for (;;) { /* until token or start of word found */ 9011556Srgrimes c = pgetc_macro(); 9021556Srgrimes switch (c) { 9031556Srgrimes case ' ': case '\t': 9041556Srgrimes continue; 9051556Srgrimes case '#': 9061556Srgrimes while ((c = pgetc()) != '\n' && c != PEOF); 9071556Srgrimes pungetc(); 9081556Srgrimes continue; 9091556Srgrimes case '\\': 9101556Srgrimes if (pgetc() == '\n') { 9111556Srgrimes startlinno = ++plinno; 9121556Srgrimes if (doprompt) 9131556Srgrimes setprompt(2); 9141556Srgrimes else 9151556Srgrimes setprompt(0); 9161556Srgrimes continue; 9171556Srgrimes } 9181556Srgrimes pungetc(); 9191556Srgrimes goto breakloop; 9201556Srgrimes case '\n': 9211556Srgrimes plinno++; 9221556Srgrimes needprompt = doprompt; 9231556Srgrimes RETURN(TNL); 9241556Srgrimes case PEOF: 9251556Srgrimes RETURN(TEOF); 9261556Srgrimes case '&': 9271556Srgrimes if (pgetc() == '&') 9281556Srgrimes RETURN(TAND); 9291556Srgrimes pungetc(); 9301556Srgrimes RETURN(TBACKGND); 9311556Srgrimes case '|': 9321556Srgrimes if (pgetc() == '|') 9331556Srgrimes RETURN(TOR); 9341556Srgrimes pungetc(); 9351556Srgrimes RETURN(TPIPE); 9361556Srgrimes case ';': 937223186Sjilles c = pgetc(); 938223186Sjilles if (c == ';') 9391556Srgrimes RETURN(TENDCASE); 940223186Sjilles else if (c == '&') 941223186Sjilles RETURN(TFALLTHRU); 9421556Srgrimes pungetc(); 9431556Srgrimes RETURN(TSEMI); 9441556Srgrimes case '(': 9451556Srgrimes RETURN(TLP); 9461556Srgrimes case ')': 9471556Srgrimes RETURN(TRP); 9481556Srgrimes default: 9491556Srgrimes goto breakloop; 9501556Srgrimes } 9511556Srgrimes } 9521556Srgrimesbreakloop: 9531556Srgrimes return readtoken1(c, BASESYNTAX, (char *)NULL, 0); 9541556Srgrimes#undef RETURN 9551556Srgrimes} 9561556Srgrimes 9571556Srgrimes 958213811Sobrien#define MAXNEST_static 8 959206145Sjillesstruct tokenstate 960206145Sjilles{ 961206145Sjilles const char *syntax; /* *SYNTAX */ 962206145Sjilles int parenlevel; /* levels of parentheses in arithmetic */ 963206145Sjilles enum tokenstate_category 964206145Sjilles { 965206145Sjilles TSTATE_TOP, 966206145Sjilles TSTATE_VAR_OLD, /* ${var+-=?}, inherits dquotes */ 967206145Sjilles TSTATE_VAR_NEW, /* other ${var...}, own dquote state */ 968206145Sjilles TSTATE_ARITH 969206145Sjilles } category; 970206145Sjilles}; 971206145Sjilles 972206145Sjilles 973205130Sjilles/* 974205130Sjilles * Called to parse command substitutions. 975205130Sjilles */ 9761556Srgrimes 977213811Sobrienstatic char * 978205130Sjillesparsebackq(char *out, struct nodelist **pbqlist, 979205130Sjilles int oldstyle, int dblquote, int quoted) 980205130Sjilles{ 981205130Sjilles struct nodelist **nlpp; 982205130Sjilles union node *n; 983205130Sjilles char *volatile str; 984205130Sjilles struct jmploc jmploc; 985205130Sjilles struct jmploc *const savehandler = handler; 986248980Sjilles size_t savelen; 987205130Sjilles int saveprompt; 988205130Sjilles const int bq_startlinno = plinno; 989205130Sjilles char *volatile ostr = NULL; 990205130Sjilles struct parsefile *const savetopfile = getcurrentfile(); 991208655Sjilles struct heredoc *const saveheredoclist = heredoclist; 992208655Sjilles struct heredoc *here; 993205130Sjilles 994205130Sjilles str = NULL; 995205130Sjilles if (setjmp(jmploc.loc)) { 996205130Sjilles popfilesupto(savetopfile); 997205130Sjilles if (str) 998205130Sjilles ckfree(str); 999205130Sjilles if (ostr) 1000205130Sjilles ckfree(ostr); 1001208655Sjilles heredoclist = saveheredoclist; 1002205130Sjilles handler = savehandler; 1003205130Sjilles if (exception == EXERROR) { 1004205130Sjilles startlinno = bq_startlinno; 1005205130Sjilles synerror("Error in command substitution"); 1006205130Sjilles } 1007205130Sjilles longjmp(handler->loc, 1); 1008205130Sjilles } 1009205130Sjilles INTOFF; 1010205130Sjilles savelen = out - stackblock(); 1011205130Sjilles if (savelen > 0) { 1012205130Sjilles str = ckmalloc(savelen); 1013205130Sjilles memcpy(str, stackblock(), savelen); 1014205130Sjilles } 1015205130Sjilles handler = &jmploc; 1016208655Sjilles heredoclist = NULL; 1017205130Sjilles INTON; 1018205130Sjilles if (oldstyle) { 1019205130Sjilles /* We must read until the closing backquote, giving special 1020205130Sjilles treatment to some slashes, and then push the string and 1021205130Sjilles reread it as input, interpreting it normally. */ 1022205130Sjilles char *oout; 1023205130Sjilles int c; 1024205130Sjilles int olen; 1025205130Sjilles 1026205130Sjilles 1027205130Sjilles STARTSTACKSTR(oout); 1028205130Sjilles for (;;) { 1029205130Sjilles if (needprompt) { 1030205130Sjilles setprompt(2); 1031205130Sjilles needprompt = 0; 1032205130Sjilles } 1033215783Sjilles CHECKSTRSPACE(2, oout); 1034205130Sjilles switch (c = pgetc()) { 1035205130Sjilles case '`': 1036205130Sjilles goto done; 1037205130Sjilles 1038205130Sjilles case '\\': 1039205130Sjilles if ((c = pgetc()) == '\n') { 1040205130Sjilles plinno++; 1041205130Sjilles if (doprompt) 1042205130Sjilles setprompt(2); 1043205130Sjilles else 1044205130Sjilles setprompt(0); 1045205130Sjilles /* 1046205130Sjilles * If eating a newline, avoid putting 1047205130Sjilles * the newline into the new character 1048215783Sjilles * stream (via the USTPUTC after the 1049205130Sjilles * switch). 1050205130Sjilles */ 1051205130Sjilles continue; 1052205130Sjilles } 1053205130Sjilles if (c != '\\' && c != '`' && c != '$' 1054205130Sjilles && (!dblquote || c != '"')) 1055215783Sjilles USTPUTC('\\', oout); 1056205130Sjilles break; 1057205130Sjilles 1058205130Sjilles case '\n': 1059205130Sjilles plinno++; 1060205130Sjilles needprompt = doprompt; 1061205130Sjilles break; 1062205130Sjilles 1063205130Sjilles case PEOF: 1064205130Sjilles startlinno = plinno; 1065205130Sjilles synerror("EOF in backquote substitution"); 1066205130Sjilles break; 1067205130Sjilles 1068205130Sjilles default: 1069205130Sjilles break; 1070205130Sjilles } 1071215783Sjilles USTPUTC(c, oout); 1072205130Sjilles } 1073205130Sjillesdone: 1074215783Sjilles USTPUTC('\0', oout); 1075205130Sjilles olen = oout - stackblock(); 1076205130Sjilles INTOFF; 1077205130Sjilles ostr = ckmalloc(olen); 1078205130Sjilles memcpy(ostr, stackblock(), olen); 1079205130Sjilles setinputstring(ostr, 1); 1080205130Sjilles INTON; 1081205130Sjilles } 1082205130Sjilles nlpp = pbqlist; 1083205130Sjilles while (*nlpp) 1084205130Sjilles nlpp = &(*nlpp)->next; 1085205130Sjilles *nlpp = (struct nodelist *)stalloc(sizeof (struct nodelist)); 1086205130Sjilles (*nlpp)->next = NULL; 1087205130Sjilles 1088205130Sjilles if (oldstyle) { 1089205130Sjilles saveprompt = doprompt; 1090205130Sjilles doprompt = 0; 1091205130Sjilles } 1092205130Sjilles 1093214525Sjilles n = list(0, oldstyle); 1094205130Sjilles 1095205130Sjilles if (oldstyle) 1096205130Sjilles doprompt = saveprompt; 1097205130Sjilles else { 1098205130Sjilles if (readtoken() != TRP) 1099205130Sjilles synexpect(TRP); 1100205130Sjilles } 1101205130Sjilles 1102205130Sjilles (*nlpp)->n = n; 1103205130Sjilles if (oldstyle) { 1104205130Sjilles /* 1105205130Sjilles * Start reading from old file again, ignoring any pushed back 1106205130Sjilles * tokens left from the backquote parsing 1107205130Sjilles */ 1108205130Sjilles popfile(); 1109205130Sjilles tokpushback = 0; 1110205130Sjilles } 1111205130Sjilles STARTSTACKSTR(out); 1112216706Sjilles CHECKSTRSPACE(savelen + 1, out); 1113208655Sjilles INTOFF; 1114205130Sjilles if (str) { 1115205130Sjilles memcpy(out, str, savelen); 1116205130Sjilles STADJUST(savelen, out); 1117205130Sjilles ckfree(str); 1118205130Sjilles str = NULL; 1119205130Sjilles } 1120205130Sjilles if (ostr) { 1121205130Sjilles ckfree(ostr); 1122205130Sjilles ostr = NULL; 1123205130Sjilles } 1124208655Sjilles here = saveheredoclist; 1125208655Sjilles if (here != NULL) { 1126208655Sjilles while (here->next != NULL) 1127208655Sjilles here = here->next; 1128208655Sjilles here->next = heredoclist; 1129208655Sjilles heredoclist = saveheredoclist; 1130208655Sjilles } 1131205130Sjilles handler = savehandler; 1132208655Sjilles INTON; 1133205130Sjilles if (quoted) 1134205130Sjilles USTPUTC(CTLBACKQ | CTLQUOTE, out); 1135205130Sjilles else 1136205130Sjilles USTPUTC(CTLBACKQ, out); 1137205130Sjilles return out; 1138205130Sjilles} 1139205130Sjilles 1140205130Sjilles 11411556Srgrimes/* 1142221513Sjilles * Called to parse a backslash escape sequence inside $'...'. 1143221513Sjilles * The backslash has already been read. 1144221513Sjilles */ 1145221513Sjillesstatic char * 1146221513Sjillesreadcstyleesc(char *out) 1147221513Sjilles{ 1148221513Sjilles int c, v, i, n; 1149221513Sjilles 1150221513Sjilles c = pgetc(); 1151221513Sjilles switch (c) { 1152221513Sjilles case '\0': 1153221513Sjilles synerror("Unterminated quoted string"); 1154221513Sjilles case '\n': 1155221513Sjilles plinno++; 1156221513Sjilles if (doprompt) 1157221513Sjilles setprompt(2); 1158221513Sjilles else 1159221513Sjilles setprompt(0); 1160221513Sjilles return out; 1161221513Sjilles case '\\': 1162221513Sjilles case '\'': 1163221513Sjilles case '"': 1164221513Sjilles v = c; 1165221513Sjilles break; 1166221513Sjilles case 'a': v = '\a'; break; 1167221513Sjilles case 'b': v = '\b'; break; 1168221513Sjilles case 'e': v = '\033'; break; 1169221513Sjilles case 'f': v = '\f'; break; 1170221513Sjilles case 'n': v = '\n'; break; 1171221513Sjilles case 'r': v = '\r'; break; 1172221513Sjilles case 't': v = '\t'; break; 1173221513Sjilles case 'v': v = '\v'; break; 1174221513Sjilles case 'x': 1175221513Sjilles v = 0; 1176221513Sjilles for (;;) { 1177221513Sjilles c = pgetc(); 1178221513Sjilles if (c >= '0' && c <= '9') 1179221513Sjilles v = (v << 4) + c - '0'; 1180221513Sjilles else if (c >= 'A' && c <= 'F') 1181221513Sjilles v = (v << 4) + c - 'A' + 10; 1182221513Sjilles else if (c >= 'a' && c <= 'f') 1183221513Sjilles v = (v << 4) + c - 'a' + 10; 1184221513Sjilles else 1185221513Sjilles break; 1186221513Sjilles } 1187221513Sjilles pungetc(); 1188221513Sjilles break; 1189221513Sjilles case '0': case '1': case '2': case '3': 1190221513Sjilles case '4': case '5': case '6': case '7': 1191221513Sjilles v = c - '0'; 1192221513Sjilles c = pgetc(); 1193221513Sjilles if (c >= '0' && c <= '7') { 1194221513Sjilles v <<= 3; 1195221513Sjilles v += c - '0'; 1196221513Sjilles c = pgetc(); 1197221513Sjilles if (c >= '0' && c <= '7') { 1198221513Sjilles v <<= 3; 1199221513Sjilles v += c - '0'; 1200221513Sjilles } else 1201221513Sjilles pungetc(); 1202221513Sjilles } else 1203221513Sjilles pungetc(); 1204221513Sjilles break; 1205221513Sjilles case 'c': 1206221513Sjilles c = pgetc(); 1207221513Sjilles if (c < 0x3f || c > 0x7a || c == 0x60) 1208221513Sjilles synerror("Bad escape sequence"); 1209221513Sjilles if (c == '\\' && pgetc() != '\\') 1210221513Sjilles synerror("Bad escape sequence"); 1211221513Sjilles if (c == '?') 1212221513Sjilles v = 127; 1213221513Sjilles else 1214221513Sjilles v = c & 0x1f; 1215221513Sjilles break; 1216221513Sjilles case 'u': 1217221513Sjilles case 'U': 1218221513Sjilles n = c == 'U' ? 8 : 4; 1219221513Sjilles v = 0; 1220221513Sjilles for (i = 0; i < n; i++) { 1221221513Sjilles c = pgetc(); 1222221513Sjilles if (c >= '0' && c <= '9') 1223221513Sjilles v = (v << 4) + c - '0'; 1224221513Sjilles else if (c >= 'A' && c <= 'F') 1225221513Sjilles v = (v << 4) + c - 'A' + 10; 1226221513Sjilles else if (c >= 'a' && c <= 'f') 1227221513Sjilles v = (v << 4) + c - 'a' + 10; 1228221513Sjilles else 1229221513Sjilles synerror("Bad escape sequence"); 1230221513Sjilles } 1231221513Sjilles if (v == 0 || (v >= 0xd800 && v <= 0xdfff)) 1232221513Sjilles synerror("Bad escape sequence"); 1233221513Sjilles /* We really need iconv here. */ 1234221669Sjilles if (initial_localeisutf8 && v > 127) { 1235221669Sjilles CHECKSTRSPACE(4, out); 1236221669Sjilles /* 1237221669Sjilles * We cannot use wctomb() as the locale may have 1238221669Sjilles * changed. 1239221669Sjilles */ 1240221669Sjilles if (v <= 0x7ff) { 1241221669Sjilles USTPUTC(0xc0 | v >> 6, out); 1242221669Sjilles USTPUTC(0x80 | (v & 0x3f), out); 1243221669Sjilles return out; 1244221669Sjilles } else if (v <= 0xffff) { 1245221669Sjilles USTPUTC(0xe0 | v >> 12, out); 1246221669Sjilles USTPUTC(0x80 | ((v >> 6) & 0x3f), out); 1247221669Sjilles USTPUTC(0x80 | (v & 0x3f), out); 1248221669Sjilles return out; 1249221669Sjilles } else if (v <= 0x10ffff) { 1250221669Sjilles USTPUTC(0xf0 | v >> 18, out); 1251221669Sjilles USTPUTC(0x80 | ((v >> 12) & 0x3f), out); 1252221669Sjilles USTPUTC(0x80 | ((v >> 6) & 0x3f), out); 1253221669Sjilles USTPUTC(0x80 | (v & 0x3f), out); 1254221669Sjilles return out; 1255221669Sjilles } 1256221669Sjilles } 1257221513Sjilles if (v > 127) 1258221513Sjilles v = '?'; 1259221513Sjilles break; 1260221513Sjilles default: 1261221513Sjilles synerror("Bad escape sequence"); 1262221513Sjilles } 1263221513Sjilles v = (char)v; 1264221513Sjilles /* 1265221513Sjilles * We can't handle NUL bytes. 1266221513Sjilles * POSIX says we should skip till the closing quote. 1267221513Sjilles */ 1268221513Sjilles if (v == '\0') { 1269221513Sjilles while ((c = pgetc()) != '\'') { 1270221513Sjilles if (c == '\\') 1271221513Sjilles c = pgetc(); 1272221513Sjilles if (c == PEOF) 1273221513Sjilles synerror("Unterminated quoted string"); 1274221513Sjilles } 1275221513Sjilles pungetc(); 1276221513Sjilles return out; 1277221513Sjilles } 1278221513Sjilles if (SQSYNTAX[v] == CCTL) 1279221513Sjilles USTPUTC(CTLESC, out); 1280221513Sjilles USTPUTC(v, out); 1281221513Sjilles return out; 1282221513Sjilles} 1283221513Sjilles 1284221513Sjilles 1285221513Sjilles/* 12861556Srgrimes * If eofmark is NULL, read a word or a redirection symbol. If eofmark 12871556Srgrimes * is not NULL, read a here document. In the latter case, eofmark is the 12881556Srgrimes * word which marks the end of the document and striptabs is true if 12891556Srgrimes * leading tabs should be stripped from the document. The argument firstc 12901556Srgrimes * is the first character of the input token or document. 12911556Srgrimes * 12921556Srgrimes * Because C does not have internal subroutines, I have simulated them 12931556Srgrimes * using goto's to implement the subroutine linkage. The following macros 12941556Srgrimes * will run code that appears at the end of readtoken1. 12951556Srgrimes */ 12961556Srgrimes 12971556Srgrimes#define CHECKEND() {goto checkend; checkend_return:;} 12981556Srgrimes#define PARSEREDIR() {goto parseredir; parseredir_return:;} 12991556Srgrimes#define PARSESUB() {goto parsesub; parsesub_return:;} 13001556Srgrimes#define PARSEARITH() {goto parsearith; parsearith_return:;} 13011556Srgrimes 1302213811Sobrienstatic int 1303248980Sjillesreadtoken1(int firstc, char const *initialsyntax, const char *eofmark, 1304248980Sjilles int striptabs) 130590111Simp{ 130617987Speter int c = firstc; 130717987Speter char *out; 13081556Srgrimes int len; 13091556Srgrimes char line[EOFMARKLEN + 1]; 13101556Srgrimes struct nodelist *bqlist; 13111556Srgrimes int quotef; 1312206145Sjilles int newvarnest; 1313206145Sjilles int level; 131454679Scracauer int synentry; 1315213811Sobrien struct tokenstate state_static[MAXNEST_static]; 1316213811Sobrien int maxnest = MAXNEST_static; 1317206145Sjilles struct tokenstate *state = state_static; 1318221513Sjilles int sqiscstyle = 0; 13191556Srgrimes 13201556Srgrimes startlinno = plinno; 13211556Srgrimes quotef = 0; 13221556Srgrimes bqlist = NULL; 1323206145Sjilles newvarnest = 0; 1324206145Sjilles level = 0; 1325206145Sjilles state[level].syntax = initialsyntax; 1326206145Sjilles state[level].parenlevel = 0; 1327206145Sjilles state[level].category = TSTATE_TOP; 13281556Srgrimes 13291556Srgrimes STARTSTACKSTR(out); 13301556Srgrimes loop: { /* for each line, until end of word */ 13311556Srgrimes CHECKEND(); /* set c to PEOF if at end of here document */ 13321556Srgrimes for (;;) { /* until end of line or end of word */ 1333214512Sjilles CHECKSTRSPACE(4, out); /* permit 4 calls to USTPUTC */ 133454679Scracauer 1335206145Sjilles synentry = state[level].syntax[c]; 133654679Scracauer 133754679Scracauer switch(synentry) { 13381556Srgrimes case CNL: /* '\n' */ 1339206145Sjilles if (state[level].syntax == BASESYNTAX) 13401556Srgrimes goto endword; /* exit outer loop */ 13411556Srgrimes USTPUTC(c, out); 13421556Srgrimes plinno++; 13431556Srgrimes if (doprompt) 13441556Srgrimes setprompt(2); 13451556Srgrimes else 13461556Srgrimes setprompt(0); 13471556Srgrimes c = pgetc(); 13481556Srgrimes goto loop; /* continue outer loop */ 1349221513Sjilles case CSBACK: 1350221513Sjilles if (sqiscstyle) { 1351221513Sjilles out = readcstyleesc(out); 1352221513Sjilles break; 1353221513Sjilles } 1354221513Sjilles /* FALLTHROUGH */ 13551556Srgrimes case CWORD: 13561556Srgrimes USTPUTC(c, out); 13571556Srgrimes break; 13581556Srgrimes case CCTL: 1359206145Sjilles if (eofmark == NULL || initialsyntax != SQSYNTAX) 13601556Srgrimes USTPUTC(CTLESC, out); 13611556Srgrimes USTPUTC(c, out); 13621556Srgrimes break; 13631556Srgrimes case CBACK: /* backslash */ 13641556Srgrimes c = pgetc(); 13651556Srgrimes if (c == PEOF) { 13661556Srgrimes USTPUTC('\\', out); 13671556Srgrimes pungetc(); 13681556Srgrimes } else if (c == '\n') { 1369160849Syar plinno++; 13701556Srgrimes if (doprompt) 13711556Srgrimes setprompt(2); 13721556Srgrimes else 13731556Srgrimes setprompt(0); 13741556Srgrimes } else { 1375206145Sjilles if (state[level].syntax == DQSYNTAX && 1376206145Sjilles c != '\\' && c != '`' && c != '$' && 1377206145Sjilles (c != '"' || (eofmark != NULL && 1378206145Sjilles newvarnest == 0)) && 1379206145Sjilles (c != '}' || state[level].category != TSTATE_VAR_OLD)) 13801556Srgrimes USTPUTC('\\', out); 1381214512Sjilles if ((eofmark == NULL || 1382214512Sjilles newvarnest > 0) && 1383214512Sjilles state[level].syntax == BASESYNTAX) 1384214512Sjilles USTPUTC(CTLQUOTEMARK, out); 138583675Stegge if (SQSYNTAX[c] == CCTL) 13861556Srgrimes USTPUTC(CTLESC, out); 13871556Srgrimes USTPUTC(c, out); 1388214512Sjilles if ((eofmark == NULL || 1389214512Sjilles newvarnest > 0) && 1390214512Sjilles state[level].syntax == BASESYNTAX && 1391214512Sjilles state[level].category == TSTATE_VAR_OLD) 1392214512Sjilles USTPUTC(CTLQUOTEEND, out); 13931556Srgrimes quotef++; 13941556Srgrimes } 13951556Srgrimes break; 13961556Srgrimes case CSQUOTE: 1397206145Sjilles USTPUTC(CTLQUOTEMARK, out); 1398206145Sjilles state[level].syntax = SQSYNTAX; 1399221513Sjilles sqiscstyle = 0; 14001556Srgrimes break; 14011556Srgrimes case CDQUOTE: 1402206145Sjilles USTPUTC(CTLQUOTEMARK, out); 1403206145Sjilles state[level].syntax = DQSYNTAX; 14041556Srgrimes break; 14051556Srgrimes case CENDQUOTE: 1406206145Sjilles if (eofmark != NULL && newvarnest == 0) 14071556Srgrimes USTPUTC(c, out); 1408206145Sjilles else { 1409214512Sjilles if (state[level].category == TSTATE_VAR_OLD) 1410214512Sjilles USTPUTC(CTLQUOTEEND, out); 1411214305Sjilles state[level].syntax = BASESYNTAX; 14121556Srgrimes quotef++; 14131556Srgrimes } 14141556Srgrimes break; 14151556Srgrimes case CVAR: /* '$' */ 14161556Srgrimes PARSESUB(); /* parse substitution */ 14171556Srgrimes break; 14181556Srgrimes case CENDVAR: /* '}' */ 1419206145Sjilles if (level > 0 && 1420214492Sjilles ((state[level].category == TSTATE_VAR_OLD && 1421214492Sjilles state[level].syntax == 1422214492Sjilles state[level - 1].syntax) || 1423214490Sjilles (state[level].category == TSTATE_VAR_NEW && 1424214490Sjilles state[level].syntax == BASESYNTAX))) { 1425214492Sjilles if (state[level].category == TSTATE_VAR_NEW) 1426206145Sjilles newvarnest--; 1427206145Sjilles level--; 14281556Srgrimes USTPUTC(CTLENDVAR, out); 14291556Srgrimes } else { 14301556Srgrimes USTPUTC(c, out); 14311556Srgrimes } 14321556Srgrimes break; 14331556Srgrimes case CLP: /* '(' in arithmetic */ 1434206145Sjilles state[level].parenlevel++; 14351556Srgrimes USTPUTC(c, out); 14361556Srgrimes break; 14371556Srgrimes case CRP: /* ')' in arithmetic */ 1438206145Sjilles if (state[level].parenlevel > 0) { 14391556Srgrimes USTPUTC(c, out); 1440206145Sjilles --state[level].parenlevel; 14411556Srgrimes } else { 14421556Srgrimes if (pgetc() == ')') { 1443206145Sjilles if (level > 0 && 1444206145Sjilles state[level].category == TSTATE_ARITH) { 1445206145Sjilles level--; 14461556Srgrimes USTPUTC(CTLENDARI, out); 14471556Srgrimes } else 14481556Srgrimes USTPUTC(')', out); 14491556Srgrimes } else { 14508855Srgrimes /* 14511556Srgrimes * unbalanced parens 14521556Srgrimes * (don't 2nd guess - no error) 14531556Srgrimes */ 14541556Srgrimes pungetc(); 14551556Srgrimes USTPUTC(')', out); 14561556Srgrimes } 14571556Srgrimes } 14581556Srgrimes break; 14591556Srgrimes case CBQUOTE: /* '`' */ 1460206145Sjilles out = parsebackq(out, &bqlist, 1, 1461206145Sjilles state[level].syntax == DQSYNTAX && 1462206145Sjilles (eofmark == NULL || newvarnest > 0), 1463206145Sjilles state[level].syntax == DQSYNTAX || state[level].syntax == ARISYNTAX); 14641556Srgrimes break; 14651556Srgrimes case CEOF: 14661556Srgrimes goto endword; /* exit outer loop */ 1467214305Sjilles case CIGN: 1468214305Sjilles break; 14691556Srgrimes default: 1470206145Sjilles if (level == 0) 14711556Srgrimes goto endword; /* exit outer loop */ 14721556Srgrimes USTPUTC(c, out); 14731556Srgrimes } 14741556Srgrimes c = pgetc_macro(); 14751556Srgrimes } 14761556Srgrimes } 14771556Srgrimesendword: 1478206145Sjilles if (state[level].syntax == ARISYNTAX) 14791556Srgrimes synerror("Missing '))'"); 1480206145Sjilles if (state[level].syntax != BASESYNTAX && eofmark == NULL) 14811556Srgrimes synerror("Unterminated quoted string"); 1482206145Sjilles if (state[level].category == TSTATE_VAR_OLD || 1483206145Sjilles state[level].category == TSTATE_VAR_NEW) { 14841556Srgrimes startlinno = plinno; 14851556Srgrimes synerror("Missing '}'"); 14861556Srgrimes } 1487206145Sjilles if (state != state_static) 1488206145Sjilles parser_temp_free_upto(state); 14891556Srgrimes USTPUTC('\0', out); 14901556Srgrimes len = out - stackblock(); 14911556Srgrimes out = stackblock(); 14921556Srgrimes if (eofmark == NULL) { 14931556Srgrimes if ((c == '>' || c == '<') 14941556Srgrimes && quotef == 0 14951556Srgrimes && len <= 2 14961556Srgrimes && (*out == '\0' || is_digit(*out))) { 14971556Srgrimes PARSEREDIR(); 14981556Srgrimes return lasttoken = TREDIR; 14991556Srgrimes } else { 15001556Srgrimes pungetc(); 15011556Srgrimes } 15021556Srgrimes } 15031556Srgrimes quoteflag = quotef; 15041556Srgrimes backquotelist = bqlist; 15051556Srgrimes grabstackblock(len); 15061556Srgrimes wordtext = out; 15071556Srgrimes return lasttoken = TWORD; 15081556Srgrimes/* end of readtoken routine */ 15091556Srgrimes 15101556Srgrimes 15111556Srgrimes/* 15121556Srgrimes * Check to see whether we are at the end of the here document. When this 15131556Srgrimes * is called, c is set to the first character of the next input line. If 15141556Srgrimes * we are at the end of the here document, this routine sets the c to PEOF. 15151556Srgrimes */ 15161556Srgrimes 15171556Srgrimescheckend: { 15181556Srgrimes if (eofmark) { 15191556Srgrimes if (striptabs) { 15201556Srgrimes while (c == '\t') 15211556Srgrimes c = pgetc(); 15221556Srgrimes } 15231556Srgrimes if (c == *eofmark) { 15241556Srgrimes if (pfgets(line, sizeof line) != NULL) { 1525248980Sjilles const char *p, *q; 15261556Srgrimes 15271556Srgrimes p = line; 15281556Srgrimes for (q = eofmark + 1 ; *q && *p == *q ; p++, q++); 1529222134Sjilles if ((*p == '\0' || *p == '\n') && *q == '\0') { 15301556Srgrimes c = PEOF; 1531222134Sjilles if (*p == '\n') { 1532222134Sjilles plinno++; 1533222134Sjilles needprompt = doprompt; 1534222134Sjilles } 15351556Srgrimes } else { 15361556Srgrimes pushstring(line, strlen(line), NULL); 15371556Srgrimes } 15381556Srgrimes } 15391556Srgrimes } 15401556Srgrimes } 15411556Srgrimes goto checkend_return; 15421556Srgrimes} 15431556Srgrimes 15441556Srgrimes 15451556Srgrimes/* 15461556Srgrimes * Parse a redirection operator. The variable "out" points to a string 15471556Srgrimes * specifying the fd to be redirected. The variable "c" contains the 15481556Srgrimes * first character of the redirection operator. 15491556Srgrimes */ 15501556Srgrimes 15511556Srgrimesparseredir: { 15521556Srgrimes char fd = *out; 15531556Srgrimes union node *np; 15541556Srgrimes 15551556Srgrimes np = (union node *)stalloc(sizeof (struct nfile)); 15561556Srgrimes if (c == '>') { 15571556Srgrimes np->nfile.fd = 1; 15581556Srgrimes c = pgetc(); 15591556Srgrimes if (c == '>') 15601556Srgrimes np->type = NAPPEND; 15611556Srgrimes else if (c == '&') 15621556Srgrimes np->type = NTOFD; 156396922Stjr else if (c == '|') 156496922Stjr np->type = NCLOBBER; 15651556Srgrimes else { 15661556Srgrimes np->type = NTO; 15671556Srgrimes pungetc(); 15681556Srgrimes } 15691556Srgrimes } else { /* c == '<' */ 15701556Srgrimes np->nfile.fd = 0; 15711556Srgrimes c = pgetc(); 15721556Srgrimes if (c == '<') { 15731556Srgrimes if (sizeof (struct nfile) != sizeof (struct nhere)) { 15741556Srgrimes np = (union node *)stalloc(sizeof (struct nhere)); 15751556Srgrimes np->nfile.fd = 0; 15761556Srgrimes } 15771556Srgrimes np->type = NHERE; 15781556Srgrimes heredoc = (struct heredoc *)stalloc(sizeof (struct heredoc)); 15791556Srgrimes heredoc->here = np; 15801556Srgrimes if ((c = pgetc()) == '-') { 15811556Srgrimes heredoc->striptabs = 1; 15821556Srgrimes } else { 15831556Srgrimes heredoc->striptabs = 0; 15841556Srgrimes pungetc(); 15851556Srgrimes } 15861556Srgrimes } else if (c == '&') 15871556Srgrimes np->type = NFROMFD; 158866612Sbrian else if (c == '>') 158966612Sbrian np->type = NFROMTO; 15901556Srgrimes else { 15911556Srgrimes np->type = NFROM; 15921556Srgrimes pungetc(); 15931556Srgrimes } 15941556Srgrimes } 15951556Srgrimes if (fd != '\0') 15961556Srgrimes np->nfile.fd = digit_val(fd); 15971556Srgrimes redirnode = np; 15981556Srgrimes goto parseredir_return; 15991556Srgrimes} 16001556Srgrimes 16011556Srgrimes 16021556Srgrimes/* 16031556Srgrimes * Parse a substitution. At this point, we have read the dollar sign 16041556Srgrimes * and nothing else. 16051556Srgrimes */ 16061556Srgrimes 16071556Srgrimesparsesub: { 1608179022Sstefanf char buf[10]; 16091556Srgrimes int subtype; 16101556Srgrimes int typeloc; 16111556Srgrimes int flags; 16121556Srgrimes char *p; 16131556Srgrimes static const char types[] = "}-+?="; 1614179022Sstefanf int bracketed_name = 0; /* used to handle ${[0-9]*} variables */ 1615179022Sstefanf int linno; 1616179387Sstefanf int length; 1617219623Sjilles int c1; 16181556Srgrimes 16191556Srgrimes c = pgetc(); 1620221513Sjilles if (c == '(') { /* $(command) or $((arith)) */ 16211556Srgrimes if (pgetc() == '(') { 16221556Srgrimes PARSEARITH(); 16231556Srgrimes } else { 16241556Srgrimes pungetc(); 1625206145Sjilles out = parsebackq(out, &bqlist, 0, 1626206145Sjilles state[level].syntax == DQSYNTAX && 1627206145Sjilles (eofmark == NULL || newvarnest > 0), 1628206145Sjilles state[level].syntax == DQSYNTAX || 1629206145Sjilles state[level].syntax == ARISYNTAX); 16301556Srgrimes } 1631221513Sjilles } else if (c == '{' || is_name(c) || is_special(c)) { 16321556Srgrimes USTPUTC(CTLVAR, out); 16331556Srgrimes typeloc = out - stackblock(); 16341556Srgrimes USTPUTC(VSNORMAL, out); 16351556Srgrimes subtype = VSNORMAL; 1636179022Sstefanf flags = 0; 16371556Srgrimes if (c == '{') { 163818202Speter bracketed_name = 1; 16391556Srgrimes c = pgetc(); 1640219623Sjilles subtype = 0; 16411556Srgrimes } 1642219623Sjillesvarname: 1643149026Sstefanf if (!is_eof(c) && is_name(c)) { 1644179387Sstefanf length = 0; 16451556Srgrimes do { 16461556Srgrimes STPUTC(c, out); 16471556Srgrimes c = pgetc(); 1648179387Sstefanf length++; 1649149026Sstefanf } while (!is_eof(c) && is_in_name(c)); 1650179387Sstefanf if (length == 6 && 1651179387Sstefanf strncmp(out - length, "LINENO", length) == 0) { 1652179022Sstefanf /* Replace the variable name with the 1653179022Sstefanf * current line number. */ 1654179022Sstefanf linno = plinno; 1655179022Sstefanf if (funclinno != 0) 1656179022Sstefanf linno -= funclinno - 1; 1657179022Sstefanf snprintf(buf, sizeof(buf), "%d", linno); 1658179022Sstefanf STADJUST(-6, out); 1659215783Sjilles STPUTS(buf, out); 1660179022Sstefanf flags |= VSLINENO; 1661179022Sstefanf } 166218202Speter } else if (is_digit(c)) { 166318202Speter if (bracketed_name) { 166418202Speter do { 166518202Speter STPUTC(c, out); 166618202Speter c = pgetc(); 166718202Speter } while (is_digit(c)); 166818202Speter } else { 166918202Speter STPUTC(c, out); 167018202Speter c = pgetc(); 167118202Speter } 1672219623Sjilles } else if (is_special(c)) { 1673219623Sjilles c1 = c; 1674219623Sjilles c = pgetc(); 1675219623Sjilles if (subtype == 0 && c1 == '#') { 1676219623Sjilles subtype = VSLENGTH; 1677219623Sjilles if (strchr(types, c) == NULL && c != ':' && 1678219623Sjilles c != '#' && c != '%') 1679219623Sjilles goto varname; 1680219623Sjilles c1 = c; 1681219623Sjilles c = pgetc(); 1682219623Sjilles if (c1 != '}' && c == '}') { 1683219623Sjilles pungetc(); 1684219623Sjilles c = c1; 1685219623Sjilles goto varname; 1686219623Sjilles } 1687219623Sjilles pungetc(); 1688219623Sjilles c = c1; 1689219623Sjilles c1 = '#'; 1690219623Sjilles subtype = 0; 1691219623Sjilles } 1692219623Sjilles USTPUTC(c1, out); 16931556Srgrimes } else { 1694219623Sjilles subtype = VSERROR; 1695219623Sjilles if (c == '}') 1696219623Sjilles pungetc(); 1697219623Sjilles else if (c == '\n' || c == PEOF) 1698219623Sjilles synerror("Unexpected end of line in substitution"); 1699219623Sjilles else 1700164003Sstefanf USTPUTC(c, out); 17011556Srgrimes } 17021556Srgrimes if (subtype == 0) { 170317987Speter switch (c) { 170417987Speter case ':': 1705179022Sstefanf flags |= VSNUL; 17061556Srgrimes c = pgetc(); 170717987Speter /*FALLTHROUGH*/ 170817987Speter default: 170917987Speter p = strchr(types, c); 1710164003Sstefanf if (p == NULL) { 1711206144Sjilles if (c == '\n' || c == PEOF) 1712206144Sjilles synerror("Unexpected end of line in substitution"); 1713164003Sstefanf if (flags == VSNUL) 1714164003Sstefanf STPUTC(':', out); 1715164003Sstefanf STPUTC(c, out); 1716164003Sstefanf subtype = VSERROR; 1717164003Sstefanf } else 1718164003Sstefanf subtype = p - types + VSNORMAL; 171917987Speter break; 172017987Speter case '%': 172120425Ssteve case '#': 172217987Speter { 172317987Speter int cc = c; 172417987Speter subtype = c == '#' ? VSTRIMLEFT : 172517987Speter VSTRIMRIGHT; 172617987Speter c = pgetc(); 172717987Speter if (c == cc) 172817987Speter subtype++; 172917987Speter else 173017987Speter pungetc(); 173117987Speter break; 173217987Speter } 17331556Srgrimes } 1734164003Sstefanf } else if (subtype != VSERROR) { 1735221461Sjilles if (subtype == VSLENGTH && c != '}') 1736221461Sjilles subtype = VSERROR; 17371556Srgrimes pungetc(); 17381556Srgrimes } 1739164003Sstefanf STPUTC('=', out); 1740220903Sjilles if (state[level].syntax == DQSYNTAX || 1741220903Sjilles state[level].syntax == ARISYNTAX) 17421556Srgrimes flags |= VSQUOTE; 17431556Srgrimes *(stackblock() + typeloc) = subtype | flags; 1744206145Sjilles if (subtype != VSNORMAL) { 1745206145Sjilles if (level + 1 >= maxnest) { 1746206145Sjilles maxnest *= 2; 1747206145Sjilles if (state == state_static) { 1748206145Sjilles state = parser_temp_alloc( 1749206145Sjilles maxnest * sizeof(*state)); 1750206145Sjilles memcpy(state, state_static, 1751213811Sobrien MAXNEST_static * sizeof(*state)); 1752206145Sjilles } else 1753206145Sjilles state = parser_temp_realloc(state, 1754206145Sjilles maxnest * sizeof(*state)); 1755206145Sjilles } 1756206145Sjilles level++; 1757206145Sjilles state[level].parenlevel = 0; 1758206145Sjilles if (subtype == VSMINUS || subtype == VSPLUS || 1759206145Sjilles subtype == VSQUESTION || subtype == VSASSIGN) { 1760206145Sjilles /* 1761206145Sjilles * For operators that were in the Bourne shell, 1762206145Sjilles * inherit the double-quote state. 1763206145Sjilles */ 1764206145Sjilles state[level].syntax = state[level - 1].syntax; 1765206145Sjilles state[level].category = TSTATE_VAR_OLD; 1766206145Sjilles } else { 1767206145Sjilles /* 1768206145Sjilles * The other operators take a pattern, 1769206145Sjilles * so go to BASESYNTAX. 1770206145Sjilles * Also, ' and " are now special, even 1771206145Sjilles * in here documents. 1772206145Sjilles */ 1773206145Sjilles state[level].syntax = BASESYNTAX; 1774206145Sjilles state[level].category = TSTATE_VAR_NEW; 1775206145Sjilles newvarnest++; 1776206145Sjilles } 1777206145Sjilles } 1778221513Sjilles } else if (c == '\'' && state[level].syntax == BASESYNTAX) { 1779221513Sjilles /* $'cstylequotes' */ 1780221513Sjilles USTPUTC(CTLQUOTEMARK, out); 1781221513Sjilles state[level].syntax = SQSYNTAX; 1782221513Sjilles sqiscstyle = 1; 1783221513Sjilles } else { 1784221513Sjilles USTPUTC('$', out); 1785221513Sjilles pungetc(); 17861556Srgrimes } 17871556Srgrimes goto parsesub_return; 17881556Srgrimes} 17891556Srgrimes 17901556Srgrimes 17911556Srgrimes/* 17921556Srgrimes * Parse an arithmetic expansion (indicate start of one and set state) 17931556Srgrimes */ 17941556Srgrimesparsearith: { 17951556Srgrimes 1796206145Sjilles if (level + 1 >= maxnest) { 1797206145Sjilles maxnest *= 2; 1798206145Sjilles if (state == state_static) { 1799206145Sjilles state = parser_temp_alloc( 1800206145Sjilles maxnest * sizeof(*state)); 1801206145Sjilles memcpy(state, state_static, 1802213811Sobrien MAXNEST_static * sizeof(*state)); 1803206145Sjilles } else 1804206145Sjilles state = parser_temp_realloc(state, 1805206145Sjilles maxnest * sizeof(*state)); 18061556Srgrimes } 1807206145Sjilles level++; 1808206145Sjilles state[level].syntax = ARISYNTAX; 1809206145Sjilles state[level].parenlevel = 0; 1810206145Sjilles state[level].category = TSTATE_ARITH; 1811206145Sjilles USTPUTC(CTLARI, out); 1812206145Sjilles if (state[level - 1].syntax == DQSYNTAX) 1813206145Sjilles USTPUTC('"',out); 1814206145Sjilles else 1815206145Sjilles USTPUTC(' ',out); 18161556Srgrimes goto parsearith_return; 18171556Srgrimes} 18181556Srgrimes 18191556Srgrimes} /* end of readtoken */ 18201556Srgrimes 18211556Srgrimes 18221556Srgrimes/* 18231556Srgrimes * Returns true if the text contains nothing to expand (no dollar signs 18241556Srgrimes * or backquotes). 18251556Srgrimes */ 18261556Srgrimes 1827213811Sobrienstatic int 182890111Simpnoexpand(char *text) 182990111Simp{ 183025230Ssteve char *p; 183125230Ssteve char c; 18321556Srgrimes 18331556Srgrimes p = text; 18341556Srgrimes while ((c = *p++) != '\0') { 183539137Stegge if ( c == CTLQUOTEMARK) 183639137Stegge continue; 18371556Srgrimes if (c == CTLESC) 18381556Srgrimes p++; 183983675Stegge else if (BASESYNTAX[(int)c] == CCTL) 18401556Srgrimes return 0; 18411556Srgrimes } 18421556Srgrimes return 1; 18431556Srgrimes} 18441556Srgrimes 18451556Srgrimes 18461556Srgrimes/* 18471556Srgrimes * Return true if the argument is a legal variable name (a letter or 18481556Srgrimes * underscore followed by zero or more letters, underscores, and digits). 18491556Srgrimes */ 18501556Srgrimes 18511556Srgrimesint 1852200956Sjillesgoodname(const char *name) 185390111Simp{ 1854200956Sjilles const char *p; 18551556Srgrimes 18561556Srgrimes p = name; 18571556Srgrimes if (! is_name(*p)) 18581556Srgrimes return 0; 18591556Srgrimes while (*++p) { 18601556Srgrimes if (! is_in_name(*p)) 18611556Srgrimes return 0; 18621556Srgrimes } 18631556Srgrimes return 1; 18641556Srgrimes} 18651556Srgrimes 18661556Srgrimes 1867222165Sjillesint 1868222165Sjillesisassignment(const char *p) 1869222165Sjilles{ 1870222165Sjilles if (!is_name(*p)) 1871222165Sjilles return 0; 1872222165Sjilles p++; 1873222165Sjilles for (;;) { 1874222165Sjilles if (*p == '=') 1875222165Sjilles return 1; 1876222165Sjilles else if (!is_in_name(*p)) 1877222165Sjilles return 0; 1878222165Sjilles p++; 1879222165Sjilles } 1880222165Sjilles} 1881222165Sjilles 1882222165Sjilles 18831556Srgrimes/* 18841556Srgrimes * Called when an unexpected token is read during the parse. The argument 18851556Srgrimes * is the token that is expected, or -1 if more than one type of token can 18861556Srgrimes * occur at this point. 18871556Srgrimes */ 18881556Srgrimes 1889213811Sobrienstatic void 189090111Simpsynexpect(int token) 189117987Speter{ 18921556Srgrimes char msg[64]; 18931556Srgrimes 18941556Srgrimes if (token >= 0) { 18951556Srgrimes fmtstr(msg, 64, "%s unexpected (expecting %s)", 18961556Srgrimes tokname[lasttoken], tokname[token]); 18971556Srgrimes } else { 18981556Srgrimes fmtstr(msg, 64, "%s unexpected", tokname[lasttoken]); 18991556Srgrimes } 19001556Srgrimes synerror(msg); 19011556Srgrimes} 19021556Srgrimes 19031556Srgrimes 1904213811Sobrienstatic void 1905201053Sjillessynerror(const char *msg) 190690111Simp{ 19071556Srgrimes if (commandname) 1908201366Sjilles outfmt(out2, "%s: %d: ", commandname, startlinno); 1909201366Sjilles outfmt(out2, "Syntax error: %s\n", msg); 19101556Srgrimes error((char *)NULL); 19111556Srgrimes} 19121556Srgrimes 1913213811Sobrienstatic void 191490111Simpsetprompt(int which) 191590111Simp{ 19161556Srgrimes whichprompt = which; 19171556Srgrimes 191817987Speter#ifndef NO_HISTORY 19191556Srgrimes if (!el) 192017987Speter#endif 1921199629Sjilles { 19221556Srgrimes out2str(getprompt(NULL)); 1923199629Sjilles flushout(out2); 1924199629Sjilles } 19251556Srgrimes} 19261556Srgrimes 19271556Srgrimes/* 19281556Srgrimes * called by editline -- any expansions to the prompt 19291556Srgrimes * should be added here. 19301556Srgrimes */ 19311556Srgrimeschar * 193290111Simpgetprompt(void *unused __unused) 193325905Ssteve{ 1934142845Sobrien static char ps[PROMPTLEN]; 1935142845Sobrien char *fmt; 1936209653Sjilles const char *pwd; 1937209653Sjilles int i, trim; 1938214538Sjilles static char internal_error[] = "??"; 1939142845Sobrien 1940142845Sobrien /* 1941142845Sobrien * Select prompt format. 1942142845Sobrien */ 19431556Srgrimes switch (whichprompt) { 19441556Srgrimes case 0: 1945201053Sjilles fmt = nullstr; 1946142845Sobrien break; 19471556Srgrimes case 1: 1948142845Sobrien fmt = ps1val(); 1949142845Sobrien break; 19501556Srgrimes case 2: 1951142845Sobrien fmt = ps2val(); 1952142845Sobrien break; 19531556Srgrimes default: 1954201053Sjilles return internal_error; 19551556Srgrimes } 1956142845Sobrien 1957142845Sobrien /* 1958142845Sobrien * Format prompt string. 1959142845Sobrien */ 1960142845Sobrien for (i = 0; (i < 127) && (*fmt != '\0'); i++, fmt++) 1961142845Sobrien if (*fmt == '\\') 1962142845Sobrien switch (*++fmt) { 1963142845Sobrien 1964142845Sobrien /* 1965142845Sobrien * Hostname. 1966142845Sobrien * 1967142845Sobrien * \h specifies just the local hostname, 1968142845Sobrien * \H specifies fully-qualified hostname. 1969142845Sobrien */ 1970142845Sobrien case 'h': 1971142845Sobrien case 'H': 1972149024Sstefanf ps[i] = '\0'; 1973142845Sobrien gethostname(&ps[i], PROMPTLEN - i); 1974142845Sobrien /* Skip to end of hostname. */ 1975142845Sobrien trim = (*fmt == 'h') ? '.' : '\0'; 1976142845Sobrien while ((ps[i+1] != '\0') && (ps[i+1] != trim)) 1977142845Sobrien i++; 1978142845Sobrien break; 1979142845Sobrien 1980142845Sobrien /* 1981142845Sobrien * Working directory. 1982142845Sobrien * 1983142845Sobrien * \W specifies just the final component, 1984142845Sobrien * \w specifies the entire path. 1985142845Sobrien */ 1986142845Sobrien case 'W': 1987142845Sobrien case 'w': 1988209653Sjilles pwd = lookupvar("PWD"); 1989209653Sjilles if (pwd == NULL) 1990209653Sjilles pwd = "?"; 1991209653Sjilles if (*fmt == 'W' && 1992209653Sjilles *pwd == '/' && pwd[1] != '\0') 1993209653Sjilles strlcpy(&ps[i], strrchr(pwd, '/') + 1, 1994209653Sjilles PROMPTLEN - i); 1995209653Sjilles else 1996209653Sjilles strlcpy(&ps[i], pwd, PROMPTLEN - i); 1997142845Sobrien /* Skip to end of path. */ 1998142845Sobrien while (ps[i + 1] != '\0') 1999142845Sobrien i++; 2000142845Sobrien break; 2001142845Sobrien 2002142845Sobrien /* 2003142845Sobrien * Superuser status. 2004142845Sobrien * 2005142845Sobrien * '$' for normal users, '#' for root. 2006142845Sobrien */ 2007142845Sobrien case '$': 2008142845Sobrien ps[i] = (geteuid() != 0) ? '$' : '#'; 2009142845Sobrien break; 2010142845Sobrien 2011142845Sobrien /* 2012142845Sobrien * A literal \. 2013142845Sobrien */ 2014142845Sobrien case '\\': 2015142845Sobrien ps[i] = '\\'; 2016142845Sobrien break; 2017142845Sobrien 2018142845Sobrien /* 2019142845Sobrien * Emit unrecognized formats verbatim. 2020142845Sobrien */ 2021142845Sobrien default: 2022142845Sobrien ps[i++] = '\\'; 2023142845Sobrien ps[i] = *fmt; 2024142845Sobrien break; 2025142845Sobrien } 2026142845Sobrien else 2027142845Sobrien ps[i] = *fmt; 2028142845Sobrien ps[i] = '\0'; 2029142845Sobrien return (ps); 20301556Srgrimes} 2031222907Sjilles 2032222907Sjilles 2033222907Sjillesconst char * 2034248980Sjillesexpandstr(const char *ps) 2035222907Sjilles{ 2036222907Sjilles union node n; 2037222907Sjilles struct jmploc jmploc; 2038222907Sjilles struct jmploc *const savehandler = handler; 2039222907Sjilles const int saveprompt = doprompt; 2040222907Sjilles struct parsefile *const savetopfile = getcurrentfile(); 2041222907Sjilles struct parser_temp *const saveparser_temp = parser_temp; 2042222907Sjilles const char *result = NULL; 2043222907Sjilles 2044222907Sjilles if (!setjmp(jmploc.loc)) { 2045222907Sjilles handler = &jmploc; 2046222907Sjilles parser_temp = NULL; 2047222907Sjilles setinputstring(ps, 1); 2048222907Sjilles doprompt = 0; 2049222907Sjilles readtoken1(pgetc(), DQSYNTAX, "\n\n", 0); 2050222907Sjilles if (backquotelist != NULL) 2051222907Sjilles error("Command substitution not allowed here"); 2052222907Sjilles 2053222907Sjilles n.narg.type = NARG; 2054222907Sjilles n.narg.next = NULL; 2055222907Sjilles n.narg.text = wordtext; 2056222907Sjilles n.narg.backquote = backquotelist; 2057222907Sjilles 2058222907Sjilles expandarg(&n, NULL, 0); 2059222907Sjilles result = stackblock(); 2060222907Sjilles INTOFF; 2061222907Sjilles } 2062222907Sjilles handler = savehandler; 2063222907Sjilles doprompt = saveprompt; 2064222907Sjilles popfilesupto(savetopfile); 2065222907Sjilles if (parser_temp != saveparser_temp) { 2066222907Sjilles parser_temp_free_all(); 2067222907Sjilles parser_temp = saveparser_temp; 2068222907Sjilles } 2069222907Sjilles if (result != NULL) { 2070222907Sjilles INTON; 2071222907Sjilles } else if (exception == EXINT) 2072222907Sjilles raise(SIGINT); 2073222907Sjilles return result; 2074222907Sjilles} 2075