mirror of
https://git.FreeBSD.org/src.git
synced 2024-12-03 09:00:21 +00:00
3c28a656f2
This addresses one known problem in the PR database. PR: 13921 Reported by: Jin Guojun <j_guojun@lbl.gov>
1802 lines
45 KiB
C
1802 lines
45 KiB
C
/*
|
|
* eval.c - gawk parse tree interpreter
|
|
*/
|
|
|
|
/*
|
|
* Copyright (C) 1986, 1988, 1989, 1991-2000 the Free Software Foundation, Inc.
|
|
*
|
|
* This file is part of GAWK, the GNU implementation of the
|
|
* AWK Programming Language.
|
|
*
|
|
* GAWK is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* GAWK is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA
|
|
*
|
|
* $FreeBSD$
|
|
*/
|
|
|
|
#include "awk.h"
|
|
|
|
extern double pow P((double x, double y));
|
|
extern double modf P((double x, double *yp));
|
|
extern double fmod P((double x, double y));
|
|
|
|
static int eval_condition P((NODE *tree));
|
|
static NODE *op_assign P((NODE *tree));
|
|
static NODE *func_call P((NODE *name, NODE *arg_list));
|
|
static NODE *match_op P((NODE *tree));
|
|
static void push_args P((int count, NODE *arglist, NODE **oldstack, char *func_name));
|
|
static void pop_fcall_stack P((void));
|
|
static void pop_fcall P((void));
|
|
static int in_function P((void));
|
|
char *nodetype2str P((NODETYPE type));
|
|
char *flags2str P((int flagval));
|
|
|
|
#if __GNUC__ < 2
|
|
NODE *_t; /* used as a temporary in macros */
|
|
#endif
|
|
#ifdef MSDOS
|
|
double _msc51bug; /* to get around a bug in MSC 5.1 */
|
|
#endif
|
|
NODE *ret_node;
|
|
int OFSlen;
|
|
int ORSlen;
|
|
int OFMTidx;
|
|
int CONVFMTidx;
|
|
|
|
/* Macros and variables to save and restore function and loop bindings */
|
|
/*
|
|
* the val variable allows return/continue/break-out-of-context to be
|
|
* caught and diagnosed
|
|
*/
|
|
#define PUSH_BINDING(stack, x, val) (memcpy((char *)(stack), (char *)(x), sizeof(jmp_buf)), val++)
|
|
#define RESTORE_BINDING(stack, x, val) (memcpy((char *)(x), (char *)(stack), sizeof(jmp_buf)), val--)
|
|
|
|
static jmp_buf loop_tag; /* always the current binding */
|
|
static int loop_tag_valid = FALSE; /* nonzero when loop_tag valid */
|
|
static int func_tag_valid = FALSE;
|
|
static jmp_buf func_tag;
|
|
extern int exiting, exit_val;
|
|
|
|
/* This rather ugly macro is for VMS C */
|
|
#ifdef C
|
|
#undef C
|
|
#endif
|
|
#define C(c) ((char)c)
|
|
/*
|
|
* This table is used by the regexp routines to do case independant
|
|
* matching. Basically, every ascii character maps to itself, except
|
|
* uppercase letters map to lower case ones. This table has 256
|
|
* entries, for ISO 8859-1. Note also that if the system this
|
|
* is compiled on doesn't use 7-bit ascii, casetable[] should not be
|
|
* defined to the linker, so gawk should not load.
|
|
*
|
|
* Do NOT make this array static, it is used in several spots, not
|
|
* just in this file.
|
|
*/
|
|
#if 'a' == 97 /* it's ascii */
|
|
char casetable[] = {
|
|
'\000', '\001', '\002', '\003', '\004', '\005', '\006', '\007',
|
|
'\010', '\011', '\012', '\013', '\014', '\015', '\016', '\017',
|
|
'\020', '\021', '\022', '\023', '\024', '\025', '\026', '\027',
|
|
'\030', '\031', '\032', '\033', '\034', '\035', '\036', '\037',
|
|
/* ' ' '!' '"' '#' '$' '%' '&' ''' */
|
|
'\040', '\041', '\042', '\043', '\044', '\045', '\046', '\047',
|
|
/* '(' ')' '*' '+' ',' '-' '.' '/' */
|
|
'\050', '\051', '\052', '\053', '\054', '\055', '\056', '\057',
|
|
/* '0' '1' '2' '3' '4' '5' '6' '7' */
|
|
'\060', '\061', '\062', '\063', '\064', '\065', '\066', '\067',
|
|
/* '8' '9' ':' ';' '<' '=' '>' '?' */
|
|
'\070', '\071', '\072', '\073', '\074', '\075', '\076', '\077',
|
|
/* '@' 'A' 'B' 'C' 'D' 'E' 'F' 'G' */
|
|
'\100', '\141', '\142', '\143', '\144', '\145', '\146', '\147',
|
|
/* 'H' 'I' 'J' 'K' 'L' 'M' 'N' 'O' */
|
|
'\150', '\151', '\152', '\153', '\154', '\155', '\156', '\157',
|
|
/* 'P' 'Q' 'R' 'S' 'T' 'U' 'V' 'W' */
|
|
'\160', '\161', '\162', '\163', '\164', '\165', '\166', '\167',
|
|
/* 'X' 'Y' 'Z' '[' '\' ']' '^' '_' */
|
|
'\170', '\171', '\172', '\133', '\134', '\135', '\136', '\137',
|
|
/* '`' 'a' 'b' 'c' 'd' 'e' 'f' 'g' */
|
|
'\140', '\141', '\142', '\143', '\144', '\145', '\146', '\147',
|
|
/* 'h' 'i' 'j' 'k' 'l' 'm' 'n' 'o' */
|
|
'\150', '\151', '\152', '\153', '\154', '\155', '\156', '\157',
|
|
/* 'p' 'q' 'r' 's' 't' 'u' 'v' 'w' */
|
|
'\160', '\161', '\162', '\163', '\164', '\165', '\166', '\167',
|
|
/* 'x' 'y' 'z' '{' '|' '}' '~' */
|
|
'\170', '\171', '\172', '\173', '\174', '\175', '\176', '\177',
|
|
#ifndef USE_PURE_ASCII
|
|
C('\200'), C('\201'), C('\202'), C('\203'), C('\204'), C('\205'), C('\206'), C('\207'),
|
|
C('\210'), C('\211'), C('\212'), C('\213'), C('\214'), C('\215'), C('\216'), C('\217'),
|
|
C('\220'), C('\221'), C('\222'), C('\223'), C('\224'), C('\225'), C('\226'), C('\227'),
|
|
C('\230'), C('\231'), C('\232'), C('\233'), C('\234'), C('\235'), C('\236'), C('\237'),
|
|
C('\240'), C('\241'), C('\242'), C('\243'), C('\244'), C('\245'), C('\246'), C('\247'),
|
|
C('\250'), C('\251'), C('\252'), C('\253'), C('\254'), C('\255'), C('\256'), C('\257'),
|
|
C('\260'), C('\261'), C('\262'), C('\263'), C('\264'), C('\265'), C('\266'), C('\267'),
|
|
C('\270'), C('\271'), C('\272'), C('\273'), C('\274'), C('\275'), C('\276'), C('\277'),
|
|
C('\340'), C('\341'), C('\342'), C('\343'), C('\344'), C('\345'), C('\346'), C('\347'),
|
|
C('\350'), C('\351'), C('\352'), C('\353'), C('\354'), C('\355'), C('\356'), C('\357'),
|
|
C('\360'), C('\361'), C('\362'), C('\363'), C('\364'), C('\365'), C('\366'), C('\327'),
|
|
C('\370'), C('\371'), C('\372'), C('\373'), C('\374'), C('\375'), C('\376'), C('\337'),
|
|
C('\340'), C('\341'), C('\342'), C('\343'), C('\344'), C('\345'), C('\346'), C('\347'),
|
|
C('\350'), C('\351'), C('\352'), C('\353'), C('\354'), C('\355'), C('\356'), C('\357'),
|
|
C('\360'), C('\361'), C('\362'), C('\363'), C('\364'), C('\365'), C('\366'), C('\367'),
|
|
C('\370'), C('\371'), C('\372'), C('\373'), C('\374'), C('\375'), C('\376'), C('\377'),
|
|
#else
|
|
C('\200'), C('\201'), C('\202'), C('\203'), C('\204'), C('\205'), C('\206'), C('\207'),
|
|
C('\210'), C('\211'), C('\212'), C('\213'), C('\214'), C('\215'), C('\216'), C('\217'),
|
|
C('\220'), C('\221'), C('\222'), C('\223'), C('\224'), C('\225'), C('\226'), C('\227'),
|
|
C('\230'), C('\231'), C('\232'), C('\233'), C('\234'), C('\235'), C('\236'), C('\237'),
|
|
C('\240'), C('\241'), C('\242'), C('\243'), C('\244'), C('\245'), C('\246'), C('\247'),
|
|
C('\250'), C('\251'), C('\252'), C('\253'), C('\254'), C('\255'), C('\256'), C('\257'),
|
|
C('\260'), C('\261'), C('\262'), C('\263'), C('\264'), C('\265'), C('\266'), C('\267'),
|
|
C('\270'), C('\271'), C('\272'), C('\273'), C('\274'), C('\275'), C('\276'), C('\277'),
|
|
C('\300'), C('\301'), C('\302'), C('\303'), C('\304'), C('\305'), C('\306'), C('\307'),
|
|
C('\310'), C('\311'), C('\312'), C('\313'), C('\314'), C('\315'), C('\316'), C('\317'),
|
|
C('\320'), C('\321'), C('\322'), C('\323'), C('\324'), C('\325'), C('\326'), C('\327'),
|
|
C('\330'), C('\331'), C('\332'), C('\333'), C('\334'), C('\335'), C('\336'), C('\337'),
|
|
C('\340'), C('\341'), C('\342'), C('\343'), C('\344'), C('\345'), C('\346'), C('\347'),
|
|
C('\350'), C('\351'), C('\352'), C('\353'), C('\354'), C('\355'), C('\356'), C('\357'),
|
|
C('\360'), C('\361'), C('\362'), C('\363'), C('\364'), C('\365'), C('\366'), C('\367'),
|
|
C('\370'), C('\371'), C('\372'), C('\373'), C('\374'), C('\375'), C('\376'), C('\377'),
|
|
#endif
|
|
};
|
|
#else
|
|
#include "You lose. You will need a translation table for your character set."
|
|
#endif
|
|
|
|
#undef C
|
|
|
|
/*
|
|
* This table maps node types to strings for debugging.
|
|
* KEEP IN SYNC WITH awk.h!!!!
|
|
*/
|
|
static char *nodetypes[] = {
|
|
"Node_illegal",
|
|
"Node_times",
|
|
"Node_quotient",
|
|
"Node_mod",
|
|
"Node_plus",
|
|
"Node_minus",
|
|
"Node_cond_pair",
|
|
"Node_subscript",
|
|
"Node_concat",
|
|
"Node_exp",
|
|
"Node_preincrement",
|
|
"Node_predecrement",
|
|
"Node_postincrement",
|
|
"Node_postdecrement",
|
|
"Node_unary_minus",
|
|
"Node_field_spec",
|
|
"Node_assign",
|
|
"Node_assign_times",
|
|
"Node_assign_quotient",
|
|
"Node_assign_mod",
|
|
"Node_assign_plus",
|
|
"Node_assign_minus",
|
|
"Node_assign_exp",
|
|
"Node_and",
|
|
"Node_or",
|
|
"Node_equal",
|
|
"Node_notequal",
|
|
"Node_less",
|
|
"Node_greater",
|
|
"Node_leq",
|
|
"Node_geq",
|
|
"Node_match",
|
|
"Node_nomatch",
|
|
"Node_not",
|
|
"Node_rule_list",
|
|
"Node_rule_node",
|
|
"Node_statement_list",
|
|
"Node_if_branches",
|
|
"Node_expression_list",
|
|
"Node_param_list",
|
|
"Node_K_if",
|
|
"Node_K_while",
|
|
"Node_K_for",
|
|
"Node_K_arrayfor",
|
|
"Node_K_break",
|
|
"Node_K_continue",
|
|
"Node_K_print",
|
|
"Node_K_printf",
|
|
"Node_K_next",
|
|
"Node_K_exit",
|
|
"Node_K_do",
|
|
"Node_K_return",
|
|
"Node_K_delete",
|
|
"Node_K_delete_loop",
|
|
"Node_K_getline",
|
|
"Node_K_function",
|
|
"Node_K_nextfile",
|
|
"Node_redirect_output",
|
|
"Node_redirect_append",
|
|
"Node_redirect_pipe",
|
|
"Node_redirect_pipein",
|
|
"Node_redirect_input",
|
|
"Node_var",
|
|
"Node_var_array",
|
|
"Node_val",
|
|
"Node_builtin",
|
|
"Node_line_range",
|
|
"Node_in_array",
|
|
"Node_func",
|
|
"Node_func_call",
|
|
"Node_cond_exp",
|
|
"Node_regex",
|
|
"Node_hashnode",
|
|
"Node_ahash",
|
|
"Node_array_ref",
|
|
"Node_NF",
|
|
"Node_NR",
|
|
"Node_FNR",
|
|
"Node_FS",
|
|
"Node_RS",
|
|
"Node_FIELDWIDTHS",
|
|
"Node_IGNORECASE",
|
|
"Node_OFS",
|
|
"Node_ORS",
|
|
"Node_OFMT",
|
|
"Node_CONVFMT",
|
|
"Node_final",
|
|
NULL
|
|
};
|
|
|
|
char *
|
|
nodetype2str(type)
|
|
NODETYPE type;
|
|
{
|
|
static char buf[40];
|
|
|
|
if (type >= Node_illegal && type <= Node_final)
|
|
return nodetypes[(int) type];
|
|
|
|
sprintf(buf, "unknown nodetype %d", (int) type);
|
|
return buf;
|
|
}
|
|
|
|
/* flags2str --- make a flags value readable */
|
|
|
|
char *
|
|
flags2str(flagval)
|
|
int flagval;
|
|
{
|
|
static char buffer[BUFSIZ];
|
|
char *sp;
|
|
|
|
sp = buffer;
|
|
|
|
if (flagval & MALLOC) {
|
|
strcpy(sp, "MALLOC");
|
|
sp += strlen(sp);
|
|
}
|
|
if (flagval & TEMP) {
|
|
if (sp != buffer)
|
|
*sp++ = '|';
|
|
strcpy(sp, "TEMP");
|
|
sp += strlen(sp);
|
|
}
|
|
if (flagval & PERM) {
|
|
if (sp != buffer)
|
|
*sp++ = '|';
|
|
strcpy(sp, "PERM");
|
|
sp += strlen(sp);
|
|
}
|
|
if (flagval & STRING) {
|
|
if (sp != buffer)
|
|
*sp++ = '|';
|
|
strcpy(sp, "STRING");
|
|
sp += strlen(sp);
|
|
}
|
|
if (flagval & STR) {
|
|
if (sp != buffer)
|
|
*sp++ = '|';
|
|
strcpy(sp, "STR");
|
|
sp += strlen(sp);
|
|
}
|
|
if (flagval & NUM) {
|
|
if (sp != buffer)
|
|
*sp++ = '|';
|
|
strcpy(sp, "NUM");
|
|
sp += strlen(sp);
|
|
}
|
|
if (flagval & NUMBER) {
|
|
if (sp != buffer)
|
|
*sp++ = '|';
|
|
strcpy(sp, "NUMBER");
|
|
sp += strlen(sp);
|
|
}
|
|
if (flagval & MAYBE_NUM) {
|
|
if (sp != buffer)
|
|
*sp++ = '|';
|
|
strcpy(sp, "MAYBE_NUM");
|
|
sp += strlen(sp);
|
|
}
|
|
if (flagval & ARRAYMAXED) {
|
|
if (sp != buffer)
|
|
*sp++ = '|';
|
|
strcpy(sp, "ARRAYMAXED");
|
|
sp += strlen(sp);
|
|
}
|
|
if (flagval & SCALAR) {
|
|
if (sp != buffer)
|
|
*sp++ = '|';
|
|
strcpy(sp, "SCALAR");
|
|
sp += strlen(sp);
|
|
}
|
|
if (flagval & FUNC) {
|
|
if (sp != buffer)
|
|
*sp++ = '|';
|
|
strcpy(sp, "FUNC");
|
|
sp += strlen(sp);
|
|
}
|
|
if (flagval & FIELD) {
|
|
if (sp != buffer)
|
|
*sp++ = '|';
|
|
strcpy(sp, "FIELD");
|
|
sp += strlen(sp);
|
|
}
|
|
|
|
return buffer;
|
|
}
|
|
|
|
/*
|
|
* interpret:
|
|
* Tree is a bunch of rules to run. Returns zero if it hit an exit()
|
|
* statement
|
|
*/
|
|
int
|
|
interpret(tree)
|
|
register NODE *volatile tree;
|
|
{
|
|
jmp_buf volatile loop_tag_stack; /* shallow binding stack for loop_tag */
|
|
static jmp_buf rule_tag; /* tag the rule currently being run, for NEXT
|
|
* and EXIT statements. It is static because
|
|
* there are no nested rules */
|
|
register NODE *volatile t = NULL; /* temporary */
|
|
NODE **volatile lhs; /* lhs == Left Hand Side for assigns, etc */
|
|
NODE *volatile stable_tree;
|
|
int volatile traverse = TRUE; /* True => loop thru tree (Node_rule_list) */
|
|
|
|
/* avoid false source indications */
|
|
source = NULL;
|
|
sourceline = 0;
|
|
|
|
if (tree == NULL)
|
|
return 1;
|
|
sourceline = tree->source_line;
|
|
source = tree->source_file;
|
|
switch (tree->type) {
|
|
case Node_rule_node:
|
|
traverse = FALSE; /* False => one for-loop iteration only */
|
|
/* FALL THROUGH */
|
|
case Node_rule_list:
|
|
for (t = tree; t != NULL; t = t->rnode) {
|
|
if (traverse)
|
|
tree = t->lnode;
|
|
sourceline = tree->source_line;
|
|
source = tree->source_file;
|
|
switch (setjmp(rule_tag)) {
|
|
case 0: /* normal non-jump */
|
|
/* test pattern, if any */
|
|
if (tree->lnode == NULL ||
|
|
eval_condition(tree->lnode))
|
|
(void) interpret(tree->rnode);
|
|
break;
|
|
case TAG_CONTINUE: /* NEXT statement */
|
|
return 1;
|
|
case TAG_BREAK:
|
|
return 0;
|
|
default:
|
|
cant_happen();
|
|
}
|
|
if (! traverse) /* case Node_rule_node */
|
|
break; /* don't loop */
|
|
}
|
|
break;
|
|
|
|
case Node_statement_list:
|
|
for (t = tree; t != NULL; t = t->rnode)
|
|
(void) interpret(t->lnode);
|
|
break;
|
|
|
|
case Node_K_if:
|
|
if (eval_condition(tree->lnode))
|
|
(void) interpret(tree->rnode->lnode);
|
|
else
|
|
(void) interpret(tree->rnode->rnode);
|
|
break;
|
|
|
|
case Node_K_while:
|
|
PUSH_BINDING(loop_tag_stack, loop_tag, loop_tag_valid);
|
|
|
|
stable_tree = tree;
|
|
while (eval_condition(stable_tree->lnode)) {
|
|
switch (setjmp(loop_tag)) {
|
|
case 0: /* normal non-jump */
|
|
(void) interpret(stable_tree->rnode);
|
|
break;
|
|
case TAG_CONTINUE: /* continue statement */
|
|
break;
|
|
case TAG_BREAK: /* break statement */
|
|
RESTORE_BINDING(loop_tag_stack, loop_tag, loop_tag_valid);
|
|
return 1;
|
|
default:
|
|
cant_happen();
|
|
}
|
|
}
|
|
RESTORE_BINDING(loop_tag_stack, loop_tag, loop_tag_valid);
|
|
break;
|
|
|
|
case Node_K_do:
|
|
PUSH_BINDING(loop_tag_stack, loop_tag, loop_tag_valid);
|
|
stable_tree = tree;
|
|
do {
|
|
switch (setjmp(loop_tag)) {
|
|
case 0: /* normal non-jump */
|
|
(void) interpret(stable_tree->rnode);
|
|
break;
|
|
case TAG_CONTINUE: /* continue statement */
|
|
break;
|
|
case TAG_BREAK: /* break statement */
|
|
RESTORE_BINDING(loop_tag_stack, loop_tag, loop_tag_valid);
|
|
return 1;
|
|
default:
|
|
cant_happen();
|
|
}
|
|
} while (eval_condition(stable_tree->lnode));
|
|
RESTORE_BINDING(loop_tag_stack, loop_tag, loop_tag_valid);
|
|
break;
|
|
|
|
case Node_K_for:
|
|
PUSH_BINDING(loop_tag_stack, loop_tag, loop_tag_valid);
|
|
(void) interpret(tree->forloop->init);
|
|
stable_tree = tree;
|
|
while (eval_condition(stable_tree->forloop->cond)) {
|
|
switch (setjmp(loop_tag)) {
|
|
case 0: /* normal non-jump */
|
|
(void) interpret(stable_tree->lnode);
|
|
/* fall through */
|
|
case TAG_CONTINUE: /* continue statement */
|
|
(void) interpret(stable_tree->forloop->incr);
|
|
break;
|
|
case TAG_BREAK: /* break statement */
|
|
RESTORE_BINDING(loop_tag_stack, loop_tag, loop_tag_valid);
|
|
return 1;
|
|
default:
|
|
cant_happen();
|
|
}
|
|
}
|
|
RESTORE_BINDING(loop_tag_stack, loop_tag, loop_tag_valid);
|
|
break;
|
|
|
|
case Node_K_arrayfor:
|
|
{
|
|
volatile struct search l; /* For array_for */
|
|
Func_ptr after_assign = NULL;
|
|
|
|
#define hakvar forloop->init
|
|
#define arrvar forloop->incr
|
|
PUSH_BINDING(loop_tag_stack, loop_tag, loop_tag_valid);
|
|
lhs = get_lhs(tree->hakvar, &after_assign);
|
|
t = tree->arrvar;
|
|
if (t->type == Node_param_list)
|
|
t = stack_ptr[t->param_cnt];
|
|
if (t->type == Node_array_ref)
|
|
t = t->orig_array;
|
|
stable_tree = tree;
|
|
if ((t->flags & SCALAR) != 0)
|
|
fatal("attempt to use scalar as array");
|
|
for (assoc_scan(t, (struct search *)&l);
|
|
l.retval;
|
|
assoc_next((struct search *)&l)) {
|
|
unref(*((NODE **) lhs));
|
|
*lhs = dupnode(l.retval);
|
|
if (after_assign)
|
|
(*after_assign)();
|
|
switch (setjmp(loop_tag)) {
|
|
case 0:
|
|
(void) interpret(stable_tree->lnode);
|
|
case TAG_CONTINUE:
|
|
break;
|
|
|
|
case TAG_BREAK:
|
|
RESTORE_BINDING(loop_tag_stack, loop_tag, loop_tag_valid);
|
|
return 1;
|
|
default:
|
|
cant_happen();
|
|
}
|
|
}
|
|
RESTORE_BINDING(loop_tag_stack, loop_tag, loop_tag_valid);
|
|
break;
|
|
}
|
|
|
|
case Node_K_break:
|
|
if (! loop_tag_valid) {
|
|
/*
|
|
* Old AT&T nawk treats break outside of loops like
|
|
* next. New ones catch it at parse time. Allow it if
|
|
* do_traditional is on, and complain if lint.
|
|
*/
|
|
static int warned = FALSE;
|
|
|
|
if (do_lint && ! warned) {
|
|
warning("use of `break' outside a loop is not portable");
|
|
warned = TRUE;
|
|
}
|
|
if (! do_traditional || do_posix)
|
|
fatal("use of `break' outside a loop is not allowed");
|
|
if (in_function())
|
|
pop_fcall_stack();
|
|
longjmp(rule_tag, TAG_CONTINUE);
|
|
} else
|
|
longjmp(loop_tag, TAG_BREAK);
|
|
break;
|
|
|
|
case Node_K_continue:
|
|
if (! loop_tag_valid) {
|
|
/*
|
|
* Old AT&T nawk treats continue outside of loops like
|
|
* next. New ones catch it at parse time. Allow it if
|
|
* do_traditional is on, and complain if lint.
|
|
*/
|
|
static int warned = FALSE;
|
|
|
|
if (do_lint && ! warned) {
|
|
warning("use of `continue' outside a loop is not portable");
|
|
warned = TRUE;
|
|
}
|
|
if (! do_traditional || do_posix)
|
|
fatal("use of `continue' outside a loop is not allowed");
|
|
if (in_function())
|
|
pop_fcall_stack();
|
|
longjmp(rule_tag, TAG_CONTINUE);
|
|
} else
|
|
longjmp(loop_tag, TAG_CONTINUE);
|
|
break;
|
|
|
|
case Node_K_print:
|
|
do_print(tree);
|
|
break;
|
|
|
|
case Node_K_printf:
|
|
do_printf(tree);
|
|
break;
|
|
|
|
case Node_K_delete:
|
|
do_delete(tree->lnode, tree->rnode);
|
|
break;
|
|
|
|
case Node_K_delete_loop:
|
|
do_delete_loop(tree->lnode, tree->rnode);
|
|
break;
|
|
|
|
case Node_K_next:
|
|
if (in_begin_rule)
|
|
fatal("`next' cannot be called from a BEGIN rule");
|
|
else if (in_end_rule)
|
|
fatal("`next' cannot be called from an END rule");
|
|
|
|
if (in_function())
|
|
pop_fcall_stack();
|
|
|
|
longjmp(rule_tag, TAG_CONTINUE);
|
|
break;
|
|
|
|
case Node_K_nextfile:
|
|
if (in_begin_rule)
|
|
fatal("`nextfile' cannot be called from a BEGIN rule");
|
|
else if (in_end_rule)
|
|
fatal("`nextfile' cannot be called from an END rule");
|
|
|
|
if (in_function())
|
|
pop_fcall_stack();
|
|
|
|
do_nextfile();
|
|
break;
|
|
|
|
case Node_K_exit:
|
|
/*
|
|
* In A,K,&W, p. 49, it says that an exit statement "...
|
|
* causes the program to behave as if the end of input had
|
|
* occurred; no more input is read, and the END actions, if
|
|
* any are executed." This implies that the rest of the rules
|
|
* are not done. So we immediately break out of the main loop.
|
|
*/
|
|
exiting = TRUE;
|
|
if (tree->lnode != NULL) {
|
|
t = tree_eval(tree->lnode);
|
|
exit_val = (int) force_number(t);
|
|
free_temp(t);
|
|
}
|
|
longjmp(rule_tag, TAG_BREAK);
|
|
break;
|
|
|
|
case Node_K_return:
|
|
t = tree_eval(tree->lnode);
|
|
ret_node = dupnode(t);
|
|
free_temp(t);
|
|
longjmp(func_tag, TAG_RETURN);
|
|
break;
|
|
|
|
default:
|
|
/*
|
|
* Appears to be an expression statement. Throw away the
|
|
* value.
|
|
*/
|
|
if (do_lint && tree->type == Node_var)
|
|
warning("statement has no effect");
|
|
t = tree_eval(tree);
|
|
free_temp(t);
|
|
break;
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
/* r_tree_eval --- evaluate a subtree */
|
|
|
|
NODE *
|
|
r_tree_eval(tree, iscond)
|
|
register NODE *tree;
|
|
int iscond;
|
|
{
|
|
register NODE *r, *t1, *t2; /* return value & temporary subtrees */
|
|
register NODE **lhs;
|
|
register int di;
|
|
AWKNUM x, x1, x2;
|
|
long lx;
|
|
#ifdef _CRAY
|
|
long lx2;
|
|
#endif
|
|
char namebuf[100];
|
|
|
|
#ifdef DEBUG
|
|
if (tree == NULL)
|
|
return Nnull_string;
|
|
else if (tree->type == Node_val) {
|
|
if (tree->stref <= 0)
|
|
cant_happen();
|
|
return tree;
|
|
} else if (tree->type == Node_var) {
|
|
if (tree->var_value->stref <= 0)
|
|
cant_happen();
|
|
return tree->var_value;
|
|
}
|
|
#endif
|
|
|
|
if (tree->type == Node_param_list) {
|
|
int paramnum = tree->param_cnt + 1;
|
|
|
|
if ((tree->flags & FUNC) != 0)
|
|
fatal("can't use function name `%s' as variable or array",
|
|
tree->vname);
|
|
|
|
tree = stack_ptr[tree->param_cnt];
|
|
if (tree == NULL)
|
|
return Nnull_string;
|
|
sprintf(namebuf, "parameter #%d", paramnum);
|
|
tree->vname = namebuf;
|
|
}
|
|
if (tree->type == Node_array_ref)
|
|
tree = tree->orig_array;
|
|
|
|
switch (tree->type) {
|
|
case Node_var:
|
|
return tree->var_value;
|
|
|
|
case Node_and:
|
|
return tmp_number((AWKNUM) (eval_condition(tree->lnode)
|
|
&& eval_condition(tree->rnode)));
|
|
|
|
case Node_or:
|
|
return tmp_number((AWKNUM) (eval_condition(tree->lnode)
|
|
|| eval_condition(tree->rnode)));
|
|
|
|
case Node_not:
|
|
return tmp_number((AWKNUM) ! eval_condition(tree->lnode));
|
|
|
|
/* Builtins */
|
|
case Node_builtin:
|
|
return (*tree->proc)(tree->subnode);
|
|
|
|
case Node_K_getline:
|
|
return (do_getline(tree));
|
|
|
|
case Node_in_array:
|
|
return tmp_number((AWKNUM) in_array(tree->lnode, tree->rnode));
|
|
|
|
case Node_func_call:
|
|
return func_call(tree->rnode, tree->lnode);
|
|
|
|
/* unary operations */
|
|
case Node_NR:
|
|
case Node_FNR:
|
|
case Node_NF:
|
|
case Node_FIELDWIDTHS:
|
|
case Node_FS:
|
|
case Node_RS:
|
|
case Node_field_spec:
|
|
case Node_subscript:
|
|
case Node_IGNORECASE:
|
|
case Node_OFS:
|
|
case Node_ORS:
|
|
case Node_OFMT:
|
|
case Node_CONVFMT:
|
|
lhs = get_lhs(tree, (Func_ptr *) NULL);
|
|
return *lhs;
|
|
|
|
case Node_var_array:
|
|
fatal("attempt to use array `%s' in a scalar context",
|
|
tree->vname);
|
|
|
|
case Node_unary_minus:
|
|
t1 = tree_eval(tree->subnode);
|
|
x = -force_number(t1);
|
|
free_temp(t1);
|
|
return tmp_number(x);
|
|
|
|
case Node_cond_exp:
|
|
if (eval_condition(tree->lnode))
|
|
return tree_eval(tree->rnode->lnode);
|
|
return tree_eval(tree->rnode->rnode);
|
|
|
|
case Node_match:
|
|
case Node_nomatch:
|
|
case Node_regex:
|
|
return match_op(tree);
|
|
|
|
case Node_func:
|
|
fatal("function `%s' called with space between name and (,\n%s",
|
|
tree->lnode->param,
|
|
"or used in other expression context");
|
|
|
|
/* assignments */
|
|
case Node_assign:
|
|
{
|
|
Func_ptr after_assign = NULL;
|
|
|
|
if (iscond && do_lint)
|
|
warning("assignment used in conditional context");
|
|
r = tree_eval(tree->rnode);
|
|
lhs = get_lhs(tree->lnode, &after_assign);
|
|
if (r != *lhs) {
|
|
NODE *save;
|
|
|
|
save = *lhs;
|
|
*lhs = dupnode(r);
|
|
unref(save);
|
|
}
|
|
free_temp(r);
|
|
tree->lnode->flags |= SCALAR;
|
|
if (after_assign)
|
|
(*after_assign)();
|
|
return *lhs;
|
|
}
|
|
|
|
case Node_concat:
|
|
{
|
|
NODE **treelist;
|
|
NODE **strlist;
|
|
NODE *save_tree;
|
|
register NODE **treep;
|
|
register NODE **strp;
|
|
register size_t len;
|
|
char *str;
|
|
register char *dest;
|
|
int alloc_count, str_count;
|
|
int i;
|
|
|
|
/*
|
|
* This is an efficiency hack for multiple adjacent string
|
|
* concatenations, to avoid recursion and string copies.
|
|
*
|
|
* Node_concat trees grow downward to the left, so
|
|
* descend to lowest (first) node, accumulating nodes
|
|
* to evaluate to strings as we go.
|
|
*/
|
|
|
|
/*
|
|
* But first, no arbitrary limits. Count the number of
|
|
* nodes and malloc the treelist and strlist arrays.
|
|
* There will be alloc_count + 1 items to concatenate. We
|
|
* also leave room for an extra pointer at the end to
|
|
* use as a sentinel. Thus, start alloc_count at 2.
|
|
*/
|
|
save_tree = tree;
|
|
for (alloc_count = 2; tree && tree->type == Node_concat; tree = tree->lnode)
|
|
alloc_count++;
|
|
tree = save_tree;
|
|
emalloc(treelist, NODE **, sizeof(NODE *) * alloc_count, "tree_eval");
|
|
emalloc(strlist, NODE **, sizeof(NODE *) * alloc_count, "tree_eval");
|
|
|
|
/* Now, here we go. */
|
|
treep = treelist;
|
|
while (tree && tree->type == Node_concat) {
|
|
*treep++ = tree->rnode;
|
|
tree = tree->lnode;
|
|
}
|
|
*treep = tree;
|
|
/*
|
|
* Now, evaluate to strings in LIFO order, accumulating
|
|
* the string length, so we can do a single malloc at the
|
|
* end.
|
|
*
|
|
* Evaluate the expressions first, then get their
|
|
* lengthes, in case one of the expressions has a
|
|
* side effect that changes one of the others.
|
|
* See test/nasty.awk.
|
|
*/
|
|
strp = strlist;
|
|
len = 0;
|
|
while (treep >= treelist) {
|
|
*strp = force_string(tree_eval(*treep--));
|
|
strp++;
|
|
}
|
|
*strp = NULL;
|
|
|
|
str_count = strp - strlist;
|
|
strp = strlist;
|
|
for (i = 0; i < str_count; i++) {
|
|
len += (*strp)->stlen;
|
|
strp++;
|
|
}
|
|
emalloc(str, char *, len+2, "tree_eval");
|
|
str[len] = str[len+1] = '\0'; /* for good measure */
|
|
dest = str;
|
|
strp = strlist;
|
|
while (*strp) {
|
|
memcpy(dest, (*strp)->stptr, (*strp)->stlen);
|
|
dest += (*strp)->stlen;
|
|
free_temp(*strp);
|
|
strp++;
|
|
}
|
|
r = make_str_node(str, len, ALREADY_MALLOCED);
|
|
r->flags |= TEMP;
|
|
|
|
free(strlist);
|
|
free(treelist);
|
|
}
|
|
return r;
|
|
|
|
/* other assignment types are easier because they are numeric */
|
|
case Node_preincrement:
|
|
case Node_predecrement:
|
|
case Node_postincrement:
|
|
case Node_postdecrement:
|
|
case Node_assign_exp:
|
|
case Node_assign_times:
|
|
case Node_assign_quotient:
|
|
case Node_assign_mod:
|
|
case Node_assign_plus:
|
|
case Node_assign_minus:
|
|
return op_assign(tree);
|
|
default:
|
|
break; /* handled below */
|
|
}
|
|
|
|
/* evaluate subtrees in order to do binary operation, then keep going */
|
|
t1 = tree_eval(tree->lnode);
|
|
t2 = tree_eval(tree->rnode);
|
|
|
|
switch (tree->type) {
|
|
case Node_geq:
|
|
case Node_leq:
|
|
case Node_greater:
|
|
case Node_less:
|
|
case Node_notequal:
|
|
case Node_equal:
|
|
di = cmp_nodes(t1, t2);
|
|
free_temp(t1);
|
|
free_temp(t2);
|
|
switch (tree->type) {
|
|
case Node_equal:
|
|
return tmp_number((AWKNUM) (di == 0));
|
|
case Node_notequal:
|
|
return tmp_number((AWKNUM) (di != 0));
|
|
case Node_less:
|
|
return tmp_number((AWKNUM) (di < 0));
|
|
case Node_greater:
|
|
return tmp_number((AWKNUM) (di > 0));
|
|
case Node_leq:
|
|
return tmp_number((AWKNUM) (di <= 0));
|
|
case Node_geq:
|
|
return tmp_number((AWKNUM) (di >= 0));
|
|
default:
|
|
cant_happen();
|
|
}
|
|
break;
|
|
default:
|
|
break; /* handled below */
|
|
}
|
|
|
|
x1 = force_number(t1);
|
|
free_temp(t1);
|
|
x2 = force_number(t2);
|
|
free_temp(t2);
|
|
switch (tree->type) {
|
|
case Node_exp:
|
|
if ((lx = x2) == x2 && lx >= 0) { /* integer exponent */
|
|
if (lx == 0)
|
|
x = 1;
|
|
else if (lx == 1)
|
|
x = x1;
|
|
else {
|
|
/* doing it this way should be more precise */
|
|
for (x = x1; --lx; )
|
|
x *= x1;
|
|
}
|
|
} else
|
|
x = pow((double) x1, (double) x2);
|
|
return tmp_number(x);
|
|
|
|
case Node_times:
|
|
return tmp_number(x1 * x2);
|
|
|
|
case Node_quotient:
|
|
if (x2 == 0)
|
|
fatal("division by zero attempted");
|
|
#ifdef _CRAY
|
|
/* special case for integer division, put in for Cray */
|
|
lx2 = x2;
|
|
if (lx2 == 0)
|
|
return tmp_number(x1 / x2);
|
|
lx = (long) x1 / lx2;
|
|
if (lx * x2 == x1)
|
|
return tmp_number((AWKNUM) lx);
|
|
else
|
|
#endif
|
|
return tmp_number(x1 / x2);
|
|
|
|
case Node_mod:
|
|
if (x2 == 0)
|
|
fatal("division by zero attempted in mod");
|
|
#ifdef HAVE_FMOD
|
|
return tmp_number(fmod(x1, x2));
|
|
#else /* ! HAVE_FMOD */
|
|
(void) modf(x1 / x2, &x);
|
|
return tmp_number(x1 - x * x2);
|
|
#endif /* ! HAVE_FMOD */
|
|
|
|
case Node_plus:
|
|
return tmp_number(x1 + x2);
|
|
|
|
case Node_minus:
|
|
return tmp_number(x1 - x2);
|
|
|
|
case Node_var_array:
|
|
fatal("attempt to use array `%s' in a scalar context",
|
|
tree->vname);
|
|
|
|
default:
|
|
fatal("illegal type (%s) in tree_eval", nodetype2str(tree->type));
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
/* eval_condition --- is TREE true or false? Returns 0==false, non-zero==true */
|
|
|
|
static int
|
|
eval_condition(tree)
|
|
register NODE *tree;
|
|
{
|
|
register NODE *t1;
|
|
register int ret;
|
|
|
|
if (tree == NULL) /* Null trees are the easiest kinds */
|
|
return TRUE;
|
|
if (tree->type == Node_line_range) {
|
|
/*
|
|
* Node_line_range is kind of like Node_match, EXCEPT: the
|
|
* lnode field (more properly, the condpair field) is a node
|
|
* of a Node_cond_pair; whether we evaluate the lnode of that
|
|
* node or the rnode depends on the triggered word. More
|
|
* precisely: if we are not yet triggered, we tree_eval the
|
|
* lnode; if that returns true, we set the triggered word.
|
|
* If we are triggered (not ELSE IF, note), we tree_eval the
|
|
* rnode, clear triggered if it succeeds, and perform our
|
|
* action (regardless of success or failure). We want to be
|
|
* able to begin and end on a single input record, so this
|
|
* isn't an ELSE IF, as noted above.
|
|
*/
|
|
if (! tree->triggered) {
|
|
if (! eval_condition(tree->condpair->lnode))
|
|
return FALSE;
|
|
else
|
|
tree->triggered = TRUE;
|
|
}
|
|
/* Else we are triggered */
|
|
if (eval_condition(tree->condpair->rnode))
|
|
tree->triggered = FALSE;
|
|
return TRUE;
|
|
}
|
|
|
|
/*
|
|
* Could just be J.random expression. in which case, null and 0 are
|
|
* false, anything else is true
|
|
*/
|
|
|
|
t1 = m_tree_eval(tree, TRUE);
|
|
if (t1->flags & MAYBE_NUM)
|
|
(void) force_number(t1);
|
|
if (t1->flags & NUMBER)
|
|
ret = (t1->numbr != 0.0);
|
|
else
|
|
ret = (t1->stlen != 0);
|
|
free_temp(t1);
|
|
return ret;
|
|
}
|
|
|
|
/* cmp_nodes --- compare two nodes, returning negative, 0, positive */
|
|
|
|
int
|
|
cmp_nodes(t1, t2)
|
|
register NODE *t1, *t2;
|
|
{
|
|
register int ret;
|
|
register size_t len1, len2;
|
|
register int l;
|
|
int ldiff;
|
|
|
|
if (t1 == t2)
|
|
return 0;
|
|
if (t1->flags & MAYBE_NUM)
|
|
(void) force_number(t1);
|
|
if (t2->flags & MAYBE_NUM)
|
|
(void) force_number(t2);
|
|
if ((t1->flags & NUMBER) && (t2->flags & NUMBER)) {
|
|
if (t1->numbr == t2->numbr)
|
|
return 0;
|
|
/* don't subtract, in case one or both are infinite */
|
|
else if (t1->numbr < t2->numbr)
|
|
return -1;
|
|
else
|
|
return 1;
|
|
}
|
|
(void) force_string(t1);
|
|
(void) force_string(t2);
|
|
len1 = t1->stlen;
|
|
len2 = t2->stlen;
|
|
ldiff = len1 - len2;
|
|
if (len1 == 0 || len2 == 0)
|
|
return ldiff;
|
|
l = (ldiff <= 0 ? len1 : len2);
|
|
if (IGNORECASE) {
|
|
register unsigned char *cp1 = (unsigned char *) t1->stptr;
|
|
register unsigned char *cp2 = (unsigned char *) t2->stptr;
|
|
|
|
for (ret = 0; l-- > 0 && ret == 0; cp1++, cp2++)
|
|
ret = casetable[*cp1] - casetable[*cp2];
|
|
} else
|
|
ret = memcmp(t1->stptr, t2->stptr, l);
|
|
return (ret == 0 ? ldiff : ret);
|
|
}
|
|
|
|
/* op_assign --- do +=, -=, etc. */
|
|
|
|
static NODE *
|
|
op_assign(tree)
|
|
register NODE *tree;
|
|
{
|
|
AWKNUM rval, lval;
|
|
NODE **lhs;
|
|
AWKNUM t1, t2;
|
|
long ltemp;
|
|
NODE *tmp;
|
|
Func_ptr after_assign = NULL;
|
|
|
|
/*
|
|
* For ++ and --, get the lhs when doing the op and then
|
|
* return. For += etc, do the rhs first, since it can
|
|
* rearrange things, and *then* get the lhs.
|
|
*/
|
|
|
|
switch(tree->type) {
|
|
case Node_preincrement:
|
|
case Node_predecrement:
|
|
lhs = get_lhs(tree->lnode, &after_assign);
|
|
lval = force_number(*lhs);
|
|
unref(*lhs);
|
|
*lhs = make_number(lval +
|
|
(tree->type == Node_preincrement ? 1.0 : -1.0));
|
|
tree->lnode->flags |= SCALAR;
|
|
if (after_assign)
|
|
(*after_assign)();
|
|
return *lhs;
|
|
|
|
case Node_postincrement:
|
|
case Node_postdecrement:
|
|
lhs = get_lhs(tree->lnode, &after_assign);
|
|
lval = force_number(*lhs);
|
|
unref(*lhs);
|
|
*lhs = make_number(lval +
|
|
(tree->type == Node_postincrement ? 1.0 : -1.0));
|
|
tree->lnode->flags |= SCALAR;
|
|
if (after_assign)
|
|
(*after_assign)();
|
|
return tmp_number(lval);
|
|
default:
|
|
break; /* handled below */
|
|
}
|
|
|
|
/*
|
|
* It's a += kind of thing. Do the rhs, then the lhs.
|
|
*/
|
|
|
|
tmp = tree_eval(tree->rnode);
|
|
rval = force_number(tmp);
|
|
free_temp(tmp);
|
|
|
|
lhs = get_lhs(tree->lnode, &after_assign);
|
|
lval = force_number(*lhs);
|
|
|
|
unref(*lhs);
|
|
switch(tree->type) {
|
|
case Node_assign_exp:
|
|
if ((ltemp = rval) == rval) { /* integer exponent */
|
|
if (ltemp == 0)
|
|
*lhs = make_number((AWKNUM) 1);
|
|
else if (ltemp == 1)
|
|
*lhs = make_number(lval);
|
|
else {
|
|
/* doing it this way should be more precise */
|
|
for (t1 = t2 = lval; --ltemp; )
|
|
t1 *= t2;
|
|
*lhs = make_number(t1);
|
|
}
|
|
} else
|
|
*lhs = make_number((AWKNUM) pow((double) lval, (double) rval));
|
|
break;
|
|
|
|
case Node_assign_times:
|
|
*lhs = make_number(lval * rval);
|
|
break;
|
|
|
|
case Node_assign_quotient:
|
|
if (rval == (AWKNUM) 0)
|
|
fatal("division by zero attempted in /=");
|
|
#ifdef _CRAY
|
|
/* special case for integer division, put in for Cray */
|
|
ltemp = rval;
|
|
if (ltemp == 0) {
|
|
*lhs = make_number(lval / rval);
|
|
break;
|
|
}
|
|
ltemp = (long) lval / ltemp;
|
|
if (ltemp * lval == rval)
|
|
*lhs = make_number((AWKNUM) ltemp);
|
|
else
|
|
#endif /* _CRAY */
|
|
*lhs = make_number(lval / rval);
|
|
break;
|
|
|
|
case Node_assign_mod:
|
|
if (rval == (AWKNUM) 0)
|
|
fatal("division by zero attempted in %%=");
|
|
#ifdef HAVE_FMOD
|
|
*lhs = make_number(fmod(lval, rval));
|
|
#else /* ! HAVE_FMOD */
|
|
(void) modf(lval / rval, &t1);
|
|
t2 = lval - rval * t1;
|
|
*lhs = make_number(t2);
|
|
#endif /* ! HAVE_FMOD */
|
|
break;
|
|
|
|
case Node_assign_plus:
|
|
*lhs = make_number(lval + rval);
|
|
break;
|
|
|
|
case Node_assign_minus:
|
|
*lhs = make_number(lval - rval);
|
|
break;
|
|
default:
|
|
cant_happen();
|
|
}
|
|
tree->lnode->flags |= SCALAR;
|
|
if (after_assign)
|
|
(*after_assign)();
|
|
return *lhs;
|
|
}
|
|
|
|
static struct fcall {
|
|
char *fname;
|
|
unsigned long count;
|
|
NODE *arglist;
|
|
NODE **prevstack;
|
|
NODE **stack;
|
|
} *fcall_list = NULL;
|
|
|
|
static long fcall_list_size = 0;
|
|
static long curfcall = -1;
|
|
|
|
/* in_function --- return true/false if we need to unwind awk functions */
|
|
|
|
static int
|
|
in_function()
|
|
{
|
|
return (curfcall >= 0);
|
|
}
|
|
|
|
/* pop_fcall --- pop off a single function call */
|
|
|
|
static void
|
|
pop_fcall()
|
|
{
|
|
NODE *n, **sp, *arg, *argp;
|
|
int count;
|
|
struct fcall *f;
|
|
|
|
assert(curfcall >= 0);
|
|
f = & fcall_list[curfcall];
|
|
stack_ptr = f->prevstack;
|
|
|
|
/*
|
|
* here, we pop each parameter and check whether
|
|
* it was an array. If so, and if the arg. passed in was
|
|
* a simple variable, then the value should be copied back.
|
|
* This achieves "call-by-reference" for arrays.
|
|
*/
|
|
sp = f->stack;
|
|
count = f->count;
|
|
|
|
for (argp = f->arglist; count > 0 && argp != NULL; argp = argp->rnode) {
|
|
arg = argp->lnode;
|
|
if (arg->type == Node_param_list)
|
|
arg = stack_ptr[arg->param_cnt];
|
|
n = *sp++;
|
|
if ((arg->type == Node_var /* || arg->type == Node_var_array */)
|
|
&& n->type == Node_var_array) {
|
|
/* should we free arg->var_value ? */
|
|
arg->var_array = n->var_array;
|
|
arg->type = Node_var_array;
|
|
arg->array_size = n->array_size;
|
|
arg->table_size = n->table_size;
|
|
arg->flags = n->flags;
|
|
}
|
|
/* n->lnode overlays the array size, don't unref it if array */
|
|
if (n->type != Node_var_array && n->type != Node_array_ref)
|
|
unref(n->lnode);
|
|
freenode(n);
|
|
count--;
|
|
}
|
|
while (count-- > 0) {
|
|
n = *sp++;
|
|
/* if n is a local array, all the elements should be freed */
|
|
if (n->type == Node_var_array)
|
|
assoc_clear(n);
|
|
/* n->lnode overlays the array size, don't unref it if array */
|
|
if (n->type != Node_var_array && n->type != Node_array_ref)
|
|
unref(n->lnode);
|
|
freenode(n);
|
|
}
|
|
if (f->stack)
|
|
free((char *) f->stack);
|
|
memset(f, '\0', sizeof(struct fcall));
|
|
curfcall--;
|
|
}
|
|
|
|
/* pop_fcall_stack --- pop off all function args, don't leak memory */
|
|
|
|
static void
|
|
pop_fcall_stack()
|
|
{
|
|
while (curfcall >= 0)
|
|
pop_fcall();
|
|
}
|
|
|
|
/* push_args --- push function arguments onto the stack */
|
|
|
|
static void
|
|
push_args(count, arglist, oldstack, func_name)
|
|
int count;
|
|
NODE *arglist;
|
|
NODE **oldstack;
|
|
char *func_name;
|
|
{
|
|
struct fcall *f;
|
|
NODE *arg, *argp, *r, **sp, *n;
|
|
|
|
if (fcall_list_size == 0) { /* first time */
|
|
emalloc(fcall_list, struct fcall *, 10 * sizeof(struct fcall),
|
|
"push_args");
|
|
fcall_list_size = 10;
|
|
}
|
|
|
|
if (++curfcall >= fcall_list_size) {
|
|
fcall_list_size *= 2;
|
|
erealloc(fcall_list, struct fcall *,
|
|
fcall_list_size * sizeof(struct fcall), "push_args");
|
|
}
|
|
f = & fcall_list[curfcall];
|
|
memset(f, '\0', sizeof(struct fcall));
|
|
|
|
if (count > 0)
|
|
emalloc(f->stack, NODE **, count*sizeof(NODE *), "func_call");
|
|
f->count = count;
|
|
f->fname = func_name; /* not used, for debugging, just in case */
|
|
f->arglist = arglist;
|
|
f->prevstack = oldstack;
|
|
|
|
sp = f->stack;
|
|
|
|
/* for each calling arg. add NODE * on stack */
|
|
for (argp = arglist; count > 0 && argp != NULL; argp = argp->rnode) {
|
|
arg = argp->lnode;
|
|
getnode(r);
|
|
r->type = Node_var;
|
|
|
|
/* call by reference for arrays; see below also */
|
|
if (arg->type == Node_param_list) {
|
|
/* we must also reassign f here; see below */
|
|
f = & fcall_list[curfcall];
|
|
arg = f->prevstack[arg->param_cnt];
|
|
}
|
|
if (arg->type == Node_var_array) {
|
|
r->type = Node_array_ref;
|
|
r->flags &= ~SCALAR;
|
|
r->orig_array = arg;
|
|
r->vname = arg->vname;
|
|
} else if (arg->type == Node_array_ref) {
|
|
*r = *arg;
|
|
} else {
|
|
n = tree_eval(arg);
|
|
r->lnode = dupnode(n);
|
|
r->rnode = (NODE *) NULL;
|
|
if ((n->flags & SCALAR) != 0)
|
|
r->flags |= SCALAR;
|
|
free_temp(n);
|
|
}
|
|
*sp++ = r;
|
|
count--;
|
|
}
|
|
if (argp != NULL) /* left over calling args. */
|
|
warning(
|
|
"function `%s' called with more arguments than declared",
|
|
func_name);
|
|
|
|
/* add remaining params. on stack with null value */
|
|
while (count-- > 0) {
|
|
getnode(r);
|
|
r->type = Node_var;
|
|
r->lnode = Nnull_string;
|
|
r->flags &= ~SCALAR;
|
|
r->rnode = (NODE *) NULL;
|
|
*sp++ = r;
|
|
}
|
|
|
|
/*
|
|
* We have to reassign f. Why, you may ask? It is possible that
|
|
* other functions were called during the course of tree_eval()-ing
|
|
* the arguments to this function. As a result of that, fcall_list
|
|
* may have been realloc()'ed, with the result that f is now
|
|
* pointing into free()'d space. This was a nasty one to track down.
|
|
*/
|
|
f = & fcall_list[curfcall];
|
|
|
|
stack_ptr = f->stack;
|
|
}
|
|
|
|
/* func_call --- call a function, call by reference for arrays */
|
|
|
|
NODE **stack_ptr;
|
|
|
|
static NODE *
|
|
func_call(name, arg_list)
|
|
NODE *name; /* name is a Node_val giving function name */
|
|
NODE *arg_list; /* Node_expression_list of calling args. */
|
|
{
|
|
register NODE *r;
|
|
NODE *f;
|
|
jmp_buf volatile func_tag_stack;
|
|
jmp_buf volatile loop_tag_stack;
|
|
int volatile save_loop_tag_valid = FALSE;
|
|
NODE *save_ret_node;
|
|
extern NODE *ret_node;
|
|
|
|
/* retrieve function definition node */
|
|
f = lookup(name->stptr);
|
|
if (f == NULL || f->type != Node_func)
|
|
fatal("function `%s' not defined", name->stptr);
|
|
#ifdef FUNC_TRACE
|
|
fprintf(stderr, "function %s called\n", name->stptr);
|
|
#endif
|
|
push_args(f->lnode->param_cnt, arg_list, stack_ptr, name->stptr);
|
|
|
|
/*
|
|
* Execute function body, saving context, as a return statement
|
|
* will longjmp back here.
|
|
*
|
|
* Have to save and restore the loop_tag stuff so that a return
|
|
* inside a loop in a function body doesn't scrog any loops going
|
|
* on in the main program. We save the necessary info in variables
|
|
* local to this function so that function nesting works OK.
|
|
* We also only bother to save the loop stuff if we're in a loop
|
|
* when the function is called.
|
|
*/
|
|
if (loop_tag_valid) {
|
|
int junk = 0;
|
|
|
|
save_loop_tag_valid = (volatile int) loop_tag_valid;
|
|
PUSH_BINDING(loop_tag_stack, loop_tag, junk);
|
|
loop_tag_valid = FALSE;
|
|
}
|
|
PUSH_BINDING(func_tag_stack, func_tag, func_tag_valid);
|
|
save_ret_node = ret_node;
|
|
ret_node = Nnull_string; /* default return value */
|
|
if (setjmp(func_tag) == 0)
|
|
(void) interpret(f->rnode);
|
|
|
|
r = ret_node;
|
|
ret_node = (NODE *) save_ret_node;
|
|
RESTORE_BINDING(func_tag_stack, func_tag, func_tag_valid);
|
|
pop_fcall();
|
|
|
|
/* Restore the loop_tag stuff if necessary. */
|
|
if (save_loop_tag_valid) {
|
|
int junk = 0;
|
|
|
|
loop_tag_valid = (int) save_loop_tag_valid;
|
|
RESTORE_BINDING(loop_tag_stack, loop_tag, junk);
|
|
}
|
|
|
|
if ((r->flags & PERM) == 0)
|
|
r->flags |= TEMP;
|
|
return r;
|
|
}
|
|
|
|
/*
|
|
* r_get_lhs:
|
|
* This returns a POINTER to a node pointer. get_lhs(ptr) is the current
|
|
* value of the var, or where to store the var's new value
|
|
*
|
|
* For the special variables, don't unref their current value if it's
|
|
* the same as the internal copy; perhaps the current one is used in
|
|
* a concatenation or some other expression somewhere higher up in the
|
|
* call chain. Ouch.
|
|
*/
|
|
|
|
NODE **
|
|
r_get_lhs(ptr, assign)
|
|
register NODE *ptr;
|
|
Func_ptr *assign;
|
|
{
|
|
register NODE **aptr = NULL;
|
|
register NODE *n;
|
|
|
|
if (assign)
|
|
*assign = NULL; /* for safety */
|
|
if (ptr->type == Node_param_list) {
|
|
if ((ptr->flags & FUNC) != 0)
|
|
fatal("can't use function name `%s' as variable or array", ptr->vname);
|
|
ptr = stack_ptr[ptr->param_cnt];
|
|
}
|
|
|
|
switch (ptr->type) {
|
|
case Node_array_ref:
|
|
case Node_var_array:
|
|
fatal("attempt to use array `%s' in a scalar context",
|
|
ptr->vname);
|
|
|
|
case Node_var:
|
|
aptr = &(ptr->var_value);
|
|
#ifdef DEBUG
|
|
if (ptr->var_value->stref <= 0)
|
|
cant_happen();
|
|
#endif
|
|
break;
|
|
|
|
case Node_FIELDWIDTHS:
|
|
aptr = &(FIELDWIDTHS_node->var_value);
|
|
if (assign != NULL)
|
|
*assign = set_FIELDWIDTHS;
|
|
break;
|
|
|
|
case Node_RS:
|
|
aptr = &(RS_node->var_value);
|
|
if (assign != NULL)
|
|
*assign = set_RS;
|
|
break;
|
|
|
|
case Node_FS:
|
|
aptr = &(FS_node->var_value);
|
|
if (assign != NULL)
|
|
*assign = set_FS;
|
|
break;
|
|
|
|
case Node_FNR:
|
|
if (FNR_node->var_value->numbr != FNR) {
|
|
unref(FNR_node->var_value);
|
|
FNR_node->var_value = make_number((AWKNUM) FNR);
|
|
}
|
|
aptr = &(FNR_node->var_value);
|
|
if (assign != NULL)
|
|
*assign = set_FNR;
|
|
break;
|
|
|
|
case Node_NR:
|
|
if (NR_node->var_value->numbr != NR) {
|
|
unref(NR_node->var_value);
|
|
NR_node->var_value = make_number((AWKNUM) NR);
|
|
}
|
|
aptr = &(NR_node->var_value);
|
|
if (assign != NULL)
|
|
*assign = set_NR;
|
|
break;
|
|
|
|
case Node_NF:
|
|
if (NF == -1 || NF_node->var_value->numbr != NF) {
|
|
if (NF == -1)
|
|
(void) get_field(HUGE-1, assign); /* parse record */
|
|
unref(NF_node->var_value);
|
|
NF_node->var_value = make_number((AWKNUM) NF);
|
|
}
|
|
aptr = &(NF_node->var_value);
|
|
if (assign != NULL)
|
|
*assign = set_NF;
|
|
break;
|
|
|
|
case Node_IGNORECASE:
|
|
aptr = &(IGNORECASE_node->var_value);
|
|
if (assign != NULL)
|
|
*assign = set_IGNORECASE;
|
|
break;
|
|
|
|
case Node_OFMT:
|
|
aptr = &(OFMT_node->var_value);
|
|
if (assign != NULL)
|
|
*assign = set_OFMT;
|
|
break;
|
|
|
|
case Node_CONVFMT:
|
|
aptr = &(CONVFMT_node->var_value);
|
|
if (assign != NULL)
|
|
*assign = set_CONVFMT;
|
|
break;
|
|
|
|
case Node_ORS:
|
|
aptr = &(ORS_node->var_value);
|
|
if (assign != NULL)
|
|
*assign = set_ORS;
|
|
break;
|
|
|
|
case Node_OFS:
|
|
aptr = &(OFS_node->var_value);
|
|
if (assign != NULL)
|
|
*assign = set_OFS;
|
|
break;
|
|
|
|
case Node_param_list:
|
|
aptr = &(stack_ptr[ptr->param_cnt]->var_value);
|
|
break;
|
|
|
|
case Node_field_spec:
|
|
{
|
|
int field_num;
|
|
|
|
n = tree_eval(ptr->lnode);
|
|
field_num = (int) force_number(n);
|
|
free_temp(n);
|
|
if (field_num < 0)
|
|
fatal("attempt to access field %d", field_num);
|
|
if (field_num == 0 && field0_valid) { /* short circuit */
|
|
aptr = &fields_arr[0];
|
|
if (assign != NULL)
|
|
*assign = reset_record;
|
|
break;
|
|
}
|
|
aptr = get_field(field_num, assign);
|
|
break;
|
|
}
|
|
case Node_subscript:
|
|
n = ptr->lnode;
|
|
if (n->type == Node_param_list) {
|
|
int i = n->param_cnt + 1;
|
|
|
|
n = stack_ptr[n->param_cnt];
|
|
if ((n->flags & SCALAR) != 0)
|
|
fatal("attempt to use scalar parameter %d as an array", i);
|
|
}
|
|
if (n->type == Node_array_ref) {
|
|
n = n->orig_array;
|
|
assert(n->type == Node_var_array || n->type == Node_var);
|
|
}
|
|
if (n->type == Node_func) {
|
|
fatal("attempt to use function `%s' as array",
|
|
n->lnode->param);
|
|
}
|
|
aptr = assoc_lookup(n, concat_exp(ptr->rnode));
|
|
break;
|
|
|
|
case Node_func:
|
|
fatal("`%s' is a function, assignment is not allowed",
|
|
ptr->lnode->param);
|
|
|
|
case Node_builtin:
|
|
fatal("assignment is not allowed to result of builtin function");
|
|
default:
|
|
fprintf(stderr, "type = %s\n", nodetype2str(ptr->type));
|
|
fflush(stderr);
|
|
cant_happen();
|
|
}
|
|
return aptr;
|
|
}
|
|
|
|
/* match_op --- do ~ and !~ */
|
|
|
|
static NODE *
|
|
match_op(tree)
|
|
register NODE *tree;
|
|
{
|
|
register NODE *t1;
|
|
register Regexp *rp;
|
|
int i;
|
|
int match = TRUE;
|
|
int kludge_need_start = FALSE; /* FIXME: --- see below */
|
|
|
|
if (tree->type == Node_nomatch)
|
|
match = FALSE;
|
|
if (tree->type == Node_regex)
|
|
t1 = *get_field(0, (Func_ptr *) 0);
|
|
else {
|
|
t1 = force_string(tree_eval(tree->lnode));
|
|
tree = tree->rnode;
|
|
}
|
|
rp = re_update(tree);
|
|
/*
|
|
* FIXME:
|
|
*
|
|
* Any place where research() is called with a last parameter of
|
|
* FALSE, we need to use the avoid_dfa test. This is the only place
|
|
* at the moment.
|
|
*
|
|
* A new or improved dfa that distinguishes beginning/end of
|
|
* string from beginning/end of line will allow us to get rid of
|
|
* this temporary hack.
|
|
*
|
|
* The avoid_dfa() function is in re.c; it is not very smart.
|
|
*/
|
|
if (avoid_dfa(tree, t1->stptr, t1->stlen))
|
|
kludge_need_start = TRUE;
|
|
i = research(rp, t1->stptr, 0, t1->stlen, kludge_need_start);
|
|
i = (i == -1) ^ (match == TRUE);
|
|
free_temp(t1);
|
|
return tmp_number((AWKNUM) i);
|
|
}
|
|
|
|
/* set_IGNORECASE --- update IGNORECASE as appropriate */
|
|
|
|
void
|
|
set_IGNORECASE()
|
|
{
|
|
static int warned = FALSE;
|
|
|
|
if ((do_lint || do_traditional) && ! warned) {
|
|
warned = TRUE;
|
|
warning("IGNORECASE not supported in compatibility mode");
|
|
}
|
|
if (do_traditional)
|
|
IGNORECASE = FALSE;
|
|
else if ((IGNORECASE_node->var_value->flags & (STRING|STR)) != 0) {
|
|
if ((IGNORECASE_node->var_value->flags & MAYBE_NUM) == 0)
|
|
IGNORECASE = (force_string(IGNORECASE_node->var_value)->stlen > 0);
|
|
else
|
|
IGNORECASE = (force_number(IGNORECASE_node->var_value) != 0.0);
|
|
} else if ((IGNORECASE_node->var_value->flags & (NUM|NUMBER)) != 0)
|
|
IGNORECASE = (force_number(IGNORECASE_node->var_value) != 0.0);
|
|
else
|
|
IGNORECASE = FALSE; /* shouldn't happen */
|
|
set_FS_if_not_FIELDWIDTHS();
|
|
}
|
|
|
|
/* set_OFS --- update OFS related variables when OFS assigned to */
|
|
|
|
void
|
|
set_OFS()
|
|
{
|
|
OFS = force_string(OFS_node->var_value)->stptr;
|
|
OFSlen = OFS_node->var_value->stlen;
|
|
OFS[OFSlen] = '\0';
|
|
}
|
|
|
|
/* set_ORS --- update ORS related variables when ORS assigned to */
|
|
|
|
void
|
|
set_ORS()
|
|
{
|
|
ORS = force_string(ORS_node->var_value)->stptr;
|
|
ORSlen = ORS_node->var_value->stlen;
|
|
ORS[ORSlen] = '\0';
|
|
}
|
|
|
|
/* fmt_ok --- is the conversion format a valid one? */
|
|
|
|
NODE **fmt_list = NULL;
|
|
static int fmt_ok P((NODE *n));
|
|
static int fmt_index P((NODE *n));
|
|
|
|
static int
|
|
fmt_ok(n)
|
|
NODE *n;
|
|
{
|
|
NODE *tmp = force_string(n);
|
|
char *p = tmp->stptr;
|
|
|
|
if (*p++ != '%')
|
|
return 0;
|
|
while (*p && strchr(" +-#", *p) != NULL) /* flags */
|
|
p++;
|
|
while (*p && isdigit(*p)) /* width - %*.*g is NOT allowed */
|
|
p++;
|
|
if (*p == '\0' || (*p != '.' && ! isdigit(*p)))
|
|
return 0;
|
|
if (*p == '.')
|
|
p++;
|
|
while (*p && isdigit(*p)) /* precision */
|
|
p++;
|
|
if (*p == '\0' || strchr("efgEG", *p) == NULL)
|
|
return 0;
|
|
if (*++p != '\0')
|
|
return 0;
|
|
return 1;
|
|
}
|
|
|
|
/* fmt_index --- track values of OFMT and CONVFMT to keep semantics correct */
|
|
|
|
static int
|
|
fmt_index(n)
|
|
NODE *n;
|
|
{
|
|
register int ix = 0;
|
|
static int fmt_num = 4;
|
|
static int fmt_hiwater = 0;
|
|
|
|
if (fmt_list == NULL)
|
|
emalloc(fmt_list, NODE **, fmt_num*sizeof(*fmt_list), "fmt_index");
|
|
(void) force_string(n);
|
|
while (ix < fmt_hiwater) {
|
|
if (cmp_nodes(fmt_list[ix], n) == 0)
|
|
return ix;
|
|
ix++;
|
|
}
|
|
/* not found */
|
|
n->stptr[n->stlen] = '\0';
|
|
if (do_lint && ! fmt_ok(n))
|
|
warning("bad %sFMT specification",
|
|
n == CONVFMT_node->var_value ? "CONV"
|
|
: n == OFMT_node->var_value ? "O"
|
|
: "");
|
|
|
|
if (fmt_hiwater >= fmt_num) {
|
|
fmt_num *= 2;
|
|
emalloc(fmt_list, NODE **, fmt_num, "fmt_index");
|
|
}
|
|
fmt_list[fmt_hiwater] = dupnode(n);
|
|
return fmt_hiwater++;
|
|
}
|
|
|
|
/* set_OFMT --- track OFMT correctly */
|
|
|
|
void
|
|
set_OFMT()
|
|
{
|
|
OFMTidx = fmt_index(OFMT_node->var_value);
|
|
OFMT = fmt_list[OFMTidx]->stptr;
|
|
}
|
|
|
|
/* set_CONVFMT --- track CONVFMT correctly */
|
|
|
|
void
|
|
set_CONVFMT()
|
|
{
|
|
CONVFMTidx = fmt_index(CONVFMT_node->var_value);
|
|
CONVFMT = fmt_list[CONVFMTidx]->stptr;
|
|
}
|