expr.y - utils-std - Collection of commonly available Unix tools

expr.y (12573B)

%{
// SPDX-License-Identifier: 0BSD
// Copyright Pace Willisson (pace@blitz.com), J.T. Conklin (jtc@wimsey.com)
/*-
 * Written by Pace Willisson (pace@blitz.com)
 * and placed in the public domain.
 *
 * Largely rewritten by J.T. Conklin (jtc@wimsey.com)
 */
/*
 * Warning: OpenBSD yacc prints the following at the very beginning:
 * #include <string.h>
 * #include <stdlib.h>
 */
#include <assert.h>
#include <sys/types.h>
#include <ctype.h>
#include "../libutils/err.h"
#include "../libutils/getopt_nolong.h"
#include <errno.h>
#include <inttypes.h>
#include <limits.h>
#include <locale.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <regex.h>
#include <unistd.h>
/*
 * POSIX specifies a specific error code for syntax errors.  We exit
 * with this code for all errors.
 */
#define	ERR_EXIT	2
enum valtype {
	integer, numeric_string, string
} ;
struct val {
	enum valtype type;
	union {
		char *s;
		intmax_t i;
	} u;
} ;
char		**av;
int		nonposix;
struct val	*result;
static void		assert_to_integer(struct val *);
static void		assert_div(intmax_t, intmax_t);
static void		assert_minus(intmax_t, intmax_t, intmax_t);
static void		assert_plus(intmax_t, intmax_t, intmax_t);
static void		assert_times(intmax_t, intmax_t, intmax_t);
static int		compare_vals(struct val *, struct val *);
static void		free_value(struct val *);
static int		is_integer(const char *);
static int		is_string(struct val *);
static int		is_zero_or_null(struct val *);
static struct val	*make_integer(intmax_t);
static struct val	*make_str(const char *);
static struct val	*op_and(struct val *, struct val *);
static struct val	*op_colon(struct val *, struct val *);
static struct val	*op_div(struct val *, struct val *);
static struct val	*op_eq(struct val *, struct val *);
static struct val	*op_ge(struct val *, struct val *);
static struct val	*op_gt(struct val *, struct val *);
static struct val	*op_le(struct val *, struct val *);
static struct val	*op_lt(struct val *, struct val *);
static struct val	*op_minus(struct val *, struct val *);
static struct val	*op_ne(struct val *, struct val *);
static struct val	*op_or(struct val *, struct val *);
static struct val	*op_plus(struct val *, struct val *);
static struct val	*op_rem(struct val *, struct val *);
static struct val	*op_times(struct val *, struct val *);
static int		to_integer(struct val *);
static void		to_string(struct val *);
#define YYERROR_IS_DECLARED
static int		yyerror(const char *);
static int		yylex(void);
const char *argv0 = "expr";
%}
%union
{
	struct val *val;
}
%left <val> '|'
%left <val> '&'
%left <val> '=' '>' '<' GE LE NE
%left <val> '+' '-'
%left <val> '*' '/' '%'
%left <val> ':'
%token <val> TOKEN
%type <val> start expr
%%
start: expr { result = $$; }
expr:	TOKEN
	| '(' expr ')' { $$ = $2; }
	| expr '|' expr { $$ = op_or($1, $3); }
	| expr '&' expr { $$ = op_and($1, $3); }
	| expr '=' expr { $$ = op_eq($1, $3); }
	| expr '>' expr { $$ = op_gt($1, $3); }
	| expr '<' expr { $$ = op_lt($1, $3); }
	| expr GE expr  { $$ = op_ge($1, $3); }
	| expr LE expr  { $$ = op_le($1, $3); }
	| expr NE expr  { $$ = op_ne($1, $3); }
	| expr '+' expr { $$ = op_plus($1, $3); }
	| expr '-' expr { $$ = op_minus($1, $3); }
	| expr '*' expr { $$ = op_times($1, $3); }
	| expr '/' expr { $$ = op_div($1, $3); }
	| expr '%' expr { $$ = op_rem($1, $3); }
	| expr ':' expr { $$ = op_colon($1, $3); }
	;
%%
static struct val *
make_integer(intmax_t i)
{
	struct val *vp;
	vp = (struct val *)malloc(sizeof(*vp));
	if (vp == NULL)
		utils_errx(ERR_EXIT, "malloc(vp) failed");
	vp->type = integer;
	vp->u.i  = i;
	return (vp);
}
static struct val *
make_str(const char *s)
{
	struct val *vp;
	vp = (struct val *)malloc(sizeof(*vp));
	if (vp == NULL)
		utils_errx(ERR_EXIT, "malloc(vp) failed");
	if ((vp->u.s = strdup(s)) == NULL)
		utils_errx(ERR_EXIT, "strdup(s) failed");
	if (is_integer(s))
		vp->type = numeric_string;
	else
		vp->type = string;
	return (vp);
}
static void
free_value(struct val *vp)
{
	if (vp->type == string || vp->type == numeric_string)
		free(vp->u.s);
	if (vp->type == string || vp->type == numeric_string || vp->type == integer)
		free(vp);
}
static int
to_integer(struct val *vp)
{
	intmax_t i;
	/* we can only convert numeric_string to integer, here */
	if (vp->type == numeric_string) {
		errno = 0;
		i  = strtoimax(vp->u.s, (char **)NULL, 10);
		/* just keep as numeric_string, if the conversion fails */
		if (errno != ERANGE) {
			free(vp->u.s);
			vp->u.i = i;
			vp->type = integer;
		}
	}
	return (vp->type == integer);
}
static void
assert_to_integer(struct val *vp)
{
	if (vp->type == string)
		utils_errx(ERR_EXIT, "not a decimal number: '%s'", vp->u.s);
	if (!to_integer(vp))
		utils_errx(ERR_EXIT, "operand too large: '%s'", vp->u.s);
}
static void
to_string(struct val *vp)
{
	if (vp->type == string || vp->type == numeric_string)
		return;
	int ndigits = snprintf(NULL, 0, "%jd", vp->u.i);
	if(ndigits <= 0)
		utils_errx(ERR_EXIT, "failed to pre-format integer %jd as a string", vp->u.i);
	ndigits++; // NULL terminator
	if(ndigits <= 0)
		utils_errx(ERR_EXIT, "pre-format length overflow", ndigits);
	char *tmp = malloc(ndigits);
	if (tmp == NULL)
		utils_errx(ERR_EXIT, "malloc(%zd) for to_string() failed", ndigits);
	int ret = snprintf(tmp, ndigits, "%jd", vp->u.i);
	if(ret < 0)
		utils_errx(ERR_EXIT, "failed to format integer %jd as a string", vp->u.i);
	vp->type = string;
	vp->u.s  = tmp;
}
static int
is_integer(const char *s)
{
	if (nonposix) {
		if (*s == '\0')
			return (1);
		while (isspace((unsigned char)*s))
			s++;
	}
	if (*s == '-' || (nonposix && *s == '+'))
		s++;
	if (*s == '\0')
		return (0);
	while (isdigit((unsigned char)*s))
		s++;
	return (*s == '\0');
}
static int
is_string(struct val *vp)
{
	/* only TRUE if this string is not a valid integer */
	return (vp->type == string);
}
static int
yylex(void)
{
	char *p;
	if (*av == NULL)
		return (0);
	p = *av++;
	if (strlen(p) == 1) {
		if (strchr("|&=<>+-*/%:()", *p))
			return (*p);
	} else if (strlen(p) == 2 && p[1] == '=') {
		switch (*p) {
		case '>': return (GE);
		case '<': return (LE);
		case '!': return (NE);
		}
	}
	yylval.val = make_str(p);
	return (TOKEN);
}
static int
is_zero_or_null(struct val *vp)
{
	if (vp->type == integer)
		return (vp->u.i == 0);
	return (*vp->u.s == 0 || (to_integer(vp) && vp->u.i == 0));
}
int
main(int argc, char *argv[])
{
	int c;
	char *lc_all = setlocale(LC_ALL, "");
	if(lc_all == NULL)
	{
		fprintf(stderr, "%s: warning: Failed loading locales. setlocale(LC_ALL, \"\"): %s\n", argv0, strerror(errno));
	}
	errno = 0;
	if (getenv("EXPR_COMPAT") != NULL
	    || getenv("POSIXLY_CORRECT") != NULL) {
		av = argv + 1;
		nonposix = 1;
	} else {
		while ((c = getopt_nolong(argc, argv, ":e")) != -1) {
			switch (c) {
			case 'e':
				nonposix = 1;
				break;
			case ':':
				utils_errx(1, "Missing operand for option: '-%c'", optopt);
				break;
			case '?':
				utils_errx(1, "Unrecognised option: '-%c'", optopt);
				break;
			default:
				abort();
			}
		}
		av = argv + optind;
	}
	yyparse();
	assert(result);
	if (result->type == integer)
		printf("%jd\n", result->u.i);
	else
		printf("%s\n", result->u.s);
	int err = is_zero_or_null(result);
	free_value(result);
	return err;
}
static int
yyerror(const char *s)
{
	utils_errx(ERR_EXIT, "syntax error: %s", s);
}
static struct val *
op_or(struct val *a, struct val *b)
{
	if (!is_zero_or_null(a)) {
		free_value(b);
		return (a);
	}
	free_value(a);
	if (!is_zero_or_null(b))
		return (b);
	free_value(b);
	return (make_integer((intmax_t)0));
}
static struct val *
op_and(struct val *a, struct val *b)
{
	if (is_zero_or_null(a) || is_zero_or_null(b)) {
		free_value(a);
		free_value(b);
		return (make_integer((intmax_t)0));
	} else {
		free_value(b);
		return (a);
	}
}
static int
compare_vals(struct val *a, struct val *b)
{
	int r;
	if (is_string(a) || is_string(b)) {
		to_string(a);
		to_string(b);
		r = strcoll(a->u.s, b->u.s);
	} else {
		assert_to_integer(a);
		assert_to_integer(b);
		if (a->u.i > b->u.i)
			r = 1;
		else if (a->u.i < b->u.i)
			r = -1;
		else
			r = 0;
	}
	free_value(a);
	free_value(b);
	return (r);
}
static struct val *
op_eq(struct val *a, struct val *b)
{
	return (make_integer((intmax_t)(compare_vals(a, b) == 0)));
}
static struct val *
op_gt(struct val *a, struct val *b)
{
	return (make_integer((intmax_t)(compare_vals(a, b) > 0)));
}
static struct val *
op_lt(struct val *a, struct val *b)
{
	return (make_integer((intmax_t)(compare_vals(a, b) < 0)));
}
static struct val *
op_ge(struct val *a, struct val *b)
{
	return (make_integer((intmax_t)(compare_vals(a, b) >= 0)));
}
static struct val *
op_le(struct val *a, struct val *b)
{
	return (make_integer((intmax_t)(compare_vals(a, b) <= 0)));
}
static struct val *
op_ne(struct val *a, struct val *b)
{
	return (make_integer((intmax_t)(compare_vals(a, b) != 0)));
}
static void
assert_plus(intmax_t a, intmax_t b, intmax_t r)
{
	/*
	 * sum of two positive numbers must be positive,
	 * sum of two negative numbers must be negative
	 */
	if ((a > 0 && b > 0 && r <= 0) ||
	    (a < 0 && b < 0 && r >= 0))
		utils_errx(ERR_EXIT, "overflow");
}
static struct val *
op_plus(struct val *a, struct val *b)
{
	struct val *r;
	assert_to_integer(a);
	assert_to_integer(b);
	r = make_integer(a->u.i + b->u.i);
	assert_plus(a->u.i, b->u.i, r->u.i);
	free_value(a);
	free_value(b);
	return (r);
}
static void
assert_minus(intmax_t a, intmax_t b, intmax_t r)
{
	if ((a >= 0 && b < 0 && r <= 0) ||
	    (a < 0 && b > 0 && r >= 0))
		utils_errx(ERR_EXIT, "overflow");
}
static struct val *
op_minus(struct val *a, struct val *b)
{
	struct val *r;
	assert_to_integer(a);
	assert_to_integer(b);
	r = make_integer(a->u.i - b->u.i);
	assert_minus(a->u.i, b->u.i, r->u.i);
	free_value(a);
	free_value(b);
	return (r);
}
/*
 * We depend on undefined behaviour giving a result (in r).
 * To test this result, pass it as volatile.  This prevents
 * optimizing away of the test based on the undefined behaviour.
 */
static void
assert_times(intmax_t a, intmax_t b, volatile intmax_t r)
{
	/*
	 * If the first operand is 0, no overflow is possible, 
	 * else the result of the division test must match the
	 * second operand.
	 *
	 * Be careful to avoid overflow in the overflow test, as
	 * in assert_div().  Overflow in division would kill us
	 * with a SIGFPE before getting the test wrong.  In old
	 * buggy versions, optimization used to give a null test
	 * instead of a SIGFPE.
	 */
	if ((a == -1 && b == INTMAX_MIN) || (a != 0 && r / a != b))
		utils_errx(ERR_EXIT, "overflow");
}
static struct val *
op_times(struct val *a, struct val *b)
{
	struct val *r;
	assert_to_integer(a);
	assert_to_integer(b);
	r = make_integer(a->u.i * b->u.i);
	assert_times(a->u.i, b->u.i, r->u.i);
	free_value(a);
	free_value(b);
	return (r);
}
static void
assert_div(intmax_t a, intmax_t b)
{
	if (b == 0)
		utils_errx(ERR_EXIT, "division by zero");
	/* only INTMAX_MIN / -1 causes overflow */
	if (a == INTMAX_MIN && b == -1)
		utils_errx(ERR_EXIT, "overflow");
}
static struct val *
op_div(struct val *a, struct val *b)
{
	struct val *r;
	assert_to_integer(a);
	assert_to_integer(b);
	/* assert based on operands only, not on result */
	assert_div(a->u.i, b->u.i);
	r = make_integer(a->u.i / b->u.i);
	free_value(a);
	free_value(b);
	return (r);
}
static struct val *
op_rem(struct val *a, struct val *b)
{
	struct val *r;
	assert_to_integer(a);
	assert_to_integer(b);
	/* pass a=1 to only check for div by zero */
	assert_div(1, b->u.i);
	r = make_integer(a->u.i % b->u.i);
	free_value(a);
	free_value(b);
	return (r);
}
static struct val *
op_colon(struct val *a, struct val *b)
{
	regex_t rp;
	regmatch_t rm[2];
	char errbuf[256];
	int eval;
	struct val *v;
	/* coerce both arguments to strings */
	to_string(a);
	to_string(b);
	/* compile regular expression */
	if ((eval = regcomp(&rp, b->u.s, 0)) != 0) {
		regerror(eval, &rp, errbuf, sizeof(errbuf));
		utils_errx(ERR_EXIT, "%s", errbuf);
	}
	/* compare string against pattern */
	/* remember that patterns are anchored to the beginning of the line */
	if (regexec(&rp, a->u.s, (size_t)2, rm, 0) == 0 && rm[0].rm_so == 0)
		if (rm[1].rm_so >= 0) {
			*(a->u.s + rm[1].rm_eo) = '\0';
			v = make_str(a->u.s + rm[1].rm_so);
		} else
			v = make_integer((intmax_t)(rm[0].rm_eo));
	else
		if (rp.re_nsub == 0)
			v = make_integer((intmax_t)0);
		else
			v = make_str("");
	/* free arguments and pattern buffer */
	free_value(a);
	free_value(b);
	regfree(&rp);
	return (v);
}