expr.y (12256B)
- %{
- // SPDX-License-Identifier: 0BSD
- // Copyright Pace Willisson (pace@blitz.com), J.T. Conklin (jtc@wimsey.com)
- /*-
- * Written by Pace Willisson (pace@blitz.com)
- * and placed in the public domain.
- *
- * Largely rewritten by J.T. Conklin (jtc@wimsey.com)
- */
- /*
- * Warning: OpenBSD yacc prints the following at the very beginning:
- * #include <string.h>
- * #include <stdlib.h>
- */
- #include <assert.h>
- #include <sys/types.h>
- #include <ctype.h>
- #include <err.h>
- #include <errno.h>
- #include <inttypes.h>
- #include <limits.h>
- #include <locale.h>
- #include <stdio.h>
- #include <stdlib.h>
- #include <string.h>
- #include <regex.h>
- #include <unistd.h>
- /*
- * POSIX specifies a specific error code for syntax errors. We exit
- * with this code for all errors.
- */
- #define ERR_EXIT 2
- enum valtype {
- integer, numeric_string, string
- } ;
- struct val {
- enum valtype type;
- union {
- char *s;
- intmax_t i;
- } u;
- } ;
- char **av;
- int nonposix;
- struct val *result;
- static void assert_to_integer(struct val *);
- static void assert_div(intmax_t, intmax_t);
- static void assert_minus(intmax_t, intmax_t, intmax_t);
- static void assert_plus(intmax_t, intmax_t, intmax_t);
- static void assert_times(intmax_t, intmax_t, intmax_t);
- static int compare_vals(struct val *, struct val *);
- static void free_value(struct val *);
- static int is_integer(const char *);
- static int is_string(struct val *);
- static int is_zero_or_null(struct val *);
- static struct val *make_integer(intmax_t);
- static struct val *make_str(const char *);
- static struct val *op_and(struct val *, struct val *);
- static struct val *op_colon(struct val *, struct val *);
- static struct val *op_div(struct val *, struct val *);
- static struct val *op_eq(struct val *, struct val *);
- static struct val *op_ge(struct val *, struct val *);
- static struct val *op_gt(struct val *, struct val *);
- static struct val *op_le(struct val *, struct val *);
- static struct val *op_lt(struct val *, struct val *);
- static struct val *op_minus(struct val *, struct val *);
- static struct val *op_ne(struct val *, struct val *);
- static struct val *op_or(struct val *, struct val *);
- static struct val *op_plus(struct val *, struct val *);
- static struct val *op_rem(struct val *, struct val *);
- static struct val *op_times(struct val *, struct val *);
- static int to_integer(struct val *);
- static void to_string(struct val *);
- #define YYERROR_IS_DECLARED
- static int yyerror(const char *);
- static int yylex(void);
- %}
- %union
- {
- struct val *val;
- }
- %left <val> '|'
- %left <val> '&'
- %left <val> '=' '>' '<' GE LE NE
- %left <val> '+' '-'
- %left <val> '*' '/' '%'
- %left <val> ':'
- %token <val> TOKEN
- %type <val> start expr
- %%
- start: expr { result = $$; }
- expr: TOKEN
- | '(' expr ')' { $$ = $2; }
- | expr '|' expr { $$ = op_or($1, $3); }
- | expr '&' expr { $$ = op_and($1, $3); }
- | expr '=' expr { $$ = op_eq($1, $3); }
- | expr '>' expr { $$ = op_gt($1, $3); }
- | expr '<' expr { $$ = op_lt($1, $3); }
- | expr GE expr { $$ = op_ge($1, $3); }
- | expr LE expr { $$ = op_le($1, $3); }
- | expr NE expr { $$ = op_ne($1, $3); }
- | expr '+' expr { $$ = op_plus($1, $3); }
- | expr '-' expr { $$ = op_minus($1, $3); }
- | expr '*' expr { $$ = op_times($1, $3); }
- | expr '/' expr { $$ = op_div($1, $3); }
- | expr '%' expr { $$ = op_rem($1, $3); }
- | expr ':' expr { $$ = op_colon($1, $3); }
- ;
- %%
- static struct val *
- make_integer(intmax_t i)
- {
- struct val *vp;
- vp = (struct val *)malloc(sizeof(*vp));
- if (vp == NULL)
- errx(ERR_EXIT, "error: malloc(vp) failed");
- vp->type = integer;
- vp->u.i = i;
- return (vp);
- }
- static struct val *
- make_str(const char *s)
- {
- struct val *vp;
- vp = (struct val *)malloc(sizeof(*vp));
- if (vp == NULL)
- errx(ERR_EXIT, "error: malloc(vp) failed");
- if ((vp->u.s = strdup(s)) == NULL)
- errx(ERR_EXIT, "error: strdup(s) failed");
- if (is_integer(s))
- vp->type = numeric_string;
- else
- vp->type = string;
- return (vp);
- }
- static void
- free_value(struct val *vp)
- {
- if (vp->type == string || vp->type == numeric_string)
- free(vp->u.s);
- if (vp->type == string || vp->type == numeric_string || vp->type == integer)
- free(vp);
- }
- static int
- to_integer(struct val *vp)
- {
- intmax_t i;
- /* we can only convert numeric_string to integer, here */
- if (vp->type == numeric_string) {
- errno = 0;
- i = strtoimax(vp->u.s, (char **)NULL, 10);
- /* just keep as numeric_string, if the conversion fails */
- if (errno != ERANGE) {
- free(vp->u.s);
- vp->u.i = i;
- vp->type = integer;
- }
- }
- return (vp->type == integer);
- }
- static void
- assert_to_integer(struct val *vp)
- {
- if (vp->type == string)
- errx(ERR_EXIT, "error: not a decimal number: '%s'", vp->u.s);
- if (!to_integer(vp))
- errx(ERR_EXIT, "error: operand too large: '%s'", vp->u.s);
- }
- static void
- to_string(struct val *vp)
- {
- char *tmp;
- if (vp->type == string || vp->type == numeric_string)
- return;
- /*
- * log_10(x) ~= 0.3 * log_2(x). Rounding up gives the number
- * of digits; add one each for the sign and terminating null
- * character, respectively.
- */
- #define NDIGITS(x) (3 * (sizeof(x) * CHAR_BIT) / 10 + 1 + 1 + 1)
- tmp = malloc(NDIGITS(vp->u.i));
- if (tmp == NULL)
- errx(ERR_EXIT, "error: malloc() failed");
- sprintf(tmp, "%jd", vp->u.i);
- vp->type = string;
- vp->u.s = tmp;
- }
- static int
- is_integer(const char *s)
- {
- if (nonposix) {
- if (*s == '\0')
- return (1);
- while (isspace((unsigned char)*s))
- s++;
- }
- if (*s == '-' || (nonposix && *s == '+'))
- s++;
- if (*s == '\0')
- return (0);
- while (isdigit((unsigned char)*s))
- s++;
- return (*s == '\0');
- }
- static int
- is_string(struct val *vp)
- {
- /* only TRUE if this string is not a valid integer */
- return (vp->type == string);
- }
- static int
- yylex(void)
- {
- char *p;
- if (*av == NULL)
- return (0);
- p = *av++;
- if (strlen(p) == 1) {
- if (strchr("|&=<>+-*/%:()", *p))
- return (*p);
- } else if (strlen(p) == 2 && p[1] == '=') {
- switch (*p) {
- case '>': return (GE);
- case '<': return (LE);
- case '!': return (NE);
- }
- }
- yylval.val = make_str(p);
- return (TOKEN);
- }
- static int
- is_zero_or_null(struct val *vp)
- {
- if (vp->type == integer)
- return (vp->u.i == 0);
- return (*vp->u.s == 0 || (to_integer(vp) && vp->u.i == 0));
- }
- int
- main(int argc, char *argv[])
- {
- int c;
- setlocale(LC_ALL, "");
- if (getenv("EXPR_COMPAT") != NULL
- || getenv("POSIXLY_CORRECT") != NULL) {
- av = argv + 1;
- nonposix = 1;
- } else {
- while ((c = getopt(argc, argv, ":e")) != -1) {
- switch (c) {
- case 'e':
- nonposix = 1;
- break;
- case ':':
- fprintf(stderr, "expr: error: Missing operand for option: '-%c'\n", optopt);
- break;
- case '?':
- fprintf(stderr, "expr: error: Unrecognised option: '-%c'\n", optopt);
- break;
- default:
- errx(ERR_EXIT,
- "usage: expr [-e] expression\n");
- }
- }
- av = argv + optind;
- }
- yyparse();
- assert(result);
- if (result->type == integer)
- printf("%jd\n", result->u.i);
- else
- printf("%s\n", result->u.s);
- int err = is_zero_or_null(result);
- free_value(result);
- return err;
- }
- static int
- yyerror(const char *s)
- {
- errx(ERR_EXIT, "error: syntax error: %s", s);
- }
- static struct val *
- op_or(struct val *a, struct val *b)
- {
- if (!is_zero_or_null(a)) {
- free_value(b);
- return (a);
- }
- free_value(a);
- if (!is_zero_or_null(b))
- return (b);
- free_value(b);
- return (make_integer((intmax_t)0));
- }
- static struct val *
- op_and(struct val *a, struct val *b)
- {
- if (is_zero_or_null(a) || is_zero_or_null(b)) {
- free_value(a);
- free_value(b);
- return (make_integer((intmax_t)0));
- } else {
- free_value(b);
- return (a);
- }
- }
- static int
- compare_vals(struct val *a, struct val *b)
- {
- int r;
- if (is_string(a) || is_string(b)) {
- to_string(a);
- to_string(b);
- r = strcoll(a->u.s, b->u.s);
- } else {
- assert_to_integer(a);
- assert_to_integer(b);
- if (a->u.i > b->u.i)
- r = 1;
- else if (a->u.i < b->u.i)
- r = -1;
- else
- r = 0;
- }
- free_value(a);
- free_value(b);
- return (r);
- }
- static struct val *
- op_eq(struct val *a, struct val *b)
- {
- return (make_integer((intmax_t)(compare_vals(a, b) == 0)));
- }
- static struct val *
- op_gt(struct val *a, struct val *b)
- {
- return (make_integer((intmax_t)(compare_vals(a, b) > 0)));
- }
- static struct val *
- op_lt(struct val *a, struct val *b)
- {
- return (make_integer((intmax_t)(compare_vals(a, b) < 0)));
- }
- static struct val *
- op_ge(struct val *a, struct val *b)
- {
- return (make_integer((intmax_t)(compare_vals(a, b) >= 0)));
- }
- static struct val *
- op_le(struct val *a, struct val *b)
- {
- return (make_integer((intmax_t)(compare_vals(a, b) <= 0)));
- }
- static struct val *
- op_ne(struct val *a, struct val *b)
- {
- return (make_integer((intmax_t)(compare_vals(a, b) != 0)));
- }
- static void
- assert_plus(intmax_t a, intmax_t b, intmax_t r)
- {
- /*
- * sum of two positive numbers must be positive,
- * sum of two negative numbers must be negative
- */
- if ((a > 0 && b > 0 && r <= 0) ||
- (a < 0 && b < 0 && r >= 0))
- errx(ERR_EXIT, "error: overflow");
- }
- static struct val *
- op_plus(struct val *a, struct val *b)
- {
- struct val *r;
- assert_to_integer(a);
- assert_to_integer(b);
- r = make_integer(a->u.i + b->u.i);
- assert_plus(a->u.i, b->u.i, r->u.i);
- free_value(a);
- free_value(b);
- return (r);
- }
- static void
- assert_minus(intmax_t a, intmax_t b, intmax_t r)
- {
- if ((a >= 0 && b < 0 && r <= 0) ||
- (a < 0 && b > 0 && r >= 0))
- errx(ERR_EXIT, "error: overflow");
- }
- static struct val *
- op_minus(struct val *a, struct val *b)
- {
- struct val *r;
- assert_to_integer(a);
- assert_to_integer(b);
- r = make_integer(a->u.i - b->u.i);
- assert_minus(a->u.i, b->u.i, r->u.i);
- free_value(a);
- free_value(b);
- return (r);
- }
- /*
- * We depend on undefined behaviour giving a result (in r).
- * To test this result, pass it as volatile. This prevents
- * optimizing away of the test based on the undefined behaviour.
- */
- static void
- assert_times(intmax_t a, intmax_t b, volatile intmax_t r)
- {
- /*
- * If the first operand is 0, no overflow is possible,
- * else the result of the division test must match the
- * second operand.
- *
- * Be careful to avoid overflow in the overflow test, as
- * in assert_div(). Overflow in division would kill us
- * with a SIGFPE before getting the test wrong. In old
- * buggy versions, optimization used to give a null test
- * instead of a SIGFPE.
- */
- if ((a == -1 && b == INTMAX_MIN) || (a != 0 && r / a != b))
- errx(ERR_EXIT, "error: overflow");
- }
- static struct val *
- op_times(struct val *a, struct val *b)
- {
- struct val *r;
- assert_to_integer(a);
- assert_to_integer(b);
- r = make_integer(a->u.i * b->u.i);
- assert_times(a->u.i, b->u.i, r->u.i);
- free_value(a);
- free_value(b);
- return (r);
- }
- static void
- assert_div(intmax_t a, intmax_t b)
- {
- if (b == 0)
- errx(ERR_EXIT, "error: division by zero");
- /* only INTMAX_MIN / -1 causes overflow */
- if (a == INTMAX_MIN && b == -1)
- errx(ERR_EXIT, "error: overflow");
- }
- static struct val *
- op_div(struct val *a, struct val *b)
- {
- struct val *r;
- assert_to_integer(a);
- assert_to_integer(b);
- /* assert based on operands only, not on result */
- assert_div(a->u.i, b->u.i);
- r = make_integer(a->u.i / b->u.i);
- free_value(a);
- free_value(b);
- return (r);
- }
- static struct val *
- op_rem(struct val *a, struct val *b)
- {
- struct val *r;
- assert_to_integer(a);
- assert_to_integer(b);
- /* pass a=1 to only check for div by zero */
- assert_div(1, b->u.i);
- r = make_integer(a->u.i % b->u.i);
- free_value(a);
- free_value(b);
- return (r);
- }
- static struct val *
- op_colon(struct val *a, struct val *b)
- {
- regex_t rp;
- regmatch_t rm[2];
- char errbuf[256];
- int eval;
- struct val *v;
- /* coerce both arguments to strings */
- to_string(a);
- to_string(b);
- /* compile regular expression */
- if ((eval = regcomp(&rp, b->u.s, 0)) != 0) {
- regerror(eval, &rp, errbuf, sizeof(errbuf));
- errx(ERR_EXIT, "error: %s", errbuf);
- }
- /* compare string against pattern */
- /* remember that patterns are anchored to the beginning of the line */
- if (regexec(&rp, a->u.s, (size_t)2, rm, 0) == 0 && rm[0].rm_so == 0)
- if (rm[1].rm_so >= 0) {
- *(a->u.s + rm[1].rm_eo) = '\0';
- v = make_str(a->u.s + rm[1].rm_so);
- } else
- v = make_integer((intmax_t)(rm[0].rm_eo));
- else
- if (rp.re_nsub == 0)
- v = make_integer((intmax_t)0);
- else
- v = make_str("");
- /* free arguments and pattern buffer */
- free_value(a);
- free_value(b);
- regfree(&rp);
- return (v);
- }