diff options
author | Andrew J. Schorr <aschorr@telemetry-investments.com> | 2016-08-09 11:33:27 -0400 |
---|---|---|
committer | Andrew J. Schorr <aschorr@telemetry-investments.com> | 2016-08-09 11:33:27 -0400 |
commit | 3cf67f58ce8e42f9ce8d7be45936eedf79751b46 (patch) | |
tree | 449f8c9cc41797a23eb9502b4ed521525a43c183 /int_array.c | |
parent | 560cf6d52f978e360e9b2a10f7ddd9a0197e0b31 (diff) | |
download | egawk-3cf67f58ce8e42f9ce8d7be45936eedf79751b46.tar.gz egawk-3cf67f58ce8e42f9ce8d7be45936eedf79751b46.tar.bz2 egawk-3cf67f58ce8e42f9ce8d7be45936eedf79751b46.zip |
If a strnum integer has a non-standard string representation, do not accept it as an integer array subscript.
Diffstat (limited to 'int_array.c')
-rw-r--r-- | int_array.c | 70 |
1 files changed, 65 insertions, 5 deletions
diff --git a/int_array.c b/int_array.c index a8de3d55..1fa32bd7 100644 --- a/int_array.c +++ b/int_array.c @@ -78,27 +78,86 @@ int_array_init(NODE *symbol, NODE *subs ATTRIBUTE_UNUSED) return & success_node; } +/* + * standard_integer_string -- check whether the string matches what + * sprintf("%ld", <value>) would produce. This is accomplished by accepting + * only strings that look like /^0$/ or /^-?[1-9][0-9]*$/. This should be + * faster than comparing vs. the results of actually calling sprintf. + */ + +static bool +standard_integer_string(const char *s, size_t len) +{ + const char *end; + + if (len == 0) + return false; + if (*s == '0' && len == 1) + return true; + end = s + len; + /* ignore leading minus sign */ + if (*s == '-' && ++s == end) + return false; + /* check first char is [1-9] */ + if (*s < '1' || *s > '9') + return false; + while (++s < end) { + if (*s < '0' || *s > '9') + return false; + } + return true; +} + /* is_integer --- check if subscript is an integer */ NODE ** is_integer(NODE *symbol, NODE *subs) { +#ifndef CHECK_INTEGER_USING_FORCE_NUMBER long l; +#endif AWKNUM d; + if ((subs->flags & NUMINT) != 0) + /* quick exit */ + return & success_node; + if (subs == Nnull_string || do_mpfr) return NULL; - if ((subs->flags & NUMINT) != 0) - return & success_node; +#ifdef CHECK_INTEGER_USING_FORCE_NUMBER + /* + * This approach is much simpler, because we remove all of the strtol + * logic below. But this may be slower in some usage cases. + */ + if ((subs->flags & NUMCUR) == 0) { + str2number(subs); - if ((subs->flags & NUMBER) != 0) { + /* check again in case force_number set NUMINT */ + if ((subs->flags & NUMINT) != 0) + return & success_node; + } +#else /* CHECK_INTEGER_USING_FORCE_NUMBER */ + if ((subs->flags & NUMCUR) != 0) { +#endif /* CHECK_INTEGER_USING_FORCE_NUMBER */ d = subs->numbr; if (d <= INT32_MAX && d >= INT32_MIN && d == (int32_t) d) { - subs->flags |= NUMINT; - return & success_node; + /* + * the numeric value is an integer, but we must + * protect against strings that cannot be generated + * from sprintf("%ld", <subscript>). This can happen + * with strnum or string values. We could skip this + * check for pure NUMBER values, but unfortunately the + * code does not currently distinguish between NUMBER + * and strnum values. + */ + if ((subs->flags & STRCUR) == 0 || standard_integer_string(subs->stptr, subs->stlen)) { + subs->flags |= NUMINT; + return & success_node; + } } return NULL; +#ifndef CHECK_INTEGER_USING_FORCE_NUMBER } /* a[3]=1; print "3" in a -- true @@ -151,6 +210,7 @@ is_integer(NODE *symbol, NODE *subs) } } return NULL; +#endif /* CHECK_INTEGER_USING_FORCE_NUMBER */ } |