305 lines
8.4 KiB
C
305 lines
8.4 KiB
C
|
/**
|
||
|
* @file parse_number.h
|
||
|
* @author Ambroz Bizjak <ambrop7@gmail.com>
|
||
|
*
|
||
|
* @section LICENSE
|
||
|
*
|
||
|
* Redistribution and use in source and binary forms, with or without
|
||
|
* modification, are permitted provided that the following conditions are met:
|
||
|
* 1. Redistributions of source code must retain the above copyright
|
||
|
* notice, this list of conditions and the following disclaimer.
|
||
|
* 2. Redistributions in binary form must reproduce the above copyright
|
||
|
* notice, this list of conditions and the following disclaimer in the
|
||
|
* documentation and/or other materials provided with the distribution.
|
||
|
* 3. Neither the name of the author nor the
|
||
|
* names of its contributors may be used to endorse or promote products
|
||
|
* derived from this software without specific prior written permission.
|
||
|
*
|
||
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
|
||
|
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
|
||
|
* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
||
|
* DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
|
||
|
* DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
|
||
|
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
|
||
|
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
|
||
|
* ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
||
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||
|
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||
|
*
|
||
|
* @section DESCRIPTION
|
||
|
*
|
||
|
* Numeric string parsing.
|
||
|
*/
|
||
|
|
||
|
#ifndef BADVPN_MISC_PARSE_NUMBER_H
|
||
|
#define BADVPN_MISC_PARSE_NUMBER_H
|
||
|
|
||
|
#include <stdint.h>
|
||
|
#include <string.h>
|
||
|
#include <stddef.h>
|
||
|
#include <limits.h>
|
||
|
|
||
|
#include <misc/debug.h>
|
||
|
#include <misc/cstring.h>
|
||
|
|
||
|
// public parsing functions
|
||
|
static int decode_decimal_digit (char c);
|
||
|
static int decode_hex_digit (char c);
|
||
|
static int parse_unsigned_integer_bin (const char *str, size_t str_len, uintmax_t *out) WARN_UNUSED;
|
||
|
static int parse_unsigned_integer (const char *str, uintmax_t *out) WARN_UNUSED;
|
||
|
static int parse_unsigned_integer_cstr (b_cstring cstr, size_t offset, size_t length, uintmax_t *out) WARN_UNUSED;
|
||
|
static int parse_unsigned_hex_integer_bin (const char *str, size_t str_len, uintmax_t *out) WARN_UNUSED;
|
||
|
static int parse_unsigned_hex_integer (const char *str, uintmax_t *out) WARN_UNUSED;
|
||
|
static int parse_signmag_integer_bin (const char *str, size_t str_len, int *out_sign, uintmax_t *out_mag) WARN_UNUSED;
|
||
|
static int parse_signmag_integer (const char *str, int *out_sign, uintmax_t *out_mag) WARN_UNUSED;
|
||
|
static int parse_signmag_integer_cstr (b_cstring cstr, size_t offset, size_t length, int *out_sign, uintmax_t *out_mag) WARN_UNUSED;
|
||
|
|
||
|
// public generation functions
|
||
|
static int compute_decimal_repr_size (uintmax_t x);
|
||
|
static void generate_decimal_repr (uintmax_t x, char *out, int repr_size);
|
||
|
static int generate_decimal_repr_string (uintmax_t x, char *out);
|
||
|
|
||
|
// implementation follows
|
||
|
|
||
|
// decimal representation of UINTMAX_MAX
|
||
|
static const char parse_number__uintmax_max_str[] = "18446744073709551615";
|
||
|
|
||
|
// make sure UINTMAX_MAX is what we think it is
|
||
|
static const char parse_number__uintmax_max_str_assert[(UINTMAX_MAX == UINTMAX_C(18446744073709551615)) ? 1 : -1];
|
||
|
|
||
|
static int decode_decimal_digit (char c)
|
||
|
{
|
||
|
switch (c) {
|
||
|
case '0': return 0;
|
||
|
case '1': return 1;
|
||
|
case '2': return 2;
|
||
|
case '3': return 3;
|
||
|
case '4': return 4;
|
||
|
case '5': return 5;
|
||
|
case '6': return 6;
|
||
|
case '7': return 7;
|
||
|
case '8': return 8;
|
||
|
case '9': return 9;
|
||
|
}
|
||
|
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
static int decode_hex_digit (char c)
|
||
|
{
|
||
|
switch (c) {
|
||
|
case '0': return 0;
|
||
|
case '1': return 1;
|
||
|
case '2': return 2;
|
||
|
case '3': return 3;
|
||
|
case '4': return 4;
|
||
|
case '5': return 5;
|
||
|
case '6': return 6;
|
||
|
case '7': return 7;
|
||
|
case '8': return 8;
|
||
|
case '9': return 9;
|
||
|
case 'A': case 'a': return 10;
|
||
|
case 'B': case 'b': return 11;
|
||
|
case 'C': case 'c': return 12;
|
||
|
case 'D': case 'd': return 13;
|
||
|
case 'E': case 'e': return 14;
|
||
|
case 'F': case 'f': return 15;
|
||
|
}
|
||
|
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
static int parse__no_overflow (const char *str, size_t str_len, uintmax_t *out)
|
||
|
{
|
||
|
uintmax_t n = 0;
|
||
|
|
||
|
while (str_len > 0) {
|
||
|
if (*str < '0' || *str > '9') {
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
n = 10 * n + (*str - '0');
|
||
|
|
||
|
str++;
|
||
|
str_len--;
|
||
|
}
|
||
|
|
||
|
*out = n;
|
||
|
return 1;
|
||
|
}
|
||
|
|
||
|
int parse_unsigned_integer_bin (const char *str, size_t str_len, uintmax_t *out)
|
||
|
{
|
||
|
// we do not allow empty strings
|
||
|
if (str_len == 0) {
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
// remove leading zeros
|
||
|
while (str_len > 0 && *str == '0') {
|
||
|
str++;
|
||
|
str_len--;
|
||
|
}
|
||
|
|
||
|
// detect overflow
|
||
|
if (str_len > sizeof(parse_number__uintmax_max_str) - 1 ||
|
||
|
(str_len == sizeof(parse_number__uintmax_max_str) - 1 && memcmp(str, parse_number__uintmax_max_str, sizeof(parse_number__uintmax_max_str) - 1) > 0)) {
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
// will not overflow (but can still have invalid characters)
|
||
|
return parse__no_overflow(str, str_len, out);
|
||
|
}
|
||
|
|
||
|
int parse_unsigned_integer (const char *str, uintmax_t *out)
|
||
|
{
|
||
|
return parse_unsigned_integer_bin(str, strlen(str), out);
|
||
|
}
|
||
|
|
||
|
int parse_unsigned_integer_cstr (b_cstring cstr, size_t offset, size_t length, uintmax_t *out)
|
||
|
{
|
||
|
b_cstring_assert_range(cstr, offset, length);
|
||
|
|
||
|
if (length == 0) {
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
uintmax_t n = 0;
|
||
|
|
||
|
B_CSTRING_LOOP_RANGE(cstr, offset, length, pos, chunk_data, chunk_length, {
|
||
|
for (size_t i = 0; i < chunk_length; i++) {
|
||
|
int digit = decode_decimal_digit(chunk_data[i]);
|
||
|
if (digit < 0) {
|
||
|
return 0;
|
||
|
}
|
||
|
if (n > UINTMAX_MAX / 10) {
|
||
|
return 0;
|
||
|
}
|
||
|
n *= 10;
|
||
|
if (digit > UINTMAX_MAX - n) {
|
||
|
return 0;
|
||
|
}
|
||
|
n += digit;
|
||
|
}
|
||
|
})
|
||
|
|
||
|
*out = n;
|
||
|
return 1;
|
||
|
}
|
||
|
|
||
|
int parse_unsigned_hex_integer_bin (const char *str, size_t str_len, uintmax_t *out)
|
||
|
{
|
||
|
uintmax_t n = 0;
|
||
|
|
||
|
if (str_len == 0) {
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
while (str_len > 0) {
|
||
|
int digit = decode_hex_digit(*str);
|
||
|
if (digit < 0) {
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
if (n > UINTMAX_MAX / 16) {
|
||
|
return 0;
|
||
|
}
|
||
|
n *= 16;
|
||
|
|
||
|
if (digit > UINTMAX_MAX - n) {
|
||
|
return 0;
|
||
|
}
|
||
|
n += digit;
|
||
|
|
||
|
str++;
|
||
|
str_len--;
|
||
|
}
|
||
|
|
||
|
*out = n;
|
||
|
return 1;
|
||
|
}
|
||
|
|
||
|
int parse_unsigned_hex_integer (const char *str, uintmax_t *out)
|
||
|
{
|
||
|
return parse_unsigned_hex_integer_bin(str, strlen(str), out);
|
||
|
}
|
||
|
|
||
|
int parse_signmag_integer_bin (const char *str, size_t str_len, int *out_sign, uintmax_t *out_mag)
|
||
|
{
|
||
|
int sign = 1;
|
||
|
if (str_len > 0 && (str[0] == '+' || str[0] == '-')) {
|
||
|
sign = 1 - 2 * (str[0] == '-');
|
||
|
str++;
|
||
|
str_len--;
|
||
|
}
|
||
|
|
||
|
if (!parse_unsigned_integer_bin(str, str_len, out_mag)) {
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
*out_sign = sign;
|
||
|
return 1;
|
||
|
}
|
||
|
|
||
|
int parse_signmag_integer (const char *str, int *out_sign, uintmax_t *out_mag)
|
||
|
{
|
||
|
return parse_signmag_integer_bin(str, strlen(str), out_sign, out_mag);
|
||
|
}
|
||
|
|
||
|
int parse_signmag_integer_cstr (b_cstring cstr, size_t offset, size_t length, int *out_sign, uintmax_t *out_mag)
|
||
|
{
|
||
|
b_cstring_assert_range(cstr, offset, length);
|
||
|
|
||
|
int sign = 1;
|
||
|
if (length > 0 && (b_cstring_at(cstr, offset) == '+' || b_cstring_at(cstr, offset) == '-')) {
|
||
|
sign = 1 - 2 * (b_cstring_at(cstr, offset) == '-');
|
||
|
offset++;
|
||
|
length--;
|
||
|
}
|
||
|
|
||
|
if (!parse_unsigned_integer_cstr(cstr, offset, length, out_mag)) {
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
*out_sign = sign;
|
||
|
return 1;
|
||
|
}
|
||
|
|
||
|
int compute_decimal_repr_size (uintmax_t x)
|
||
|
{
|
||
|
int size = 0;
|
||
|
|
||
|
do {
|
||
|
size++;
|
||
|
x /= 10;
|
||
|
} while (x > 0);
|
||
|
|
||
|
return size;
|
||
|
}
|
||
|
|
||
|
void generate_decimal_repr (uintmax_t x, char *out, int repr_size)
|
||
|
{
|
||
|
ASSERT(out)
|
||
|
ASSERT(repr_size == compute_decimal_repr_size(x))
|
||
|
|
||
|
out += repr_size;
|
||
|
|
||
|
do {
|
||
|
*(--out) = '0' + (x % 10);
|
||
|
x /= 10;
|
||
|
} while (x > 0);
|
||
|
}
|
||
|
|
||
|
int generate_decimal_repr_string (uintmax_t x, char *out)
|
||
|
{
|
||
|
ASSERT(out)
|
||
|
|
||
|
int repr_size = compute_decimal_repr_size(x);
|
||
|
generate_decimal_repr(x, out, repr_size);
|
||
|
out[repr_size] = '\0';
|
||
|
|
||
|
return repr_size;
|
||
|
}
|
||
|
|
||
|
#endif
|