banan-os/userspace/libraries/LibC/printf_impl.cpp

632 lines
14 KiB
C++

#include <BAN/Traits.h>
#include <BAN/Math.h>
#include <bits/printf.h>
#include <ctype.h>
#include <errno.h>
#include <math.h>
#include <stdio.h>
#include <string.h>
#define BAN_PRINTF_PUTC(c) \
do \
{ \
if (putc_fun((c), data) == EOF) \
return -1; \
written++; \
} while (false)
enum class length_t
{
none,
hh,
h,
l,
ll,
j,
z,
t,
L,
};
struct format_options_t
{
bool alternate_form { false };
bool zero_padded { false };
bool left_justified { false };
bool show_plus_sign_as_space { false };
bool show_plus_sign { false };
int width { -1 };
int percision { -1 };
length_t length { length_t::none };
};
template<BAN::integral T>
static void integer_to_string(char* buffer, T value, int base, bool upper, format_options_t options)
{
int digits = 1;
if (options.percision != -1)
{
digits = options.percision;
options.zero_padded = false;
}
if (value == 0 && options.alternate_form)
{
if (digits == 0 && base == 8)
digits = 1;
for (int i = 0; i < digits; i++)
buffer[i] = '0';
buffer[digits] = '\0';
return;
}
auto digit_char = [](int digit, bool upper)
{
if (digit < 10)
return '0' + digit;
return (upper ? 'A' : 'a') + (digit - 10);
};
int offset = 0;
int prefix_length = 0;
char prefix[2] {};
if constexpr(BAN::is_signed_v<T>)
{
prefix_length = 1;
if (value < 0)
{
prefix[0] = '-';
buffer[offset++] = digit_char(-(value % base), upper);
value = -(value / base);
}
else if (options.show_plus_sign)
prefix[0] = '+';
else if (options.show_plus_sign_as_space)
prefix[0] = ' ';
else
prefix_length = 0;
}
else
{
if (options.alternate_form && base == 8)
{
prefix_length = 1;
prefix[0] = '0';
digits--;
}
else if (options.alternate_form && base == 16)
{
prefix_length = 2;
prefix[0] = '0';
prefix[1] = 'x';
}
}
while (value || offset < digits)
{
buffer[offset++] = digit_char(value % base, upper);
value /= base;
}
if (options.zero_padded)
{
int zeroes = options.width - prefix_length;
for (int i = offset; i < zeroes; i++)
buffer[offset++] = '0';
}
if (prefix[1]) buffer[offset++] = prefix[1];
if (prefix[0]) buffer[offset++] = prefix[0];
for (int i = 0; i < offset / 2; i++)
{
char temp = buffer[i];
buffer[i] = buffer[offset - i - 1];
buffer[offset - i - 1] = temp;
}
buffer[offset++] = '\0';
}
template<BAN::floating_point T>
static void floating_point_to_string(char* buffer, T value, bool upper, const format_options_t options)
{
int percision = 6;
if (options.percision != -1)
percision = options.percision;
int offset = 0;
// Add sign if needed
if (value < (T)0.0)
{
buffer[offset++] = '-';
value = -value;
}
else if (options.show_plus_sign)
buffer[offset++] = '+';
else if (options.show_plus_sign_as_space)
buffer[offset++] = ' ';
if (isnan(value))
{
strcpy(buffer + offset, upper ? "NAN" : "nan");
return;
}
if (isinf(value))
{
strcpy(buffer + offset, upper ? "INF" : "inf");
return;
}
// Round last digit
value += (T)0.5 * BAN::Math::pow<T>(10.0, -percision);
// Add integer part of the decimal
if (value < (T)1.0)
{
buffer[offset++] = '0';
value *= (T)10.0;
}
else
{
int exponent = (int)BAN::Math::log10<T>(value);
T magnitude = BAN::Math::pow<T>(10, exponent);
value /= magnitude;
for (int i = 0; i <= exponent; i++)
{
int digit = 0;
for (; digit < 10; digit++)
if (value < digit + 1)
break;
buffer[offset++] = '0' + digit;
value -= (T)digit;
value *= (T)10.0;
}
}
// We are done if the decimal part is not written
if (percision == 0 && !options.alternate_form)
{
buffer[offset++] = '\0';
return;
}
buffer[offset++] = '.';
// Add the 'percision' digits after decimal point
for (int i = 0; i < percision; i++)
{
int digit = 0;
for (; digit < 10; digit++)
if (value < digit + 1)
break;
buffer[offset++] = '0' + digit;
value -= (T)digit;
value *= (T)10.0;
}
buffer[offset++] = '\0';
}
template<BAN::floating_point T>
static void floating_point_to_exponent_string(char* buffer, T value, bool upper, const format_options_t options)
{
int offset = 0;
// Add sign if needed
if (value < (T)0.0)
{
buffer[offset++] = '-';
value = -value;
}
else if (options.show_plus_sign)
buffer[offset++] = '+';
else if (options.show_plus_sign_as_space)
buffer[offset++] = ' ';
if (isnan(value))
{
strcpy(buffer + offset, upper ? "NAN" : "nan");
return;
}
if (isinf(value))
{
strcpy(buffer + offset, upper ? "INF" : "inf");
return;
}
// Calculate which number to put as exponent
int exponent = 0;
if (value != (T)0.0)
{
exponent = (int)BAN::Math::log10<T>(value);
value /= BAN::Math::pow<T>(10.0, exponent);
}
// Add first numbers before 'e'
floating_point_to_string<T>(buffer + offset, value, upper, options);
offset = strlen(buffer);
// Add the exponent part
buffer[offset++] = (upper ? 'E' : 'e');
format_options_t exponent_options;
exponent_options.show_plus_sign = true;
exponent_options.zero_padded = true;
exponent_options.width = 3;
integer_to_string<int>(buffer + offset, exponent, 10, upper, exponent_options);
}
extern "C" int printf_impl(const char* format, va_list arguments, int (*putc_fun)(int, void*), void* data)
{
int written = 0;
while (*format)
{
if (*format == '%')
{
format_options_t options;
// PARSE FLAGS
bool flags_done = false;
while (!flags_done)
{
format++;
switch (*format)
{
case '#': options.alternate_form = true; break;
case '0': options.zero_padded = true; break;
case '-': options.left_justified = true; break;
case ' ': options.show_plus_sign_as_space = true; break;
case '+': options.show_plus_sign = true; break;
default:
flags_done = true;
break;
}
}
if (options.zero_padded && options.left_justified)
options.zero_padded = false;
// PARSE FIELD WIDTH
if (*format == '*')
{
options.width = va_arg(arguments, int);
format++;
}
else if (isdigit(*format) && *format != '0')
{
int width = 0;
while (isdigit(*format))
{
width *= 10;
width += *format - '0';
format++;
}
options.width = width;
}
// PARSE PERCISION
if (*format == '.')
{
format++;
int percision = 0;
if (isdigit(*format))
{
while (isdigit(*format))
{
percision *= 10;
percision += *format - '0';
format++;
}
}
else if (*format == '-')
{
percision = -1;
format++;
while (isdigit(*format))
format++;
}
else if (*format == '*')
{
percision = va_arg(arguments, int);
format++;
}
if (percision < 0)
percision = -1;
options.percision = percision;
}
// PARSE LENGTH
if (*format == 'h')
{
if (*(format + 1) == 'h')
{
format++;
options.length = length_t::hh;
}
else
options.length = length_t::h;
}
else if (*format == 'l')
{
if (*(format + 1) == 'l')
{
format++;
options.length = length_t::ll;
}
else
options.length = length_t::l;
}
else if (*format == 'j')
options.length = length_t::j;
else if (*format == 'z')
options.length = length_t::z;
else if (*format == 't')
options.length = length_t::t;
else if (*format == 'L')
options.length = length_t::L;
else
format--;
format++;
// FIXME: this should be thread-local to keep
// satisfy multithreaded requirement
static char conversion[4096];
const char* string = nullptr;
int length = -1;
#define PARSE_INT_CASE(length, type) \
case length_t::length: integer_to_string<type>(conversion, va_arg(arguments, type), BASE_, UPPER_, options); break
#define PARSE_INT_CASE_CAST(length, cast, type) \
case length_t::length: integer_to_string<cast>(conversion, va_arg(arguments, type), BASE_, UPPER_, options); break
#define PARSE_INT_DEFAULT(type) \
default: integer_to_string<type>(conversion, va_arg(arguments, type), BASE_, UPPER_, options); break
switch (*format)
{
case 'd':
case 'i':
{
switch (options.length)
{
#define BASE_ 10
#define UPPER_ false
PARSE_INT_CASE_CAST(hh, signed char, int);
PARSE_INT_CASE_CAST(h, short, int);
PARSE_INT_CASE(l, long);
PARSE_INT_CASE(ll, long long);
PARSE_INT_CASE(j, intmax_t);
PARSE_INT_CASE(z, ssize_t);
PARSE_INT_CASE(t, ptrdiff_t);
PARSE_INT_DEFAULT(int);
#undef BASE_
#undef UPPER_
}
string = conversion;
format++;
break;
}
case 'o':
{
switch (options.length)
{
#define BASE_ 8
#define UPPER_ false
PARSE_INT_CASE_CAST(hh, unsigned char, unsigned int);
PARSE_INT_CASE_CAST(h, unsigned short, unsigned int);
PARSE_INT_CASE(l, unsigned long);
PARSE_INT_CASE(ll, unsigned long long);
PARSE_INT_CASE(j, uintmax_t);
PARSE_INT_CASE(z, size_t);
PARSE_INT_CASE(t, uintptr_t);
PARSE_INT_DEFAULT(unsigned int);
#undef BASE_
#undef UPPER_
}
string = conversion;
format++;
break;
}
case 'u':
{
switch (options.length)
{
#define BASE_ 10
#define UPPER_ false
PARSE_INT_CASE_CAST(hh, unsigned char, unsigned int);
PARSE_INT_CASE_CAST(h, unsigned short, unsigned int);
PARSE_INT_CASE(l, unsigned long);
PARSE_INT_CASE(ll, unsigned long long);
PARSE_INT_CASE(j, uintmax_t);
PARSE_INT_CASE(z, size_t);
PARSE_INT_CASE(t, uintptr_t);
PARSE_INT_DEFAULT(unsigned int);
#undef BASE_
#undef UPPER_
}
string = conversion;
format++;
break;
}
case 'x':
{
switch (options.length)
{
#define BASE_ 16
#define UPPER_ false
PARSE_INT_CASE_CAST(hh, unsigned char, unsigned int);
PARSE_INT_CASE_CAST(h, unsigned short, unsigned int);
PARSE_INT_CASE(l, unsigned long);
PARSE_INT_CASE(ll, unsigned long long);
PARSE_INT_CASE(j, uintmax_t);
PARSE_INT_CASE(z, size_t);
PARSE_INT_CASE(t, uintptr_t);
PARSE_INT_DEFAULT(unsigned int);
#undef BASE_
#undef UPPER_
}
string = conversion;
format++;
break;
}
case 'X':
{
switch (options.length)
{
#define BASE_ 16
#define UPPER_ true
PARSE_INT_CASE_CAST(hh, unsigned char, unsigned int);
PARSE_INT_CASE_CAST(h, unsigned short, unsigned int);
PARSE_INT_CASE(l, unsigned long);
PARSE_INT_CASE(ll, unsigned long long);
PARSE_INT_CASE(j, uintmax_t);
PARSE_INT_CASE(z, size_t);
PARSE_INT_CASE(t, uintptr_t);
PARSE_INT_DEFAULT(unsigned int);
#undef BASE_
#undef UPPER_
}
string = conversion;
format++;
break;
}
case 'e':
case 'E':
{
switch (options.length)
{
case length_t::L: floating_point_to_exponent_string<long double> (conversion, va_arg(arguments, long double), *format == 'E', options); break;
default: floating_point_to_exponent_string<double> (conversion, va_arg(arguments, double), *format == 'E', options); break;
}
string = conversion;
format++;
break;
}
case 'f':
case 'F':
{
switch (options.length)
{
case length_t::L: floating_point_to_string<long double> (conversion, va_arg(arguments, long double), *format == 'F', options); break;
default: floating_point_to_string<double> (conversion, va_arg(arguments, double), *format == 'F', options); break;
}
string = conversion;
format++;
break;
}
case 'g':
case 'G':
// TODO
break;
case 'a':
case 'A':
// TODO
break;
case 'c':
{
conversion[0] = va_arg(arguments, int);
conversion[1] = '\0';
string = conversion;
format++;
break;
}
case 's':
{
string = va_arg(arguments, const char*);
if (options.percision != -1)
{
length = 0;
while (string[length] && length < options.percision)
length++;
}
format++;
break;
}
case 'C':
// TODO (depricated)
break;
case 'S':
// TODO (depricated)
break;
case 'p':
{
void* ptr = va_arg(arguments, void*);
options.alternate_form = true;
integer_to_string<uintptr_t>(conversion, (uintptr_t)ptr, 16, false, options);
string = conversion;
format++;
break;
}
case 'n':
{
switch (options.length)
{
case length_t::hh: *va_arg(arguments, signed char*) = written; break;
case length_t::h: *va_arg(arguments, short*) = written; break;
case length_t::l: *va_arg(arguments, long*) = written; break;
case length_t::ll: *va_arg(arguments, long long*) = written; break;
case length_t::j: *va_arg(arguments, intmax_t*) = written; break;
case length_t::z: *va_arg(arguments, ssize_t*) = written; break;
case length_t::t: *va_arg(arguments, ptrdiff_t*) = written; break;
default: *va_arg(arguments, int*) = written; break;
}
format++;
break;
}
case 'm':
{
// NOTE: this is a glibc extension
// NOTE: syslog() requires %m to be handled
if (options.alternate_form)
string = strerrorname_np(errno);
else
string = strerror(errno);
format++;
break;
}
case '%':
{
conversion[0] = '%';
conversion[1] = '\0';
string = conversion;
format++;
break;
}
default:
break;
}
if (string)
{
if (length == -1)
length = strlen(string);
if (options.width == -1)
options.width = 0;
if (!options.left_justified)
for (int i = length; i < options.width; i++)
BAN_PRINTF_PUTC(' ');
for (int i = 0; i < length && string[i]; i++)
BAN_PRINTF_PUTC(string[i]);
if (options.left_justified)
for (int i = length; i < options.width; i++)
BAN_PRINTF_PUTC(' ');
}
}
else
{
BAN_PRINTF_PUTC(*format);
format++;
}
}
return written;
}