diff --git a/src/runtime/d3d12compute.cpp b/src/runtime/d3d12compute.cpp index adae690800cc..f4f85180a56e 100644 --- a/src/runtime/d3d12compute.cpp +++ b/src/runtime/d3d12compute.cpp @@ -98,11 +98,11 @@ static constexpr uint64_t trace_buf_size = 4096; WEAK char trace_buf[trace_buf_size] = {}; WEAK int trace_indent = 0; -struct trace : public BasicPrinter { +struct trace : public PrinterBase { ScopedMutexLock lock; explicit trace(void *user_context = nullptr) - : BasicPrinter(user_context, trace_buf), + : PrinterBase(user_context, trace_buf, trace_buf_size), lock(&trace_lock) { for (int i = 0; i < trace_indent; i++) { *this << " "; diff --git a/src/runtime/posix_error_handler.cpp b/src/runtime/posix_error_handler.cpp index d40790fad15d..27bcc1f5b28f 100644 --- a/src/runtime/posix_error_handler.cpp +++ b/src/runtime/posix_error_handler.cpp @@ -7,18 +7,16 @@ extern "C" { extern void abort(); WEAK void halide_default_error(void *user_context, const char *msg) { - char buf[4096]; - char *dst = halide_string_to_string(buf, buf + 4094, "Error: "); - dst = halide_string_to_string(dst, dst + 4094, msg); - // We still have one character free. Add a newline if there - // isn't one already. - if (dst[-1] != '\n') { - dst[0] = '\n'; - dst[1] = 0; - dst += 1; + // Can't use StackBasicPrinter here because it limits size to 256 + constexpr int buf_size = 4096; + char buf[buf_size]; + PrinterBase dst(user_context, buf, buf_size); + dst << "Error: " << msg; + const char *d = dst.str(); + if (d && *d && d[strlen(d) - 1] != '\n') { + dst << "\n"; } - (void)halide_msan_annotate_memory_is_initialized(user_context, buf, dst - buf + 1); - halide_print(user_context, buf); + halide_print(user_context, dst.str()); abort(); } } diff --git a/src/runtime/printer.h b/src/runtime/printer.h index be3620020824..6a379561dbe5 100644 --- a/src/runtime/printer.h +++ b/src/runtime/printer.h @@ -41,179 +41,174 @@ constexpr uint64_t default_printer_buffer_length = 1024; // Then remember the print only happens when the debug object leaves // scope, which may print at a confusing time. -namespace { -template -class Printer { - char *buf, *dst, *end; - void *user_context; - bool own_mem; +class PrinterBase { +protected: + char *dst; + char *const end; + char *const start; + void *const user_context; + + NEVER_INLINE void allocation_error() const { + halide_error(user_context, "Printer buffer allocation failed.\n"); + } public: - explicit Printer(void *ctx, char *mem = nullptr) - : user_context(ctx), own_mem(mem == nullptr) { - if (mem != nullptr) { - buf = mem; - } else { - buf = (char *)malloc(buffer_length); + // This class will stream text into the range [start, start + size - 1]. + // It does *not* assume any ownership of the memory; it assumes + // the memory will remain valid for its lifespan, and doesn't + // attempt to free any allocations. It also doesn't do any sanity + // checking of the pointers, so if you pass in a null or bogus value, + // it will attempt to use it. + NEVER_INLINE PrinterBase(void *user_context_, char *start_, uint64_t size_) + : dst(start_), + // (If start is null, set end = start to ensure no writes are done) + end(start_ ? start_ + size_ - 1 : start_), + start(start_), + user_context(user_context_) { + if (end > start) { + // null-terminate the final byte to ensure string isn't $ENDLESS + *end = 0; } + } + + NEVER_INLINE const char *str() { + (void)halide_msan_annotate_memory_is_initialized(user_context, start, dst - start + 1); + return start; + } + + uint64_t size() const { + halide_debug_assert(user_context, dst >= start); + return (uint64_t)(dst - start); + } + + uint64_t capacity() const { + halide_debug_assert(user_context, end >= start); + return (uint64_t)(end - start); + } - dst = buf; + NEVER_INLINE void clear() { + dst = start; if (dst) { - end = buf + (buffer_length - 1); - *end = 0; - } else { - // Pointers equal ensures no writes to buffer via formatting code - end = dst; + dst[0] = 0; } + } -#if HALIDE_RUNTIME_PRINTER_LOG_THREADID - uint64_t tid; - pthread_threadid_np(0, &tid); - *this << "(TID:" << tid << ")"; -#endif + NEVER_INLINE void erase(int n) { + if (dst) { + dst -= n; + if (dst < start) { + dst = start; + } + dst[0] = 0; + } } - // Not movable, not copyable - Printer(const Printer ©) = delete; - Printer &operator=(const Printer &) = delete; - Printer(Printer &&) = delete; - Printer &operator=(Printer &&) = delete; + struct Float16Bits { + uint16_t bits; + }; - Printer &operator<<(const char *arg) { + // These are NEVER_INLINE because Clang will aggressively inline + // all of them, but the code size of calling out-of-line here is slightly + // smaller, and we ~always prefer smaller code size when using Printer + // in the runtime (it's a modest but nonzero difference). + NEVER_INLINE PrinterBase &operator<<(const char *arg) { dst = halide_string_to_string(dst, end, arg); return *this; } - Printer &operator<<(int64_t arg) { + NEVER_INLINE PrinterBase &operator<<(int64_t arg) { dst = halide_int64_to_string(dst, end, arg, 1); return *this; } - Printer &operator<<(int32_t arg) { + NEVER_INLINE PrinterBase &operator<<(int32_t arg) { dst = halide_int64_to_string(dst, end, arg, 1); return *this; } - Printer &operator<<(uint64_t arg) { + NEVER_INLINE PrinterBase &operator<<(uint64_t arg) { dst = halide_uint64_to_string(dst, end, arg, 1); return *this; } - Printer &operator<<(uint32_t arg) { + NEVER_INLINE PrinterBase &operator<<(uint32_t arg) { dst = halide_uint64_to_string(dst, end, arg, 1); return *this; } - Printer &operator<<(double arg) { + NEVER_INLINE PrinterBase &operator<<(double arg) { dst = halide_double_to_string(dst, end, arg, 1); return *this; } - Printer &operator<<(float arg) { + NEVER_INLINE PrinterBase &operator<<(float arg) { dst = halide_double_to_string(dst, end, arg, 0); return *this; } - Printer &operator<<(const void *arg) { - dst = halide_pointer_to_string(dst, end, arg); + NEVER_INLINE PrinterBase &operator<<(Float16Bits arg) { + double value = halide_float16_bits_to_double(arg.bits); + dst = halide_double_to_string(dst, end, value, 1); return *this; } - Printer &write_float16_from_bits(const uint16_t arg) { - double value = halide_float16_bits_to_double(arg); - dst = halide_double_to_string(dst, end, value, 1); + NEVER_INLINE PrinterBase &operator<<(const void *arg) { + dst = halide_pointer_to_string(dst, end, arg); return *this; } - Printer &operator<<(const halide_type_t &t) { + NEVER_INLINE PrinterBase &operator<<(const halide_type_t &t) { dst = halide_type_to_string(dst, end, &t); return *this; } - Printer &operator<<(const halide_buffer_t &buf) { + NEVER_INLINE PrinterBase &operator<<(const halide_buffer_t &buf) { dst = halide_buffer_to_string(dst, end, &buf); return *this; } - template - void append(const T &value) { - *this << value; - } - - template - void append(const First &first, const Second &second, const Rest &...rest) { - append(first); - append(second, rest...); - } - - // Use it like a stringstream. - const char *str() { - if (buf) { - if (printer_type == StringStreamPrinterType) { - msan_annotate_is_initialized(); - } - return buf; - } else { - return allocation_error(); - } - } - - // Clear it. Useful for reusing a stringstream. - void clear() { - dst = buf; - if (dst) { - dst[0] = 0; - } + template + void append(const Args &...args) { + ((*this << args), ...); } - // Returns the number of characters in the buffer - uint64_t size() const { - return (uint64_t)(dst - buf); - } + // Not movable, not copyable + PrinterBase(const PrinterBase ©) = delete; + PrinterBase &operator=(const PrinterBase &) = delete; + PrinterBase(PrinterBase &&) = delete; + PrinterBase &operator=(PrinterBase &&) = delete; +}; - uint64_t capacity() const { - return buffer_length; - } +namespace { - // Delete the last N characters - void erase(int n) { - if (dst) { - dst -= n; - if (dst < buf) { - dst = buf; - } - dst[0] = 0; +template +class HeapPrinter : public PrinterBase { +public: + NEVER_INLINE explicit HeapPrinter(void *user_context) + : PrinterBase(user_context, (char *)malloc(buffer_length), buffer_length) { + if (!start) { + allocation_error(); } - } - const char *allocation_error() { - return "Printer buffer allocation failed.\n"; - } - - void msan_annotate_is_initialized() { - (void)halide_msan_annotate_memory_is_initialized(user_context, buf, dst - buf + 1); +#if HALIDE_RUNTIME_PRINTER_LOG_THREADID + uint64_t tid; + pthread_threadid_np(0, &tid); + *this << "(TID:" << tid << ")"; +#endif } - ~Printer() { - if (!buf) { - halide_error(user_context, allocation_error()); + NEVER_INLINE ~HeapPrinter() { + if (printer_type == ErrorPrinterType) { + halide_error(user_context, str()); + } else if (printer_type == BasicPrinterType) { + halide_print(user_context, str()); } else { - msan_annotate_is_initialized(); - if (printer_type == ErrorPrinterType) { - halide_error(user_context, buf); - } else if (printer_type == BasicPrinterType) { - halide_print(user_context, buf); - } else { - // It's a stringstream. Do nothing. - } + // It's a stringstream. Do nothing. } - if (own_mem) { - free(buf); - } + free(start); } }; - // A class that supports << with all the same types as Printer, but // does nothing and should compile to a no-op. class SinkPrinter { @@ -227,13 +222,13 @@ ALWAYS_INLINE SinkPrinter operator<<(const SinkPrinter &s, T) { } template -using BasicPrinter = Printer; +using BasicPrinter = HeapPrinter; template -using ErrorPrinter = Printer; +using ErrorPrinter = HeapPrinter; template -using StringStreamPrinter = Printer; +using StringStreamPrinter = HeapPrinter; using print = BasicPrinter<>; using error = ErrorPrinter<>; @@ -244,17 +239,16 @@ using debug = BasicPrinter<>; #else using debug = SinkPrinter; #endif -} // namespace // A Printer that automatically reserves stack space for the printer buffer, rather than malloc. // Note that this requires an explicit buffer_length, and it (generally) should be <= 256. template -class StackPrinter : public Printer { +class StackPrinter : public PrinterBase { char scratch[buffer_length]; public: - explicit StackPrinter(void *ctx) - : Printer(ctx, scratch) { + explicit StackPrinter(void *user_context) + : PrinterBase(user_context, scratch, buffer_length) { static_assert(buffer_length <= 256, "StackPrinter is meant only for small buffer sizes; you are probably making a mistake."); } }; @@ -268,6 +262,8 @@ using StackErrorPrinter = StackPrinter; template using StackStringStreamPrinter = StackPrinter; +} // namespace + } // namespace Internal } // namespace Runtime } // namespace Halide diff --git a/src/runtime/runtime_internal.h b/src/runtime/runtime_internal.h index 57dfe0b1087a..027ae5c4f500 100644 --- a/src/runtime/runtime_internal.h +++ b/src/runtime/runtime_internal.h @@ -51,6 +51,8 @@ typedef ptrdiff_t ssize_t; #define WEAK __attribute__((weak)) +#define NEVER_INLINE __attribute__((noinline)) + // Note that ALWAYS_INLINE should *always* also be `inline`. #define ALWAYS_INLINE inline __attribute__((always_inline)) diff --git a/src/runtime/to_string.cpp b/src/runtime/to_string.cpp index 71d537609e83..1200ca5c07d9 100644 --- a/src/runtime/to_string.cpp +++ b/src/runtime/to_string.cpp @@ -1,8 +1,11 @@ #include "HalideRuntime.h" +#include "runtime_internal.h" extern "C" { WEAK char *halide_string_to_string(char *dst, char *end, const char *arg) { + halide_debug_assert(nullptr, dst <= end); + if (dst >= end) { return dst; } @@ -25,6 +28,8 @@ WEAK char *halide_string_to_string(char *dst, char *end, const char *arg) { } WEAK char *halide_uint64_to_string(char *dst, char *end, uint64_t arg, int min_digits) { + halide_debug_assert(nullptr, dst <= end); + // 32 is more than enough chars to contain any 64-bit int. char buf[32]; buf[31] = 0; @@ -43,6 +48,8 @@ WEAK char *halide_uint64_to_string(char *dst, char *end, uint64_t arg, int min_d } WEAK char *halide_int64_to_string(char *dst, char *end, int64_t arg, int min_digits) { + halide_debug_assert(nullptr, dst <= end); + if (arg < 0 && dst < end) { *dst++ = '-'; arg = -arg; @@ -51,6 +58,8 @@ WEAK char *halide_int64_to_string(char *dst, char *end, int64_t arg, int min_dig } WEAK char *halide_double_to_string(char *dst, char *end, double arg, int scientific) { + halide_debug_assert(nullptr, dst <= end); + uint64_t bits = 0; memcpy(&bits, &arg, sizeof(double)); @@ -234,6 +243,8 @@ WEAK char *halide_double_to_string(char *dst, char *end, double arg, int scienti } WEAK char *halide_pointer_to_string(char *dst, char *end, const void *arg) { + halide_debug_assert(nullptr, dst <= end); + const char *hex_digits = "0123456789abcdef"; char buf[20] = {0}; char *buf_ptr = buf + 18; @@ -251,6 +262,8 @@ WEAK char *halide_pointer_to_string(char *dst, char *end, const void *arg) { } WEAK char *halide_type_to_string(char *dst, char *end, const halide_type_t *t) { + halide_debug_assert(nullptr, dst <= end); + const char *code_name = nullptr; switch (t->code) { case halide_type_int: @@ -282,6 +295,8 @@ WEAK char *halide_type_to_string(char *dst, char *end, const halide_type_t *t) { } WEAK char *halide_buffer_to_string(char *dst, char *end, const halide_buffer_t *buf) { + halide_debug_assert(nullptr, dst <= end); + if (buf == nullptr) { return halide_string_to_string(dst, end, "nullptr"); } diff --git a/src/runtime/tracing.cpp b/src/runtime/tracing.cpp index 8e8769e2ad12..93a12c7d90a4 100644 --- a/src/runtime/tracing.cpp +++ b/src/runtime/tracing.cpp @@ -308,7 +308,7 @@ WEAK int32_t halide_default_trace(void *user_context, const halide_trace_event_t if (print_bits == 32) { ss << ((float *)(e->value))[i]; } else if (print_bits == 16) { - ss.write_float16_from_bits(((uint16_t *)(e->value))[i]); + ss << PrinterBase::Float16Bits{((uint16_t *)(e->value))[i]}; } else { ss << ((double *)(e->value))[i]; }