fmt/format.h

631 lines
17 KiB
C
Raw Normal View History

2012-12-07 16:31:09 +00:00
/*
2012-12-12 15:44:41 +00:00
String formatting library for C++
Copyright (c) 2012, Victor Zverovich
All rights reserved.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are met:
1. Redistributions of source code must retain the above copyright notice, this
list of conditions and the following disclaimer.
2. Redistributions in binary form must reproduce the above copyright notice,
this list of conditions and the following disclaimer in the documentation
and/or other materials provided with the distribution.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
2012-12-07 16:31:09 +00:00
*/
#ifndef FORMAT_H_
#define FORMAT_H_
#include <cstddef>
2012-12-18 23:50:14 +00:00
#include <cstdio>
2012-12-18 23:39:42 +00:00
#include <cstring>
2012-12-07 16:31:09 +00:00
#include <stdexcept>
#include <string>
2012-12-09 17:03:47 +00:00
#include <sstream>
2012-12-07 16:31:09 +00:00
#include <vector>
namespace format {
2012-12-12 17:14:00 +00:00
namespace internal {
2012-12-11 20:23:52 +00:00
// A simple array for POD types with the first SIZE elements stored in
// the object itself. It supports a subset of std::vector's operations.
template <typename T, std::size_t SIZE>
2012-12-11 20:23:52 +00:00
class Array {
private:
std::size_t size_;
std::size_t capacity_;
T *ptr_;
T data_[SIZE];
void Grow(std::size_t size);
// Do not implement!
2012-12-11 20:23:52 +00:00
Array(const Array &);
void operator=(const Array &);
public:
2012-12-11 20:23:52 +00:00
Array() : size_(0), capacity_(SIZE), ptr_(data_) {}
~Array() {
if (ptr_ != data_) delete [] ptr_;
}
2012-12-11 20:23:52 +00:00
// Returns the size of this array.
std::size_t size() const { return size_; }
2012-12-11 04:37:35 +00:00
2012-12-11 20:23:52 +00:00
// Returns the capacity of this array.
std::size_t capacity() const { return capacity_; }
2012-12-11 20:23:52 +00:00
// Resizes the array. If T is a POD type new elements are not initialized.
void resize(std::size_t new_size) {
if (new_size > capacity_)
Grow(new_size);
size_ = new_size;
}
void reserve(std::size_t capacity) {
if (capacity > capacity_)
Grow(capacity);
}
2012-12-11 04:37:35 +00:00
void clear() { size_ = 0; }
void push_back(const T &value) {
if (size_ == capacity_)
Grow(size_ + 1);
ptr_[size_++] = value;
}
2012-12-11 20:23:52 +00:00
// Appends data to the end of the array.
void append(const T *begin, const T *end);
T &operator[](std::size_t index) { return ptr_[index]; }
const T &operator[](std::size_t index) const { return ptr_[index]; }
};
template <typename T, std::size_t SIZE>
2012-12-11 20:23:52 +00:00
void Array<T, SIZE>::Grow(std::size_t size) {
capacity_ = std::max(size, capacity_ + capacity_ / 2);
T *p = new T[capacity_];
std::copy(ptr_, ptr_ + size_, p);
if (ptr_ != data_)
delete [] ptr_;
ptr_ = p;
}
template <typename T, std::size_t SIZE>
2012-12-11 20:23:52 +00:00
void Array<T, SIZE>::append(const T *begin, const T *end) {
std::ptrdiff_t num_elements = end - begin;
if (size_ + num_elements > capacity_)
Grow(num_elements);
std::copy(begin, end, ptr_ + size_);
size_ += num_elements;
}
2012-12-12 17:14:00 +00:00
class ArgInserter;
}
2013-01-04 15:04:35 +00:00
/**
\rst
A string reference. It can be constructed from a C string, ``std::string``
or as a result of a formatting operation. It is most useful as a parameter
type to allow passing different types of strings in a function, for example::
TempFormatter<> Format(StringRef format);
\endrst
*/
2012-12-25 21:25:14 +00:00
class StringRef {
private:
const char *data_;
mutable std::size_t size_;
public:
StringRef(const char *s, std::size_t size = 0) : data_(s), size_(size) {}
StringRef(const std::string &s) : data_(s.c_str()), size_(s.size()) {}
operator std::string() const { return std::string(data_, size()); }
const char *c_str() const { return data_; }
std::size_t size() const {
if (size_ == 0) size_ = std::strlen(data_);
return size_;
}
};
2012-12-11 18:27:13 +00:00
class FormatError : public std::runtime_error {
public:
2012-12-12 15:44:41 +00:00
explicit FormatError(const std::string &message)
: std::runtime_error(message) {}
2012-12-11 18:27:13 +00:00
};
2012-12-22 22:05:56 +00:00
enum Alignment {
ALIGN_DEFAULT, ALIGN_LEFT, ALIGN_RIGHT, ALIGN_CENTER, ALIGN_NUMERIC
};
2012-12-21 04:10:55 +00:00
struct FormatSpec {
2012-12-22 22:05:56 +00:00
Alignment align;
2012-12-21 04:10:55 +00:00
unsigned flags;
unsigned width;
char type;
char fill;
2012-12-21 17:12:04 +00:00
2012-12-22 22:05:56 +00:00
FormatSpec() : align(ALIGN_DEFAULT), flags(0), width(0), type(0), fill(' ') {}
2012-12-21 04:10:55 +00:00
};
class BasicFormatter {
protected:
enum { INLINE_BUFFER_SIZE = 500 };
internal::Array<char, INLINE_BUFFER_SIZE> buffer_; // Output buffer.
// Grows the buffer by n characters and returns a pointer to the newly
// allocated area.
char *GrowBuffer(std::size_t n) {
std::size_t size = buffer_.size();
buffer_.resize(size + n);
return &buffer_[size];
}
public:
void operator<<(int value);
};
/**
\rst
2013-01-03 16:57:34 +00:00
The :cpp:class:`format::Formatter` class provides string formatting
functionality similar to Python's `str.format
<http://docs.python.org/3/library/stdtypes.html#str.format>`__.
The output is stored in a memory buffer that grows dynamically.
2013-01-03 16:57:34 +00:00
**Example**::
Formatter out;
out("Current point:\n");
out("(-{:+f}, {:+f})") << 3.14 << -3.14;
This will populate the buffer of the ``out`` object with the following
output:
.. code-block:: none
Current point:
(-3.140000, +3.140000)
The buffer can be accessed using :meth:`data` or :meth:`c_str`.
\endrst
*/
class Formatter : public BasicFormatter {
private:
2012-12-07 16:31:09 +00:00
enum Type {
// Numeric types should go first.
2012-12-09 22:13:23 +00:00
INT, UINT, LONG, ULONG, DOUBLE, LONG_DOUBLE,
LAST_NUMERIC_TYPE = LONG_DOUBLE,
CHAR, STRING, WSTRING, POINTER, CUSTOM
2012-12-07 16:31:09 +00:00
};
2012-12-21 04:10:55 +00:00
typedef void (Formatter::*FormatFunc)(
const void *arg, const FormatSpec &spec);
// A format argument.
2012-12-11 18:27:13 +00:00
class Arg {
private:
// This method is private to disallow formatting of arbitrary pointers.
// If you want to output a pointer cast it to const void*. Do not implement!
template <typename T>
Arg(const T *value);
// This method is private to disallow formatting of arbitrary pointers.
// If you want to output a pointer cast it to void*. Do not implement!
template <typename T>
Arg(T *value);
// This method is private to disallow formatting of wide characters.
// If you want to output a wide character cast it to integer type.
// Do not implement!
Arg(wchar_t value);
public:
2012-12-07 16:31:09 +00:00
Type type;
union {
int int_value;
unsigned uint_value;
double double_value;
long long_value;
unsigned long ulong_value;
long double long_double_value;
const void *pointer_value;
struct {
2012-12-12 05:47:05 +00:00
const char *value;
2012-12-09 17:03:47 +00:00
std::size_t size;
2012-12-12 05:47:05 +00:00
} string;
2012-12-09 17:03:47 +00:00
struct {
2012-12-12 05:47:05 +00:00
const void *value;
FormatFunc format;
2012-12-12 05:47:05 +00:00
} custom;
2012-12-07 16:31:09 +00:00
};
2012-12-11 20:23:52 +00:00
mutable Formatter *formatter;
2012-12-11 18:27:13 +00:00
2012-12-12 05:47:05 +00:00
Arg(int value) : type(INT), int_value(value), formatter(0) {}
Arg(unsigned value) : type(UINT), uint_value(value), formatter(0) {}
Arg(long value) : type(LONG), long_value(value), formatter(0) {}
Arg(unsigned long value) : type(ULONG), ulong_value(value), formatter(0) {}
Arg(double value) : type(DOUBLE), double_value(value), formatter(0) {}
Arg(long double value)
: type(LONG_DOUBLE), long_double_value(value), formatter(0) {}
Arg(char value) : type(CHAR), int_value(value), formatter(0) {}
Arg(const char *value) : type(STRING), formatter(0) {
string.value = value;
string.size = 0;
}
Arg(char *value) : type(STRING), formatter(0) {
string.value = value;
string.size = 0;
}
Arg(const void *value)
: type(POINTER), pointer_value(value), formatter(0) {}
Arg(void *value) : type(POINTER), pointer_value(value), formatter(0) {}
Arg(const std::string &value) : type(STRING), formatter(0) {
string.value = value.c_str();
string.size = value.size();
}
2012-12-11 18:27:13 +00:00
template <typename T>
2012-12-12 05:47:05 +00:00
Arg(const T &value) : type(CUSTOM), formatter(0) {
custom.value = &value;
custom.format = &Formatter::FormatCustomArg<T>;
}
2012-12-11 18:27:13 +00:00
~Arg() {
// Format is called here to make sure that a referred object is
// still alive, for example:
2012-12-11 18:27:13 +00:00
//
// Print("{0}") << std::string("test");
//
// Here an Arg object refers to a temporary std::string which is
// destroyed at the end of the statement. Since the string object is
// constructed before the Arg object, it will be destroyed after,
// so it will be alive in the Arg's destructor where Format is called.
2012-12-11 18:27:13 +00:00
// Note that the string object will not necessarily be alive when
// the destructor of ArgInserter is called.
formatter->CompleteFormatting();
2012-12-11 18:27:13 +00:00
}
2012-12-07 16:31:09 +00:00
};
2012-12-11 04:37:35 +00:00
enum { NUM_INLINE_ARGS = 10 };
2012-12-12 17:14:00 +00:00
internal::Array<const Arg*, NUM_INLINE_ARGS> args_; // Format arguments.
2012-12-07 16:31:09 +00:00
const char *format_; // Format string.
2012-12-12 23:21:11 +00:00
int num_open_braces_;
2012-12-27 14:56:55 +00:00
int next_arg_index_;
2012-12-07 16:31:09 +00:00
2012-12-12 17:14:00 +00:00
friend class internal::ArgInserter;
friend class ArgFormatter;
2012-12-07 16:31:09 +00:00
void Add(const Arg &arg) {
2012-12-11 18:27:13 +00:00
args_.push_back(&arg);
2012-12-07 16:31:09 +00:00
}
2012-12-25 21:25:14 +00:00
void ReportError(const char *s, StringRef message) const;
2012-12-12 23:21:11 +00:00
char *PrepareFilledBuffer(unsigned size, const FormatSpec &spec, char sign);
2012-12-22 22:05:56 +00:00
2012-12-10 19:08:16 +00:00
// Formats an integer.
2012-12-07 16:31:09 +00:00
template <typename T>
void FormatInt(T value, const FormatSpec &spec);
2012-12-10 19:08:16 +00:00
2012-12-10 23:04:55 +00:00
// Formats a floating point number (double or long double).
2012-12-10 19:08:16 +00:00
template <typename T>
2012-12-21 04:10:55 +00:00
void FormatDouble(T value, const FormatSpec &spec, int precision);
2012-12-07 16:31:09 +00:00
2012-12-28 16:27:54 +00:00
char *FormatString(const char *s, std::size_t size, const FormatSpec &spec);
2012-12-23 01:53:13 +00:00
2012-12-09 17:03:47 +00:00
// Formats an argument of a custom type, such as a user-defined class.
template <typename T>
2012-12-21 04:10:55 +00:00
void FormatCustomArg(const void *arg, const FormatSpec &spec);
2012-12-12 23:21:11 +00:00
unsigned ParseUInt(const char *&s) const;
// Parses argument index and returns an argument with this index.
2012-12-27 14:56:55 +00:00
const Arg &ParseArgIndex(const char *&s);
2012-12-12 23:21:11 +00:00
2012-12-25 21:45:12 +00:00
void CheckSign(const char *&s, const Arg &arg);
2012-12-11 20:23:52 +00:00
void DoFormat();
void CompleteFormatting() {
2012-12-11 20:23:52 +00:00
if (!format_) return;
DoFormat();
}
2012-12-07 16:31:09 +00:00
public:
2013-01-04 15:04:35 +00:00
/**
\rst
Constructs a formatter with an empty output buffer.
\endrst
*/
Formatter() : format_(0) { buffer_[0] = 0; }
2012-12-07 16:31:09 +00:00
2013-01-04 15:04:35 +00:00
/**
\rst
Formats a string appending the output to the internal buffer.
Arguments are accepted through the returned ``ArgInserter`` object
using inserter operator ``<<``.
\endrst
*/
internal::ArgInserter operator()(StringRef format);
2012-12-07 16:31:09 +00:00
2013-01-04 15:04:35 +00:00
/**
\rst
Returns the number of characters written to the output buffer.
\endrst
*/
2012-12-09 17:03:47 +00:00
std::size_t size() const { return buffer_.size(); }
2013-01-04 15:04:35 +00:00
/**
\rst
Returns a pointer to the output buffer content. No terminating null
character is appended.
\endrst
*/
const char *data() const { return &buffer_[0]; }
2013-01-04 15:04:35 +00:00
/**
\rst
Returns a pointer to the output buffer content with terminating null
character appended.
\endrst
*/
const char *c_str() const { return &buffer_[0]; }
2013-01-04 15:04:35 +00:00
/**
\rst
Returns the content of the output buffer as an ``std::string``.
\endrst
*/
std::string str() const { return std::string(&buffer_[0], buffer_.size()); }
2012-12-07 16:31:09 +00:00
};
2012-12-12 17:14:00 +00:00
namespace internal {
// This is a transient object that normally exists only as a temporary
// returned by one of the formatting functions. It stores a reference
// to a formatter and provides operator<< that feeds arguments to the
// formatter.
class ArgInserter {
private:
mutable Formatter *formatter_;
friend class format::Formatter;
2012-12-18 23:39:42 +00:00
friend class format::StringRef;
2012-12-12 17:14:00 +00:00
// Do not implement.
void operator=(const ArgInserter& other);
2012-12-12 17:14:00 +00:00
protected:
explicit ArgInserter(Formatter *f = 0) : formatter_(f) {}
void Init(Formatter &f, const char *format) {
const ArgInserter &other = f(format);
formatter_ = other.formatter_;
2012-12-12 17:14:00 +00:00
other.formatter_ = 0;
}
ArgInserter(const ArgInserter& other)
: formatter_(other.formatter_) {
2012-12-12 17:14:00 +00:00
other.formatter_ = 0;
}
const Formatter *Format() const {
Formatter *f = formatter_;
if (f) {
formatter_ = 0;
f->CompleteFormatting();
2012-12-12 17:14:00 +00:00
}
return f;
}
Formatter *formatter() const { return formatter_; }
const char *format() const { return formatter_->format_; }
void ResetFormatter() const { formatter_ = 0; }
2012-12-12 17:14:00 +00:00
struct Proxy {
Formatter *formatter;
explicit Proxy(Formatter *f) : formatter(f) {}
2012-12-18 23:39:42 +00:00
Formatter *Format() {
formatter->CompleteFormatting();
return formatter;
}
};
2012-12-12 17:14:00 +00:00
public:
~ArgInserter() {
if (formatter_)
formatter_->CompleteFormatting();
2012-12-12 17:14:00 +00:00
}
// Feeds an argument to a formatter.
ArgInserter &operator<<(const Formatter::Arg &arg) {
arg.formatter = formatter_;
formatter_->Add(arg);
return *this;
}
operator Proxy() {
Formatter *f = formatter_;
formatter_ = 0;
return Proxy(f);
}
2012-12-19 18:47:00 +00:00
operator StringRef() {
const Formatter *f = Format();
return StringRef(f->c_str(), f->size());
}
// Performs formatting and returns a std::string with the output.
friend std::string str(Proxy p) {
2012-12-18 23:39:42 +00:00
return p.Format()->str();
}
2012-12-18 05:13:54 +00:00
2012-12-12 17:14:00 +00:00
// Performs formatting and returns a C string with the output.
friend const char *c_str(Proxy p) {
2012-12-18 23:39:42 +00:00
return p.Format()->c_str();
2012-12-12 17:14:00 +00:00
}
};
std::string str(ArgInserter::Proxy p);
2012-12-18 23:39:42 +00:00
const char *c_str(ArgInserter::Proxy p);
2012-12-12 17:14:00 +00:00
}
using format::internal::str;
2012-12-18 23:39:42 +00:00
using format::internal::c_str;
// ArgFormatter provides access to the format buffer within custom
// Format functions. It is not desirable to pass Formatter to these
// functions because Formatter::operator() is not reentrant and
// therefore can't be used for argument formatting.
class ArgFormatter {
private:
Formatter &formatter_;
public:
explicit ArgFormatter(Formatter &f) : formatter_(f) {}
2012-12-21 04:10:55 +00:00
void Write(const std::string &s, const FormatSpec &spec) {
2012-12-23 01:53:13 +00:00
formatter_.FormatString(s.data(), s.size(), spec);
}
};
// The default formatting function.
2012-12-09 17:03:47 +00:00
template <typename T>
2012-12-21 04:10:55 +00:00
void Format(ArgFormatter &af, const FormatSpec &spec, const T &value) {
2012-12-09 17:03:47 +00:00
std::ostringstream os;
os << value;
2012-12-21 04:10:55 +00:00
af.Write(os.str(), spec);
}
template <typename T>
2012-12-21 04:10:55 +00:00
void Formatter::FormatCustomArg(const void *arg, const FormatSpec &spec) {
ArgFormatter af(*this);
2012-12-21 04:10:55 +00:00
Format(af, spec, *static_cast<const T*>(arg));
2012-12-09 17:03:47 +00:00
}
inline internal::ArgInserter Formatter::operator()(StringRef format) {
2012-12-12 17:14:00 +00:00
internal::ArgInserter formatter(this);
format_ = format.c_str();
args_.clear();
return formatter;
2012-12-07 16:31:09 +00:00
}
2013-01-03 16:57:34 +00:00
// A formatting action that does nothing.
struct NoAction {
void operator()(const Formatter &) const {}
};
// A formatter with an action performed when formatting is complete.
// Objects of this class normally exist only as temporaries returned
// by one of the formatting functions, thus the name.
2013-01-03 16:57:34 +00:00
template <typename Action = NoAction>
class TempFormatter : public internal::ArgInserter {
2012-12-07 16:31:09 +00:00
private:
Formatter formatter_;
Action action_;
2012-12-07 16:31:09 +00:00
// Forbid copying other than from a temporary. Do not implement.
TempFormatter(TempFormatter &);
2012-12-07 16:31:09 +00:00
// Do not implement.
TempFormatter& operator=(const TempFormatter &);
struct Proxy {
const char *format;
Action action;
Proxy(const char *fmt, Action a) : format(fmt), action(a) {}
};
2012-12-07 16:31:09 +00:00
public:
// Creates an active formatter with a format string and an action.
// Action should be an unary function object that takes a const
// reference to Formatter as an argument. See Ignore and Write
// for examples of action classes.
2013-01-03 16:57:34 +00:00
explicit TempFormatter(StringRef format, Action a = Action())
: action_(a) {
2013-01-03 16:57:34 +00:00
Init(formatter_, format.c_str());
2012-12-07 16:31:09 +00:00
}
TempFormatter(const Proxy &p)
: ArgInserter(0), action_(p.action) {
Init(formatter_, p.format);
2012-12-12 04:49:01 +00:00
}
~TempFormatter() {
2012-12-12 04:49:01 +00:00
if (formatter())
action_(*Format());
2012-12-07 16:31:09 +00:00
}
operator Proxy() {
const char *fmt = format();
ResetFormatter();
return Proxy(fmt, action_);
}
2012-12-07 16:31:09 +00:00
};
2013-01-03 16:57:34 +00:00
/**
\rst
Formats a string. Returns a temporary formatter object that accepts
arguments via operator ``<<``. *format* is a format string that contains
literal text and replacement fields surrounded by braces ``{}``.
The formatter object replaces the fields with formatted arguments
and stores the output in a memory buffer. The content of the buffer can
be converted to ``std::string`` with :meth:`str` or accessed as a C string
with :meth:`c_str`.
2012-12-07 16:31:09 +00:00
2013-01-03 16:57:34 +00:00
**Example**::
std::string message = str(Format("Elapsed time: {0:.2f} seconds") << 1.23);
See also `Format String Syntax`_.
\endrst
*/
inline TempFormatter<> Format(StringRef format) {
return TempFormatter<>(format);
}
2012-12-07 16:31:09 +00:00
// A formatting action that writes formatted output to stdout.
struct Write {
void operator()(const Formatter &f) const {
std::fwrite(f.data(), 1, f.size(), stdout);
2012-12-07 16:31:09 +00:00
}
};
// Formats a string and prints it to stdout.
// Example:
// Print("Elapsed time: {0:.2f} seconds") << 1.23;
2013-01-03 16:57:34 +00:00
inline TempFormatter<Write> Print(StringRef format) {
return TempFormatter<Write>(format);
}
2012-12-07 16:31:09 +00:00
}
namespace fmt = format;
#endif // FORMAT_H_