X-Git-Url: http://plrg.eecs.uci.edu/git/?p=folly.git;a=blobdiff_plain;f=folly%2FString.h;h=c9982f356d8cd26ee30ede7534db150d1397008e;hp=563f5313ecc04a63c4fb739763a819a93026c1c6;hb=43d3a315bbd54cb187021897b566ffb53290a44b;hpb=db66e2f4b93dee8c8834dede216e068a3a3e40af diff --git a/folly/String.h b/folly/String.h index 563f5313..c9982f35 100644 --- a/folly/String.h +++ b/folly/String.h @@ -1,5 +1,5 @@ /* - * Copyright 2014 Facebook, Inc. + * Copyright 2016 Facebook, Inc. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. @@ -14,12 +14,15 @@ * limitations under the License. */ -#ifndef FOLLY_BASE_STRING_H_ -#define FOLLY_BASE_STRING_H_ +#pragma once +#define FOLLY_STRING_H_ #include +#include #include +#include #include +#include #ifdef FOLLY_HAVE_DEPRECATED_ASSOC #ifdef _GLIBCXX_SYMVER @@ -32,7 +35,7 @@ #include #include -#include +#include #include #include #include @@ -186,6 +189,16 @@ std::string& stringAppendf(std::string* output, FOLLY_PRINTF_FORMAT const char* format, ...) FOLLY_PRINTF_FORMAT_ATTR(2, 3); +/** + * Similar to stringPrintf, but accepts a va_list argument. + * + * As with vsnprintf() itself, the value of ap is undefined after the call. + * These functions do not call va_end() on ap. + */ +std::string stringVPrintf(const char* format, va_list ap); +void stringVPrintf(std::string* out, const char* format, va_list ap); +std::string& stringVAppendf(std::string* out, const char* format, va_list ap); + /** * Backslashify a string, that is, replace non-printable characters * with C-style (but NOT C compliant) "\xHH" encoding. If hex_style @@ -247,6 +260,21 @@ template bool hexlify(const InputString& input, OutputString& output, bool append=false); +template +OutputString hexlify(ByteRange input) { + OutputString output; + if (!hexlify(input, output)) { + // hexlify() currently always returns true, so this can't really happen + throw std::runtime_error("hexlify failed"); + } + return output; +} + +template +OutputString hexlify(StringPiece input) { + return hexlify(ByteRange{input}); +} + /** * Same functionality as Python's binascii.unhexlify. Returns true * on successful conversion. @@ -254,6 +282,17 @@ bool hexlify(const InputString& input, OutputString& output, template bool unhexlify(const InputString& input, OutputString& output); +template +OutputString unhexlify(StringPiece input) { + OutputString output; + if (!unhexlify(input, output)) { + // unhexlify() fails if the input has non-hexidecimal characters, + // or if it doesn't consist of a whole number of bytes + throw std::domain_error("unhexlify() called with non-hex input"); + } + return output; +} + /* * A pretty-printer for numbers that appends suffixes of units of the * given type. It prints 4 sig-figs of value with the most @@ -348,23 +387,6 @@ std::string hexDump(const void* ptr, size_t size); */ fbstring errnoStr(int err); -/** - * Debug string for an exception: include type and what(). - */ -inline fbstring exceptionStr(const std::exception& e) { - return folly::to(demangle(typeid(e)), ": ", e.what()); -} - -inline fbstring exceptionStr(std::exception_ptr ep) { - try { - std::rethrow_exception(ep); - } catch (const std::exception& e) { - return exceptionStr(e); - } catch (...) { - return ""; - } -} - /* * Split a string into a list of tokens by delimiter. * @@ -398,26 +420,28 @@ template void split(const Delim& delimiter, const String& input, std::vector& out, - bool ignoreEmpty = false); + const bool ignoreEmpty = false); template void split(const Delim& delimiter, const String& input, folly::fbvector& out, - bool ignoreEmpty = false); + const bool ignoreEmpty = false); template void splitTo(const Delim& delimiter, const String& input, OutputIterator out, - bool ignoreEmpty = false); + const bool ignoreEmpty = false); /* * Split a string into a fixed number of string pieces and/or numeric types - * by delimiter. Any numeric type that folly::to<> can convert to from a - * string piece is supported as a target. Returns 'true' if the fields were - * all successfully populated. + * by delimiter. Conversions are supported for any type which folly:to<> can + * target, including all overloads of parseTo(). Returns 'true' if the fields + * were all successfully populated. Returns 'false' if there were too few + * fields in the input, or too many fields if exact=true. Casting exceptions + * will not be caught. * * Examples: * @@ -445,20 +469,58 @@ void splitTo(const Delim& delimiter, * Note that this will likely not work if the last field's target is of numeric * type, in which case folly::to<> will throw an exception. */ +template +struct IsSomeVector { + enum { value = false }; +}; + +template +struct IsSomeVector, void> { + enum { value = true }; +}; + +template +struct IsSomeVector, void> { + enum { value = true }; +}; + +template +struct IsConvertible { + enum { value = false }; +}; + template -using IsSplitTargetType = std::integral_constant::value || - std::is_same::value>; - -template -typename std::enable_if::value, bool>::type -split(const Delim& delimiter, - StringPiece input, - OutputType& outHead, - OutputTypes&... outTail); +struct IsConvertible< + T, + decltype(static_cast( + parseTo(std::declval(), std::declval())))> { + enum { value = true }; +}; + +template +struct AllConvertible; + +template +struct AllConvertible { + enum { value = IsConvertible::value && AllConvertible::value }; +}; + +template <> +struct AllConvertible<> { + enum { value = true }; +}; + +static_assert(AllConvertible::value, ""); +static_assert(AllConvertible::value, ""); +static_assert(AllConvertible::value, ""); +static_assert(AllConvertible::value, ""); +static_assert(!AllConvertible>::value, ""); + +template +typename std::enable_if< + AllConvertible::value && sizeof...(OutputTypes) >= 1, + bool>::type +split(const Delim& delimiter, StringPiece input, OutputTypes&... outputs); /* * Join list of tokens. @@ -503,11 +565,56 @@ std::string join(const Delim& delimiter, return output; } +template ::iterator_category, + std::random_access_iterator_tag>::value>::type* = nullptr> +std::string join(const Delim& delimiter, Iterator begin, Iterator end) { + std::string output; + join(delimiter, begin, end, output); + return output; +} + +/** + * Returns a subpiece with all whitespace removed from the front of @sp. + * Whitespace means any of [' ', '\n', '\r', '\t']. + */ +StringPiece ltrimWhitespace(StringPiece sp); + +/** + * Returns a subpiece with all whitespace removed from the back of @sp. + * Whitespace means any of [' ', '\n', '\r', '\t']. + */ +StringPiece rtrimWhitespace(StringPiece sp); + +/** + * Returns a subpiece with all whitespace removed from the back and front of @sp. + * Whitespace means any of [' ', '\n', '\r', '\t']. + */ +inline StringPiece trimWhitespace(StringPiece sp) { + return ltrimWhitespace(rtrimWhitespace(sp)); +} + /** * Returns a subpiece with all whitespace removed from the front of @sp. * Whitespace means any of [' ', '\n', '\r', '\t']. + * DEPRECATED: @see ltrimWhitespace @see rtrimWhitespace */ -StringPiece skipWhitespace(StringPiece sp); +inline StringPiece skipWhitespace(StringPiece sp) { + return ltrimWhitespace(sp); +} + +/** + * Strips the leading and the trailing whitespace-only lines. Then looks for + * the least indented non-whitespace-only line and removes its amount of + * leading whitespace from every line. Assumes leading whitespace is either all + * spaces or all tabs. + * + * Purpose: including a multiline string literal in source code, indented to + * the level expected from context. + */ +std::string stripLeftMargin(std::string s); /** * Fast, in-place lowercasing of ASCII alphabetic characters in strings. @@ -522,37 +629,22 @@ inline void toLowerAscii(MutableStringPiece str) { toLowerAscii(str.begin(), str.size()); } -} // namespace folly - -// Hash functions to make std::string usable with e.g. hash_map -// -// Handle interaction with different C++ standard libraries, which -// expect these types to be in different namespaces. -namespace std { - -template -struct hash > : private hash { - size_t operator()(const std::basic_string & s) const { - return hash::operator()(s.c_str()); - } +template >> +class UTF8Range : public Base { + public: + /* implicit */ UTF8Range(const folly::Range baseRange) + : Base(boost::u8_to_u32_iterator( + baseRange.begin(), baseRange.begin(), baseRange.end()), + boost::u8_to_u32_iterator( + baseRange.end(), baseRange.begin(), baseRange.end())) {} + /* implicit */ UTF8Range(const std::string& baseString) + : Base(folly::Range(baseString)) {} }; -} - -#if FOLLY_HAVE_DEPRECATED_ASSOC -#if defined(_GLIBCXX_SYMVER) && !defined(__BIONIC__) -namespace __gnu_cxx { +using UTF8StringPiece = UTF8Range; -template -struct hash > : private hash { - size_t operator()(const std::basic_string & s) const { - return hash::operator()(s.c_str()); - } -}; - -} -#endif -#endif +} // namespace folly // Hook into boost's type traits namespace boost { @@ -563,5 +655,3 @@ struct has_nothrow_constructor > : true_type { } // namespace boost #include - -#endif