cast.cpp 27 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844
  1. #include <util/system/defaults.h>
  2. #if defined(_freebsd_) && !defined(__LONG_LONG_SUPPORTED)
  3. #define __LONG_LONG_SUPPORTED
  4. #endif
  5. #include <cstdio>
  6. #include <string>
  7. #include <cmath>
  8. #include <util/string/type.h>
  9. #include <util/string/cast.h>
  10. #include <util/string/escape.h>
  11. #include <contrib/libs/double-conversion/double-conversion.h>
  12. #include <util/generic/string.h>
  13. #include <util/system/yassert.h>
  14. #include <util/generic/yexception.h>
  15. #include <util/generic/typetraits.h>
  16. #include <util/generic/ylimits.h>
  17. #include <util/generic/singleton.h>
  18. #include <util/generic/utility.h>
  19. using double_conversion::DoubleToStringConverter;
  20. using double_conversion::StringBuilder;
  21. using double_conversion::StringToDoubleConverter;
  22. /*
  23. * ------------------------------ formatters ------------------------------
  24. */
  25. namespace {
  26. constexpr char IntToChar[] = {'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 'A', 'B', 'C', 'D', 'E', 'F'};
  27. static_assert(Y_ARRAY_SIZE(IntToChar) == 16, "expect Y_ARRAY_SIZE(IntToChar) == 16");
  28. // clang-format off
  29. constexpr int LetterToIntMap[] = {
  30. 20, 20, 20, 20, 20, 20, 20, 20, 20, 20,
  31. 20, 20, 20, 20, 20, 20, 20, 20, 20, 20,
  32. 20, 20, 20, 20, 20, 20, 20, 20, 20, 20,
  33. 20, 20, 20, 20, 20, 20, 20, 20, 20, 20,
  34. 20, 20, 20, 20, 20, 20, 20, 20, 0, 1,
  35. 2, 3, 4, 5, 6, 7, 8, 9, 20, 20,
  36. 20, 20, 20, 20, 20, 10, 11, 12, 13, 14,
  37. 15, 20, 20, 20, 20, 20, 20, 20, 20, 20,
  38. 20, 20, 20, 20, 20, 20, 20, 20, 20, 20,
  39. 20, 20, 20, 20, 20, 20, 20, 10, 11, 12,
  40. 13, 14, 15,
  41. };
  42. // clang-format on
  43. template <class T>
  44. std::enable_if_t<std::is_signed<T>::value, std::make_unsigned_t<T>> NegateNegativeSigned(T value) noexcept {
  45. return std::make_unsigned_t<T>(-(value + 1)) + std::make_unsigned_t<T>(1);
  46. }
  47. template <class T>
  48. std::enable_if_t<std::is_unsigned<T>::value, std::make_unsigned_t<T>> NegateNegativeSigned(T) noexcept {
  49. Y_UNREACHABLE();
  50. }
  51. template <class T>
  52. std::make_signed_t<T> NegatePositiveSigned(T value) noexcept {
  53. return value > 0 ? (-std::make_signed_t<T>(value - 1) - 1) : 0;
  54. }
  55. template <class T, unsigned base, class TChar>
  56. struct TBasicIntFormatter {
  57. static_assert(1 < base && base < 17, "expect 1 < base && base < 17");
  58. static_assert(std::is_unsigned<T>::value, "TBasicIntFormatter can only handle unsigned integers.");
  59. static inline size_t Format(T value, TChar* buf, size_t len) {
  60. Y_ENSURE(len, TStringBuf("zero length"));
  61. TChar* tmp = buf;
  62. do {
  63. // divide only once, do not use mod
  64. const T nextVal = static_cast<T>(value / base);
  65. *tmp++ = IntToChar[base == 2 || base == 4 || base == 8 || base == 16 ? value & (base - 1) : value - base * nextVal];
  66. value = nextVal;
  67. } while (value && --len);
  68. Y_ENSURE(!value, TStringBuf("not enough room in buffer"));
  69. const size_t result = tmp - buf;
  70. --tmp;
  71. while (buf < tmp) {
  72. TChar c = *buf;
  73. *buf = *tmp;
  74. *tmp = c;
  75. ++buf;
  76. --tmp;
  77. }
  78. return result;
  79. }
  80. };
  81. template <class T, unsigned base, class TChar>
  82. struct TIntFormatter {
  83. static_assert(1 < base && base < 17, "expect 1 < base && base < 17");
  84. static_assert(std::is_integral<T>::value, "T must be an integral type.");
  85. static inline size_t Format(T value, TChar* buf, size_t len) {
  86. using TUFmt = TBasicIntFormatter<std::make_unsigned_t<T>, base, TChar>;
  87. if (std::is_signed<T>::value && value < 0) {
  88. Y_ENSURE(len >= 2, TStringBuf("not enough room in buffer"));
  89. *buf = '-';
  90. return 1 + TUFmt::Format(NegateNegativeSigned(value), buf + 1, len - 1);
  91. }
  92. return TUFmt::Format(value, buf, len);
  93. }
  94. };
  95. template <class T>
  96. struct TFltModifiers;
  97. template <class T, int base, class TChar>
  98. Y_NO_INLINE size_t FormatInt(T value, TChar* buf, size_t len) {
  99. return TIntFormatter<T, base, TChar>::Format(value, buf, len);
  100. }
  101. template <class T>
  102. inline size_t FormatFlt(T t, char* buf, size_t len) {
  103. const int ret = snprintf(buf, len, TFltModifiers<T>::ModifierWrite, t);
  104. Y_ENSURE(ret >= 0 && (size_t)ret <= len, TStringBuf("cannot format float"));
  105. return (size_t)ret;
  106. }
  107. enum EParseStatus {
  108. PS_OK = 0,
  109. PS_EMPTY_STRING,
  110. PS_PLUS_STRING,
  111. PS_MINUS_STRING,
  112. PS_BAD_SYMBOL,
  113. PS_OVERFLOW,
  114. };
  115. constexpr ui8 SAFE_LENS[4][17] = {
  116. {0, 0, 7, 5, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1},
  117. {0, 0, 15, 10, 7, 6, 6, 5, 5, 5, 4, 4, 4, 4, 4, 4, 3},
  118. {0, 0, 31, 20, 15, 13, 12, 11, 10, 10, 9, 9, 8, 8, 8, 8, 7},
  119. {0, 0, 63, 40, 31, 27, 24, 22, 21, 20, 19, 18, 17, 17, 16, 16, 15},
  120. };
  121. inline constexpr ui8 ConstLog2(ui8 x) noexcept {
  122. return x == 1 ? 0 : 1 + ConstLog2(x / 2);
  123. }
  124. template <unsigned BASE, class TChar, class T>
  125. inline std::enable_if_t<(BASE > 10), bool> CharToDigit(TChar c, T* digit) noexcept {
  126. unsigned uc = c;
  127. if (uc >= Y_ARRAY_SIZE(LetterToIntMap)) {
  128. return false;
  129. }
  130. *digit = LetterToIntMap[uc];
  131. return *digit < BASE;
  132. }
  133. template <unsigned BASE, class TChar, class T>
  134. inline std::enable_if_t<(BASE <= 10), bool> CharToDigit(TChar c, T* digit) noexcept {
  135. return (c >= '0') && ((*digit = (c - '0')) < BASE);
  136. }
  137. template <class T, unsigned base, class TChar>
  138. struct TBasicIntParser {
  139. static_assert(1 < base && base < 17, "Expect 1 < base && base < 17.");
  140. static_assert(std::is_unsigned<T>::value, "TBasicIntParser can only handle unsigned integers.");
  141. enum : unsigned {
  142. BASE_POW_2 = base * base,
  143. };
  144. static inline EParseStatus Parse(const TChar** ppos, const TChar* end, T max, T* target) noexcept {
  145. Y_ASSERT(*ppos != end); /* This check should be somewhere up the stack. */
  146. const size_t maxSafeLen = SAFE_LENS[ConstLog2(sizeof(T))][base];
  147. // can parse without overflow
  148. if (size_t(end - *ppos) <= maxSafeLen) {
  149. T result;
  150. if (ParseFast(*ppos, end, &result) && result <= max) {
  151. *target = result;
  152. return PS_OK;
  153. }
  154. }
  155. return ParseSlow(ppos, end, max, target);
  156. }
  157. static inline bool ParseFast(const TChar* pos, const TChar* end, T* target) noexcept {
  158. T result = T();
  159. T d1;
  160. T d2;
  161. // we have end > pos
  162. auto beforeEnd = end - 1;
  163. while (pos < beforeEnd && CharToDigit<base>(*pos, &d1) && CharToDigit<base>(*(pos + 1), &d2)) {
  164. result = result * BASE_POW_2 + d1 * base + d2;
  165. pos += 2;
  166. }
  167. while (pos != end && CharToDigit<base>(*pos, &d1)) {
  168. result = result * base + d1;
  169. ++pos;
  170. }
  171. *target = result;
  172. return pos == end;
  173. }
  174. static inline EParseStatus ParseSlow(const TChar** ppos, const TChar* end, T max, T* target) noexcept {
  175. T result = T();
  176. T preMulMax = max / base;
  177. const TChar* pos = *ppos;
  178. while (pos != end) {
  179. T digit;
  180. if (!CharToDigit<base>(*pos, &digit)) {
  181. *ppos = pos;
  182. return PS_BAD_SYMBOL;
  183. }
  184. if (result > preMulMax) {
  185. return PS_OVERFLOW;
  186. }
  187. result *= base;
  188. if (result > max - digit) {
  189. return PS_OVERFLOW;
  190. }
  191. result += digit;
  192. pos++;
  193. }
  194. *target = result;
  195. return PS_OK;
  196. }
  197. };
  198. template <class T>
  199. struct TBounds {
  200. T PositiveMax;
  201. T NegativeMax;
  202. };
  203. template <class T, unsigned base, class TChar>
  204. struct TIntParser {
  205. static_assert(1 < base && base < 17, "Expect 1 < base && base < 17.");
  206. static_assert(std::is_integral<T>::value, "T must be an integral type.");
  207. enum {
  208. IsSigned = std::is_signed<T>::value
  209. };
  210. using TUnsigned = std::make_unsigned_t<T>;
  211. static inline EParseStatus Parse(const TChar** ppos, const TChar* end, const TBounds<TUnsigned>& bounds, T* target) {
  212. const TChar* pos = *ppos;
  213. if (pos == end) {
  214. return PS_EMPTY_STRING;
  215. }
  216. bool negative = false;
  217. TUnsigned max;
  218. if (*pos == '+') {
  219. pos++;
  220. max = bounds.PositiveMax;
  221. if (pos == end) {
  222. return PS_PLUS_STRING;
  223. }
  224. } else if (IsSigned && *pos == '-') {
  225. pos++;
  226. max = bounds.NegativeMax;
  227. negative = true;
  228. if (pos == end) {
  229. return PS_MINUS_STRING;
  230. }
  231. } else {
  232. max = bounds.PositiveMax;
  233. }
  234. TUnsigned result;
  235. EParseStatus error = TBasicIntParser<TUnsigned, base, TChar>::Parse(&pos, end, max, &result);
  236. if (error != PS_OK) {
  237. *ppos = pos;
  238. return error;
  239. }
  240. if (IsSigned) {
  241. *target = negative ? NegatePositiveSigned(result) : static_cast<T>(result);
  242. } else {
  243. *target = result;
  244. }
  245. return PS_OK;
  246. }
  247. };
  248. template <class TChar>
  249. [[noreturn]] static Y_NO_INLINE void ThrowParseError(EParseStatus status, const TChar* data, size_t len, const TChar* pos) {
  250. Y_ASSERT(status != PS_OK);
  251. typedef TBasicString<TChar> TStringType;
  252. switch (status) {
  253. case PS_EMPTY_STRING:
  254. ythrow TFromStringException() << TStringBuf("Cannot parse empty string as number. ");
  255. case PS_PLUS_STRING:
  256. ythrow TFromStringException() << TStringBuf("Cannot parse string \"+\" as number. ");
  257. case PS_MINUS_STRING:
  258. ythrow TFromStringException() << TStringBuf("Cannot parse string \"-\" as number. ");
  259. case PS_BAD_SYMBOL:
  260. ythrow TFromStringException() << TStringBuf("Unexpected symbol \"") << EscapeC(*pos) << TStringBuf("\" at pos ") << (pos - data) << TStringBuf(" in string ") << TStringType(data, len).Quote() << TStringBuf(". ");
  261. case PS_OVERFLOW:
  262. ythrow TFromStringException() << TStringBuf("Integer overflow in string ") << TStringType(data, len).Quote() << TStringBuf(". ");
  263. default:
  264. ythrow yexception() << TStringBuf("Unknown error code in string converter. ");
  265. }
  266. }
  267. template <typename T, typename TUnsigned, int base, typename TChar>
  268. Y_NO_INLINE T ParseInt(const TChar* data, size_t len, const TBounds<TUnsigned>& bounds) {
  269. T result;
  270. const TChar* pos = data;
  271. EParseStatus status = TIntParser<T, base, TChar>::Parse(&pos, pos + len, bounds, &result);
  272. if (status == PS_OK) {
  273. return result;
  274. } else {
  275. ThrowParseError(status, data, len, pos);
  276. }
  277. }
  278. template <typename T, typename TUnsigned, int base, typename TChar>
  279. Y_NO_INLINE bool TryParseInt(const TChar* data, size_t len, const TBounds<TUnsigned>& bounds, T* result) {
  280. return TIntParser<T, base, TChar>::Parse(&data, data + len, bounds, result) == PS_OK;
  281. }
  282. template <class T>
  283. inline T ParseFlt(const char* data, size_t len) {
  284. /*
  285. * TODO
  286. */
  287. if (len > 256) {
  288. len = 256;
  289. }
  290. char* c = (char*)alloca(len + 1);
  291. memcpy(c, data, len);
  292. c[len] = 0;
  293. T ret;
  294. char ec;
  295. // try to read a value and an extra character in order to catch cases when
  296. // the string start with a valid float but is followed by unexpected characters
  297. if (sscanf(c, TFltModifiers<T>::ModifierReadAndChar, &ret, &ec) == 1) {
  298. return ret;
  299. }
  300. ythrow TFromStringException() << TStringBuf("cannot parse float(") << TStringBuf(data, len) << TStringBuf(")");
  301. }
  302. #define DEF_FLT_MOD(type, modifierWrite, modifierRead) \
  303. template <> \
  304. struct TFltModifiers<type> { \
  305. static const char* const ModifierWrite; \
  306. static const char* const ModifierReadAndChar; \
  307. }; \
  308. \
  309. const char* const TFltModifiers<type>::ModifierWrite = modifierWrite; \
  310. const char* const TFltModifiers<type>::ModifierReadAndChar = modifierRead "%c";
  311. DEF_FLT_MOD(long double, "%.10Lg", "%Lg")
  312. #undef DEF_FLT_MOD
  313. /* The following constants are initialized in terms of <climits> constants to make
  314. * sure they go into binary as actual values and there is no associated
  315. * initialization code.
  316. * */
  317. constexpr TBounds<ui64> bSBounds = {static_cast<ui64>(SCHAR_MAX), static_cast<ui64>(UCHAR_MAX - SCHAR_MAX)};
  318. constexpr TBounds<ui64> bUBounds = {static_cast<ui64>(UCHAR_MAX), 0};
  319. constexpr TBounds<ui64> sSBounds = {static_cast<ui64>(SHRT_MAX), static_cast<ui64>(USHRT_MAX - SHRT_MAX)};
  320. constexpr TBounds<ui64> sUBounds = {static_cast<ui64>(USHRT_MAX), 0};
  321. constexpr TBounds<ui64> iSBounds = {static_cast<ui64>(INT_MAX), static_cast<ui64>(UINT_MAX - INT_MAX)};
  322. constexpr TBounds<ui64> iUBounds = {static_cast<ui64>(UINT_MAX), 0};
  323. constexpr TBounds<ui64> lSBounds = {static_cast<ui64>(LONG_MAX), static_cast<ui64>(ULONG_MAX - LONG_MAX)};
  324. constexpr TBounds<ui64> lUBounds = {static_cast<ui64>(ULONG_MAX), 0};
  325. constexpr TBounds<ui64> llSBounds = {static_cast<ui64>(LLONG_MAX), static_cast<ui64>(ULLONG_MAX - LLONG_MAX)};
  326. constexpr TBounds<ui64> llUBounds = {static_cast<ui64>(ULLONG_MAX), 0};
  327. }
  328. #define DEF_INT_SPEC_II(TYPE, ITYPE, BASE) \
  329. template <> \
  330. size_t IntToString<BASE, TYPE>(TYPE value, char* buf, size_t len) { \
  331. return FormatInt<ITYPE, BASE, char>(value, buf, len); \
  332. }
  333. #define DEF_INT_SPEC_I(TYPE, ITYPE) \
  334. template <> \
  335. size_t ToStringImpl<TYPE>(TYPE value, char* buf, size_t len) { \
  336. return FormatInt<ITYPE, 10, char>(value, buf, len); \
  337. } \
  338. DEF_INT_SPEC_II(TYPE, ITYPE, 2) \
  339. DEF_INT_SPEC_II(TYPE, ITYPE, 8) \
  340. DEF_INT_SPEC_II(TYPE, ITYPE, 10) \
  341. DEF_INT_SPEC_II(TYPE, ITYPE, 16)
  342. #define DEF_INT_SPEC(TYPE) \
  343. DEF_INT_SPEC_I(signed TYPE, i64) \
  344. DEF_INT_SPEC_I(unsigned TYPE, ui64)
  345. DEF_INT_SPEC(char)
  346. DEF_INT_SPEC(short)
  347. DEF_INT_SPEC(int)
  348. DEF_INT_SPEC(long)
  349. DEF_INT_SPEC(long long)
  350. #ifdef __cpp_char8_t
  351. template <>
  352. size_t ToStringImpl<char8_t>(char8_t value, char* buf, size_t len) {
  353. return FormatInt<ui64, 10, char>(value, buf, len);
  354. }
  355. #endif
  356. using TCharIType = std::conditional_t<std::is_signed<char>::value, i64, ui64>;
  357. using TWCharIType = std::conditional_t<std::is_signed<wchar_t>::value, i64, ui64>;
  358. DEF_INT_SPEC_I(char, TCharIType)
  359. DEF_INT_SPEC_I(wchar_t, TWCharIType)
  360. DEF_INT_SPEC_I(wchar16, ui64) // wchar16 is always unsigned
  361. DEF_INT_SPEC_I(wchar32, ui64) // wchar32 is always unsigned
  362. #undef DEF_INT_SPEC
  363. #undef DEF_INT_SPEC_I
  364. #undef DEF_INT_SPEC_II
  365. #define DEF_FLT_SPEC(type) \
  366. template <> \
  367. size_t ToStringImpl<type>(type t, char* buf, size_t len) { \
  368. return FormatFlt<type>(t, buf, len); \
  369. }
  370. DEF_FLT_SPEC(long double)
  371. #undef DEF_FLT_SPEC
  372. template <>
  373. size_t ToStringImpl<bool>(bool t, char* buf, size_t len) {
  374. Y_ENSURE(len, TStringBuf("zero length"));
  375. *buf = t ? '1' : '0';
  376. return 1;
  377. }
  378. /*
  379. * ------------------------------ parsers ------------------------------
  380. */
  381. template <>
  382. bool TryFromStringImpl<bool>(const char* data, size_t len, bool& result) {
  383. if (len == 1) {
  384. if (data[0] == '0') {
  385. result = false;
  386. return true;
  387. } else if (data[0] == '1') {
  388. result = true;
  389. return true;
  390. }
  391. }
  392. TStringBuf buf(data, len);
  393. if (IsTrue(buf)) {
  394. result = true;
  395. return true;
  396. } else if (IsFalse(buf)) {
  397. result = false;
  398. return true;
  399. }
  400. return false;
  401. }
  402. template <>
  403. bool FromStringImpl<bool>(const char* data, size_t len) {
  404. bool result;
  405. if (!TryFromStringImpl<bool>(data, len, result)) {
  406. ythrow TFromStringException() << TStringBuf("Cannot parse bool(") << TStringBuf(data, len) << TStringBuf("). ");
  407. }
  408. return result;
  409. }
  410. template <>
  411. TString FromStringImpl<TString>(const char* data, size_t len) {
  412. return TString(data, len);
  413. }
  414. template <>
  415. TStringBuf FromStringImpl<TStringBuf>(const char* data, size_t len) {
  416. return TStringBuf(data, len);
  417. }
  418. template <>
  419. std::string FromStringImpl<std::string>(const char* data, size_t len) {
  420. return std::string(data, len);
  421. }
  422. template <>
  423. TUtf16String FromStringImpl<TUtf16String>(const wchar16* data, size_t len) {
  424. return TUtf16String(data, len);
  425. }
  426. template <>
  427. TWtringBuf FromStringImpl<TWtringBuf>(const wchar16* data, size_t len) {
  428. return TWtringBuf(data, len);
  429. }
  430. // Try-versions
  431. template <>
  432. bool TryFromStringImpl<TStringBuf>(const char* data, size_t len, TStringBuf& result) {
  433. result = {data, len};
  434. return true;
  435. }
  436. template <>
  437. bool TryFromStringImpl<TString>(const char* data, size_t len, TString& result) {
  438. result = TString(data, len);
  439. return true;
  440. }
  441. template <>
  442. bool TryFromStringImpl<std::string>(const char* data, size_t len, std::string& result) {
  443. result.assign(data, len);
  444. return true;
  445. }
  446. template <>
  447. bool TryFromStringImpl<TWtringBuf>(const wchar16* data, size_t len, TWtringBuf& result) {
  448. result = {data, len};
  449. return true;
  450. }
  451. template <>
  452. bool TryFromStringImpl<TUtf16String>(const wchar16* data, size_t len, TUtf16String& result) {
  453. result = TUtf16String(data, len);
  454. return true;
  455. }
  456. #define DEF_INT_SPEC_III(CHAR, TYPE, ITYPE, BOUNDS, BASE) \
  457. template <> \
  458. TYPE IntFromString<TYPE, BASE>(const CHAR* data, size_t len) { \
  459. return ParseInt<ITYPE, ui64, BASE>(data, len, BOUNDS); \
  460. } \
  461. template <> \
  462. bool TryIntFromString<BASE>(const CHAR* data, size_t len, TYPE& result) { \
  463. ITYPE tmp; \
  464. bool status = TryParseInt<ITYPE, ui64, BASE>(data, len, BOUNDS, &tmp); \
  465. if (status) { \
  466. result = tmp; \
  467. } \
  468. return status; \
  469. }
  470. #define DEF_INT_SPEC_II(CHAR, TYPE, ITYPE, BOUNDS) \
  471. template <> \
  472. TYPE FromStringImpl<TYPE>(const CHAR* data, size_t len) { \
  473. return ParseInt<ITYPE, ui64, 10>(data, len, BOUNDS); \
  474. } \
  475. template <> \
  476. bool TryFromStringImpl<TYPE>(const CHAR* data, size_t len, TYPE& result) { \
  477. ITYPE tmp; \
  478. bool status = TryParseInt<ITYPE, ui64, 10>(data, len, BOUNDS, &tmp); \
  479. if (status) { \
  480. result = tmp; \
  481. } \
  482. return status; \
  483. } \
  484. DEF_INT_SPEC_III(CHAR, TYPE, ITYPE, BOUNDS, 2) \
  485. DEF_INT_SPEC_III(CHAR, TYPE, ITYPE, BOUNDS, 8) \
  486. DEF_INT_SPEC_III(CHAR, TYPE, ITYPE, BOUNDS, 10) \
  487. DEF_INT_SPEC_III(CHAR, TYPE, ITYPE, BOUNDS, 16)
  488. #define DEF_INT_SPEC_I(TYPE, ITYPE, BOUNDS) \
  489. DEF_INT_SPEC_II(char, TYPE, ITYPE, BOUNDS) \
  490. DEF_INT_SPEC_II(wchar16, TYPE, ITYPE, BOUNDS)
  491. #define DEF_INT_SPEC(TYPE, ID) \
  492. DEF_INT_SPEC_I(signed TYPE, i64, ID##SBounds) \
  493. DEF_INT_SPEC_I(unsigned TYPE, ui64, ID##UBounds)
  494. #define DEF_INT_SPEC_FIXED_WIDTH(TYPE, ID) \
  495. DEF_INT_SPEC_I(TYPE, i64, ID##SBounds) \
  496. DEF_INT_SPEC_I(u##TYPE, ui64, ID##UBounds)
  497. DEF_INT_SPEC_FIXED_WIDTH(i8, b)
  498. DEF_INT_SPEC(short, s)
  499. DEF_INT_SPEC(int, i)
  500. DEF_INT_SPEC(long, l)
  501. DEF_INT_SPEC(long long, ll)
  502. #undef DEF_INT_SPEC_FIXED_WIDTH
  503. #undef DEF_INT_SPEC
  504. #undef DEF_INT_SPEC_I
  505. #undef DEF_INT_SPEC_II
  506. #undef DEF_INT_SPEC_III
  507. #define DEF_FLT_SPEC(type) \
  508. template <> \
  509. type FromStringImpl<type>(const char* data, size_t len) { \
  510. return ParseFlt<type>(data, len); \
  511. }
  512. DEF_FLT_SPEC(long double)
  513. #undef DEF_FLT_SPEC
  514. // Using StrToD for float and double because it is faster than sscanf.
  515. // Exception-free, specialized for float types
  516. template <>
  517. bool TryFromStringImpl<double>(const char* data, size_t len, double& result) {
  518. if (!len) {
  519. return false;
  520. }
  521. char* se = nullptr;
  522. double d = StrToD(data, data + len, &se);
  523. if (se != data + len) {
  524. return false;
  525. }
  526. result = d;
  527. return true;
  528. }
  529. template <>
  530. bool TryFromStringImpl<float>(const char* data, size_t len, float& result) {
  531. double d;
  532. if (TryFromStringImpl<double>(data, len, d)) {
  533. result = static_cast<float>(d);
  534. return true;
  535. }
  536. return false;
  537. }
  538. template <>
  539. bool TryFromStringImpl<long double>(const char* data, size_t len, long double& result) {
  540. double d;
  541. if (TryFromStringImpl<double>(data, len, d)) {
  542. result = static_cast<long double>(d);
  543. return true;
  544. }
  545. return false;
  546. }
  547. // Exception-throwing, specialized for float types
  548. template <>
  549. double FromStringImpl<double>(const char* data, size_t len) {
  550. double d = 0.0;
  551. if (!TryFromStringImpl(data, len, d)) {
  552. ythrow TFromStringException() << TStringBuf("cannot parse float(") << TStringBuf(data, len) << TStringBuf(")");
  553. }
  554. return d;
  555. }
  556. template <>
  557. float FromStringImpl<float>(const char* data, size_t len) {
  558. return static_cast<float>(FromStringImpl<double>(data, len));
  559. }
  560. double StrToD(const char* b, const char* e, char** se) {
  561. struct TCvt: public StringToDoubleConverter {
  562. inline TCvt()
  563. : StringToDoubleConverter(ALLOW_TRAILING_JUNK | ALLOW_HEX | ALLOW_LEADING_SPACES, 0.0, NAN, nullptr, nullptr)
  564. {
  565. }
  566. };
  567. int out = 0;
  568. const auto res = SingletonWithPriority<TCvt, 0>()->StringToDouble(b, e - b, &out);
  569. if (se) {
  570. *se = (char*)(b + out);
  571. }
  572. return res;
  573. }
  574. double StrToD(const char* b, char** se) {
  575. return StrToD(b, b + strlen(b), se);
  576. }
  577. namespace {
  578. static inline DoubleToStringConverter& ToStringConverterNoPad() noexcept {
  579. struct TCvt: public DoubleToStringConverter {
  580. inline TCvt() noexcept
  581. : DoubleToStringConverter(EMIT_POSITIVE_EXPONENT_SIGN, "inf", "nan", 'e', -10, 21, 4, 0)
  582. {
  583. }
  584. };
  585. return *SingletonWithPriority<TCvt, 0>();
  586. }
  587. struct TBuilder {
  588. alignas(StringBuilder) char Store[sizeof(StringBuilder)];
  589. StringBuilder* SB;
  590. inline TBuilder(char* buf, size_t len) noexcept
  591. : SB(new (Store) StringBuilder(buf, len))
  592. {
  593. }
  594. };
  595. static inline size_t FixZeros(char* buf, size_t len) noexcept {
  596. auto end = buf + len;
  597. auto point = (char*)memchr(buf, '.', len);
  598. if (!point) {
  599. return len;
  600. }
  601. auto exp = (char*)memchr(point, 'e', end - point);
  602. if (!exp) {
  603. exp = end;
  604. }
  605. auto c = exp;
  606. c -= 1;
  607. while (point < c && *c == '0') {
  608. --c;
  609. }
  610. if (*c == '.') {
  611. --c;
  612. }
  613. memmove(c + 1, exp, end - exp);
  614. return c - buf + 1 + end - exp;
  615. }
  616. static inline size_t FixEnd(char* buf, size_t len) noexcept {
  617. if (len > 2) {
  618. auto sign = buf[len - 2];
  619. if (sign == '-' || sign == '+') {
  620. buf[len] = buf[len - 1];
  621. buf[len - 1] = '0';
  622. ++len;
  623. }
  624. }
  625. buf[len] = 0;
  626. return len;
  627. }
  628. static inline size_t DoDtoa(double d, char* buf, size_t len, int prec) noexcept {
  629. TBuilder sb(buf, len);
  630. Y_VERIFY(ToStringConverterNoPad().ToPrecision(d, prec, sb.SB), "conversion failed");
  631. return FixEnd(buf, FixZeros(buf, sb.SB->position()));
  632. }
  633. }
  634. template <>
  635. size_t ToStringImpl<double>(double d, char* buf, size_t len) {
  636. return DoDtoa(d, buf, len, 10);
  637. }
  638. template <>
  639. size_t ToStringImpl<float>(float f, char* buf, size_t len) {
  640. return DoDtoa(f, buf, len, 6);
  641. }
  642. size_t FloatToString(float t, char* buf, size_t len, EFloatToStringMode mode, int ndigits) {
  643. if (mode == PREC_AUTO) {
  644. TBuilder sb(buf, len);
  645. Y_VERIFY(ToStringConverterNoPad().ToShortestSingle(t, sb.SB), "conversion failed");
  646. return FixEnd(buf, sb.SB->position());
  647. }
  648. return FloatToString((double)t, buf, len, mode, ndigits);
  649. }
  650. size_t FloatToString(double t, char* buf, size_t len, EFloatToStringMode mode, int ndigits) {
  651. if (mode == PREC_NDIGITS) {
  652. auto minDigits = DoubleToStringConverter::kMinPrecisionDigits;
  653. auto maxDigits = DoubleToStringConverter::kMaxPrecisionDigits;
  654. return DoDtoa(t, buf, len, ClampVal(ndigits, minDigits, maxDigits));
  655. }
  656. TBuilder sb(buf, len);
  657. if (mode == PREC_AUTO) {
  658. Y_VERIFY(ToStringConverterNoPad().ToShortest(t, sb.SB), "conversion failed");
  659. return FixEnd(buf, sb.SB->position());
  660. }
  661. if (!ToStringConverterNoPad().ToFixed(t, ndigits, sb.SB)) {
  662. return FloatToString(t, buf, len, PREC_AUTO);
  663. }
  664. if (mode == PREC_POINT_DIGITS_STRIP_ZEROES) {
  665. return FixZeros(buf, sb.SB->position());
  666. }
  667. return sb.SB->position();
  668. }