/* auto-generated on 2023-07-23 15:03:22 -0400. Do not edit! */ /* begin file include/ada.h */ /** * @file ada.h * @brief Includes all definitions for Ada. */ #ifndef ADA_H #define ADA_H /* begin file include/ada/ada_idna.h */ /* auto-generated on 2023-05-07 19:12:14 -0400. Do not edit! */ /* begin file include/idna.h */ #ifndef ADA_IDNA_H #define ADA_IDNA_H /* begin file include/ada/idna/unicode_transcoding.h */ #ifndef ADA_IDNA_UNICODE_TRANSCODING_H #define ADA_IDNA_UNICODE_TRANSCODING_H #include #include namespace ada::idna { size_t utf8_to_utf32(const char* buf, size_t len, char32_t* utf32_output); size_t utf8_length_from_utf32(const char32_t* buf, size_t len); size_t utf32_length_from_utf8(const char* buf, size_t len); size_t utf32_to_utf8(const char32_t* buf, size_t len, char* utf8_output); } // namespace ada::idna #endif // ADA_IDNA_UNICODE_TRANSCODING_H /* end file include/ada/idna/unicode_transcoding.h */ /* begin file include/ada/idna/mapping.h */ #ifndef ADA_IDNA_MAPPING_H #define ADA_IDNA_MAPPING_H #include #include namespace ada::idna { // If the input is ascii, then the mapping is just -> lower case. void ascii_map(char* input, size_t length); // check whether an ascii string needs mapping bool ascii_has_upper_case(char* input, size_t length); // Map the characters according to IDNA, returning the empty string on error. std::u32string map(std::u32string_view input); } // namespace ada::idna #endif /* end file include/ada/idna/mapping.h */ /* begin file include/ada/idna/normalization.h */ #ifndef ADA_IDNA_NORMALIZATION_H #define ADA_IDNA_NORMALIZATION_H #include #include namespace ada::idna { // Normalize the characters according to IDNA (Unicode Normalization Form C). void normalize(std::u32string& input); } // namespace ada::idna #endif /* end file include/ada/idna/normalization.h */ /* begin file include/ada/idna/punycode.h */ #ifndef ADA_IDNA_PUNYCODE_H #define ADA_IDNA_PUNYCODE_H #include #include namespace ada::idna { bool punycode_to_utf32(std::string_view input, std::u32string& out); bool verify_punycode(std::string_view input); bool utf32_to_punycode(std::u32string_view input, std::string& out); } // namespace ada::idna #endif // ADA_IDNA_PUNYCODE_H /* end file include/ada/idna/punycode.h */ /* begin file include/ada/idna/validity.h */ #ifndef ADA_IDNA_VALIDITY_H #define ADA_IDNA_VALIDITY_H #include #include namespace ada::idna { /** * @see https://www.unicode.org/reports/tr46/#Validity_Criteria */ bool is_label_valid(const std::u32string_view label); } // namespace ada::idna #endif // ADA_IDNA_VALIDITY_H /* end file include/ada/idna/validity.h */ /* begin file include/ada/idna/to_ascii.h */ #ifndef ADA_IDNA_TO_ASCII_H #define ADA_IDNA_TO_ASCII_H #include #include namespace ada::idna { // Converts a domain (e.g., www.google.com) possibly containing international // characters to an ascii domain (with punycode). It will not do percent // decoding: percent decoding should be done prior to calling this function. We // do not remove tabs and spaces, they should have been removed prior to calling // this function. We also do not trim control characters. We also assume that // the input is not empty. We return "" on error. // // // This function may accept or even produce invalid domains. std::string to_ascii(std::string_view ut8_string); // Returns true if the string contains a forbidden code point according to the // WHATGL URL specification: // https://url.spec.whatwg.org/#forbidden-domain-code-point bool contains_forbidden_domain_code_point(std::string_view ascii_string); bool constexpr begins_with(std::u32string_view view, std::u32string_view prefix); bool constexpr begins_with(std::string_view view, std::string_view prefix); bool constexpr is_ascii(std::u32string_view view); bool constexpr is_ascii(std::string_view view); } // namespace ada::idna #endif // ADA_IDNA_TO_ASCII_H /* end file include/ada/idna/to_ascii.h */ /* begin file include/ada/idna/to_unicode.h */ #ifndef ADA_IDNA_TO_UNICODE_H #define ADA_IDNA_TO_UNICODE_H #include namespace ada::idna { std::string to_unicode(std::string_view input); } // namespace ada::idna #endif // ADA_IDNA_TO_UNICODE_H /* end file include/ada/idna/to_unicode.h */ #endif /* end file include/idna.h */ /* end file include/ada/ada_idna.h */ /* begin file include/ada/character_sets-inl.h */ /** * @file character_sets-inl.h * @brief Definitions of the character sets used by unicode functions. * @author Node.js * @see https://github.com/nodejs/node/blob/main/src/node_url_tables.cc */ #ifndef ADA_CHARACTER_SETS_INL_H #define ADA_CHARACTER_SETS_INL_H /* begin file include/ada/character_sets.h */ /** * @file character_sets.h * @brief Declaration of the character sets used by unicode functions. * @author Node.js * @see https://github.com/nodejs/node/blob/main/src/node_url_tables.cc */ #ifndef ADA_CHARACTER_SETS_H #define ADA_CHARACTER_SETS_H /* begin file include/ada/common_defs.h */ /** * @file common_defs.h * @brief Common definitions for cross-platform compiler support. */ #ifndef ADA_COMMON_DEFS_H #define ADA_COMMON_DEFS_H #ifdef _MSC_VER #define ADA_VISUAL_STUDIO 1 /** * We want to differentiate carefully between * clang under visual studio and regular visual * studio. */ #ifdef __clang__ // clang under visual studio #define ADA_CLANG_VISUAL_STUDIO 1 #else // just regular visual studio (best guess) #define ADA_REGULAR_VISUAL_STUDIO 1 #endif // __clang__ #endif // _MSC_VER #if defined(__GNUC__) // Marks a block with a name so that MCA analysis can see it. #define ADA_BEGIN_DEBUG_BLOCK(name) __asm volatile("# LLVM-MCA-BEGIN " #name); #define ADA_END_DEBUG_BLOCK(name) __asm volatile("# LLVM-MCA-END " #name); #define ADA_DEBUG_BLOCK(name, block) \ BEGIN_DEBUG_BLOCK(name); \ block; \ END_DEBUG_BLOCK(name); #else #define ADA_BEGIN_DEBUG_BLOCK(name) #define ADA_END_DEBUG_BLOCK(name) #define ADA_DEBUG_BLOCK(name, block) #endif // Align to N-byte boundary #define ADA_ROUNDUP_N(a, n) (((a) + ((n)-1)) & ~((n)-1)) #define ADA_ROUNDDOWN_N(a, n) ((a) & ~((n)-1)) #define ADA_ISALIGNED_N(ptr, n) (((uintptr_t)(ptr) & ((n)-1)) == 0) #if defined(ADA_REGULAR_VISUAL_STUDIO) #define ada_really_inline __forceinline #define ada_never_inline __declspec(noinline) #define ada_unused #define ada_warn_unused #ifndef ada_likely #define ada_likely(x) x #endif #ifndef ada_unlikely #define ada_unlikely(x) x #endif #define ADA_PUSH_DISABLE_WARNINGS __pragma(warning(push)) #define ADA_PUSH_DISABLE_ALL_WARNINGS __pragma(warning(push, 0)) #define ADA_DISABLE_VS_WARNING(WARNING_NUMBER) \ __pragma(warning(disable : WARNING_NUMBER)) // Get rid of Intellisense-only warnings (Code Analysis) // Though __has_include is C++17, it is supported in Visual Studio 2017 or // better (_MSC_VER>=1910). #ifdef __has_include #if __has_include() #include #define ADA_DISABLE_UNDESIRED_WARNINGS \ ADA_DISABLE_VS_WARNING(ALL_CPPCORECHECK_WARNINGS) #endif #endif #ifndef ADA_DISABLE_UNDESIRED_WARNINGS #define ADA_DISABLE_UNDESIRED_WARNINGS #endif #define ADA_DISABLE_DEPRECATED_WARNING ADA_DISABLE_VS_WARNING(4996) #define ADA_DISABLE_STRICT_OVERFLOW_WARNING #define ADA_POP_DISABLE_WARNINGS __pragma(warning(pop)) #else // ADA_REGULAR_VISUAL_STUDIO #define ada_really_inline inline __attribute__((always_inline)) #define ada_never_inline inline __attribute__((noinline)) #define ada_unused __attribute__((unused)) #define ada_warn_unused __attribute__((warn_unused_result)) #ifndef ada_likely #define ada_likely(x) __builtin_expect(!!(x), 1) #endif #ifndef ada_unlikely #define ada_unlikely(x) __builtin_expect(!!(x), 0) #endif #define ADA_PUSH_DISABLE_WARNINGS _Pragma("GCC diagnostic push") // gcc doesn't seem to disable all warnings with all and extra, add warnings // here as necessary #define ADA_PUSH_DISABLE_ALL_WARNINGS \ ADA_PUSH_DISABLE_WARNINGS \ ADA_DISABLE_GCC_WARNING("-Weffc++") \ ADA_DISABLE_GCC_WARNING("-Wall") \ ADA_DISABLE_GCC_WARNING("-Wconversion") \ ADA_DISABLE_GCC_WARNING("-Wextra") \ ADA_DISABLE_GCC_WARNING("-Wattributes") \ ADA_DISABLE_GCC_WARNING("-Wimplicit-fallthrough") \ ADA_DISABLE_GCC_WARNING("-Wnon-virtual-dtor") \ ADA_DISABLE_GCC_WARNING("-Wreturn-type") \ ADA_DISABLE_GCC_WARNING("-Wshadow") \ ADA_DISABLE_GCC_WARNING("-Wunused-parameter") \ ADA_DISABLE_GCC_WARNING("-Wunused-variable") #define ADA_PRAGMA(P) _Pragma(#P) #define ADA_DISABLE_GCC_WARNING(WARNING) \ ADA_PRAGMA(GCC diagnostic ignored WARNING) #if defined(ADA_CLANG_VISUAL_STUDIO) #define ADA_DISABLE_UNDESIRED_WARNINGS \ ADA_DISABLE_GCC_WARNING("-Wmicrosoft-include") #else #define ADA_DISABLE_UNDESIRED_WARNINGS #endif #define ADA_DISABLE_DEPRECATED_WARNING \ ADA_DISABLE_GCC_WARNING("-Wdeprecated-declarations") #define ADA_DISABLE_STRICT_OVERFLOW_WARNING \ ADA_DISABLE_GCC_WARNING("-Wstrict-overflow") #define ADA_POP_DISABLE_WARNINGS _Pragma("GCC diagnostic pop") #endif // MSC_VER #if defined(ADA_VISUAL_STUDIO) /** * It does not matter here whether you are using * the regular visual studio or clang under visual * studio. */ #if ADA_USING_LIBRARY #define ADA_DLLIMPORTEXPORT __declspec(dllimport) #else #define ADA_DLLIMPORTEXPORT __declspec(dllexport) #endif #else #define ADA_DLLIMPORTEXPORT #endif /// If EXPR is an error, returns it. #define ADA_TRY(EXPR) \ { \ auto _err = (EXPR); \ if (_err) { \ return _err; \ } \ } // __has_cpp_attribute is part of C++20 #if !defined(__has_cpp_attribute) #define __has_cpp_attribute(x) 0 #endif #if __has_cpp_attribute(gnu::noinline) #define ADA_ATTRIBUTE_NOINLINE [[gnu::noinline]] #else #define ADA_ATTRIBUTE_NOINLINE #endif namespace ada { [[noreturn]] inline void unreachable() { #ifdef __GNUC__ __builtin_unreachable(); #elif defined(_MSC_VER) __assume(false); #else #endif } } // namespace ada #if defined(__GNUC__) && !defined(__clang__) #if __GNUC__ <= 8 #define ADA_OLD_GCC 1 #endif // __GNUC__ <= 8 #endif // defined(__GNUC__) && !defined(__clang__) #if ADA_OLD_GCC #define ada_constexpr #else #define ada_constexpr constexpr #endif #if defined(__BYTE_ORDER__) && defined(__ORDER_BIG_ENDIAN__) #define ADA_IS_BIG_ENDIAN (__BYTE_ORDER__ == __ORDER_BIG_ENDIAN__) #elif defined(_WIN32) #define ADA_IS_BIG_ENDIAN 0 #else #if defined(__APPLE__) || \ defined(__FreeBSD__) // defined __BYTE_ORDER__ && defined // __ORDER_BIG_ENDIAN__ #include #elif defined(sun) || \ defined(__sun) // defined(__APPLE__) || defined(__FreeBSD__) #include #else // defined(__APPLE__) || defined(__FreeBSD__) #ifdef __has_include #if __has_include() #include #endif //__has_include() #endif //__has_include #endif // defined(__APPLE__) || defined(__FreeBSD__) #ifndef !defined(__BYTE_ORDER__) || !defined(__ORDER_LITTLE_ENDIAN__) #define ADA_IS_BIG_ENDIAN 0 #endif #if __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__ #define ADA_IS_BIG_ENDIAN 0 #else // __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__ #define ADA_IS_BIG_ENDIAN 1 #endif // __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__ #endif // defined __BYTE_ORDER__ && defined __ORDER_BIG_ENDIAN__ // Unless the programmer has already set ADA_DEVELOPMENT_CHECKS, // we want to set it under debug builds. We detect a debug build // under Visual Studio when the _DEBUG macro is set. Under the other // compilers, we use the fact that they define __OPTIMIZE__ whenever // they allow optimizations. // It is possible that this could miss some cases where ADA_DEVELOPMENT_CHECKS // is helpful, but the programmer can set the macro ADA_DEVELOPMENT_CHECKS. // It could also wrongly set ADA_DEVELOPMENT_CHECKS (e.g., if the programmer // sets _DEBUG in a release build under Visual Studio, or if some compiler fails // to set the __OPTIMIZE__ macro). #if !defined(ADA_DEVELOPMENT_CHECKS) && !defined(NDEBUG) #ifdef _MSC_VER // Visual Studio seems to set _DEBUG for debug builds. #ifdef _DEBUG #define ADA_DEVELOPMENT_CHECKS 1 #endif // _DEBUG #else // _MSC_VER // All other compilers appear to set __OPTIMIZE__ to a positive integer // when the compiler is optimizing. #ifndef __OPTIMIZE__ #define ADA_DEVELOPMENT_CHECKS 1 #endif // __OPTIMIZE__ #endif // _MSC_VER #endif // ADA_DEVELOPMENT_CHECKS #define ADA_STR(x) #x #if ADA_DEVELOPMENT_CHECKS #define ADA_REQUIRE(EXPR) \ { \ if (!(EXPR) { abort(); }) } #define ADA_FAIL(MESSAGE) \ do { \ std::cerr << "FAIL: " << (MESSAGE) << std::endl; \ abort(); \ } while (0); #define ADA_ASSERT_EQUAL(LHS, RHS, MESSAGE) \ do { \ if (LHS != RHS) { \ std::cerr << "Mismatch: '" << LHS << "' - '" << RHS << "'" << std::endl; \ ADA_FAIL(MESSAGE); \ } \ } while (0); #define ADA_ASSERT_TRUE(COND) \ do { \ if (!(COND)) { \ std::cerr << "Assert at line " << __LINE__ << " of file " << __FILE__ \ << std::endl; \ ADA_FAIL(ADA_STR(COND)); \ } \ } while (0); #else #define ADA_FAIL(MESSAGE) #define ADA_ASSERT_EQUAL(LHS, RHS, MESSAGE) #define ADA_ASSERT_TRUE(COND) #endif #ifdef ADA_VISUAL_STUDIO #define ADA_ASSUME(COND) __assume(COND) #else #define ADA_ASSUME(COND) \ do { \ if (!(COND)) __builtin_unreachable(); \ } while (0) #endif #if defined(__SSE2__) || defined(__x86_64__) || defined(__x86_64) || \ (defined(_M_AMD64) || defined(_M_X64) || \ (defined(_M_IX86_FP) && _M_IX86_FP == 2)) #define ADA_SSE2 1 #endif #if defined(__aarch64__) || defined(_M_ARM64) #define ADA_NEON 1 #endif #endif // ADA_COMMON_DEFS_H /* end file include/ada/common_defs.h */ #include /** * @namespace ada::character_sets * @brief Includes the definitions for unicode character sets. */ namespace ada::character_sets { ada_really_inline bool bit_at(const uint8_t a[], const uint8_t i); } // namespace ada::character_sets #endif // ADA_CHARACTER_SETS_H /* end file include/ada/character_sets.h */ namespace ada::character_sets { constexpr char hex[1024] = "%00\0%01\0%02\0%03\0%04\0%05\0%06\0%07\0" "%08\0%09\0%0A\0%0B\0%0C\0%0D\0%0E\0%0F\0" "%10\0%11\0%12\0%13\0%14\0%15\0%16\0%17\0" "%18\0%19\0%1A\0%1B\0%1C\0%1D\0%1E\0%1F\0" "%20\0%21\0%22\0%23\0%24\0%25\0%26\0%27\0" "%28\0%29\0%2A\0%2B\0%2C\0%2D\0%2E\0%2F\0" "%30\0%31\0%32\0%33\0%34\0%35\0%36\0%37\0" "%38\0%39\0%3A\0%3B\0%3C\0%3D\0%3E\0%3F\0" "%40\0%41\0%42\0%43\0%44\0%45\0%46\0%47\0" "%48\0%49\0%4A\0%4B\0%4C\0%4D\0%4E\0%4F\0" "%50\0%51\0%52\0%53\0%54\0%55\0%56\0%57\0" "%58\0%59\0%5A\0%5B\0%5C\0%5D\0%5E\0%5F\0" "%60\0%61\0%62\0%63\0%64\0%65\0%66\0%67\0" "%68\0%69\0%6A\0%6B\0%6C\0%6D\0%6E\0%6F\0" "%70\0%71\0%72\0%73\0%74\0%75\0%76\0%77\0" "%78\0%79\0%7A\0%7B\0%7C\0%7D\0%7E\0%7F\0" "%80\0%81\0%82\0%83\0%84\0%85\0%86\0%87\0" "%88\0%89\0%8A\0%8B\0%8C\0%8D\0%8E\0%8F\0" "%90\0%91\0%92\0%93\0%94\0%95\0%96\0%97\0" "%98\0%99\0%9A\0%9B\0%9C\0%9D\0%9E\0%9F\0" "%A0\0%A1\0%A2\0%A3\0%A4\0%A5\0%A6\0%A7\0" "%A8\0%A9\0%AA\0%AB\0%AC\0%AD\0%AE\0%AF\0" "%B0\0%B1\0%B2\0%B3\0%B4\0%B5\0%B6\0%B7\0" "%B8\0%B9\0%BA\0%BB\0%BC\0%BD\0%BE\0%BF\0" "%C0\0%C1\0%C2\0%C3\0%C4\0%C5\0%C6\0%C7\0" "%C8\0%C9\0%CA\0%CB\0%CC\0%CD\0%CE\0%CF\0" "%D0\0%D1\0%D2\0%D3\0%D4\0%D5\0%D6\0%D7\0" "%D8\0%D9\0%DA\0%DB\0%DC\0%DD\0%DE\0%DF\0" "%E0\0%E1\0%E2\0%E3\0%E4\0%E5\0%E6\0%E7\0" "%E8\0%E9\0%EA\0%EB\0%EC\0%ED\0%EE\0%EF\0" "%F0\0%F1\0%F2\0%F3\0%F4\0%F5\0%F6\0%F7\0" "%F8\0%F9\0%FA\0%FB\0%FC\0%FD\0%FE\0%FF"; constexpr uint8_t C0_CONTROL_PERCENT_ENCODE[32] = { // 00 01 02 03 04 05 06 07 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 08 09 0A 0B 0C 0D 0E 0F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 10 11 12 13 14 15 16 17 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 18 19 1A 1B 1C 1D 1E 1F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 20 21 22 23 24 25 26 27 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 28 29 2A 2B 2C 2D 2E 2F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 30 31 32 33 34 35 36 37 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 38 39 3A 3B 3C 3D 3E 3F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 40 41 42 43 44 45 46 47 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 48 49 4A 4B 4C 4D 4E 4F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 50 51 52 53 54 55 56 57 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 58 59 5A 5B 5C 5D 5E 5F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 60 61 62 63 64 65 66 67 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 68 69 6A 6B 6C 6D 6E 6F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 70 71 72 73 74 75 76 77 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 78 79 7A 7B 7C 7D 7E 7F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x80, // 80 81 82 83 84 85 86 87 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 88 89 8A 8B 8C 8D 8E 8F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 90 91 92 93 94 95 96 97 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 98 99 9A 9B 9C 9D 9E 9F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A0 A1 A2 A3 A4 A5 A6 A7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A8 A9 AA AB AC AD AE AF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B0 B1 B2 B3 B4 B5 B6 B7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B8 B9 BA BB BC BD BE BF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C0 C1 C2 C3 C4 C5 C6 C7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C8 C9 CA CB CC CD CE CF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D0 D1 D2 D3 D4 D5 D6 D7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D8 D9 DA DB DC DD DE DF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E0 E1 E2 E3 E4 E5 E6 E7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E8 E9 EA EB EC ED EE EF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F0 F1 F2 F3 F4 F5 F6 F7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F8 F9 FA FB FC FD FE FF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80}; constexpr uint8_t SPECIAL_QUERY_PERCENT_ENCODE[32] = { // 00 01 02 03 04 05 06 07 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 08 09 0A 0B 0C 0D 0E 0F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 10 11 12 13 14 15 16 17 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 18 19 1A 1B 1C 1D 1E 1F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 20 21 22 23 24 25 26 27 0x01 | 0x00 | 0x04 | 0x08 | 0x00 | 0x00 | 0x00 | 0x80, // 28 29 2A 2B 2C 2D 2E 2F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 30 31 32 33 34 35 36 37 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 38 39 3A 3B 3C 3D 3E 3F 0x00 | 0x00 | 0x00 | 0x00 | 0x10 | 0x00 | 0x40 | 0x00, // 40 41 42 43 44 45 46 47 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 48 49 4A 4B 4C 4D 4E 4F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 50 51 52 53 54 55 56 57 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 58 59 5A 5B 5C 5D 5E 5F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 60 61 62 63 64 65 66 67 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 68 69 6A 6B 6C 6D 6E 6F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 70 71 72 73 74 75 76 77 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 78 79 7A 7B 7C 7D 7E 7F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x80, // 80 81 82 83 84 85 86 87 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 88 89 8A 8B 8C 8D 8E 8F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 90 91 92 93 94 95 96 97 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 98 99 9A 9B 9C 9D 9E 9F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A0 A1 A2 A3 A4 A5 A6 A7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A8 A9 AA AB AC AD AE AF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B0 B1 B2 B3 B4 B5 B6 B7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B8 B9 BA BB BC BD BE BF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C0 C1 C2 C3 C4 C5 C6 C7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C8 C9 CA CB CC CD CE CF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D0 D1 D2 D3 D4 D5 D6 D7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D8 D9 DA DB DC DD DE DF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E0 E1 E2 E3 E4 E5 E6 E7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E8 E9 EA EB EC ED EE EF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F0 F1 F2 F3 F4 F5 F6 F7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F8 F9 FA FB FC FD FE FF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80}; constexpr uint8_t QUERY_PERCENT_ENCODE[32] = { // 00 01 02 03 04 05 06 07 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 08 09 0A 0B 0C 0D 0E 0F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 10 11 12 13 14 15 16 17 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 18 19 1A 1B 1C 1D 1E 1F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 20 21 22 23 24 25 26 27 0x01 | 0x00 | 0x04 | 0x08 | 0x00 | 0x00 | 0x00 | 0x00, // 28 29 2A 2B 2C 2D 2E 2F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 30 31 32 33 34 35 36 37 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 38 39 3A 3B 3C 3D 3E 3F 0x00 | 0x00 | 0x00 | 0x00 | 0x10 | 0x00 | 0x40 | 0x00, // 40 41 42 43 44 45 46 47 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 48 49 4A 4B 4C 4D 4E 4F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 50 51 52 53 54 55 56 57 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 58 59 5A 5B 5C 5D 5E 5F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 60 61 62 63 64 65 66 67 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 68 69 6A 6B 6C 6D 6E 6F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 70 71 72 73 74 75 76 77 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 78 79 7A 7B 7C 7D 7E 7F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x80, // 80 81 82 83 84 85 86 87 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 88 89 8A 8B 8C 8D 8E 8F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 90 91 92 93 94 95 96 97 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 98 99 9A 9B 9C 9D 9E 9F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A0 A1 A2 A3 A4 A5 A6 A7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A8 A9 AA AB AC AD AE AF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B0 B1 B2 B3 B4 B5 B6 B7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B8 B9 BA BB BC BD BE BF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C0 C1 C2 C3 C4 C5 C6 C7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C8 C9 CA CB CC CD CE CF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D0 D1 D2 D3 D4 D5 D6 D7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D8 D9 DA DB DC DD DE DF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E0 E1 E2 E3 E4 E5 E6 E7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E8 E9 EA EB EC ED EE EF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F0 F1 F2 F3 F4 F5 F6 F7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F8 F9 FA FB FC FD FE FF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80}; constexpr uint8_t FRAGMENT_PERCENT_ENCODE[32] = { // 00 01 02 03 04 05 06 07 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 08 09 0A 0B 0C 0D 0E 0F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 10 11 12 13 14 15 16 17 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 18 19 1A 1B 1C 1D 1E 1F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 20 21 22 23 24 25 26 27 0x01 | 0x00 | 0x04 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 28 29 2A 2B 2C 2D 2E 2F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 30 31 32 33 34 35 36 37 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 38 39 3A 3B 3C 3D 3E 3F 0x00 | 0x00 | 0x00 | 0x00 | 0x10 | 0x00 | 0x40 | 0x00, // 40 41 42 43 44 45 46 47 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 48 49 4A 4B 4C 4D 4E 4F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 50 51 52 53 54 55 56 57 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 58 59 5A 5B 5C 5D 5E 5F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 60 61 62 63 64 65 66 67 0x01 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 68 69 6A 6B 6C 6D 6E 6F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 70 71 72 73 74 75 76 77 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 78 79 7A 7B 7C 7D 7E 7F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x80, // 80 81 82 83 84 85 86 87 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 88 89 8A 8B 8C 8D 8E 8F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 90 91 92 93 94 95 96 97 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 98 99 9A 9B 9C 9D 9E 9F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A0 A1 A2 A3 A4 A5 A6 A7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A8 A9 AA AB AC AD AE AF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B0 B1 B2 B3 B4 B5 B6 B7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B8 B9 BA BB BC BD BE BF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C0 C1 C2 C3 C4 C5 C6 C7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C8 C9 CA CB CC CD CE CF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D0 D1 D2 D3 D4 D5 D6 D7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D8 D9 DA DB DC DD DE DF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E0 E1 E2 E3 E4 E5 E6 E7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E8 E9 EA EB EC ED EE EF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F0 F1 F2 F3 F4 F5 F6 F7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F8 F9 FA FB FC FD FE FF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80}; constexpr uint8_t USERINFO_PERCENT_ENCODE[32] = { // 00 01 02 03 04 05 06 07 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 08 09 0A 0B 0C 0D 0E 0F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 10 11 12 13 14 15 16 17 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 18 19 1A 1B 1C 1D 1E 1F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 20 21 22 23 24 25 26 27 0x01 | 0x00 | 0x04 | 0x08 | 0x00 | 0x00 | 0x00 | 0x00, // 28 29 2A 2B 2C 2D 2E 2F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x80, // 30 31 32 33 34 35 36 37 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 38 39 3A 3B 3C 3D 3E 3F 0x00 | 0x00 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 40 41 42 43 44 45 46 47 0x01 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 48 49 4A 4B 4C 4D 4E 4F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 50 51 52 53 54 55 56 57 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 58 59 5A 5B 5C 5D 5E 5F 0x00 | 0x00 | 0x00 | 0x08 | 0x10 | 0x20 | 0x40 | 0x00, // 60 61 62 63 64 65 66 67 0x01 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 68 69 6A 6B 6C 6D 6E 6F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 70 71 72 73 74 75 76 77 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 78 79 7A 7B 7C 7D 7E 7F 0x00 | 0x00 | 0x00 | 0x08 | 0x10 | 0x20 | 0x00 | 0x80, // 80 81 82 83 84 85 86 87 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 88 89 8A 8B 8C 8D 8E 8F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 90 91 92 93 94 95 96 97 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 98 99 9A 9B 9C 9D 9E 9F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A0 A1 A2 A3 A4 A5 A6 A7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A8 A9 AA AB AC AD AE AF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B0 B1 B2 B3 B4 B5 B6 B7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B8 B9 BA BB BC BD BE BF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C0 C1 C2 C3 C4 C5 C6 C7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C8 C9 CA CB CC CD CE CF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D0 D1 D2 D3 D4 D5 D6 D7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D8 D9 DA DB DC DD DE DF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E0 E1 E2 E3 E4 E5 E6 E7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E8 E9 EA EB EC ED EE EF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F0 F1 F2 F3 F4 F5 F6 F7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F8 F9 FA FB FC FD FE FF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80}; constexpr uint8_t PATH_PERCENT_ENCODE[32] = { // 00 01 02 03 04 05 06 07 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 08 09 0A 0B 0C 0D 0E 0F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 10 11 12 13 14 15 16 17 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 18 19 1A 1B 1C 1D 1E 1F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 20 21 22 23 24 25 26 27 0x01 | 0x00 | 0x04 | 0x08 | 0x00 | 0x00 | 0x00 | 0x00, // 28 29 2A 2B 2C 2D 2E 2F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 30 31 32 33 34 35 36 37 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 38 39 3A 3B 3C 3D 3E 3F 0x00 | 0x00 | 0x00 | 0x00 | 0x10 | 0x00 | 0x40 | 0x80, // 40 41 42 43 44 45 46 47 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 48 49 4A 4B 4C 4D 4E 4F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 50 51 52 53 54 55 56 57 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 58 59 5A 5B 5C 5D 5E 5F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 60 61 62 63 64 65 66 67 0x01 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 68 69 6A 6B 6C 6D 6E 6F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 70 71 72 73 74 75 76 77 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 78 79 7A 7B 7C 7D 7E 7F 0x00 | 0x00 | 0x00 | 0x08 | 0x00 | 0x20 | 0x00 | 0x80, // 80 81 82 83 84 85 86 87 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 88 89 8A 8B 8C 8D 8E 8F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 90 91 92 93 94 95 96 97 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 98 99 9A 9B 9C 9D 9E 9F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A0 A1 A2 A3 A4 A5 A6 A7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A8 A9 AA AB AC AD AE AF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B0 B1 B2 B3 B4 B5 B6 B7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B8 B9 BA BB BC BD BE BF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C0 C1 C2 C3 C4 C5 C6 C7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C8 C9 CA CB CC CD CE CF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D0 D1 D2 D3 D4 D5 D6 D7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D8 D9 DA DB DC DD DE DF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E0 E1 E2 E3 E4 E5 E6 E7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E8 E9 EA EB EC ED EE EF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F0 F1 F2 F3 F4 F5 F6 F7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F8 F9 FA FB FC FD FE FF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80}; constexpr uint8_t WWW_FORM_URLENCODED_PERCENT_ENCODE[32] = { // 00 01 02 03 04 05 06 07 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 08 09 0A 0B 0C 0D 0E 0F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 10 11 12 13 14 15 16 17 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 18 19 1A 1B 1C 1D 1E 1F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 20 21 22 23 24 25 26 27 0x00 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 28 29 2A 2B 2C 2D 2E 2F 0x01 | 0x02 | 0x00 | 0x08 | 0x10 | 0x00 | 0x00 | 0x00, // 30 31 32 33 34 35 36 37 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 38 39 3A 3B 3C 3D 3E 3F 0x00 | 0x00 | 0x00 | 0x00 | 0x10 | 0x00 | 0x40 | 0x80, // 40 41 42 43 44 45 46 47 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 48 49 4A 4B 4C 4D 4E 4F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 50 51 52 53 54 55 56 57 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 58 59 5A 5B 5C 5D 5E 5F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 60 61 62 63 64 65 66 67 0x01 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 68 69 6A 6B 6C 6D 6E 6F 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 70 71 72 73 74 75 76 77 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00 | 0x00, // 78 79 7A 7B 7C 7D 7E 7F 0x00 | 0x00 | 0x00 | 0x08 | 0x00 | 0x20 | 0x40 | 0x80, // 80 81 82 83 84 85 86 87 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 88 89 8A 8B 8C 8D 8E 8F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 90 91 92 93 94 95 96 97 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // 98 99 9A 9B 9C 9D 9E 9F 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A0 A1 A2 A3 A4 A5 A6 A7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // A8 A9 AA AB AC AD AE AF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B0 B1 B2 B3 B4 B5 B6 B7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // B8 B9 BA BB BC BD BE BF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C0 C1 C2 C3 C4 C5 C6 C7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // C8 C9 CA CB CC CD CE CF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D0 D1 D2 D3 D4 D5 D6 D7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // D8 D9 DA DB DC DD DE DF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E0 E1 E2 E3 E4 E5 E6 E7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // E8 E9 EA EB EC ED EE EF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F0 F1 F2 F3 F4 F5 F6 F7 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80, // F8 F9 FA FB FC FD FE FF 0x01 | 0x02 | 0x04 | 0x08 | 0x10 | 0x20 | 0x40 | 0x80}; ada_really_inline bool bit_at(const uint8_t a[], const uint8_t i) { return !!(a[i >> 3] & (1 << (i & 7))); } } // namespace ada::character_sets #endif // ADA_CHARACTER_SETS_H /* end file include/ada/character_sets-inl.h */ /* begin file include/ada/checkers-inl.h */ /** * @file checkers-inl.h * @brief Definitions for URL specific checkers used within Ada. */ #ifndef ADA_CHECKERS_INL_H #define ADA_CHECKERS_INL_H #include #include namespace ada::checkers { inline bool has_hex_prefix_unsafe(std::string_view input) { // This is actually efficient code, see has_hex_prefix for the assembly. uint32_t value_one = 1; bool is_little_endian = (reinterpret_cast(&value_one)[0] == 1); uint16_t word0x{}; std::memcpy(&word0x, "0x", 2); // we would use bit_cast in C++20 and the // function could be constexpr. uint16_t two_first_bytes{}; std::memcpy(&two_first_bytes, input.data(), 2); if (is_little_endian) { two_first_bytes |= 0x2000; } else { two_first_bytes |= 0x020; } return two_first_bytes == word0x; } inline bool has_hex_prefix(std::string_view input) { return input.size() >= 2 && has_hex_prefix_unsafe(input); } constexpr bool is_digit(char x) noexcept { return (x >= '0') & (x <= '9'); } constexpr char to_lower(char x) noexcept { return (x | 0x20); } constexpr bool is_alpha(char x) noexcept { return (to_lower(x) >= 'a') && (to_lower(x) <= 'z'); } inline constexpr bool is_windows_drive_letter(std::string_view input) noexcept { return input.size() >= 2 && (is_alpha(input[0]) && ((input[1] == ':') || (input[1] == '|'))) && ((input.size() == 2) || (input[2] == '/' || input[2] == '\\' || input[2] == '?' || input[2] == '#')); } inline constexpr bool is_normalized_windows_drive_letter( std::string_view input) noexcept { return input.size() >= 2 && (is_alpha(input[0]) && (input[1] == ':')); } ada_really_inline constexpr bool begins_with(std::string_view view, std::string_view prefix) { // in C++20, you have view.begins_with(prefix) return view.size() >= prefix.size() && (view.substr(0, prefix.size()) == prefix); } } // namespace ada::checkers #endif // ADA_CHECKERS_H /* end file include/ada/checkers-inl.h */ /* begin file include/ada/log.h */ /** * @file log.h * @brief Includes the definitions for logging. * @private Excluded from docs through the doxygen file. */ #ifndef ADA_LOG_H #define ADA_LOG_H #include // To enable logging, set ADA_LOGGING to 1: #ifndef ADA_LOGGING #define ADA_LOGGING 0 #endif namespace ada { /** * Private function used for logging messages. * @private */ template ada_really_inline void inner_log([[maybe_unused]] T t) { #if ADA_LOGGING std::cout << t << std::endl; #endif } /** * Private function used for logging messages. * @private */ template ada_really_inline void inner_log([[maybe_unused]] T t, [[maybe_unused]] Args... args) { #if ADA_LOGGING std::cout << t; inner_log(args...); #endif } /** * Log a message. * @private */ template ada_really_inline void log([[maybe_unused]] T t, [[maybe_unused]] Args... args) { #if ADA_LOGGING std::cout << "ADA_LOG: " << t; inner_log(args...); #endif } /** * Log a message. * @private */ template ada_really_inline void log([[maybe_unused]] T t) { #if ADA_LOGGING std::cout << "ADA_LOG: " << t << std::endl; #endif } } // namespace ada #if ADA_LOGGING #ifndef ada_log #define ada_log(...) \ do { \ ada::log(__VA_ARGS__); \ } while (0) #endif // ada_log #else #define ada_log(...) #endif // ADA_LOGGING #endif // ADA_LOG_H /* end file include/ada/log.h */ /* begin file include/ada/encoding_type.h */ /** * @file encoding_type.h * @brief Definition for supported encoding types. */ #ifndef ADA_ENCODING_TYPE_H #define ADA_ENCODING_TYPE_H #include namespace ada { /** * This specification defines three encodings with the same names as encoding * schemes defined in the Unicode standard: UTF-8, UTF-16LE, and UTF-16BE. * * @see https://encoding.spec.whatwg.org/#encodings */ enum class encoding_type { UTF8, UTF_16LE, UTF_16BE, }; /** * Convert a encoding_type to string. */ ada_warn_unused std::string to_string(encoding_type type); } // namespace ada #endif // ADA_ENCODING_TYPE_H /* end file include/ada/encoding_type.h */ /* begin file include/ada/helpers.h */ /** * @file helpers.h * @brief Definitions for helper functions used within Ada. */ #ifndef ADA_HELPERS_H #define ADA_HELPERS_H /* begin file include/ada/state.h */ /** * @file state.h * @brief Definitions for the states of the URL state machine. */ #ifndef ADA_STATE_H #define ADA_STATE_H #include namespace ada { /** * @see https://url.spec.whatwg.org/#url-parsing */ enum class state { AUTHORITY, SCHEME_START, SCHEME, HOST, NO_SCHEME, FRAGMENT, RELATIVE_SCHEME, RELATIVE_SLASH, FILE, FILE_HOST, FILE_SLASH, PATH_OR_AUTHORITY, SPECIAL_AUTHORITY_IGNORE_SLASHES, SPECIAL_AUTHORITY_SLASHES, SPECIAL_RELATIVE_OR_AUTHORITY, QUERY, PATH, PATH_START, OPAQUE_PATH, PORT, }; /** * Stringify a URL state machine state. */ ada_warn_unused std::string to_string(ada::state s); } // namespace ada #endif // ADA_STATE_H /* end file include/ada/state.h */ /* begin file include/ada/url_base.h */ /** * @file url_base.h * @brief Declaration for the basic URL definitions */ #ifndef ADA_URL_BASE_H #define ADA_URL_BASE_H /* begin file include/ada/url_components.h */ /** * @file url_components.h * @brief Declaration for the URL Components */ #ifndef ADA_URL_COMPONENTS_H #define ADA_URL_COMPONENTS_H #include #include namespace ada { /** * @brief URL Component representations using offsets. * * @details We design the url_components struct so that it is as small * and simple as possible. This version uses 32 bytes. * * This struct is used to extract components from a single 'href'. */ struct url_components { constexpr static uint32_t omitted = uint32_t(-1); url_components() = default; url_components(const url_components &u) = default; url_components(url_components &&u) noexcept = default; url_components &operator=(url_components &&u) noexcept = default; url_components &operator=(const url_components &u) = default; ~url_components() = default; /* * By using 32-bit integers, we implicitly assume that the URL string * cannot exceed 4 GB. * * https://user:pass@example.com:1234/foo/bar?baz#quux * | | | | ^^^^| | | * | | | | | | | `----- hash_start * | | | | | | `--------- search_start * | | | | | `----------------- pathname_start * | | | | `--------------------- port * | | | `----------------------- host_end * | | `---------------------------------- host_start * | `--------------------------------------- username_end * `--------------------------------------------- protocol_end */ uint32_t protocol_end{0}; /** * Username end is not `omitted` by default to make username and password * getters less costly to implement. */ uint32_t username_end{0}; uint32_t host_start{0}; uint32_t host_end{0}; uint32_t port{omitted}; uint32_t pathname_start{0}; uint32_t search_start{omitted}; uint32_t hash_start{omitted}; /** * Check the following conditions: * protocol_end < username_end < ... < hash_start, * expect when a value is omitted. It also computes * a lower bound on the possible string length that may match these * offsets. * @return true if the offset values are * consistent with a possible URL string */ bool check_offset_consistency() const noexcept; /** * Converts a url_components to JSON stringified version. */ std::string to_string() const; }; // struct url_components } // namespace ada #endif /* end file include/ada/url_components.h */ /* begin file include/ada/scheme.h */ /** * @file scheme.h * @brief Declarations for the URL scheme. */ #ifndef ADA_SCHEME_H #define ADA_SCHEME_H #include #include #include /** * @namespace ada::scheme * @brief Includes the scheme declarations */ namespace ada::scheme { /** * Type of the scheme as an enum. * Using strings to represent a scheme type is not ideal because * checking for types involves string comparisons. It is faster to use * a simple integer. * In C++11, we are allowed to specify the underlying type of the enum. * We pick an 8-bit integer (which allows up to 256 types). Specifying the * type of the enum may help integration with other systems if the type * variable is exposed (since its value will not depend on the compiler). */ enum type : uint8_t { HTTP = 0, NOT_SPECIAL = 1, HTTPS = 2, WS = 3, FTP = 4, WSS = 5, FILE = 6 }; /** * A special scheme is an ASCII string that is listed in the first column of the * following table. The default port for a special scheme is listed in the * second column on the same row. The default port for any other ASCII string is * null. * * @see https://url.spec.whatwg.org/#url-miscellaneous * @param scheme * @return If scheme is a special scheme */ ada_really_inline constexpr bool is_special(std::string_view scheme); /** * A special scheme is an ASCII string that is listed in the first column of the * following table. The default port for a special scheme is listed in the * second column on the same row. The default port for any other ASCII string is * null. * * @see https://url.spec.whatwg.org/#url-miscellaneous * @param scheme * @return The special port */ constexpr uint16_t get_special_port(std::string_view scheme) noexcept; /** * Returns the port number of a special scheme. * @see https://url.spec.whatwg.org/#special-scheme */ constexpr uint16_t get_special_port(ada::scheme::type type) noexcept; /** * Returns the scheme of an input, or NOT_SPECIAL if it's not a special scheme * defined by the spec. */ constexpr ada::scheme::type get_scheme_type(std::string_view scheme) noexcept; } // namespace ada::scheme #endif // ADA_SCHEME_H /* end file include/ada/scheme.h */ #include namespace ada { /** * @brief Base class of URL implementations * * @details A url_base contains a few attributes: is_valid, has_opaque_path and * type. All non-trivial implementation details are in derived classes such as * ada::url and ada::url_aggregator. * * It is an abstract class that cannot be instantiated directly. */ struct url_base { virtual ~url_base() = default; /** * Used for returning the validity from the result of the URL parser. */ bool is_valid{true}; /** * A URL has an opaque path if its path is a string. */ bool has_opaque_path{false}; /** * @private */ ada::scheme::type type{ada::scheme::type::NOT_SPECIAL}; /** * A URL is special if its scheme is a special scheme. A URL is not special if * its scheme is not a special scheme. */ [[nodiscard]] ada_really_inline bool is_special() const noexcept; /** * The origin getter steps are to return the serialization of this's URL's * origin. [HTML] * @return a newly allocated string. * @see https://url.spec.whatwg.org/#concept-url-origin */ [[nodiscard]] virtual std::string get_origin() const noexcept = 0; /** * Returns true if this URL has a valid domain as per RFC 1034 and * corresponding specifications. Among other things, it requires * that the domain string has fewer than 255 octets. */ [[nodiscard]] virtual bool has_valid_domain() const noexcept = 0; /** * @private * * Return the 'special port' if the URL is special and not 'file'. * Returns 0 otherwise. */ [[nodiscard]] inline uint16_t get_special_port() const noexcept; /** * @private * * Get the default port if the url's scheme has one, returns 0 otherwise. */ [[nodiscard]] ada_really_inline uint16_t scheme_default_port() const noexcept; /** * @private * * Parse a port (16-bit decimal digit) from the provided input. * We assume that the input does not contain spaces or tabs * within the ASCII digits. * It returns how many bytes were consumed when a number is successfully * parsed. * @return On failure, it returns zero. * @see https://url.spec.whatwg.org/#host-parsing */ virtual ada_really_inline size_t parse_port( std::string_view view, bool check_trailing_content = false) noexcept = 0; /** * Returns a JSON string representation of this URL. */ virtual std::string to_string() const = 0; /** @private */ virtual inline void clear_pathname() = 0; /** @private */ virtual inline void clear_search() = 0; /** @private */ virtual inline bool has_hash() const noexcept = 0; /** @private */ virtual inline bool has_search() const noexcept = 0; }; // url_base } // namespace ada #endif /* end file include/ada/url_base.h */ #include #include /** * @private * @namespace ada::helpers * @brief Includes the definitions for helper functions */ namespace ada::helpers { /** * @private */ template void encode_json(std::string_view view, out_iter out); /** * @private * This function is used to prune a fragment from a url, and returning the * removed string if input has fragment. * * @details prune_hash seeks the first '#' and returns everything after it * as a string_view, and modifies (in place) the input so that it points at * everything before the '#'. If no '#' is found, the input is left unchanged * and std::nullopt is returned. * * @attention The function is non-allocating and it does not throw. * @returns Note that the returned string_view might be empty! */ ada_really_inline std::optional prune_hash( std::string_view& input) noexcept; /** * @private * Defined by the URL specification, shorten a URLs paths. * @see https://url.spec.whatwg.org/#shorten-a-urls-path * @returns Returns true if path is shortened. */ ada_really_inline bool shorten_path(std::string& path, ada::scheme::type type) noexcept; /** * @private * Defined by the URL specification, shorten a URLs paths. * @see https://url.spec.whatwg.org/#shorten-a-urls-path * @returns Returns true if path is shortened. */ ada_really_inline bool shorten_path(std::string_view& path, ada::scheme::type type) noexcept; /** * @private * * Parse the path from the provided input and append to the existing * (possibly empty) path. The input cannot contain tabs and spaces: it * is the user's responsibility to check. * * The input is expected to be UTF-8. * * @see https://url.spec.whatwg.org/ */ ada_really_inline void parse_prepared_path(const std::string_view input, ada::scheme::type type, std::string& path); /** * @private * Remove and mutate all ASCII tab or newline characters from an input. */ ada_really_inline void remove_ascii_tab_or_newline(std::string& input) noexcept; /** * @private * Return the substring from input going from index pos to the end. * This function cannot throw. */ ada_really_inline std::string_view substring(std::string_view input, size_t pos) noexcept; /** * @private * Returns true if the string_view points within the string. */ bool overlaps(std::string_view input1, const std::string& input2) noexcept; /** * @private * Return the substring from input going from index pos1 to the pos2 (non * included). The length of the substring is pos2 - pos1. */ ada_really_inline std::string_view substring(const std::string& input, size_t pos1, size_t pos2) noexcept { #if ADA_DEVELOPMENT_CHECKS if (pos2 < pos1) { std::cerr << "Negative-length substring: [" << pos1 << " to " << pos2 << ")" << std::endl; abort(); } #endif return std::string_view(input.data() + pos1, pos2 - pos1); } /** * @private * Modify the string_view so that it has the new size pos, assuming that pos <= * input.size(). This function cannot throw. */ ada_really_inline void resize(std::string_view& input, size_t pos) noexcept; /** * @private * Returns a host's delimiter location depending on the state of the instance, * and whether a colon was found outside brackets. Used by the host parser. */ ada_really_inline std::pair get_host_delimiter_location( const bool is_special, std::string_view& view) noexcept; /** * @private * Removes leading and trailing C0 control and whitespace characters from * string. */ ada_really_inline void trim_c0_whitespace(std::string_view& input) noexcept; /** * @private * @see * https://url.spec.whatwg.org/#potentially-strip-trailing-spaces-from-an-opaque-path */ template ada_really_inline void strip_trailing_spaces_from_opaque_path( url_type& url) noexcept; /** * @private * Reverse the order of the bytes. */ ada_really_inline uint64_t swap_bytes(uint64_t val) noexcept; /** * @private * Reverse the order of the bytes but only if the system is big endian */ ada_really_inline uint64_t swap_bytes_if_big_endian(uint64_t val) noexcept; /** * @private * Finds the delimiter of a view in authority state. */ ada_really_inline size_t find_authority_delimiter_special(std::string_view view) noexcept; /** * @private * Finds the delimiter of a view in authority state. */ ada_really_inline size_t find_authority_delimiter(std::string_view view) noexcept; /** * @private */ template inline void inner_concat(std::string& buffer, T t) { buffer.append(t); } /** * @private */ template inline void inner_concat(std::string& buffer, T t, Args... args) { buffer.append(t); return inner_concat(buffer, args...); } /** * Concatenate the arguments and return a string. * @returns a string */ template std::string concat(Args... args) { std::string answer; inner_concat(answer, args...); return answer; } /** * @return Number of leading zeroes. */ inline int leading_zeroes(uint32_t input_num) noexcept { #if ADA_REGULAR_VISUAL_STUDIO unsigned long leading_zero(0); unsigned long in(input_num); return _BitScanReverse(&leading_zero, in) ? int(31 - leading_zero) : 32; #else return __builtin_clz(input_num); #endif // ADA_REGULAR_VISUAL_STUDIO } /** * Counts the number of decimal digits necessary to represent x. * faster than std::to_string(x).size(). * @return digit count */ inline int fast_digit_count(uint32_t x) noexcept { auto int_log2 = [](uint32_t z) -> int { return 31 - ada::helpers::leading_zeroes(z | 1); }; // Compiles to very few instructions. Note that the // table is static and thus effectively a constant. // We leave it inside the function because it is meaningless // outside of it (this comes at no performance cost). const static uint64_t table[] = { 4294967296, 8589934582, 8589934582, 8589934582, 12884901788, 12884901788, 12884901788, 17179868184, 17179868184, 17179868184, 21474826480, 21474826480, 21474826480, 21474826480, 25769703776, 25769703776, 25769703776, 30063771072, 30063771072, 30063771072, 34349738368, 34349738368, 34349738368, 34349738368, 38554705664, 38554705664, 38554705664, 41949672960, 41949672960, 41949672960, 42949672960, 42949672960}; return int((x + table[int_log2(x)]) >> 32); } } // namespace ada::helpers #endif // ADA_HELPERS_H /* end file include/ada/helpers.h */ /* begin file include/ada/parser.h */ /** * @file parser.h * @brief Definitions for the parser. */ #ifndef ADA_PARSER_H #define ADA_PARSER_H /* begin file include/ada/expected.h */ /** * @file expected.h * @brief Definitions for std::expected * @private Excluded from docs through the doxygen file. */ /// // expected - An implementation of std::expected with extensions // Written in 2017 by Sy Brand (tartanllama@gmail.com, @TartanLlama) // // Documentation available at http://tl.tartanllama.xyz/ // // To the extent possible under law, the author(s) have dedicated all // copyright and related and neighboring rights to this software to the // public domain worldwide. This software is distributed without any warranty. // // You should have received a copy of the CC0 Public Domain Dedication // along with this software. If not, see // . /// #ifndef TL_EXPECTED_HPP #define TL_EXPECTED_HPP #define TL_EXPECTED_VERSION_MAJOR 1 #define TL_EXPECTED_VERSION_MINOR 0 #define TL_EXPECTED_VERSION_PATCH 1 #include #include #include #include #if defined(__EXCEPTIONS) || defined(_CPPUNWIND) #define TL_EXPECTED_EXCEPTIONS_ENABLED #endif #if (defined(_MSC_VER) && _MSC_VER == 1900) #define TL_EXPECTED_MSVC2015 #define TL_EXPECTED_MSVC2015_CONSTEXPR #else #define TL_EXPECTED_MSVC2015_CONSTEXPR constexpr #endif #if (defined(__GNUC__) && __GNUC__ == 4 && __GNUC_MINOR__ <= 9 && \ !defined(__clang__)) #define TL_EXPECTED_GCC49 #endif #if (defined(__GNUC__) && __GNUC__ == 5 && __GNUC_MINOR__ <= 4 && \ !defined(__clang__)) #define TL_EXPECTED_GCC54 #endif #if (defined(__GNUC__) && __GNUC__ == 5 && __GNUC_MINOR__ <= 5 && \ !defined(__clang__)) #define TL_EXPECTED_GCC55 #endif #if (defined(__GNUC__) && __GNUC__ == 4 && __GNUC_MINOR__ <= 9 && \ !defined(__clang__)) // GCC < 5 doesn't support overloading on const&& for member functions #define TL_EXPECTED_NO_CONSTRR // GCC < 5 doesn't support some standard C++11 type traits #define TL_EXPECTED_IS_TRIVIALLY_COPY_CONSTRUCTIBLE(T) \ std::has_trivial_copy_constructor #define TL_EXPECTED_IS_TRIVIALLY_COPY_ASSIGNABLE(T) \ std::has_trivial_copy_assign // This one will be different for GCC 5.7 if it's ever supported #define TL_EXPECTED_IS_TRIVIALLY_DESTRUCTIBLE(T) \ std::is_trivially_destructible // GCC 5 < v < 8 has a bug in is_trivially_copy_constructible which breaks // std::vector for non-copyable types #elif (defined(__GNUC__) && __GNUC__ < 8 && !defined(__clang__)) #ifndef TL_GCC_LESS_8_TRIVIALLY_COPY_CONSTRUCTIBLE_MUTEX #define TL_GCC_LESS_8_TRIVIALLY_COPY_CONSTRUCTIBLE_MUTEX namespace tl { namespace detail { template struct is_trivially_copy_constructible : std::is_trivially_copy_constructible {}; #ifdef _GLIBCXX_VECTOR template struct is_trivially_copy_constructible> : std::false_type {}; #endif } // namespace detail } // namespace tl #endif #define TL_EXPECTED_IS_TRIVIALLY_COPY_CONSTRUCTIBLE(T) \ tl::detail::is_trivially_copy_constructible #define TL_EXPECTED_IS_TRIVIALLY_COPY_ASSIGNABLE(T) \ std::is_trivially_copy_assignable #define TL_EXPECTED_IS_TRIVIALLY_DESTRUCTIBLE(T) \ std::is_trivially_destructible #else #define TL_EXPECTED_IS_TRIVIALLY_COPY_CONSTRUCTIBLE(T) \ std::is_trivially_copy_constructible #define TL_EXPECTED_IS_TRIVIALLY_COPY_ASSIGNABLE(T) \ std::is_trivially_copy_assignable #define TL_EXPECTED_IS_TRIVIALLY_DESTRUCTIBLE(T) \ std::is_trivially_destructible #endif #if __cplusplus > 201103L #define TL_EXPECTED_CXX14 #endif #ifdef TL_EXPECTED_GCC49 #define TL_EXPECTED_GCC49_CONSTEXPR #else #define TL_EXPECTED_GCC49_CONSTEXPR constexpr #endif #if (__cplusplus == 201103L || defined(TL_EXPECTED_MSVC2015) || \ defined(TL_EXPECTED_GCC49)) #define TL_EXPECTED_11_CONSTEXPR #else #define TL_EXPECTED_11_CONSTEXPR constexpr #endif namespace tl { template class expected; #ifndef TL_MONOSTATE_INPLACE_MUTEX #define TL_MONOSTATE_INPLACE_MUTEX class monostate {}; struct in_place_t { explicit in_place_t() = default; }; static constexpr in_place_t in_place{}; #endif template class unexpected { public: static_assert(!std::is_same::value, "E must not be void"); unexpected() = delete; constexpr explicit unexpected(const E &e) : m_val(e) {} constexpr explicit unexpected(E &&e) : m_val(std::move(e)) {} template ::value>::type * = nullptr> constexpr explicit unexpected(Args &&...args) : m_val(std::forward(args)...) {} template < class U, class... Args, typename std::enable_if &, Args &&...>::value>::type * = nullptr> constexpr explicit unexpected(std::initializer_list l, Args &&...args) : m_val(l, std::forward(args)...) {} constexpr const E &value() const & { return m_val; } TL_EXPECTED_11_CONSTEXPR E &value() & { return m_val; } TL_EXPECTED_11_CONSTEXPR E &&value() && { return std::move(m_val); } constexpr const E &&value() const && { return std::move(m_val); } private: E m_val; }; #ifdef __cpp_deduction_guides template unexpected(E) -> unexpected; #endif template constexpr bool operator==(const unexpected &lhs, const unexpected &rhs) { return lhs.value() == rhs.value(); } template constexpr bool operator!=(const unexpected &lhs, const unexpected &rhs) { return lhs.value() != rhs.value(); } template constexpr bool operator<(const unexpected &lhs, const unexpected &rhs) { return lhs.value() < rhs.value(); } template constexpr bool operator<=(const unexpected &lhs, const unexpected &rhs) { return lhs.value() <= rhs.value(); } template constexpr bool operator>(const unexpected &lhs, const unexpected &rhs) { return lhs.value() > rhs.value(); } template constexpr bool operator>=(const unexpected &lhs, const unexpected &rhs) { return lhs.value() >= rhs.value(); } template unexpected::type> make_unexpected(E &&e) { return unexpected::type>(std::forward(e)); } struct unexpect_t { unexpect_t() = default; }; static constexpr unexpect_t unexpect{}; namespace detail { template [[noreturn]] TL_EXPECTED_11_CONSTEXPR void throw_exception(E &&e) { #ifdef TL_EXPECTED_EXCEPTIONS_ENABLED throw std::forward(e); #else #ifdef _MSC_VER __assume(0); #else __builtin_unreachable(); #endif #endif } #ifndef TL_TRAITS_MUTEX #define TL_TRAITS_MUTEX // C++14-style aliases for brevity template using remove_const_t = typename std::remove_const::type; template using remove_reference_t = typename std::remove_reference::type; template using decay_t = typename std::decay::type; template using enable_if_t = typename std::enable_if::type; template using conditional_t = typename std::conditional::type; // std::conjunction from C++17 template struct conjunction : std::true_type {}; template struct conjunction : B {}; template struct conjunction : std::conditional, B>::type {}; #if defined(_LIBCPP_VERSION) && __cplusplus == 201103L #define TL_TRAITS_LIBCXX_MEM_FN_WORKAROUND #endif // In C++11 mode, there's an issue in libc++'s std::mem_fn // which results in a hard-error when using it in a noexcept expression // in some cases. This is a check to workaround the common failing case. #ifdef TL_TRAITS_LIBCXX_MEM_FN_WORKAROUND template struct is_pointer_to_non_const_member_func : std::false_type {}; template struct is_pointer_to_non_const_member_func : std::true_type {}; template struct is_pointer_to_non_const_member_func : std::true_type {}; template struct is_pointer_to_non_const_member_func : std::true_type {}; template struct is_pointer_to_non_const_member_func : std::true_type {}; template struct is_pointer_to_non_const_member_func : std::true_type {}; template struct is_pointer_to_non_const_member_func : std::true_type {}; template struct is_const_or_const_ref : std::false_type {}; template struct is_const_or_const_ref : std::true_type {}; template struct is_const_or_const_ref : std::true_type {}; #endif // std::invoke from C++17 // https://stackoverflow.com/questions/38288042/c11-14-invoke-workaround template < typename Fn, typename... Args, #ifdef TL_TRAITS_LIBCXX_MEM_FN_WORKAROUND typename = enable_if_t::value && is_const_or_const_ref::value)>, #endif typename = enable_if_t>::value>, int = 0> constexpr auto invoke(Fn &&f, Args &&...args) noexcept( noexcept(std::mem_fn(f)(std::forward(args)...))) -> decltype(std::mem_fn(f)(std::forward(args)...)) { return std::mem_fn(f)(std::forward(args)...); } template >::value>> constexpr auto invoke(Fn &&f, Args &&...args) noexcept( noexcept(std::forward(f)(std::forward(args)...))) -> decltype(std::forward(f)(std::forward(args)...)) { return std::forward(f)(std::forward(args)...); } // std::invoke_result from C++17 template struct invoke_result_impl; template struct invoke_result_impl< F, decltype(detail::invoke(std::declval(), std::declval()...), void()), Us...> { using type = decltype(detail::invoke(std::declval(), std::declval()...)); }; template using invoke_result = invoke_result_impl; template using invoke_result_t = typename invoke_result::type; #if defined(_MSC_VER) && _MSC_VER <= 1900 // TODO make a version which works with MSVC 2015 template struct is_swappable : std::true_type {}; template struct is_nothrow_swappable : std::true_type {}; #else // https://stackoverflow.com/questions/26744589/what-is-a-proper-way-to-implement-is-swappable-to-test-for-the-swappable-concept namespace swap_adl_tests { // if swap ADL finds this then it would call std::swap otherwise (same // signature) struct tag {}; template tag swap(T &, T &); template tag swap(T (&a)[N], T (&b)[N]); // helper functions to test if an unqualified swap is possible, and if it // becomes std::swap template std::false_type can_swap(...) noexcept(false); template (), std::declval()))> std::true_type can_swap(int) noexcept(noexcept(swap(std::declval(), std::declval()))); template std::false_type uses_std(...); template std::is_same(), std::declval())), tag> uses_std(int); template struct is_std_swap_noexcept : std::integral_constant::value && std::is_nothrow_move_assignable::value> {}; template struct is_std_swap_noexcept : is_std_swap_noexcept {}; template struct is_adl_swap_noexcept : std::integral_constant(0))> {}; } // namespace swap_adl_tests template struct is_swappable : std::integral_constant< bool, decltype(detail::swap_adl_tests::can_swap(0))::value && (!decltype(detail::swap_adl_tests::uses_std(0))::value || (std::is_move_assignable::value && std::is_move_constructible::value))> {}; template struct is_swappable : std::integral_constant< bool, decltype(detail::swap_adl_tests::can_swap(0))::value && (!decltype(detail::swap_adl_tests::uses_std( 0))::value || is_swappable::value)> {}; template struct is_nothrow_swappable : std::integral_constant< bool, is_swappable::value && ((decltype(detail::swap_adl_tests::uses_std(0))::value && detail::swap_adl_tests::is_std_swap_noexcept::value) || (!decltype(detail::swap_adl_tests::uses_std(0))::value && detail::swap_adl_tests::is_adl_swap_noexcept::value))> {}; #endif #endif // Trait for checking if a type is a tl::expected template struct is_expected_impl : std::false_type {}; template struct is_expected_impl> : std::true_type {}; template using is_expected = is_expected_impl>; template using expected_enable_forward_value = detail::enable_if_t< std::is_constructible::value && !std::is_same, in_place_t>::value && !std::is_same, detail::decay_t>::value && !std::is_same, detail::decay_t>::value>; template using expected_enable_from_other = detail::enable_if_t< std::is_constructible::value && std::is_constructible::value && !std::is_constructible &>::value && !std::is_constructible &&>::value && !std::is_constructible &>::value && !std::is_constructible &&>::value && !std::is_convertible &, T>::value && !std::is_convertible &&, T>::value && !std::is_convertible &, T>::value && !std::is_convertible &&, T>::value>; template using is_void_or = conditional_t::value, std::true_type, U>; template using is_copy_constructible_or_void = is_void_or>; template using is_move_constructible_or_void = is_void_or>; template using is_copy_assignable_or_void = is_void_or>; template using is_move_assignable_or_void = is_void_or>; } // namespace detail namespace detail { struct no_init_t {}; static constexpr no_init_t no_init{}; // Implements the storage of the values, and ensures that the destructor is // trivial if it can be. // // This specialization is for where neither `T` or `E` is trivially // destructible, so the destructors must be called on destruction of the // `expected` template ::value, bool = std::is_trivially_destructible::value> struct expected_storage_base { constexpr expected_storage_base() : m_val(T{}), m_has_val(true) {} constexpr expected_storage_base(no_init_t) : m_no_init(), m_has_val(false) {} template ::value> * = nullptr> constexpr expected_storage_base(in_place_t, Args &&...args) : m_val(std::forward(args)...), m_has_val(true) {} template &, Args &&...>::value> * = nullptr> constexpr expected_storage_base(in_place_t, std::initializer_list il, Args &&...args) : m_val(il, std::forward(args)...), m_has_val(true) {} template ::value> * = nullptr> constexpr explicit expected_storage_base(unexpect_t, Args &&...args) : m_unexpect(std::forward(args)...), m_has_val(false) {} template &, Args &&...>::value> * = nullptr> constexpr explicit expected_storage_base(unexpect_t, std::initializer_list il, Args &&...args) : m_unexpect(il, std::forward(args)...), m_has_val(false) {} ~expected_storage_base() { if (m_has_val) { m_val.~T(); } else { m_unexpect.~unexpected(); } } union { T m_val; unexpected m_unexpect; char m_no_init; }; bool m_has_val; }; // This specialization is for when both `T` and `E` are trivially-destructible, // so the destructor of the `expected` can be trivial. template struct expected_storage_base { constexpr expected_storage_base() : m_val(T{}), m_has_val(true) {} constexpr expected_storage_base(no_init_t) : m_no_init(), m_has_val(false) {} template ::value> * = nullptr> constexpr expected_storage_base(in_place_t, Args &&...args) : m_val(std::forward(args)...), m_has_val(true) {} template &, Args &&...>::value> * = nullptr> constexpr expected_storage_base(in_place_t, std::initializer_list il, Args &&...args) : m_val(il, std::forward(args)...), m_has_val(true) {} template ::value> * = nullptr> constexpr explicit expected_storage_base(unexpect_t, Args &&...args) : m_unexpect(std::forward(args)...), m_has_val(false) {} template &, Args &&...>::value> * = nullptr> constexpr explicit expected_storage_base(unexpect_t, std::initializer_list il, Args &&...args) : m_unexpect(il, std::forward(args)...), m_has_val(false) {} ~expected_storage_base() = default; union { T m_val; unexpected m_unexpect; char m_no_init; }; bool m_has_val; }; // T is trivial, E is not. template struct expected_storage_base { constexpr expected_storage_base() : m_val(T{}), m_has_val(true) {} TL_EXPECTED_MSVC2015_CONSTEXPR expected_storage_base(no_init_t) : m_no_init(), m_has_val(false) {} template ::value> * = nullptr> constexpr expected_storage_base(in_place_t, Args &&...args) : m_val(std::forward(args)...), m_has_val(true) {} template &, Args &&...>::value> * = nullptr> constexpr expected_storage_base(in_place_t, std::initializer_list il, Args &&...args) : m_val(il, std::forward(args)...), m_has_val(true) {} template ::value> * = nullptr> constexpr explicit expected_storage_base(unexpect_t, Args &&...args) : m_unexpect(std::forward(args)...), m_has_val(false) {} template &, Args &&...>::value> * = nullptr> constexpr explicit expected_storage_base(unexpect_t, std::initializer_list il, Args &&...args) : m_unexpect(il, std::forward(args)...), m_has_val(false) {} ~expected_storage_base() { if (!m_has_val) { m_unexpect.~unexpected(); } } union { T m_val; unexpected m_unexpect; char m_no_init; }; bool m_has_val; }; // E is trivial, T is not. template struct expected_storage_base { constexpr expected_storage_base() : m_val(T{}), m_has_val(true) {} constexpr expected_storage_base(no_init_t) : m_no_init(), m_has_val(false) {} template ::value> * = nullptr> constexpr expected_storage_base(in_place_t, Args &&...args) : m_val(std::forward(args)...), m_has_val(true) {} template &, Args &&...>::value> * = nullptr> constexpr expected_storage_base(in_place_t, std::initializer_list il, Args &&...args) : m_val(il, std::forward(args)...), m_has_val(true) {} template ::value> * = nullptr> constexpr explicit expected_storage_base(unexpect_t, Args &&...args) : m_unexpect(std::forward(args)...), m_has_val(false) {} template &, Args &&...>::value> * = nullptr> constexpr explicit expected_storage_base(unexpect_t, std::initializer_list il, Args &&...args) : m_unexpect(il, std::forward(args)...), m_has_val(false) {} ~expected_storage_base() { if (m_has_val) { m_val.~T(); } } union { T m_val; unexpected m_unexpect; char m_no_init; }; bool m_has_val; }; // `T` is `void`, `E` is trivially-destructible template struct expected_storage_base { #if __GNUC__ <= 5 // no constexpr for GCC 4/5 bug #else TL_EXPECTED_MSVC2015_CONSTEXPR #endif expected_storage_base() : m_has_val(true) {} constexpr expected_storage_base(no_init_t) : m_val(), m_has_val(false) {} constexpr expected_storage_base(in_place_t) : m_has_val(true) {} template ::value> * = nullptr> constexpr explicit expected_storage_base(unexpect_t, Args &&...args) : m_unexpect(std::forward(args)...), m_has_val(false) {} template &, Args &&...>::value> * = nullptr> constexpr explicit expected_storage_base(unexpect_t, std::initializer_list il, Args &&...args) : m_unexpect(il, std::forward(args)...), m_has_val(false) {} ~expected_storage_base() = default; struct dummy {}; union { unexpected m_unexpect; dummy m_val; }; bool m_has_val; }; // `T` is `void`, `E` is not trivially-destructible template struct expected_storage_base { constexpr expected_storage_base() : m_dummy(), m_has_val(true) {} constexpr expected_storage_base(no_init_t) : m_dummy(), m_has_val(false) {} constexpr expected_storage_base(in_place_t) : m_dummy(), m_has_val(true) {} template ::value> * = nullptr> constexpr explicit expected_storage_base(unexpect_t, Args &&...args) : m_unexpect(std::forward(args)...), m_has_val(false) {} template &, Args &&...>::value> * = nullptr> constexpr explicit expected_storage_base(unexpect_t, std::initializer_list il, Args &&...args) : m_unexpect(il, std::forward(args)...), m_has_val(false) {} ~expected_storage_base() { if (!m_has_val) { m_unexpect.~unexpected(); } } union { unexpected m_unexpect; char m_dummy; }; bool m_has_val; }; // This base class provides some handy member functions which can be used in // further derived classes template struct expected_operations_base : expected_storage_base { using expected_storage_base::expected_storage_base; template void construct(Args &&...args) noexcept { new (std::addressof(this->m_val)) T(std::forward(args)...); this->m_has_val = true; } template void construct_with(Rhs &&rhs) noexcept { new (std::addressof(this->m_val)) T(std::forward(rhs).get()); this->m_has_val = true; } template void construct_error(Args &&...args) noexcept { new (std::addressof(this->m_unexpect)) unexpected(std::forward(args)...); this->m_has_val = false; } #ifdef TL_EXPECTED_EXCEPTIONS_ENABLED // These assign overloads ensure that the most efficient assignment // implementation is used while maintaining the strong exception guarantee. // The problematic case is where rhs has a value, but *this does not. // // This overload handles the case where we can just copy-construct `T` // directly into place without throwing. template ::value> * = nullptr> void assign(const expected_operations_base &rhs) noexcept { if (!this->m_has_val && rhs.m_has_val) { geterr().~unexpected(); construct(rhs.get()); } else { assign_common(rhs); } } // This overload handles the case where we can attempt to create a copy of // `T`, then no-throw move it into place if the copy was successful. template ::value && std::is_nothrow_move_constructible::value> * = nullptr> void assign(const expected_operations_base &rhs) noexcept { if (!this->m_has_val && rhs.m_has_val) { T tmp = rhs.get(); geterr().~unexpected(); construct(std::move(tmp)); } else { assign_common(rhs); } } // This overload is the worst-case, where we have to move-construct the // unexpected value into temporary storage, then try to copy the T into place. // If the construction succeeds, then everything is fine, but if it throws, // then we move the old unexpected value back into place before rethrowing the // exception. template ::value && !std::is_nothrow_move_constructible::value> * = nullptr> void assign(const expected_operations_base &rhs) { if (!this->m_has_val && rhs.m_has_val) { auto tmp = std::move(geterr()); geterr().~unexpected(); #ifdef TL_EXPECTED_EXCEPTIONS_ENABLED try { construct(rhs.get()); } catch (...) { geterr() = std::move(tmp); throw; } #else construct(rhs.get()); #endif } else { assign_common(rhs); } } // These overloads do the same as above, but for rvalues template ::value> * = nullptr> void assign(expected_operations_base &&rhs) noexcept { if (!this->m_has_val && rhs.m_has_val) { geterr().~unexpected(); construct(std::move(rhs).get()); } else { assign_common(std::move(rhs)); } } template ::value> * = nullptr> void assign(expected_operations_base &&rhs) { if (!this->m_has_val && rhs.m_has_val) { auto tmp = std::move(geterr()); geterr().~unexpected(); #ifdef TL_EXPECTED_EXCEPTIONS_ENABLED try { construct(std::move(rhs).get()); } catch (...) { geterr() = std::move(tmp); throw; } #else construct(std::move(rhs).get()); #endif } else { assign_common(std::move(rhs)); } } #else // If exceptions are disabled then we can just copy-construct void assign(const expected_operations_base &rhs) noexcept { if (!this->m_has_val && rhs.m_has_val) { geterr().~unexpected(); construct(rhs.get()); } else { assign_common(rhs); } } void assign(expected_operations_base &&rhs) noexcept { if (!this->m_has_val && rhs.m_has_val) { geterr().~unexpected(); construct(std::move(rhs).get()); } else { assign_common(rhs); } } #endif // The common part of move/copy assigning template void assign_common(Rhs &&rhs) { if (this->m_has_val) { if (rhs.m_has_val) { get() = std::forward(rhs).get(); } else { destroy_val(); construct_error(std::forward(rhs).geterr()); } } else { if (!rhs.m_has_val) { geterr() = std::forward(rhs).geterr(); } } } bool has_value() const { return this->m_has_val; } TL_EXPECTED_11_CONSTEXPR T &get() & { return this->m_val; } constexpr const T &get() const & { return this->m_val; } TL_EXPECTED_11_CONSTEXPR T &&get() && { return std::move(this->m_val); } #ifndef TL_EXPECTED_NO_CONSTRR constexpr const T &&get() const && { return std::move(this->m_val); } #endif TL_EXPECTED_11_CONSTEXPR unexpected &geterr() & { return this->m_unexpect; } constexpr const unexpected &geterr() const & { return this->m_unexpect; } TL_EXPECTED_11_CONSTEXPR unexpected &&geterr() && { return std::move(this->m_unexpect); } #ifndef TL_EXPECTED_NO_CONSTRR constexpr const unexpected &&geterr() const && { return std::move(this->m_unexpect); } #endif TL_EXPECTED_11_CONSTEXPR void destroy_val() { get().~T(); } }; // This base class provides some handy member functions which can be used in // further derived classes template struct expected_operations_base : expected_storage_base { using expected_storage_base::expected_storage_base; template void construct() noexcept { this->m_has_val = true; } // This function doesn't use its argument, but needs it so that code in // levels above this can work independently of whether T is void template void construct_with(Rhs &&) noexcept { this->m_has_val = true; } template void construct_error(Args &&...args) noexcept { new (std::addressof(this->m_unexpect)) unexpected(std::forward(args)...); this->m_has_val = false; } template void assign(Rhs &&rhs) noexcept { if (!this->m_has_val) { if (rhs.m_has_val) { geterr().~unexpected(); construct(); } else { geterr() = std::forward(rhs).geterr(); } } else { if (!rhs.m_has_val) { construct_error(std::forward(rhs).geterr()); } } } bool has_value() const { return this->m_has_val; } TL_EXPECTED_11_CONSTEXPR unexpected &geterr() & { return this->m_unexpect; } constexpr const unexpected &geterr() const & { return this->m_unexpect; } TL_EXPECTED_11_CONSTEXPR unexpected &&geterr() && { return std::move(this->m_unexpect); } #ifndef TL_EXPECTED_NO_CONSTRR constexpr const unexpected &&geterr() const && { return std::move(this->m_unexpect); } #endif TL_EXPECTED_11_CONSTEXPR void destroy_val() { // no-op } }; // This class manages conditionally having a trivial copy constructor // This specialization is for when T and E are trivially copy constructible template :: value &&TL_EXPECTED_IS_TRIVIALLY_COPY_CONSTRUCTIBLE(E)::value> struct expected_copy_base : expected_operations_base { using expected_operations_base::expected_operations_base; }; // This specialization is for when T or E are not trivially copy constructible template struct expected_copy_base : expected_operations_base { using expected_operations_base::expected_operations_base; expected_copy_base() = default; expected_copy_base(const expected_copy_base &rhs) : expected_operations_base(no_init) { if (rhs.has_value()) { this->construct_with(rhs); } else { this->construct_error(rhs.geterr()); } } expected_copy_base(expected_copy_base &&rhs) = default; expected_copy_base &operator=(const expected_copy_base &rhs) = default; expected_copy_base &operator=(expected_copy_base &&rhs) = default; }; // This class manages conditionally having a trivial move constructor // Unfortunately there's no way to achieve this in GCC < 5 AFAIK, since it // doesn't implement an analogue to std::is_trivially_move_constructible. We // have to make do with a non-trivial move constructor even if T is trivially // move constructible #ifndef TL_EXPECTED_GCC49 template >::value &&std::is_trivially_move_constructible::value> struct expected_move_base : expected_copy_base { using expected_copy_base::expected_copy_base; }; #else template struct expected_move_base; #endif template struct expected_move_base : expected_copy_base { using expected_copy_base::expected_copy_base; expected_move_base() = default; expected_move_base(const expected_move_base &rhs) = default; expected_move_base(expected_move_base &&rhs) noexcept( std::is_nothrow_move_constructible::value) : expected_copy_base(no_init) { if (rhs.has_value()) { this->construct_with(std::move(rhs)); } else { this->construct_error(std::move(rhs.geterr())); } } expected_move_base &operator=(const expected_move_base &rhs) = default; expected_move_base &operator=(expected_move_base &&rhs) = default; }; // This class manages conditionally having a trivial copy assignment operator template >::value &&TL_EXPECTED_IS_TRIVIALLY_COPY_ASSIGNABLE(E)::value &&TL_EXPECTED_IS_TRIVIALLY_COPY_CONSTRUCTIBLE(E)::value &&TL_EXPECTED_IS_TRIVIALLY_DESTRUCTIBLE(E)::value> struct expected_copy_assign_base : expected_move_base { using expected_move_base::expected_move_base; }; template struct expected_copy_assign_base : expected_move_base { using expected_move_base::expected_move_base; expected_copy_assign_base() = default; expected_copy_assign_base(const expected_copy_assign_base &rhs) = default; expected_copy_assign_base(expected_copy_assign_base &&rhs) = default; expected_copy_assign_base &operator=(const expected_copy_assign_base &rhs) { this->assign(rhs); return *this; } expected_copy_assign_base &operator=(expected_copy_assign_base &&rhs) = default; }; // This class manages conditionally having a trivial move assignment operator // Unfortunately there's no way to achieve this in GCC < 5 AFAIK, since it // doesn't implement an analogue to std::is_trivially_move_assignable. We have // to make do with a non-trivial move assignment operator even if T is trivially // move assignable #ifndef TL_EXPECTED_GCC49 template , std::is_trivially_move_constructible, std::is_trivially_move_assignable>>:: value &&std::is_trivially_destructible::value &&std::is_trivially_move_constructible::value &&std::is_trivially_move_assignable::value> struct expected_move_assign_base : expected_copy_assign_base { using expected_copy_assign_base::expected_copy_assign_base; }; #else template struct expected_move_assign_base; #endif template struct expected_move_assign_base : expected_copy_assign_base { using expected_copy_assign_base::expected_copy_assign_base; expected_move_assign_base() = default; expected_move_assign_base(const expected_move_assign_base &rhs) = default; expected_move_assign_base(expected_move_assign_base &&rhs) = default; expected_move_assign_base &operator=(const expected_move_assign_base &rhs) = default; expected_move_assign_base & operator=(expected_move_assign_base &&rhs) noexcept( std::is_nothrow_move_constructible::value &&std::is_nothrow_move_assignable::value) { this->assign(std::move(rhs)); return *this; } }; // expected_delete_ctor_base will conditionally delete copy and move // constructors depending on whether T is copy/move constructible template ::value && std::is_copy_constructible::value), bool EnableMove = (is_move_constructible_or_void::value && std::is_move_constructible::value)> struct expected_delete_ctor_base { expected_delete_ctor_base() = default; expected_delete_ctor_base(const expected_delete_ctor_base &) = default; expected_delete_ctor_base(expected_delete_ctor_base &&) noexcept = default; expected_delete_ctor_base &operator=(const expected_delete_ctor_base &) = default; expected_delete_ctor_base &operator=(expected_delete_ctor_base &&) noexcept = default; }; template struct expected_delete_ctor_base { expected_delete_ctor_base() = default; expected_delete_ctor_base(const expected_delete_ctor_base &) = default; expected_delete_ctor_base(expected_delete_ctor_base &&) noexcept = delete; expected_delete_ctor_base &operator=(const expected_delete_ctor_base &) = default; expected_delete_ctor_base &operator=(expected_delete_ctor_base &&) noexcept = default; }; template struct expected_delete_ctor_base { expected_delete_ctor_base() = default; expected_delete_ctor_base(const expected_delete_ctor_base &) = delete; expected_delete_ctor_base(expected_delete_ctor_base &&) noexcept = default; expected_delete_ctor_base &operator=(const expected_delete_ctor_base &) = default; expected_delete_ctor_base &operator=(expected_delete_ctor_base &&) noexcept = default; }; template struct expected_delete_ctor_base { expected_delete_ctor_base() = default; expected_delete_ctor_base(const expected_delete_ctor_base &) = delete; expected_delete_ctor_base(expected_delete_ctor_base &&) noexcept = delete; expected_delete_ctor_base &operator=(const expected_delete_ctor_base &) = default; expected_delete_ctor_base &operator=(expected_delete_ctor_base &&) noexcept = default; }; // expected_delete_assign_base will conditionally delete copy and move // constructors depending on whether T and E are copy/move constructible + // assignable template ::value && std::is_copy_constructible::value && is_copy_assignable_or_void::value && std::is_copy_assignable::value), bool EnableMove = (is_move_constructible_or_void::value && std::is_move_constructible::value && is_move_assignable_or_void::value && std::is_move_assignable::value)> struct expected_delete_assign_base { expected_delete_assign_base() = default; expected_delete_assign_base(const expected_delete_assign_base &) = default; expected_delete_assign_base(expected_delete_assign_base &&) noexcept = default; expected_delete_assign_base &operator=(const expected_delete_assign_base &) = default; expected_delete_assign_base &operator=( expected_delete_assign_base &&) noexcept = default; }; template struct expected_delete_assign_base { expected_delete_assign_base() = default; expected_delete_assign_base(const expected_delete_assign_base &) = default; expected_delete_assign_base(expected_delete_assign_base &&) noexcept = default; expected_delete_assign_base &operator=(const expected_delete_assign_base &) = default; expected_delete_assign_base &operator=( expected_delete_assign_base &&) noexcept = delete; }; template struct expected_delete_assign_base { expected_delete_assign_base() = default; expected_delete_assign_base(const expected_delete_assign_base &) = default; expected_delete_assign_base(expected_delete_assign_base &&) noexcept = default; expected_delete_assign_base &operator=(const expected_delete_assign_base &) = delete; expected_delete_assign_base &operator=( expected_delete_assign_base &&) noexcept = default; }; template struct expected_delete_assign_base { expected_delete_assign_base() = default; expected_delete_assign_base(const expected_delete_assign_base &) = default; expected_delete_assign_base(expected_delete_assign_base &&) noexcept = default; expected_delete_assign_base &operator=(const expected_delete_assign_base &) = delete; expected_delete_assign_base &operator=( expected_delete_assign_base &&) noexcept = delete; }; // This is needed to be able to construct the expected_default_ctor_base which // follows, while still conditionally deleting the default constructor. struct default_constructor_tag { explicit constexpr default_constructor_tag() = default; }; // expected_default_ctor_base will ensure that expected has a deleted default // constructor if T is not default constructible. // This specialization is for when T is default constructible template ::value || std::is_void::value> struct expected_default_ctor_base { constexpr expected_default_ctor_base() noexcept = default; constexpr expected_default_ctor_base( expected_default_ctor_base const &) noexcept = default; constexpr expected_default_ctor_base(expected_default_ctor_base &&) noexcept = default; expected_default_ctor_base &operator=( expected_default_ctor_base const &) noexcept = default; expected_default_ctor_base &operator=( expected_default_ctor_base &&) noexcept = default; constexpr explicit expected_default_ctor_base(default_constructor_tag) {} }; // This specialization is for when T is not default constructible template struct expected_default_ctor_base { constexpr expected_default_ctor_base() noexcept = delete; constexpr expected_default_ctor_base( expected_default_ctor_base const &) noexcept = default; constexpr expected_default_ctor_base(expected_default_ctor_base &&) noexcept = default; expected_default_ctor_base &operator=( expected_default_ctor_base const &) noexcept = default; expected_default_ctor_base &operator=( expected_default_ctor_base &&) noexcept = default; constexpr explicit expected_default_ctor_base(default_constructor_tag) {} }; } // namespace detail template class bad_expected_access : public std::exception { public: explicit bad_expected_access(E e) : m_val(std::move(e)) {} virtual const char *what() const noexcept override { return "Bad expected access"; } const E &error() const & { return m_val; } E &error() & { return m_val; } const E &&error() const && { return std::move(m_val); } E &&error() && { return std::move(m_val); } private: E m_val; }; /// An `expected` object is an object that contains the storage for /// another object and manages the lifetime of this contained object `T`. /// Alternatively it could contain the storage for another unexpected object /// `E`. The contained object may not be initialized after the expected object /// has been initialized, and may not be destroyed before the expected object /// has been destroyed. The initialization state of the contained object is /// tracked by the expected object. template class expected : private detail::expected_move_assign_base, private detail::expected_delete_ctor_base, private detail::expected_delete_assign_base, private detail::expected_default_ctor_base { static_assert(!std::is_reference::value, "T must not be a reference"); static_assert(!std::is_same::type>::value, "T must not be in_place_t"); static_assert(!std::is_same::type>::value, "T must not be unexpect_t"); static_assert( !std::is_same>::type>::value, "T must not be unexpected"); static_assert(!std::is_reference::value, "E must not be a reference"); T *valptr() { return std::addressof(this->m_val); } const T *valptr() const { return std::addressof(this->m_val); } unexpected *errptr() { return std::addressof(this->m_unexpect); } const unexpected *errptr() const { return std::addressof(this->m_unexpect); } template ::value> * = nullptr> TL_EXPECTED_11_CONSTEXPR U &val() { return this->m_val; } TL_EXPECTED_11_CONSTEXPR unexpected &err() { return this->m_unexpect; } template ::value> * = nullptr> constexpr const U &val() const { return this->m_val; } constexpr const unexpected &err() const { return this->m_unexpect; } using impl_base = detail::expected_move_assign_base; using ctor_base = detail::expected_default_ctor_base; public: typedef T value_type; typedef E error_type; typedef unexpected unexpected_type; #if defined(TL_EXPECTED_CXX14) && !defined(TL_EXPECTED_GCC49) && \ !defined(TL_EXPECTED_GCC54) && !defined(TL_EXPECTED_GCC55) template TL_EXPECTED_11_CONSTEXPR auto and_then(F &&f) & { return and_then_impl(*this, std::forward(f)); } template TL_EXPECTED_11_CONSTEXPR auto and_then(F &&f) && { return and_then_impl(std::move(*this), std::forward(f)); } template constexpr auto and_then(F &&f) const & { return and_then_impl(*this, std::forward(f)); } #ifndef TL_EXPECTED_NO_CONSTRR template constexpr auto and_then(F &&f) const && { return and_then_impl(std::move(*this), std::forward(f)); } #endif #else template TL_EXPECTED_11_CONSTEXPR auto and_then(F &&f) & -> decltype(and_then_impl( std::declval(), std::forward(f))) { return and_then_impl(*this, std::forward(f)); } template TL_EXPECTED_11_CONSTEXPR auto and_then(F &&f) && -> decltype(and_then_impl( std::declval(), std::forward(f))) { return and_then_impl(std::move(*this), std::forward(f)); } template constexpr auto and_then(F &&f) const & -> decltype(and_then_impl( std::declval(), std::forward(f))) { return and_then_impl(*this, std::forward(f)); } #ifndef TL_EXPECTED_NO_CONSTRR template constexpr auto and_then(F &&f) const && -> decltype(and_then_impl( std::declval(), std::forward(f))) { return and_then_impl(std::move(*this), std::forward(f)); } #endif #endif #if defined(TL_EXPECTED_CXX14) && !defined(TL_EXPECTED_GCC49) && \ !defined(TL_EXPECTED_GCC54) && !defined(TL_EXPECTED_GCC55) template TL_EXPECTED_11_CONSTEXPR auto map(F &&f) & { return expected_map_impl(*this, std::forward(f)); } template TL_EXPECTED_11_CONSTEXPR auto map(F &&f) && { return expected_map_impl(std::move(*this), std::forward(f)); } template constexpr auto map(F &&f) const & { return expected_map_impl(*this, std::forward(f)); } template constexpr auto map(F &&f) const && { return expected_map_impl(std::move(*this), std::forward(f)); } #else template TL_EXPECTED_11_CONSTEXPR decltype(expected_map_impl( std::declval(), std::declval())) map(F &&f) & { return expected_map_impl(*this, std::forward(f)); } template TL_EXPECTED_11_CONSTEXPR decltype(expected_map_impl(std::declval(), std::declval())) map(F &&f) && { return expected_map_impl(std::move(*this), std::forward(f)); } template constexpr decltype(expected_map_impl(std::declval(), std::declval())) map(F &&f) const & { return expected_map_impl(*this, std::forward(f)); } #ifndef TL_EXPECTED_NO_CONSTRR template constexpr decltype(expected_map_impl(std::declval(), std::declval())) map(F &&f) const && { return expected_map_impl(std::move(*this), std::forward(f)); } #endif #endif #if defined(TL_EXPECTED_CXX14) && !defined(TL_EXPECTED_GCC49) && \ !defined(TL_EXPECTED_GCC54) && !defined(TL_EXPECTED_GCC55) template TL_EXPECTED_11_CONSTEXPR auto transform(F &&f) & { return expected_map_impl(*this, std::forward(f)); } template TL_EXPECTED_11_CONSTEXPR auto transform(F &&f) && { return expected_map_impl(std::move(*this), std::forward(f)); } template constexpr auto transform(F &&f) const & { return expected_map_impl(*this, std::forward(f)); } template constexpr auto transform(F &&f) const && { return expected_map_impl(std::move(*this), std::forward(f)); } #else template TL_EXPECTED_11_CONSTEXPR decltype(expected_map_impl( std::declval(), std::declval())) transform(F &&f) & { return expected_map_impl(*this, std::forward(f)); } template TL_EXPECTED_11_CONSTEXPR decltype(expected_map_impl(std::declval(), std::declval())) transform(F &&f) && { return expected_map_impl(std::move(*this), std::forward(f)); } template constexpr decltype(expected_map_impl(std::declval(), std::declval())) transform(F &&f) const & { return expected_map_impl(*this, std::forward(f)); } #ifndef TL_EXPECTED_NO_CONSTRR template constexpr decltype(expected_map_impl(std::declval(), std::declval())) transform(F &&f) const && { return expected_map_impl(std::move(*this), std::forward(f)); } #endif #endif #if defined(TL_EXPECTED_CXX14) && !defined(TL_EXPECTED_GCC49) && \ !defined(TL_EXPECTED_GCC54) && !defined(TL_EXPECTED_GCC55) template TL_EXPECTED_11_CONSTEXPR auto map_error(F &&f) & { return map_error_impl(*this, std::forward(f)); } template TL_EXPECTED_11_CONSTEXPR auto map_error(F &&f) && { return map_error_impl(std::move(*this), std::forward(f)); } template constexpr auto map_error(F &&f) const & { return map_error_impl(*this, std::forward(f)); } template constexpr auto map_error(F &&f) const && { return map_error_impl(std::move(*this), std::forward(f)); } #else template TL_EXPECTED_11_CONSTEXPR decltype(map_error_impl(std::declval(), std::declval())) map_error(F &&f) & { return map_error_impl(*this, std::forward(f)); } template TL_EXPECTED_11_CONSTEXPR decltype(map_error_impl(std::declval(), std::declval())) map_error(F &&f) && { return map_error_impl(std::move(*this), std::forward(f)); } template constexpr decltype(map_error_impl(std::declval(), std::declval())) map_error(F &&f) const & { return map_error_impl(*this, std::forward(f)); } #ifndef TL_EXPECTED_NO_CONSTRR template constexpr decltype(map_error_impl(std::declval(), std::declval())) map_error(F &&f) const && { return map_error_impl(std::move(*this), std::forward(f)); } #endif #endif template expected TL_EXPECTED_11_CONSTEXPR or_else(F &&f) & { return or_else_impl(*this, std::forward(f)); } template expected TL_EXPECTED_11_CONSTEXPR or_else(F &&f) && { return or_else_impl(std::move(*this), std::forward(f)); } template expected constexpr or_else(F &&f) const & { return or_else_impl(*this, std::forward(f)); } #ifndef TL_EXPECTED_NO_CONSTRR template expected constexpr or_else(F &&f) const && { return or_else_impl(std::move(*this), std::forward(f)); } #endif constexpr expected() = default; constexpr expected(const expected &rhs) = default; constexpr expected(expected &&rhs) = default; expected &operator=(const expected &rhs) = default; expected &operator=(expected &&rhs) = default; template ::value> * = nullptr> constexpr expected(in_place_t, Args &&...args) : impl_base(in_place, std::forward(args)...), ctor_base(detail::default_constructor_tag{}) {} template &, Args &&...>::value> * = nullptr> constexpr expected(in_place_t, std::initializer_list il, Args &&...args) : impl_base(in_place, il, std::forward(args)...), ctor_base(detail::default_constructor_tag{}) {} template ::value> * = nullptr, detail::enable_if_t::value> * = nullptr> explicit constexpr expected(const unexpected &e) : impl_base(unexpect, e.value()), ctor_base(detail::default_constructor_tag{}) {} template < class G = E, detail::enable_if_t::value> * = nullptr, detail::enable_if_t::value> * = nullptr> constexpr expected(unexpected const &e) : impl_base(unexpect, e.value()), ctor_base(detail::default_constructor_tag{}) {} template < class G = E, detail::enable_if_t::value> * = nullptr, detail::enable_if_t::value> * = nullptr> explicit constexpr expected(unexpected &&e) noexcept( std::is_nothrow_constructible::value) : impl_base(unexpect, std::move(e.value())), ctor_base(detail::default_constructor_tag{}) {} template < class G = E, detail::enable_if_t::value> * = nullptr, detail::enable_if_t::value> * = nullptr> constexpr expected(unexpected &&e) noexcept( std::is_nothrow_constructible::value) : impl_base(unexpect, std::move(e.value())), ctor_base(detail::default_constructor_tag{}) {} template ::value> * = nullptr> constexpr explicit expected(unexpect_t, Args &&...args) : impl_base(unexpect, std::forward(args)...), ctor_base(detail::default_constructor_tag{}) {} template &, Args &&...>::value> * = nullptr> constexpr explicit expected(unexpect_t, std::initializer_list il, Args &&...args) : impl_base(unexpect, il, std::forward(args)...), ctor_base(detail::default_constructor_tag{}) {} template ::value && std::is_convertible::value)> * = nullptr, detail::expected_enable_from_other * = nullptr> explicit TL_EXPECTED_11_CONSTEXPR expected(const expected &rhs) : ctor_base(detail::default_constructor_tag{}) { if (rhs.has_value()) { this->construct(*rhs); } else { this->construct_error(rhs.error()); } } template ::value && std::is_convertible::value)> * = nullptr, detail::expected_enable_from_other * = nullptr> TL_EXPECTED_11_CONSTEXPR expected(const expected &rhs) : ctor_base(detail::default_constructor_tag{}) { if (rhs.has_value()) { this->construct(*rhs); } else { this->construct_error(rhs.error()); } } template < class U, class G, detail::enable_if_t::value && std::is_convertible::value)> * = nullptr, detail::expected_enable_from_other * = nullptr> explicit TL_EXPECTED_11_CONSTEXPR expected(expected &&rhs) : ctor_base(detail::default_constructor_tag{}) { if (rhs.has_value()) { this->construct(std::move(*rhs)); } else { this->construct_error(std::move(rhs.error())); } } template < class U, class G, detail::enable_if_t<(std::is_convertible::value && std::is_convertible::value)> * = nullptr, detail::expected_enable_from_other * = nullptr> TL_EXPECTED_11_CONSTEXPR expected(expected &&rhs) : ctor_base(detail::default_constructor_tag{}) { if (rhs.has_value()) { this->construct(std::move(*rhs)); } else { this->construct_error(std::move(rhs.error())); } } template < class U = T, detail::enable_if_t::value> * = nullptr, detail::expected_enable_forward_value * = nullptr> explicit TL_EXPECTED_MSVC2015_CONSTEXPR expected(U &&v) : expected(in_place, std::forward(v)) {} template < class U = T, detail::enable_if_t::value> * = nullptr, detail::expected_enable_forward_value * = nullptr> TL_EXPECTED_MSVC2015_CONSTEXPR expected(U &&v) : expected(in_place, std::forward(v)) {} template < class U = T, class G = T, detail::enable_if_t::value> * = nullptr, detail::enable_if_t::value> * = nullptr, detail::enable_if_t< (!std::is_same, detail::decay_t>::value && !detail::conjunction, std::is_same>>::value && std::is_constructible::value && std::is_assignable::value && std::is_nothrow_move_constructible::value)> * = nullptr> expected &operator=(U &&v) { if (has_value()) { val() = std::forward(v); } else { err().~unexpected(); ::new (valptr()) T(std::forward(v)); this->m_has_val = true; } return *this; } template < class U = T, class G = T, detail::enable_if_t::value> * = nullptr, detail::enable_if_t::value> * = nullptr, detail::enable_if_t< (!std::is_same, detail::decay_t>::value && !detail::conjunction, std::is_same>>::value && std::is_constructible::value && std::is_assignable::value && std::is_nothrow_move_constructible::value)> * = nullptr> expected &operator=(U &&v) { if (has_value()) { val() = std::forward(v); } else { auto tmp = std::move(err()); err().~unexpected(); #ifdef TL_EXPECTED_EXCEPTIONS_ENABLED try { ::new (valptr()) T(std::forward(v)); this->m_has_val = true; } catch (...) { err() = std::move(tmp); throw; } #else ::new (valptr()) T(std::forward(v)); this->m_has_val = true; #endif } return *this; } template ::value && std::is_assignable::value> * = nullptr> expected &operator=(const unexpected &rhs) { if (!has_value()) { err() = rhs; } else { this->destroy_val(); ::new (errptr()) unexpected(rhs); this->m_has_val = false; } return *this; } template ::value && std::is_move_assignable::value> * = nullptr> expected &operator=(unexpected &&rhs) noexcept { if (!has_value()) { err() = std::move(rhs); } else { this->destroy_val(); ::new (errptr()) unexpected(std::move(rhs)); this->m_has_val = false; } return *this; } template ::value> * = nullptr> void emplace(Args &&...args) { if (has_value()) { val().~T(); } else { err().~unexpected(); this->m_has_val = true; } ::new (valptr()) T(std::forward(args)...); } template ::value> * = nullptr> void emplace(Args &&...args) { if (has_value()) { val().~T(); ::new (valptr()) T(std::forward(args)...); } else { auto tmp = std::move(err()); err().~unexpected(); #ifdef TL_EXPECTED_EXCEPTIONS_ENABLED try { ::new (valptr()) T(std::forward(args)...); this->m_has_val = true; } catch (...) { err() = std::move(tmp); throw; } #else ::new (valptr()) T(std::forward(args)...); this->m_has_val = true; #endif } } template &, Args &&...>::value> * = nullptr> void emplace(std::initializer_list il, Args &&...args) { if (has_value()) { T t(il, std::forward(args)...); val() = std::move(t); } else { err().~unexpected(); ::new (valptr()) T(il, std::forward(args)...); this->m_has_val = true; } } template &, Args &&...>::value> * = nullptr> void emplace(std::initializer_list il, Args &&...args) { if (has_value()) { T t(il, std::forward(args)...); val() = std::move(t); } else { auto tmp = std::move(err()); err().~unexpected(); #ifdef TL_EXPECTED_EXCEPTIONS_ENABLED try { ::new (valptr()) T(il, std::forward(args)...); this->m_has_val = true; } catch (...) { err() = std::move(tmp); throw; } #else ::new (valptr()) T(il, std::forward(args)...); this->m_has_val = true; #endif } } private: using t_is_void = std::true_type; using t_is_not_void = std::false_type; using t_is_nothrow_move_constructible = std::true_type; using move_constructing_t_can_throw = std::false_type; using e_is_nothrow_move_constructible = std::true_type; using move_constructing_e_can_throw = std::false_type; void swap_where_both_have_value(expected & /*rhs*/, t_is_void) noexcept { // swapping void is a no-op } void swap_where_both_have_value(expected &rhs, t_is_not_void) { using std::swap; swap(val(), rhs.val()); } void swap_where_only_one_has_value(expected &rhs, t_is_void) noexcept( std::is_nothrow_move_constructible::value) { ::new (errptr()) unexpected_type(std::move(rhs.err())); rhs.err().~unexpected_type(); std::swap(this->m_has_val, rhs.m_has_val); } void swap_where_only_one_has_value(expected &rhs, t_is_not_void) { swap_where_only_one_has_value_and_t_is_not_void( rhs, typename std::is_nothrow_move_constructible::type{}, typename std::is_nothrow_move_constructible::type{}); } void swap_where_only_one_has_value_and_t_is_not_void( expected &rhs, t_is_nothrow_move_constructible, e_is_nothrow_move_constructible) noexcept { auto temp = std::move(val()); val().~T(); ::new (errptr()) unexpected_type(std::move(rhs.err())); rhs.err().~unexpected_type(); ::new (rhs.valptr()) T(std::move(temp)); std::swap(this->m_has_val, rhs.m_has_val); } void swap_where_only_one_has_value_and_t_is_not_void( expected &rhs, t_is_nothrow_move_constructible, move_constructing_e_can_throw) { auto temp = std::move(val()); val().~T(); #ifdef TL_EXPECTED_EXCEPTIONS_ENABLED try { ::new (errptr()) unexpected_type(std::move(rhs.err())); rhs.err().~unexpected_type(); ::new (rhs.valptr()) T(std::move(temp)); std::swap(this->m_has_val, rhs.m_has_val); } catch (...) { val() = std::move(temp); throw; } #else ::new (errptr()) unexpected_type(std::move(rhs.err())); rhs.err().~unexpected_type(); ::new (rhs.valptr()) T(std::move(temp)); std::swap(this->m_has_val, rhs.m_has_val); #endif } void swap_where_only_one_has_value_and_t_is_not_void( expected &rhs, move_constructing_t_can_throw, e_is_nothrow_move_constructible) { auto temp = std::move(rhs.err()); rhs.err().~unexpected_type(); #ifdef TL_EXPECTED_EXCEPTIONS_ENABLED try { ::new (rhs.valptr()) T(std::move(val())); val().~T(); ::new (errptr()) unexpected_type(std::move(temp)); std::swap(this->m_has_val, rhs.m_has_val); } catch (...) { rhs.err() = std::move(temp); throw; } #else ::new (rhs.valptr()) T(std::move(val())); val().~T(); ::new (errptr()) unexpected_type(std::move(temp)); std::swap(this->m_has_val, rhs.m_has_val); #endif } public: template detail::enable_if_t::value && detail::is_swappable::value && (std::is_nothrow_move_constructible::value || std::is_nothrow_move_constructible::value)> swap(expected &rhs) noexcept( std::is_nothrow_move_constructible::value &&detail::is_nothrow_swappable::value &&std::is_nothrow_move_constructible::value &&detail::is_nothrow_swappable::value) { if (has_value() && rhs.has_value()) { swap_where_both_have_value(rhs, typename std::is_void::type{}); } else if (!has_value() && rhs.has_value()) { rhs.swap(*this); } else if (has_value()) { swap_where_only_one_has_value(rhs, typename std::is_void::type{}); } else { using std::swap; swap(err(), rhs.err()); } } constexpr const T *operator->() const { return valptr(); } TL_EXPECTED_11_CONSTEXPR T *operator->() { return valptr(); } template ::value> * = nullptr> constexpr const U &operator*() const & { return val(); } template ::value> * = nullptr> TL_EXPECTED_11_CONSTEXPR U &operator*() & { return val(); } template ::value> * = nullptr> constexpr const U &&operator*() const && { return std::move(val()); } template ::value> * = nullptr> TL_EXPECTED_11_CONSTEXPR U &&operator*() && { return std::move(val()); } constexpr bool has_value() const noexcept { return this->m_has_val; } constexpr explicit operator bool() const noexcept { return this->m_has_val; } template ::value> * = nullptr> TL_EXPECTED_11_CONSTEXPR const U &value() const & { if (!has_value()) detail::throw_exception(bad_expected_access(err().value())); return val(); } template ::value> * = nullptr> TL_EXPECTED_11_CONSTEXPR U &value() & { if (!has_value()) detail::throw_exception(bad_expected_access(err().value())); return val(); } template ::value> * = nullptr> TL_EXPECTED_11_CONSTEXPR const U &&value() const && { if (!has_value()) detail::throw_exception(bad_expected_access(std::move(err()).value())); return std::move(val()); } template ::value> * = nullptr> TL_EXPECTED_11_CONSTEXPR U &&value() && { if (!has_value()) detail::throw_exception(bad_expected_access(std::move(err()).value())); return std::move(val()); } constexpr const E &error() const & { return err().value(); } TL_EXPECTED_11_CONSTEXPR E &error() & { return err().value(); } constexpr const E &&error() const && { return std::move(err().value()); } TL_EXPECTED_11_CONSTEXPR E &&error() && { return std::move(err().value()); } template constexpr T value_or(U &&v) const & { static_assert(std::is_copy_constructible::value && std::is_convertible::value, "T must be copy-constructible and convertible to from U&&"); return bool(*this) ? **this : static_cast(std::forward(v)); } template TL_EXPECTED_11_CONSTEXPR T value_or(U &&v) && { static_assert(std::is_move_constructible::value && std::is_convertible::value, "T must be move-constructible and convertible to from U&&"); return bool(*this) ? std::move(**this) : static_cast(std::forward(v)); } }; namespace detail { template using exp_t = typename detail::decay_t::value_type; template using err_t = typename detail::decay_t::error_type; template using ret_t = expected>; #ifdef TL_EXPECTED_CXX14 template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), *std::declval()))> constexpr auto and_then_impl(Exp &&exp, F &&f) { static_assert(detail::is_expected::value, "F must return an expected"); return exp.has_value() ? detail::invoke(std::forward(f), *std::forward(exp)) : Ret(unexpect, std::forward(exp).error()); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval()))> constexpr auto and_then_impl(Exp &&exp, F &&f) { static_assert(detail::is_expected::value, "F must return an expected"); return exp.has_value() ? detail::invoke(std::forward(f)) : Ret(unexpect, std::forward(exp).error()); } #else template struct TC; template (), *std::declval())), detail::enable_if_t>::value> * = nullptr> auto and_then_impl(Exp &&exp, F &&f) -> Ret { static_assert(detail::is_expected::value, "F must return an expected"); return exp.has_value() ? detail::invoke(std::forward(f), *std::forward(exp)) : Ret(unexpect, std::forward(exp).error()); } template ())), detail::enable_if_t>::value> * = nullptr> constexpr auto and_then_impl(Exp &&exp, F &&f) -> Ret { static_assert(detail::is_expected::value, "F must return an expected"); return exp.has_value() ? detail::invoke(std::forward(f)) : Ret(unexpect, std::forward(exp).error()); } #endif #ifdef TL_EXPECTED_CXX14 template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), *std::declval())), detail::enable_if_t::value> * = nullptr> constexpr auto expected_map_impl(Exp &&exp, F &&f) { using result = ret_t>; return exp.has_value() ? result(detail::invoke(std::forward(f), *std::forward(exp))) : result(unexpect, std::forward(exp).error()); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), *std::declval())), detail::enable_if_t::value> * = nullptr> auto expected_map_impl(Exp &&exp, F &&f) { using result = expected>; if (exp.has_value()) { detail::invoke(std::forward(f), *std::forward(exp)); return result(); } return result(unexpect, std::forward(exp).error()); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval())), detail::enable_if_t::value> * = nullptr> constexpr auto expected_map_impl(Exp &&exp, F &&f) { using result = ret_t>; return exp.has_value() ? result(detail::invoke(std::forward(f))) : result(unexpect, std::forward(exp).error()); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval())), detail::enable_if_t::value> * = nullptr> auto expected_map_impl(Exp &&exp, F &&f) { using result = expected>; if (exp.has_value()) { detail::invoke(std::forward(f)); return result(); } return result(unexpect, std::forward(exp).error()); } #else template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), *std::declval())), detail::enable_if_t::value> * = nullptr> constexpr auto expected_map_impl(Exp &&exp, F &&f) -> ret_t> { using result = ret_t>; return exp.has_value() ? result(detail::invoke(std::forward(f), *std::forward(exp))) : result(unexpect, std::forward(exp).error()); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), *std::declval())), detail::enable_if_t::value> * = nullptr> auto expected_map_impl(Exp &&exp, F &&f) -> expected> { if (exp.has_value()) { detail::invoke(std::forward(f), *std::forward(exp)); return {}; } return unexpected>(std::forward(exp).error()); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval())), detail::enable_if_t::value> * = nullptr> constexpr auto expected_map_impl(Exp &&exp, F &&f) -> ret_t> { using result = ret_t>; return exp.has_value() ? result(detail::invoke(std::forward(f))) : result(unexpect, std::forward(exp).error()); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval())), detail::enable_if_t::value> * = nullptr> auto expected_map_impl(Exp &&exp, F &&f) -> expected> { if (exp.has_value()) { detail::invoke(std::forward(f)); return {}; } return unexpected>(std::forward(exp).error()); } #endif #if defined(TL_EXPECTED_CXX14) && !defined(TL_EXPECTED_GCC49) && \ !defined(TL_EXPECTED_GCC54) && !defined(TL_EXPECTED_GCC55) template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), std::declval().error())), detail::enable_if_t::value> * = nullptr> constexpr auto map_error_impl(Exp &&exp, F &&f) { using result = expected, detail::decay_t>; return exp.has_value() ? result(*std::forward(exp)) : result(unexpect, detail::invoke(std::forward(f), std::forward(exp).error())); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), std::declval().error())), detail::enable_if_t::value> * = nullptr> auto map_error_impl(Exp &&exp, F &&f) { using result = expected, monostate>; if (exp.has_value()) { return result(*std::forward(exp)); } detail::invoke(std::forward(f), std::forward(exp).error()); return result(unexpect, monostate{}); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), std::declval().error())), detail::enable_if_t::value> * = nullptr> constexpr auto map_error_impl(Exp &&exp, F &&f) { using result = expected, detail::decay_t>; return exp.has_value() ? result() : result(unexpect, detail::invoke(std::forward(f), std::forward(exp).error())); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), std::declval().error())), detail::enable_if_t::value> * = nullptr> auto map_error_impl(Exp &&exp, F &&f) { using result = expected, monostate>; if (exp.has_value()) { return result(); } detail::invoke(std::forward(f), std::forward(exp).error()); return result(unexpect, monostate{}); } #else template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), std::declval().error())), detail::enable_if_t::value> * = nullptr> constexpr auto map_error_impl(Exp &&exp, F &&f) -> expected, detail::decay_t> { using result = expected, detail::decay_t>; return exp.has_value() ? result(*std::forward(exp)) : result(unexpect, detail::invoke(std::forward(f), std::forward(exp).error())); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), std::declval().error())), detail::enable_if_t::value> * = nullptr> auto map_error_impl(Exp &&exp, F &&f) -> expected, monostate> { using result = expected, monostate>; if (exp.has_value()) { return result(*std::forward(exp)); } detail::invoke(std::forward(f), std::forward(exp).error()); return result(unexpect, monostate{}); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), std::declval().error())), detail::enable_if_t::value> * = nullptr> constexpr auto map_error_impl(Exp &&exp, F &&f) -> expected, detail::decay_t> { using result = expected, detail::decay_t>; return exp.has_value() ? result() : result(unexpect, detail::invoke(std::forward(f), std::forward(exp).error())); } template >::value> * = nullptr, class Ret = decltype(detail::invoke(std::declval(), std::declval().error())), detail::enable_if_t::value> * = nullptr> auto map_error_impl(Exp &&exp, F &&f) -> expected, monostate> { using result = expected, monostate>; if (exp.has_value()) { return result(); } detail::invoke(std::forward(f), std::forward(exp).error()); return result(unexpect, monostate{}); } #endif #ifdef TL_EXPECTED_CXX14 template (), std::declval().error())), detail::enable_if_t::value> * = nullptr> constexpr auto or_else_impl(Exp &&exp, F &&f) { static_assert(detail::is_expected::value, "F must return an expected"); return exp.has_value() ? std::forward(exp) : detail::invoke(std::forward(f), std::forward(exp).error()); } template (), std::declval().error())), detail::enable_if_t::value> * = nullptr> detail::decay_t or_else_impl(Exp &&exp, F &&f) { return exp.has_value() ? std::forward(exp) : (detail::invoke(std::forward(f), std::forward(exp).error()), std::forward(exp)); } #else template (), std::declval().error())), detail::enable_if_t::value> * = nullptr> auto or_else_impl(Exp &&exp, F &&f) -> Ret { static_assert(detail::is_expected::value, "F must return an expected"); return exp.has_value() ? std::forward(exp) : detail::invoke(std::forward(f), std::forward(exp).error()); } template (), std::declval().error())), detail::enable_if_t::value> * = nullptr> detail::decay_t or_else_impl(Exp &&exp, F &&f) { return exp.has_value() ? std::forward(exp) : (detail::invoke(std::forward(f), std::forward(exp).error()), std::forward(exp)); } #endif } // namespace detail template constexpr bool operator==(const expected &lhs, const expected &rhs) { return (lhs.has_value() != rhs.has_value()) ? false : (!lhs.has_value() ? lhs.error() == rhs.error() : *lhs == *rhs); } template constexpr bool operator!=(const expected &lhs, const expected &rhs) { return (lhs.has_value() != rhs.has_value()) ? true : (!lhs.has_value() ? lhs.error() != rhs.error() : *lhs != *rhs); } template constexpr bool operator==(const expected &lhs, const expected &rhs) { return (lhs.has_value() != rhs.has_value()) ? false : (!lhs.has_value() ? lhs.error() == rhs.error() : true); } template constexpr bool operator!=(const expected &lhs, const expected &rhs) { return (lhs.has_value() != rhs.has_value()) ? true : (!lhs.has_value() ? lhs.error() == rhs.error() : false); } template constexpr bool operator==(const expected &x, const U &v) { return x.has_value() ? *x == v : false; } template constexpr bool operator==(const U &v, const expected &x) { return x.has_value() ? *x == v : false; } template constexpr bool operator!=(const expected &x, const U &v) { return x.has_value() ? *x != v : true; } template constexpr bool operator!=(const U &v, const expected &x) { return x.has_value() ? *x != v : true; } template constexpr bool operator==(const expected &x, const unexpected &e) { return x.has_value() ? false : x.error() == e.value(); } template constexpr bool operator==(const unexpected &e, const expected &x) { return x.has_value() ? false : x.error() == e.value(); } template constexpr bool operator!=(const expected &x, const unexpected &e) { return x.has_value() ? true : x.error() != e.value(); } template constexpr bool operator!=(const unexpected &e, const expected &x) { return x.has_value() ? true : x.error() != e.value(); } template ::value || std::is_move_constructible::value) && detail::is_swappable::value && std::is_move_constructible::value && detail::is_swappable::value> * = nullptr> void swap(expected &lhs, expected &rhs) noexcept(noexcept(lhs.swap(rhs))) { lhs.swap(rhs); } } // namespace tl #endif /* end file include/ada/expected.h */ #include #include /** * @private */ namespace ada { struct url_aggregator; struct url; } // namespace ada /** * @namespace ada::parser * @brief Includes the definitions for supported parsers */ namespace ada::parser { /** * Parses a url. */ template result_type parse_url(std::string_view user_input, const result_type* base_url = nullptr); extern template url_aggregator parse_url( std::string_view user_input, const url_aggregator* base_url); extern template url parse_url(std::string_view user_input, const url* base_url); } // namespace ada::parser #endif // ADA_PARSER_H /* end file include/ada/parser.h */ /* begin file include/ada/scheme-inl.h */ /** * @file scheme-inl.h * @brief Definitions for the URL scheme. */ #ifndef ADA_SCHEME_INL_H #define ADA_SCHEME_INL_H namespace ada::scheme { /** * @namespace ada::scheme::details * @brief Includes the definitions for scheme specific entities */ namespace details { // for use with is_special and get_special_port // Spaces, if present, are removed from URL. constexpr std::string_view is_special_list[] = {"http", " ", "https", "ws", "ftp", "wss", "file", " "}; // for use with get_special_port constexpr uint16_t special_ports[] = {80, 0, 443, 80, 21, 443, 0, 0}; } // namespace details ada_really_inline constexpr bool is_special(std::string_view scheme) { if (scheme.empty()) { return false; } int hash_value = (2 * scheme.size() + (unsigned)(scheme[0])) & 7; const std::string_view target = details::is_special_list[hash_value]; return (target[0] == scheme[0]) && (target.substr(1) == scheme.substr(1)); } constexpr uint16_t get_special_port(std::string_view scheme) noexcept { if (scheme.empty()) { return 0; } int hash_value = (2 * scheme.size() + (unsigned)(scheme[0])) & 7; const std::string_view target = details::is_special_list[hash_value]; if ((target[0] == scheme[0]) && (target.substr(1) == scheme.substr(1))) { return details::special_ports[hash_value]; } else { return 0; } } constexpr uint16_t get_special_port(ada::scheme::type type) noexcept { return details::special_ports[int(type)]; } constexpr ada::scheme::type get_scheme_type(std::string_view scheme) noexcept { if (scheme.empty()) { return ada::scheme::NOT_SPECIAL; } int hash_value = (2 * scheme.size() + (unsigned)(scheme[0])) & 7; const std::string_view target = details::is_special_list[hash_value]; if ((target[0] == scheme[0]) && (target.substr(1) == scheme.substr(1))) { return ada::scheme::type(hash_value); } else { return ada::scheme::NOT_SPECIAL; } } } // namespace ada::scheme #endif // ADA_SCHEME_H /* end file include/ada/scheme-inl.h */ /* begin file include/ada/serializers.h */ /** * @file serializers.h * @brief Definitions for the URL serializers. */ #ifndef ADA_SERIALIZERS_H #define ADA_SERIALIZERS_H #include #include #include /** * @namespace ada::serializers * @brief Includes the definitions for URL serializers */ namespace ada::serializers { /** * Finds and returns the longest sequence of 0 values in a ipv6 input. */ void find_longest_sequence_of_ipv6_pieces( const std::array& address, size_t& compress, size_t& compress_length) noexcept; /** * Serializes an ipv6 address. * @details An IPv6 address is a 128-bit unsigned integer that identifies a * network address. * @see https://url.spec.whatwg.org/#concept-ipv6-serializer */ std::string ipv6(const std::array& address) noexcept; /** * Serializes an ipv4 address. * @details An IPv4 address is a 32-bit unsigned integer that identifies a * network address. * @see https://url.spec.whatwg.org/#concept-ipv4-serializer */ std::string ipv4(const uint64_t address) noexcept; } // namespace ada::serializers #endif // ADA_SERIALIZERS_H /* end file include/ada/serializers.h */ /* begin file include/ada/unicode.h */ /** * @file unicode.h * @brief Definitions for all unicode specific functions. */ #ifndef ADA_UNICODE_H #define ADA_UNICODE_H #include #include /** * @namespace ada::unicode * @brief Includes the definitions for unicode operations */ namespace ada::unicode { /** * We receive a UTF-8 string representing a domain name. * If the string is percent encoded, we apply percent decoding. * * Given a domain, we need to identify its labels. * They are separated by label-separators: * * U+002E (.) FULL STOP * U+FF0E FULLWIDTH FULL STOP * U+3002 IDEOGRAPHIC FULL STOP * U+FF61 HALFWIDTH IDEOGRAPHIC FULL STOP * * They are all mapped to U+002E. * * We process each label into a string that should not exceed 63 octets. * If the string is already punycode (starts with "xn--"), then we must * scan it to look for unallowed code points. * Otherwise, if the string is not pure ASCII, we need to transcode it * to punycode by following RFC 3454 which requires us to * - Map characters (see section 3), * - Normalize (see section 4), * - Reject forbidden characters, * - Check for right-to-left characters and if so, check all requirements (see * section 6), * - Optionally reject based on unassigned code points (section 7). * * The Unicode standard provides a table of code points with a mapping, a list * of forbidden code points and so forth. This table is subject to change and * will vary based on the implementation. For Unicode 15, the table is at * https://www.unicode.org/Public/idna/15.0.0/IdnaMappingTable.txt * If you use ICU, they parse this table and map it to code using a Python * script. * * The resulting strings should not exceed 255 octets according to RFC 1035 * section 2.3.4. ICU checks for label size and domain size, but these errors * are ignored. * * @see https://url.spec.whatwg.org/#concept-domain-to-ascii * */ bool to_ascii(std::optional& out, std::string_view plain, size_t first_percent); /** * @see https://www.unicode.org/reports/tr46/#ToUnicode */ std::string to_unicode(std::string_view input); /** * Checks if the input has tab or newline characters. * * @attention The has_tabs_or_newline function is a bottleneck and it is simple * enough that compilers like GCC can 'autovectorize it'. */ ada_really_inline bool has_tabs_or_newline( std::string_view user_input) noexcept; /** * Checks if the input is a forbidden host code point. * @see https://url.spec.whatwg.org/#forbidden-host-code-point */ ada_really_inline constexpr bool is_forbidden_host_code_point( const char c) noexcept; /** * Checks if the input contains a forbidden domain code point. * @see https://url.spec.whatwg.org/#forbidden-domain-code-point */ ada_really_inline constexpr bool contains_forbidden_domain_code_point( const char* input, size_t length) noexcept; /** * Checks if the input contains a forbidden domain code point in which case * the first bit is set to 1. If the input contains an upper case ASCII letter, * then the second bit is set to 1. * @see https://url.spec.whatwg.org/#forbidden-domain-code-point */ ada_really_inline constexpr uint8_t contains_forbidden_domain_code_point_or_upper(const char* input, size_t length) noexcept; /** * Checks if the input is a forbidden domain code point. * @see https://url.spec.whatwg.org/#forbidden-domain-code-point */ ada_really_inline constexpr bool is_forbidden_domain_code_point( const char c) noexcept; /** * Checks if the input is alphanumeric, '+', '-' or '.' */ ada_really_inline constexpr bool is_alnum_plus(const char c) noexcept; /** * @details An ASCII hex digit is an ASCII upper hex digit or ASCII lower hex * digit. An ASCII upper hex digit is an ASCII digit or a code point in the * range U+0041 (A) to U+0046 (F), inclusive. An ASCII lower hex digit is an * ASCII digit or a code point in the range U+0061 (a) to U+0066 (f), inclusive. */ ada_really_inline constexpr bool is_ascii_hex_digit(const char c) noexcept; /** * Checks if the input is a C0 control or space character. * * @details A C0 control or space is a C0 control or U+0020 SPACE. * A C0 control is a code point in the range U+0000 NULL to U+001F INFORMATION * SEPARATOR ONE, inclusive. */ ada_really_inline constexpr bool is_c0_control_or_space(const char c) noexcept; /** * Checks if the input is a ASCII tab or newline character. * * @details An ASCII tab or newline is U+0009 TAB, U+000A LF, or U+000D CR. */ ada_really_inline constexpr bool is_ascii_tab_or_newline(const char c) noexcept; /** * @details A double-dot path segment must be ".." or an ASCII case-insensitive * match for ".%2e", "%2e.", or "%2e%2e". */ ada_really_inline ada_constexpr bool is_double_dot_path_segment( const std::string_view input) noexcept; /** * @details A single-dot path segment must be "." or an ASCII case-insensitive * match for "%2e". */ ada_really_inline constexpr bool is_single_dot_path_segment( const std::string_view input) noexcept; /** * @details ipv4 character might contain 0-9 or a-f character ranges. */ ada_really_inline constexpr bool is_lowercase_hex(const char c) noexcept; /** * @details Convert hex to binary. */ unsigned constexpr convert_hex_to_binary(char c) noexcept; /** * first_percent should be = input.find('%') * * @todo It would be faster as noexcept maybe, but it could be unsafe since. * @author Node.js * @see https://github.com/nodejs/node/blob/main/src/node_url.cc#L245 * @see https://encoding.spec.whatwg.org/#utf-8-decode-without-bom */ std::string percent_decode(const std::string_view input, size_t first_percent); /** * Returns a percent-encoding string whether percent encoding was needed or not. * @see https://github.com/nodejs/node/blob/main/src/node_url.cc#L226 */ std::string percent_encode(const std::string_view input, const uint8_t character_set[]); /** * Returns a percent-encoded string version of input, while starting the percent * encoding at the provided index. * @see https://github.com/nodejs/node/blob/main/src/node_url.cc#L226 */ std::string percent_encode(const std::string_view input, const uint8_t character_set[], size_t index); /** * Returns true if percent encoding was needed, in which case, we store * the percent-encoded content in 'out'. If the boolean 'append' is set to * true, the content is appended to 'out'. * If percent encoding is not needed, out is left unchanged. * @see https://github.com/nodejs/node/blob/main/src/node_url.cc#L226 */ template bool percent_encode(const std::string_view input, const uint8_t character_set[], std::string& out); /** * Returns the index at which percent encoding should start, or (equivalently), * the length of the prefix that does not require percent encoding. */ ada_really_inline size_t percent_encode_index(const std::string_view input, const uint8_t character_set[]); /** * Lowers the string in-place, assuming that the content is ASCII. * Return true if the content was ASCII. */ constexpr bool to_lower_ascii(char* input, size_t length) noexcept; } // namespace ada::unicode #endif // ADA_UNICODE_H /* end file include/ada/unicode.h */ /* begin file include/ada/url_base-inl.h */ /** * @file url_base-inl.h * @brief Inline functions for url base */ #ifndef ADA_URL_BASE_INL_H #define ADA_URL_BASE_INL_H /* begin file include/ada/url_aggregator.h */ /** * @file url_aggregator.h * @brief Declaration for the basic URL definitions */ #ifndef ADA_URL_AGGREGATOR_H #define ADA_URL_AGGREGATOR_H #include #include namespace ada { /** * @brief Lightweight URL struct. * * @details The url_aggregator class aims to minimize temporary memory * allocation while representing a parsed URL. Internally, it contains a single * normalized URL (the href), and it makes available the components, mostly * using std::string_view. */ struct url_aggregator : url_base { url_aggregator() = default; url_aggregator(const url_aggregator &u) = default; url_aggregator(url_aggregator &&u) noexcept = default; url_aggregator &operator=(url_aggregator &&u) noexcept = default; url_aggregator &operator=(const url_aggregator &u) = default; ~url_aggregator() = default; bool set_href(const std::string_view input); bool set_host(const std::string_view input); bool set_hostname(const std::string_view input); bool set_protocol(const std::string_view input); bool set_username(const std::string_view input); bool set_password(const std::string_view input); bool set_port(const std::string_view input); bool set_pathname(const std::string_view input); void set_search(const std::string_view input); void set_hash(const std::string_view input); [[nodiscard]] bool has_valid_domain() const noexcept override; /** * The origin getter steps are to return the serialization of this's URL's * origin. [HTML] * @return a newly allocated string. * @see https://url.spec.whatwg.org/#concept-url-origin */ [[nodiscard]] std::string get_origin() const noexcept override; /** * Return the normalized string. * This function does not allocate memory. * It is highly efficient. * @return a constant reference to the underlying normalized URL. * @see https://url.spec.whatwg.org/#dom-url-href * @see https://url.spec.whatwg.org/#concept-url-serializer */ inline std::string_view get_href() const noexcept; /** * The username getter steps are to return this's URL's username. * This function does not allocate memory. * @return a lightweight std::string_view. * @see https://url.spec.whatwg.org/#dom-url-username */ [[nodiscard]] std::string_view get_username() const noexcept; /** * The password getter steps are to return this's URL's password. * This function does not allocate memory. * @return a lightweight std::string_view. * @see https://url.spec.whatwg.org/#dom-url-password */ [[nodiscard]] std::string_view get_password() const noexcept; /** * Return this's URL's port, serialized. * This function does not allocate memory. * @return a lightweight std::string_view. * @see https://url.spec.whatwg.org/#dom-url-port */ [[nodiscard]] std::string_view get_port() const noexcept; /** * Return U+0023 (#), followed by this's URL's fragment. * This function does not allocate memory. * @return a lightweight std::string_view.. * @see https://url.spec.whatwg.org/#dom-url-hash */ [[nodiscard]] std::string_view get_hash() const noexcept; /** * Return url's host, serialized, followed by U+003A (:) and url's port, * serialized. * This function does not allocate memory. * When there is no host, this function returns the empty view. * @return a lightweight std::string_view. * @see https://url.spec.whatwg.org/#dom-url-host */ [[nodiscard]] std::string_view get_host() const noexcept; /** * Return this's URL's host, serialized. * This function does not allocate memory. * When there is no host, this function returns the empty view. * @return a lightweight std::string_view. * @see https://url.spec.whatwg.org/#dom-url-hostname */ [[nodiscard]] std::string_view get_hostname() const noexcept; /** * The pathname getter steps are to return the result of URL path serializing * this's URL. * This function does not allocate memory. * @return a lightweight std::string_view. * @see https://url.spec.whatwg.org/#dom-url-pathname */ [[nodiscard]] std::string_view get_pathname() const noexcept; /** * Compute the pathname length in bytes without instantiating a view or a * string. * @return size of the pathname in bytes * @see https://url.spec.whatwg.org/#dom-url-pathname */ ada_really_inline uint32_t get_pathname_length() const noexcept; /** * Return U+003F (?), followed by this's URL's query. * This function does not allocate memory. * @return a lightweight std::string_view. * @see https://url.spec.whatwg.org/#dom-url-search */ [[nodiscard]] std::string_view get_search() const noexcept; /** * The protocol getter steps are to return this's URL's scheme, followed by * U+003A (:). * This function does not allocate memory. * @return a lightweight std::string_view. * @see https://url.spec.whatwg.org/#dom-url-protocol */ [[nodiscard]] std::string_view get_protocol() const noexcept; /** * A URL includes credentials if its username or password is not the empty * string. */ [[nodiscard]] ada_really_inline bool has_credentials() const noexcept; /** * Useful for implementing efficient serialization for the URL. * * https://user:pass@example.com:1234/foo/bar?baz#quux * | | | | ^^^^| | | * | | | | | | | `----- hash_start * | | | | | | `--------- search_start * | | | | | `----------------- pathname_start * | | | | `--------------------- port * | | | `----------------------- host_end * | | `---------------------------------- host_start * | `--------------------------------------- username_end * `--------------------------------------------- protocol_end * * Inspired after servo/url * * @return a constant reference to the underlying component attribute. * * @see * https://github.com/servo/rust-url/blob/b65a45515c10713f6d212e6726719a020203cc98/url/src/quirks.rs#L31 */ [[nodiscard]] ada_really_inline const ada::url_components &get_components() const noexcept; /** * Returns a string representation of this URL. */ std::string to_string() const override; /** * Returns a string diagram of this URL. */ std::string to_diagram() const; /** * Verifies that the parsed URL could be valid. Useful for debugging purposes. * @return true if the URL is valid, otherwise return true of the offsets are * possible. */ bool validate() const noexcept; /** @return true if it has an host but it is the empty string */ [[nodiscard]] inline bool has_empty_hostname() const noexcept; /** @return true if it has a host (included an empty host) */ [[nodiscard]] inline bool has_hostname() const noexcept; /** @return true if the URL has a non-empty username */ [[nodiscard]] inline bool has_non_empty_username() const noexcept; /** @return true if the URL has a non-empty password */ [[nodiscard]] inline bool has_non_empty_password() const noexcept; /** @return true if the URL has a (non default) port */ [[nodiscard]] inline bool has_port() const noexcept; /** @return true if the URL has a password */ [[nodiscard]] inline bool has_password() const noexcept; /** @return true if the URL has a hash component */ [[nodiscard]] inline bool has_hash() const noexcept override; /** @return true if the URL has a search component */ [[nodiscard]] inline bool has_search() const noexcept override; private: friend ada::url_aggregator ada::parser::parse_url( std::string_view, const ada::url_aggregator *); friend void ada::helpers::strip_trailing_spaces_from_opaque_path< ada::url_aggregator>(ada::url_aggregator &url) noexcept; std::string buffer{}; url_components components{}; /** * Returns true if neither the search, nor the hash nor the pathname * have been set. * @return true if the buffer is ready to receive the path. */ [[nodiscard]] ada_really_inline bool is_at_path() const noexcept; inline void add_authority_slashes_if_needed() noexcept; /** * To optimize performance, you may indicate how much memory to allocate * within this instance. */ inline void reserve(uint32_t capacity); ada_really_inline size_t parse_port(std::string_view view, bool check_trailing_content = false) noexcept override; /** * Return true on success. * @see https://url.spec.whatwg.org/#concept-ipv4-parser */ [[nodiscard]] bool parse_ipv4(std::string_view input); /** * Return true on success. * @see https://url.spec.whatwg.org/#concept-ipv6-parser */ [[nodiscard]] bool parse_ipv6(std::string_view input); /** * Return true on success. * @see https://url.spec.whatwg.org/#concept-opaque-host-parser */ [[nodiscard]] bool parse_opaque_host(std::string_view input); ada_really_inline void parse_path(std::string_view input); /** * A URL cannot have a username/password/port if its host is null or the empty * string, or its scheme is "file". */ [[nodiscard]] inline bool cannot_have_credentials_or_port() const; template bool set_host_or_hostname(const std::string_view input); ada_really_inline bool parse_host(std::string_view input); inline void update_base_authority(std::string_view base_buffer, const ada::url_components &base); inline void update_unencoded_base_hash(std::string_view input); inline void update_base_hostname(std::string_view input); inline void update_base_search(std::string_view input); inline void update_base_search(std::string_view input, const uint8_t *query_percent_encode_set); inline void update_base_pathname(const std::string_view input); inline void update_base_username(const std::string_view input); inline void append_base_username(const std::string_view input); inline void update_base_password(const std::string_view input); inline void append_base_password(const std::string_view input); inline void update_base_port(uint32_t input); inline void append_base_pathname(const std::string_view input); inline uint32_t retrieve_base_port() const; inline void clear_port(); inline void clear_hostname(); inline void clear_hash(); inline void clear_pathname() override; inline void clear_search() override; inline void clear_password(); inline bool has_dash_dot() const noexcept; void delete_dash_dot(); inline void consume_prepared_path(std::string_view input); template [[nodiscard]] ada_really_inline bool parse_scheme_with_colon( const std::string_view input); ada_really_inline uint32_t replace_and_resize(uint32_t start, uint32_t end, std::string_view input); inline bool has_authority() const noexcept; inline void set_protocol_as_file(); inline void set_scheme(std::string_view new_scheme) noexcept; /** * Fast function to set the scheme from a view with a colon in the * buffer, does not change type. */ inline void set_scheme_from_view_with_colon( std::string_view new_scheme_with_colon) noexcept; inline void copy_scheme(const url_aggregator &u) noexcept; }; // url_aggregator inline std::ostream &operator<<(std::ostream &out, const ada::url &u); } // namespace ada #endif /* end file include/ada/url_aggregator.h */ /* begin file include/ada/checkers.h */ /** * @file checkers.h * @brief Declarations for URL specific checkers used within Ada. */ #ifndef ADA_CHECKERS_H #define ADA_CHECKERS_H #include #include /** * @namespace ada::checkers * @brief Includes the definitions for validation functions */ namespace ada::checkers { /** * Assuming that x is an ASCII letter, this function returns the lower case * equivalent. * @details More likely to be inlined by the compiler and constexpr. */ constexpr char to_lower(char x) noexcept; /** * Returns true if the character is an ASCII letter. Equivalent to std::isalpha * but more likely to be inlined by the compiler. * * @attention std::isalpha is not constexpr generally. */ constexpr bool is_alpha(char x) noexcept; /** * Check whether a string starts with 0x or 0X. The function is only * safe if input.size() >=2. * * @see has_hex_prefix */ inline bool has_hex_prefix_unsafe(std::string_view input); /** * Check whether a string starts with 0x or 0X. */ inline bool has_hex_prefix(std::string_view input); /** * Check whether x is an ASCII digit. More likely to be inlined than * std::isdigit. */ constexpr bool is_digit(char x) noexcept; /** * @details A string starts with a Windows drive letter if all of the following * are true: * * - its length is greater than or equal to 2 * - its first two code points are a Windows drive letter * - its length is 2 or its third code point is U+002F (/), U+005C (\), U+003F * (?), or U+0023 (#). * * https://url.spec.whatwg.org/#start-with-a-windows-drive-letter */ inline constexpr bool is_windows_drive_letter(std::string_view input) noexcept; /** * @details A normalized Windows drive letter is a Windows drive letter of which * the second code point is U+003A (:). */ inline constexpr bool is_normalized_windows_drive_letter( std::string_view input) noexcept; /** * @warning Will be removed when Ada supports C++20. */ ada_really_inline constexpr bool begins_with(std::string_view view, std::string_view prefix); /** * Returns true if an input is an ipv4 address. */ ada_really_inline ada_constexpr bool is_ipv4(std::string_view view) noexcept; /** * Returns a bitset. If the first bit is set, then at least one character needs * percent encoding. If the second bit is set, a \\ is found. If the third bit * is set then we have a dot. If the fourth bit is set, then we have a percent * character. */ ada_really_inline constexpr uint8_t path_signature( std::string_view input) noexcept; /** * Returns true if the length of the domain name and its labels are according to * the specifications. The length of the domain must be 255 octets (253 * characters not including the last 2 which are the empty label reserved at the * end). When the empty label is included (a dot at the end), the domain name * can have 254 characters. The length of a label must be at least 1 and at most * 63 characters. * @see section 3.1. of https://www.rfc-editor.org/rfc/rfc1034 * @see https://www.unicode.org/reports/tr46/#ToASCII */ ada_really_inline constexpr bool verify_dns_length( std::string_view input) noexcept; } // namespace ada::checkers #endif // ADA_CHECKERS_H /* end file include/ada/checkers.h */ /* begin file include/ada/url.h */ /** * @file url.h * @brief Declaration for the URL */ #ifndef ADA_URL_H #define ADA_URL_H #include #include #include #include #include #include namespace ada { /** * @brief Generic URL struct reliant on std::string instantiation. * * @details To disambiguate from a valid URL string it can also be referred to * as a URL record. A URL is a struct that represents a universal identifier. * Unlike the url_aggregator, the ada::url represents the different components * of a parsed URL as independent std::string instances. This makes the * structure heavier and more reliant on memory allocations. When getting * components from the parsed URL, a new std::string is typically constructed. * * @see https://url.spec.whatwg.org/#url-representation */ struct url : url_base { url() = default; url(const url &u) = default; url(url &&u) noexcept = default; url &operator=(url &&u) noexcept = default; url &operator=(const url &u) = default; ~url() = default; /** * @private * A URL's username is an ASCII string identifying a username. It is initially * the empty string. */ std::string username{}; /** * @private * A URL's password is an ASCII string identifying a password. It is initially * the empty string. */ std::string password{}; /** * @private * A URL's host is null or a host. It is initially null. */ std::optional host{}; /** * @private * A URL's port is either null or a 16-bit unsigned integer that identifies a * networking port. It is initially null. */ std::optional port{}; /** * @private * A URL's path is either an ASCII string or a list of zero or more ASCII * strings, usually identifying a location. */ std::string path{}; /** * @private * A URL's query is either null or an ASCII string. It is initially null. */ std::optional query{}; /** * @private * A URL's fragment is either null or an ASCII string that can be used for * further processing on the resource the URL's other components identify. It * is initially null. */ std::optional hash{}; /** @return true if it has an host but it is the empty string */ [[nodiscard]] inline bool has_empty_hostname() const noexcept; /** @return true if the URL has a (non default) port */ [[nodiscard]] inline bool has_port() const noexcept; /** @return true if it has a host (included an empty host) */ [[nodiscard]] inline bool has_hostname() const noexcept; [[nodiscard]] bool has_valid_domain() const noexcept override; /** * Returns a JSON string representation of this URL. */ std::string to_string() const override; /** * @see https://url.spec.whatwg.org/#dom-url-href * @see https://url.spec.whatwg.org/#concept-url-serializer */ [[nodiscard]] ada_really_inline std::string get_href() const noexcept; /** * The origin getter steps are to return the serialization of this's URL's * origin. [HTML] * @return a newly allocated string. * @see https://url.spec.whatwg.org/#concept-url-origin */ [[nodiscard]] std::string get_origin() const noexcept override; /** * The protocol getter steps are to return this's URL's scheme, followed by * U+003A (:). * @return a newly allocated string. * @see https://url.spec.whatwg.org/#dom-url-protocol */ [[nodiscard]] std::string get_protocol() const noexcept; /** * Return url's host, serialized, followed by U+003A (:) and url's port, * serialized. * When there is no host, this function returns the empty string. * @return a newly allocated string. * @see https://url.spec.whatwg.org/#dom-url-host */ [[nodiscard]] std::string get_host() const noexcept; /** * Return this's URL's host, serialized. * When there is no host, this function returns the empty string. * @return a newly allocated string. * @see https://url.spec.whatwg.org/#dom-url-hostname */ [[nodiscard]] std::string get_hostname() const noexcept; /** * The pathname getter steps are to return the result of URL path serializing * this's URL. * @return a newly allocated string. * @see https://url.spec.whatwg.org/#dom-url-pathname */ [[nodiscard]] const std::string_view get_pathname() const noexcept; /** * Compute the pathname length in bytes without instantiating a view or a * string. * @return size of the pathname in bytes * @see https://url.spec.whatwg.org/#dom-url-pathname */ ada_really_inline size_t get_pathname_length() const noexcept; /** * Return U+003F (?), followed by this's URL's query. * @return a newly allocated string. * @see https://url.spec.whatwg.org/#dom-url-search */ [[nodiscard]] std::string get_search() const noexcept; /** * The username getter steps are to return this's URL's username. * @return a constant reference to the underlying string. * @see https://url.spec.whatwg.org/#dom-url-username */ [[nodiscard]] const std::string &get_username() const noexcept; /** * @return Returns true on successful operation. * @see https://url.spec.whatwg.org/#dom-url-username */ bool set_username(const std::string_view input); /** * @return Returns true on success. * @see https://url.spec.whatwg.org/#dom-url-password */ bool set_password(const std::string_view input); /** * @return Returns true on success. * @see https://url.spec.whatwg.org/#dom-url-port */ bool set_port(const std::string_view input); /** * This function always succeeds. * @see https://url.spec.whatwg.org/#dom-url-hash */ void set_hash(const std::string_view input); /** * This function always succeeds. * @see https://url.spec.whatwg.org/#dom-url-search */ void set_search(const std::string_view input); /** * @return Returns true on success. * @see https://url.spec.whatwg.org/#dom-url-search */ bool set_pathname(const std::string_view input); /** * @return Returns true on success. * @see https://url.spec.whatwg.org/#dom-url-host */ bool set_host(const std::string_view input); /** * @return Returns true on success. * @see https://url.spec.whatwg.org/#dom-url-hostname */ bool set_hostname(const std::string_view input); /** * @return Returns true on success. * @see https://url.spec.whatwg.org/#dom-url-protocol */ bool set_protocol(const std::string_view input); /** * @see https://url.spec.whatwg.org/#dom-url-href */ bool set_href(const std::string_view input); /** * The password getter steps are to return this's URL's password. * @return a constant reference to the underlying string. * @see https://url.spec.whatwg.org/#dom-url-password */ [[nodiscard]] const std::string &get_password() const noexcept; /** * Return this's URL's port, serialized. * @return a newly constructed string representing the port. * @see https://url.spec.whatwg.org/#dom-url-port */ [[nodiscard]] std::string get_port() const noexcept; /** * Return U+0023 (#), followed by this's URL's fragment. * @return a newly constructed string representing the hash. * @see https://url.spec.whatwg.org/#dom-url-hash */ [[nodiscard]] std::string get_hash() const noexcept; /** * A URL includes credentials if its username or password is not the empty * string. */ [[nodiscard]] ada_really_inline bool has_credentials() const noexcept; /** * Useful for implementing efficient serialization for the URL. * * https://user:pass@example.com:1234/foo/bar?baz#quux * | | | | ^^^^| | | * | | | | | | | `----- hash_start * | | | | | | `--------- search_start * | | | | | `----------------- pathname_start * | | | | `--------------------- port * | | | `----------------------- host_end * | | `---------------------------------- host_start * | `--------------------------------------- username_end * `--------------------------------------------- protocol_end * * Inspired after servo/url * * @return a newly constructed component. * * @see * https://github.com/servo/rust-url/blob/b65a45515c10713f6d212e6726719a020203cc98/url/src/quirks.rs#L31 */ [[nodiscard]] ada_really_inline ada::url_components get_components() const noexcept; /** @return true if the URL has a hash component */ [[nodiscard]] inline bool has_hash() const noexcept override; /** @return true if the URL has a search component */ [[nodiscard]] inline bool has_search() const noexcept override; private: friend ada::url ada::parser::parse_url(std::string_view, const ada::url *); friend ada::url_aggregator ada::parser::parse_url( std::string_view, const ada::url_aggregator *); friend void ada::helpers::strip_trailing_spaces_from_opaque_path( ada::url &url) noexcept; inline void update_unencoded_base_hash(std::string_view input); inline void update_base_hostname(std::string_view input); inline void update_base_search(std::string_view input); inline void update_base_search(std::string_view input, const uint8_t query_percent_encode_set[]); inline void update_base_search(std::optional input); inline void update_base_pathname(const std::string_view input); inline void update_base_username(const std::string_view input); inline void update_base_password(const std::string_view input); inline void update_base_port(std::optional input); /** * Sets the host or hostname according to override condition. * Return true on success. * @see https://url.spec.whatwg.org/#hostname-state */ template bool set_host_or_hostname(std::string_view input); /** * Return true on success. * @see https://url.spec.whatwg.org/#concept-ipv4-parser */ [[nodiscard]] bool parse_ipv4(std::string_view input); /** * Return true on success. * @see https://url.spec.whatwg.org/#concept-ipv6-parser */ [[nodiscard]] bool parse_ipv6(std::string_view input); /** * Return true on success. * @see https://url.spec.whatwg.org/#concept-opaque-host-parser */ [[nodiscard]] bool parse_opaque_host(std::string_view input); /** * A URL's scheme is an ASCII string that identifies the type of URL and can * be used to dispatch a URL for further processing after parsing. It is * initially the empty string. We only set non_special_scheme when the scheme * is non-special, otherwise we avoid constructing string. * * Special schemes are stored in ada::scheme::details::is_special_list so we * typically do not need to store them in each url instance. */ std::string non_special_scheme{}; /** * A URL cannot have a username/password/port if its host is null or the empty * string, or its scheme is "file". */ [[nodiscard]] inline bool cannot_have_credentials_or_port() const; ada_really_inline size_t parse_port(std::string_view view, bool check_trailing_content = false) noexcept override; /** * Take the scheme from another URL. The scheme string is copied from the * provided url. */ inline void copy_scheme(const ada::url &u); /** * Parse the host from the provided input. We assume that * the input does not contain spaces or tabs. Control * characters and spaces are not trimmed (they should have * been removed if needed). * Return true on success. * @see https://url.spec.whatwg.org/#host-parsing */ [[nodiscard]] ada_really_inline bool parse_host(std::string_view input); template [[nodiscard]] ada_really_inline bool parse_scheme( const std::string_view input); inline void clear_pathname() override; inline void clear_search() override; inline void set_protocol_as_file(); /** * Parse the path from the provided input. * Return true on success. Control characters not * trimmed from the ends (they should have * been removed if needed). * * The input is expected to be UTF-8. * * @see https://url.spec.whatwg.org/ */ ada_really_inline void parse_path(const std::string_view input); /** * Set the scheme for this URL. The provided scheme should be a valid * scheme string, be lower-cased, not contain spaces or tabs. It should * have no spurious trailing or leading content. */ inline void set_scheme(std::string &&new_scheme) noexcept; /** * Take the scheme from another URL. The scheme string is moved from the * provided url. */ inline void copy_scheme(ada::url &&u) noexcept; }; // struct url inline std::ostream &operator<<(std::ostream &out, const ada::url &u); } // namespace ada #endif // ADA_URL_H /* end file include/ada/url.h */ #include #include #if ADA_REGULAR_VISUAL_STUDIO #include #endif // ADA_REGULAR_VISUAL_STUDIO namespace ada { [[nodiscard]] ada_really_inline bool url_base::is_special() const noexcept { return type != ada::scheme::NOT_SPECIAL; } [[nodiscard]] inline uint16_t url_base::get_special_port() const noexcept { return ada::scheme::get_special_port(type); } [[nodiscard]] ada_really_inline uint16_t url_base::scheme_default_port() const noexcept { return scheme::get_special_port(type); } } // namespace ada #endif // ADA_URL_BASE_INL_H /* end file include/ada/url_base-inl.h */ /* begin file include/ada/url-inl.h */ /** * @file url-inl.h * @brief Definitions for the URL */ #ifndef ADA_URL_INL_H #define ADA_URL_INL_H #include #include #if ADA_REGULAR_VISUAL_STUDIO #include #endif // ADA_REGULAR_VISUAL_STUDIO namespace ada { [[nodiscard]] ada_really_inline bool url::has_credentials() const noexcept { return !username.empty() || !password.empty(); } [[nodiscard]] ada_really_inline bool url::has_port() const noexcept { return port.has_value(); } [[nodiscard]] inline bool url::cannot_have_credentials_or_port() const { return !host.has_value() || host.value().empty() || type == ada::scheme::type::FILE; } [[nodiscard]] inline bool url::has_empty_hostname() const noexcept { if (!host.has_value()) { return false; } return host.value().empty(); } [[nodiscard]] inline bool url::has_hostname() const noexcept { return host.has_value(); } inline std::ostream &operator<<(std::ostream &out, const ada::url &u) { return out << u.to_string(); } size_t url::get_pathname_length() const noexcept { return path.size(); } [[nodiscard]] ada_really_inline ada::url_components url::get_components() const noexcept { url_components out{}; // protocol ends with ':'. for example: "https:" out.protocol_end = uint32_t(get_protocol().size()); // Trailing index is always the next character of the current one. size_t running_index = out.protocol_end; if (host.has_value()) { // 2 characters for "//" and 1 character for starting index out.host_start = out.protocol_end + 2; if (has_credentials()) { out.username_end = uint32_t(out.host_start + username.size()); out.host_start += uint32_t(username.size()); if (!password.empty()) { out.host_start += uint32_t(password.size() + 1); } out.host_end = uint32_t(out.host_start + host.value().size()); } else { out.username_end = out.host_start; // Host does not start with "@" if it does not include credentials. out.host_end = uint32_t(out.host_start + host.value().size()) - 1; } running_index = out.host_end + 1; } else { // Update host start and end date to the same index, since it does not // exist. out.host_start = out.protocol_end; out.host_end = out.host_start; if (!has_opaque_path && checkers::begins_with(path, "//")) { // If url's host is null, url does not have an opaque path, url's path's // size is greater than 1, and url's path[0] is the empty string, then // append U+002F (/) followed by U+002E (.) to output. running_index = out.protocol_end + 2; } else { running_index = out.protocol_end; } } if (port.has_value()) { out.port = *port; running_index += helpers::fast_digit_count(*port) + 1; // Port omits ':' } out.pathname_start = uint32_t(running_index); running_index += path.size(); if (query.has_value()) { out.search_start = uint32_t(running_index); running_index += get_search().size(); if (get_search().size() == 0) { running_index++; } } if (hash.has_value()) { out.hash_start = uint32_t(running_index); } return out; } inline void url::update_base_hostname(std::string_view input) { host = input; } inline void url::update_unencoded_base_hash(std::string_view input) { // We do the percent encoding hash = unicode::percent_encode(input, ada::character_sets::FRAGMENT_PERCENT_ENCODE); } inline void url::update_base_search(std::string_view input, const uint8_t query_percent_encode_set[]) { query = ada::unicode::percent_encode(input, query_percent_encode_set); } inline void url::update_base_search(std::optional input) { query = input; } inline void url::update_base_pathname(const std::string_view input) { path = input; } inline void url::update_base_username(const std::string_view input) { username = input; } inline void url::update_base_password(const std::string_view input) { password = input; } inline void url::update_base_port(std::optional input) { port = input; } inline void url::clear_pathname() { path.clear(); } inline void url::clear_search() { query = std::nullopt; } [[nodiscard]] inline bool url::has_hash() const noexcept { return hash.has_value(); } [[nodiscard]] inline bool url::has_search() const noexcept { return query.has_value(); } inline void url::set_protocol_as_file() { type = ada::scheme::type::FILE; } inline void url::set_scheme(std::string &&new_scheme) noexcept { type = ada::scheme::get_scheme_type(new_scheme); // We only move the 'scheme' if it is non-special. if (!is_special()) { non_special_scheme = new_scheme; } } inline void url::copy_scheme(ada::url &&u) noexcept { non_special_scheme = u.non_special_scheme; type = u.type; } inline void url::copy_scheme(const ada::url &u) { non_special_scheme = u.non_special_scheme; type = u.type; } [[nodiscard]] ada_really_inline std::string url::get_href() const noexcept { std::string output = get_protocol(); if (host.has_value()) { output += "//"; if (has_credentials()) { output += username; if (!password.empty()) { output += ":" + get_password(); } output += "@"; } output += host.value(); if (port.has_value()) { output += ":" + get_port(); } } else if (!has_opaque_path && checkers::begins_with(path, "//")) { // If url's host is null, url does not have an opaque path, url's path's // size is greater than 1, and url's path[0] is the empty string, then // append U+002F (/) followed by U+002E (.) to output. output += "/."; } output += path; if (query.has_value()) { output += "?" + query.value(); } if (hash.has_value()) { output += "#" + hash.value(); } return output; } ada_really_inline size_t url::parse_port(std::string_view view, bool check_trailing_content) noexcept { ada_log("parse_port('", view, "') ", view.size()); uint16_t parsed_port{}; auto r = std::from_chars(view.data(), view.data() + view.size(), parsed_port); if (r.ec == std::errc::result_out_of_range) { ada_log("parse_port: std::errc::result_out_of_range"); is_valid = false; return 0; } ada_log("parse_port: ", parsed_port); const size_t consumed = size_t(r.ptr - view.data()); ada_log("parse_port: consumed ", consumed); if (check_trailing_content) { is_valid &= (consumed == view.size() || view[consumed] == '/' || view[consumed] == '?' || (is_special() && view[consumed] == '\\')); } ada_log("parse_port: is_valid = ", is_valid); if (is_valid) { // scheme_default_port can return 0, and we should allow 0 as a base port. auto default_port = scheme_default_port(); bool is_port_valid = (default_port == 0 && parsed_port == 0) || (default_port != parsed_port); port = (r.ec == std::errc() && is_port_valid) ? std::optional(parsed_port) : std::nullopt; } return consumed; } } // namespace ada #endif // ADA_URL_H /* end file include/ada/url-inl.h */ /* begin file include/ada/url_aggregator-inl.h */ /** * @file url_aggregator-inl.h * @brief Inline functions for url aggregator */ #ifndef ADA_URL_AGGREGATOR_INL_H #define ADA_URL_AGGREGATOR_INL_H /* begin file include/ada/unicode-inl.h */ /** * @file unicode-inl.h * @brief Definitions for unicode operations. */ #ifndef ADA_UNICODE_INL_H #define ADA_UNICODE_INL_H #include /** * @namespace ada::unicode * @brief Includes the declarations for unicode operations */ namespace ada::unicode { ada_really_inline size_t percent_encode_index(const std::string_view input, const uint8_t character_set[]) { return std::distance( input.begin(), std::find_if(input.begin(), input.end(), [character_set](const char c) { return character_sets::bit_at(character_set, c); })); } } // namespace ada::unicode #endif // ADA_UNICODE_INL_H /* end file include/ada/unicode-inl.h */ #include #include namespace ada { inline void url_aggregator::update_base_authority( std::string_view base_buffer, const ada::url_components &base) { std::string_view input = base_buffer.substr( base.protocol_end, base.host_start - base.protocol_end); ada_log("url_aggregator::update_base_authority ", input); bool input_starts_with_dash = checkers::begins_with(input, "//"); uint32_t diff = components.host_start - components.protocol_end; buffer.erase(components.protocol_end, components.host_start - components.protocol_end); components.username_end = components.protocol_end; if (input_starts_with_dash) { input.remove_prefix(2); diff += 2; // add "//" buffer.insert(components.protocol_end, "//"); components.username_end += 2; } size_t password_delimiter = input.find(':'); // Check if input contains both username and password by checking the // delimiter: ":" A typical input that contains authority would be "user:pass" if (password_delimiter != std::string_view::npos) { // Insert both username and password std::string_view username = input.substr(0, password_delimiter); std::string_view password = input.substr(password_delimiter + 1); buffer.insert(components.protocol_end + diff, username); diff += uint32_t(username.size()); buffer.insert(components.protocol_end + diff, ":"); components.username_end = components.protocol_end + diff; buffer.insert(components.protocol_end + diff + 1, password); diff += uint32_t(password.size()) + 1; } else if (!input.empty()) { // Insert only username buffer.insert(components.protocol_end + diff, input); components.username_end = components.protocol_end + diff + uint32_t(input.size()); diff += uint32_t(input.size()); } components.host_start += diff; if (buffer.size() > base.host_start && buffer[base.host_start] != '@') { buffer.insert(components.host_start, "@"); diff++; } components.host_end += diff; components.pathname_start += diff; if (components.search_start != url_components::omitted) { components.search_start += diff; } if (components.hash_start != url_components::omitted) { components.hash_start += diff; } } inline void url_aggregator::update_unencoded_base_hash(std::string_view input) { ada_log("url_aggregator::update_unencoded_base_hash ", input, " [", input.size(), " bytes], buffer is '", buffer, "' [", buffer.size(), " bytes] components.hash_start = ", components.hash_start); ADA_ASSERT_TRUE(validate()); ADA_ASSERT_TRUE(!helpers::overlaps(input, buffer)); if (components.hash_start != url_components::omitted) { buffer.resize(components.hash_start); } components.hash_start = uint32_t(buffer.size()); buffer += "#"; bool encoding_required = unicode::percent_encode( input, ada::character_sets::FRAGMENT_PERCENT_ENCODE, buffer); // When encoding_required is false, then buffer is left unchanged, and percent // encoding was not deemed required. if (!encoding_required) { buffer.append(input); } ada_log("url_aggregator::update_unencoded_base_hash final buffer is '", buffer, "' [", buffer.size(), " bytes]"); ADA_ASSERT_TRUE(validate()); } ada_really_inline uint32_t url_aggregator::replace_and_resize( uint32_t start, uint32_t end, std::string_view input) { uint32_t current_length = end - start; uint32_t input_size = uint32_t(input.size()); uint32_t new_difference = input_size - current_length; if (current_length == 0) { buffer.insert(start, input); } else if (input_size == current_length) { buffer.replace(start, input_size, input); } else if (input_size < current_length) { buffer.erase(start, current_length - input_size); buffer.replace(start, input_size, input); } else { buffer.replace(start, current_length, input.substr(0, current_length)); buffer.insert(start + current_length, input.substr(current_length)); } return new_difference; } inline void url_aggregator::update_base_hostname(const std::string_view input) { ada_log("url_aggregator::update_base_hostname ", input, " [", input.size(), " bytes], buffer is '", buffer, "' [", buffer.size(), " bytes]"); ADA_ASSERT_TRUE(validate()); ADA_ASSERT_TRUE(!helpers::overlaps(input, buffer)); // This next line is required for when parsing a URL like `foo://` add_authority_slashes_if_needed(); bool has_credentials = components.protocol_end + 2 < components.host_start; uint32_t new_difference = replace_and_resize(components.host_start, components.host_end, input); if (has_credentials) { buffer.insert(components.host_start, "@"); new_difference++; } components.host_end += new_difference; components.pathname_start += new_difference; if (components.search_start != url_components::omitted) { components.search_start += new_difference; } if (components.hash_start != url_components::omitted) { components.hash_start += new_difference; } ADA_ASSERT_TRUE(validate()); } ada_really_inline uint32_t url_aggregator::get_pathname_length() const noexcept { ada_log("url_aggregator::get_pathname_length"); uint32_t ending_index = uint32_t(buffer.size()); if (components.search_start != url_components::omitted) { ending_index = components.search_start; } else if (components.hash_start != url_components::omitted) { ending_index = components.hash_start; } return ending_index - components.pathname_start; } [[nodiscard]] ada_really_inline bool url_aggregator::is_at_path() const noexcept { return buffer.size() == components.pathname_start; } inline void url_aggregator::update_base_search(std::string_view input) { ada_log("url_aggregator::update_base_search ", input); ADA_ASSERT_TRUE(validate()); ADA_ASSERT_TRUE(!helpers::overlaps(input, buffer)); if (input.empty()) { clear_search(); return; } if (input[0] == '?') { input.remove_prefix(1); } if (components.hash_start == url_components::omitted) { if (components.search_start == url_components::omitted) { components.search_start = uint32_t(buffer.size()); buffer += "?"; } else { buffer.resize(components.search_start + 1); } buffer.append(input); } else { if (components.search_start == url_components::omitted) { components.search_start = components.hash_start; } else { buffer.erase(components.search_start, components.hash_start - components.search_start); components.hash_start = components.search_start; } buffer.insert(components.search_start, "?"); buffer.insert(components.search_start + 1, input); components.hash_start += uint32_t(input.size() + 1); // Do not forget `?` } ADA_ASSERT_TRUE(validate()); } inline void url_aggregator::update_base_search( std::string_view input, const uint8_t query_percent_encode_set[]) { ada_log("url_aggregator::update_base_search ", input, " with encoding parameter ", to_string(), "\n", to_diagram()); ADA_ASSERT_TRUE(validate()); ADA_ASSERT_TRUE(!helpers::overlaps(input, buffer)); if (components.hash_start == url_components::omitted) { if (components.search_start == url_components::omitted) { components.search_start = uint32_t(buffer.size()); buffer += "?"; } else { buffer.resize(components.search_start + 1); } bool encoding_required = unicode::percent_encode(input, query_percent_encode_set, buffer); // When encoding_required is false, then buffer is left unchanged, and // percent encoding was not deemed required. if (!encoding_required) { buffer.append(input); } } else { if (components.search_start == url_components::omitted) { components.search_start = components.hash_start; } else { buffer.erase(components.search_start, components.hash_start - components.search_start); components.hash_start = components.search_start; } buffer.insert(components.search_start, "?"); size_t idx = ada::unicode::percent_encode_index(input, query_percent_encode_set); if (idx == input.size()) { buffer.insert(components.search_start + 1, input); components.hash_start += uint32_t(input.size() + 1); // Do not forget `?` } else { buffer.insert(components.search_start + 1, input, 0, idx); input.remove_prefix(idx); // We only create a temporary string if we need percent encoding and // we attempt to create as small a temporary string as we can. std::string encoded = ada::unicode::percent_encode(input, query_percent_encode_set); buffer.insert(components.search_start + idx + 1, encoded); components.hash_start += uint32_t(encoded.size() + idx + 1); // Do not forget `?` } } ADA_ASSERT_TRUE(validate()); } inline void url_aggregator::update_base_pathname(const std::string_view input) { ada_log("url_aggregator::update_base_pathname '", input, "' [", input.size(), " bytes] \n", to_diagram()); ADA_ASSERT_TRUE(!helpers::overlaps(input, buffer)); ADA_ASSERT_TRUE(validate()); const bool begins_with_dashdash = checkers::begins_with(input, "//"); if (!begins_with_dashdash && has_dash_dot()) { ada_log("url_aggregator::update_base_pathname has /.: \n", to_diagram()); // We must delete the ./ delete_dash_dot(); } if (begins_with_dashdash && !has_opaque_path && !has_authority() && !has_dash_dot()) { // If url's host is null, url does not have an opaque path, url's path's // size is greater than 1, then append U+002F (/) followed by U+002E (.) to // output. buffer.insert(components.pathname_start, "/."); components.pathname_start += 2; } uint32_t difference = replace_and_resize( components.pathname_start, components.pathname_start + get_pathname_length(), input); if (components.search_start != url_components::omitted) { components.search_start += difference; } if (components.hash_start != url_components::omitted) { components.hash_start += difference; } ada_log("url_aggregator::update_base_pathname end '", input, "' [", input.size(), " bytes] \n", to_diagram()); ADA_ASSERT_TRUE(validate()); } inline void url_aggregator::append_base_pathname(const std::string_view input) { ada_log("url_aggregator::append_base_pathname ", input, " ", to_string(), "\n", to_diagram()); ADA_ASSERT_TRUE(validate()); ADA_ASSERT_TRUE(!helpers::overlaps(input, buffer)); #if ADA_DEVELOPMENT_CHECKS // computing the expected password. std::string path_expected = std::string(get_pathname()); path_expected.append(input); #endif // ADA_DEVELOPMENT_CHECKS uint32_t ending_index = uint32_t(buffer.size()); if (components.search_start != url_components::omitted) { ending_index = components.search_start; } else if (components.hash_start != url_components::omitted) { ending_index = components.hash_start; } buffer.insert(ending_index, input); if (components.search_start != url_components::omitted) { components.search_start += uint32_t(input.size()); } if (components.hash_start != url_components::omitted) { components.hash_start += uint32_t(input.size()); } #if ADA_DEVELOPMENT_CHECKS std::string path_after = std::string(get_pathname()); ADA_ASSERT_EQUAL( path_expected, path_after, "append_base_pathname problem after inserting " + std::string(input)); #endif // ADA_DEVELOPMENT_CHECKS ADA_ASSERT_TRUE(validate()); } inline void url_aggregator::update_base_username(const std::string_view input) { ada_log("url_aggregator::update_base_username '", input, "' ", to_string(), "\n", to_diagram()); ADA_ASSERT_TRUE(validate()); ADA_ASSERT_TRUE(!helpers::overlaps(input, buffer)); add_authority_slashes_if_needed(); bool has_password = has_non_empty_password(); bool host_starts_with_at = buffer.size() > components.host_start && buffer[components.host_start] == '@'; uint32_t diff = replace_and_resize(components.protocol_end + 2, components.username_end, input); components.username_end += diff; components.host_start += diff; if (!input.empty() && !host_starts_with_at) { buffer.insert(components.host_start, "@"); diff++; } else if (input.empty() && host_starts_with_at && !has_password) { // Input is empty, there is no password, and we need to remove "@" from // hostname buffer.erase(components.host_start, 1); diff--; } components.host_end += diff; components.pathname_start += diff; if (components.search_start != url_components::omitted) { components.search_start += diff; } if (components.hash_start != url_components::omitted) { components.hash_start += diff; } ADA_ASSERT_TRUE(validate()); } inline void url_aggregator::append_base_username(const std::string_view input) { ada_log("url_aggregator::append_base_username ", input); ADA_ASSERT_TRUE(validate()); ADA_ASSERT_TRUE(!helpers::overlaps(input, buffer)); #if ADA_DEVELOPMENT_CHECKS // computing the expected password. std::string username_expected = std::string(get_username()); username_expected.append(input); #endif // ADA_DEVELOPMENT_CHECKS add_authority_slashes_if_needed(); // If input is empty, do nothing. if (input.empty()) { return; } uint32_t difference = uint32_t(input.size()); buffer.insert(components.username_end, input); components.username_end += difference; components.host_start += difference; if (buffer[components.host_start] != '@' && components.host_start != components.host_end) { buffer.insert(components.host_start, "@"); difference++; } components.host_end += difference; components.pathname_start += difference; if (components.search_start != url_components::omitted) { components.search_start += difference; } if (components.hash_start != url_components::omitted) { components.hash_start += difference; } #if ADA_DEVELOPMENT_CHECKS std::string username_after = std::string(get_username()); ADA_ASSERT_EQUAL( username_expected, username_after, "append_base_username problem after inserting " + std::string(input)); #endif // ADA_DEVELOPMENT_CHECKS ADA_ASSERT_TRUE(validate()); } inline void url_aggregator::clear_password() { ada_log("url_aggregator::clear_password ", to_string(), "\n", to_diagram()); ADA_ASSERT_TRUE(validate()); if (!has_password()) { return; } uint32_t diff = components.host_start - components.username_end; buffer.erase(components.username_end, diff); components.host_start -= diff; components.host_end -= diff; components.pathname_start -= diff; if (components.search_start != url_components::omitted) { components.search_start -= diff; } if (components.hash_start != url_components::omitted) { components.hash_start -= diff; } } inline void url_aggregator::update_base_password(const std::string_view input) { ada_log("url_aggregator::update_base_password ", input); ADA_ASSERT_TRUE(validate()); ADA_ASSERT_TRUE(!helpers::overlaps(input, buffer)); add_authority_slashes_if_needed(); // TODO: Optimization opportunity. Merge the following removal functions. if (input.empty()) { clear_password(); // Remove username too, if it is empty. if (!has_non_empty_username()) { update_base_username(""); } return; } bool password_exists = has_password(); uint32_t difference = uint32_t(input.size()); if (password_exists) { uint32_t current_length = components.host_start - components.username_end - 1; buffer.erase(components.username_end + 1, current_length); difference -= current_length; } else { buffer.insert(components.username_end, ":"); difference++; } buffer.insert(components.username_end + 1, input); components.host_start += difference; // The following line is required to add "@" to hostname. When updating // password if hostname does not start with "@", it is "update_base_password"s // responsibility to set it. if (buffer[components.host_start] != '@') { buffer.insert(components.host_start, "@"); difference++; } components.host_end += difference; components.pathname_start += difference; if (components.search_start != url_components::omitted) { components.search_start += difference; } if (components.hash_start != url_components::omitted) { components.hash_start += difference; } ADA_ASSERT_TRUE(validate()); } inline void url_aggregator::append_base_password(const std::string_view input) { ada_log("url_aggregator::append_base_password ", input, " ", to_string(), "\n", to_diagram()); ADA_ASSERT_TRUE(validate()); ADA_ASSERT_TRUE(!helpers::overlaps(input, buffer)); #if ADA_DEVELOPMENT_CHECKS // computing the expected password. std::string password_expected = std::string(get_password()); password_expected.append(input); #endif // ADA_DEVELOPMENT_CHECKS add_authority_slashes_if_needed(); // If input is empty, do nothing. if (input.empty()) { return; } uint32_t difference = uint32_t(input.size()); if (has_password()) { buffer.insert(components.host_start, input); } else { difference++; // Increment for ":" buffer.insert(components.username_end, ":"); buffer.insert(components.username_end + 1, input); } components.host_start += difference; // The following line is required to add "@" to hostname. When updating // password if hostname does not start with "@", it is "append_base_password"s // responsibility to set it. if (buffer[components.host_start] != '@') { buffer.insert(components.host_start, "@"); difference++; } components.host_end += difference; components.pathname_start += difference; if (components.search_start != url_components::omitted) { components.search_start += difference; } if (components.hash_start != url_components::omitted) { components.hash_start += difference; } #if ADA_DEVELOPMENT_CHECKS std::string password_after = std::string(get_password()); ADA_ASSERT_EQUAL( password_expected, password_after, "append_base_password problem after inserting " + std::string(input)); #endif // ADA_DEVELOPMENT_CHECKS ADA_ASSERT_TRUE(validate()); } inline void url_aggregator::update_base_port(uint32_t input) { ada_log("url_aggregator::update_base_port"); ADA_ASSERT_TRUE(validate()); if (input == url_components::omitted) { clear_port(); return; } // calling std::to_string(input.value()) is unfortunate given that the port // value is probably already available as a string. std::string value = helpers::concat(":", std::to_string(input)); uint32_t difference = uint32_t(value.size()); if (components.port != url_components::omitted) { difference -= components.pathname_start - components.host_end; buffer.erase(components.host_end, components.pathname_start - components.host_end); } buffer.insert(components.host_end, value); components.pathname_start += difference; if (components.search_start != url_components::omitted) { components.search_start += difference; } if (components.hash_start != url_components::omitted) { components.hash_start += difference; } components.port = input; ADA_ASSERT_TRUE(validate()); } inline void url_aggregator::clear_port() { ada_log("url_aggregator::clear_port"); ADA_ASSERT_TRUE(validate()); if (components.port == url_components::omitted) { return; } uint32_t length = components.pathname_start - components.host_end; buffer.erase(components.host_end, length); components.pathname_start -= length; if (components.search_start != url_components::omitted) { components.search_start -= length; } if (components.hash_start != url_components::omitted) { components.hash_start -= length; } components.port = url_components::omitted; ADA_ASSERT_TRUE(validate()); } inline uint32_t url_aggregator::retrieve_base_port() const { ada_log("url_aggregator::retrieve_base_port"); return components.port; } inline void url_aggregator::clear_search() { ada_log("url_aggregator::clear_search"); ADA_ASSERT_TRUE(validate()); if (components.search_start == url_components::omitted) { return; } if (components.hash_start == url_components::omitted) { buffer.resize(components.search_start); } else { buffer.erase(components.search_start, components.hash_start - components.search_start); components.hash_start = components.search_start; } components.search_start = url_components::omitted; #if ADA_DEVELOPMENT_CHECKS ADA_ASSERT_EQUAL(get_search(), "", "search should have been cleared on buffer=" + buffer + " with " + components.to_string() + "\n" + to_diagram()); #endif ADA_ASSERT_TRUE(validate()); } inline void url_aggregator::clear_hash() { ada_log("url_aggregator::clear_hash"); ADA_ASSERT_TRUE(validate()); if (components.hash_start == url_components::omitted) { return; } buffer.resize(components.hash_start); components.hash_start = url_components::omitted; #if ADA_DEVELOPMENT_CHECKS ADA_ASSERT_EQUAL(get_hash(), "", "hash should have been cleared on buffer=" + buffer + " with " + components.to_string() + "\n" + to_diagram()); #endif ADA_ASSERT_TRUE(validate()); } inline void url_aggregator::clear_pathname() { ada_log("url_aggregator::clear_pathname"); ADA_ASSERT_TRUE(validate()); uint32_t ending_index = uint32_t(buffer.size()); if (components.search_start != url_components::omitted) { ending_index = components.search_start; } else if (components.hash_start != url_components::omitted) { ending_index = components.hash_start; } uint32_t pathname_length = ending_index - components.pathname_start; buffer.erase(components.pathname_start, pathname_length); uint32_t difference = pathname_length; if (components.pathname_start == components.host_end + 2 && buffer[components.host_end] == '/' && buffer[components.host_end + 1] == '.') { components.pathname_start -= 2; buffer.erase(components.host_end, 2); difference += 2; } if (components.search_start != url_components::omitted) { components.search_start -= difference; } if (components.hash_start != url_components::omitted) { components.hash_start -= difference; } ada_log("url_aggregator::clear_pathname completed, running checks..."); #if ADA_DEVELOPMENT_CHECKS ADA_ASSERT_EQUAL(get_pathname(), "", "pathname should have been cleared on buffer=" + buffer + " with " + components.to_string() + "\n" + to_diagram()); #endif ADA_ASSERT_TRUE(validate()); ada_log("url_aggregator::clear_pathname completed, running checks... ok"); } inline void url_aggregator::clear_hostname() { ada_log("url_aggregator::clear_hostname"); ADA_ASSERT_TRUE(validate()); if (!has_authority()) { return; } ADA_ASSERT_TRUE(has_authority()); uint32_t hostname_length = components.host_end - components.host_start; uint32_t start = components.host_start; // If hostname starts with "@", we should not remove that character. if (hostname_length > 0 && buffer[start] == '@') { start++; hostname_length--; } buffer.erase(start, hostname_length); components.host_end = start; components.pathname_start -= hostname_length; if (components.search_start != url_components::omitted) { components.search_start -= hostname_length; } if (components.hash_start != url_components::omitted) { components.hash_start -= hostname_length; } #if ADA_DEVELOPMENT_CHECKS ADA_ASSERT_EQUAL(get_hostname(), "", "hostname should have been cleared on buffer=" + buffer + " with " + components.to_string() + "\n" + to_diagram()); #endif ADA_ASSERT_TRUE(has_authority()); ADA_ASSERT_TRUE(has_empty_hostname()); ADA_ASSERT_TRUE(validate()); } [[nodiscard]] inline bool url_aggregator::has_hash() const noexcept { ada_log("url_aggregator::has_hash"); return components.hash_start != url_components::omitted; } [[nodiscard]] inline bool url_aggregator::has_search() const noexcept { ada_log("url_aggregator::has_search"); return components.search_start != url_components::omitted; } ada_really_inline bool url_aggregator::has_credentials() const noexcept { ada_log("url_aggregator::has_credentials"); return has_non_empty_username() || has_non_empty_password(); } inline bool url_aggregator::cannot_have_credentials_or_port() const { ada_log("url_aggregator::cannot_have_credentials_or_port"); return type == ada::scheme::type::FILE || components.host_start == components.host_end; } [[nodiscard]] ada_really_inline const ada::url_components & url_aggregator::get_components() const noexcept { return components; } [[nodiscard]] inline bool ada::url_aggregator::has_authority() const noexcept { ada_log("url_aggregator::has_authority"); // Performance: instead of doing this potentially expensive check, we could // have a boolean in the struct. return components.protocol_end + 2 <= components.host_start && helpers::substring(buffer, components.protocol_end, components.protocol_end + 2) == "//"; } inline void ada::url_aggregator::add_authority_slashes_if_needed() noexcept { ada_log("url_aggregator::add_authority_slashes_if_needed"); ADA_ASSERT_TRUE(validate()); // Protocol setter will insert `http:` to the URL. It is up to hostname setter // to insert // `//` initially to the buffer, since it depends on the hostname existence. if (has_authority()) { return; } // Performance: the common case is components.protocol_end == buffer.size() // Optimization opportunity: in many cases, the "//" is part of the input and // the insert could be fused with another insert. buffer.insert(components.protocol_end, "//"); components.username_end += 2; components.host_start += 2; components.host_end += 2; components.pathname_start += 2; if (components.search_start != url_components::omitted) { components.search_start += 2; } if (components.hash_start != url_components::omitted) { components.hash_start += 2; } ADA_ASSERT_TRUE(validate()); } inline void ada::url_aggregator::reserve(uint32_t capacity) { buffer.reserve(capacity); } inline bool url_aggregator::has_non_empty_username() const noexcept { ada_log("url_aggregator::has_non_empty_username"); return components.protocol_end + 2 < components.username_end; } inline bool url_aggregator::has_non_empty_password() const noexcept { ada_log("url_aggregator::has_non_empty_password"); return components.host_start - components.username_end > 0; } inline bool url_aggregator::has_password() const noexcept { ada_log("url_aggregator::has_password"); // This function does not care about the length of the password return components.host_start > components.username_end && buffer[components.username_end] == ':'; } inline bool url_aggregator::has_empty_hostname() const noexcept { if (!has_hostname()) { return false; } if (components.host_start == components.host_end) { return true; } if (components.host_end > components.host_start + 1) { return false; } return components.username_end != components.host_start; } inline bool url_aggregator::has_hostname() const noexcept { return has_authority(); } inline bool url_aggregator::has_port() const noexcept { ada_log("url_aggregator::has_port"); return components.pathname_start != components.host_end; } inline bool url_aggregator::has_dash_dot() const noexcept { // If url's host is null, url does not have an opaque path, url's path's size // is greater than 1, and url's path[0] is the empty string, then append // U+002F (/) followed by U+002E (.) to output. ada_log("url_aggregator::has_dash_dot"); // Performance: instead of doing this potentially expensive check, we could // just have a boolean value in the structure. #if ADA_DEVELOPMENT_CHECKS if (components.pathname_start + 1 < buffer.size() && components.pathname_start == components.host_end + 2) { ADA_ASSERT_TRUE(buffer[components.host_end] == '/'); ADA_ASSERT_TRUE(buffer[components.host_end + 1] == '.'); ADA_ASSERT_TRUE(buffer[components.pathname_start] == '/'); ADA_ASSERT_TRUE(buffer[components.pathname_start + 1] == '/'); } #endif return !has_opaque_path && components.pathname_start == components.host_end + 2 && components.pathname_start + 1 < buffer.size(); } inline std::string_view url_aggregator::get_href() const noexcept { ada_log("url_aggregator::get_href"); return buffer; } ada_really_inline size_t url_aggregator::parse_port( std::string_view view, bool check_trailing_content) noexcept { ada_log("url_aggregator::parse_port('", view, "') ", view.size()); uint16_t parsed_port{}; auto r = std::from_chars(view.data(), view.data() + view.size(), parsed_port); if (r.ec == std::errc::result_out_of_range) { ada_log("parse_port: std::errc::result_out_of_range"); is_valid = false; return 0; } ada_log("parse_port: ", parsed_port); const size_t consumed = size_t(r.ptr - view.data()); ada_log("parse_port: consumed ", consumed); if (check_trailing_content) { is_valid &= (consumed == view.size() || view[consumed] == '/' || view[consumed] == '?' || (is_special() && view[consumed] == '\\')); } ada_log("parse_port: is_valid = ", is_valid); if (is_valid) { ada_log("parse_port", r.ec == std::errc()); // scheme_default_port can return 0, and we should allow 0 as a base port. auto default_port = scheme_default_port(); bool is_port_valid = (default_port == 0 && parsed_port == 0) || (default_port != parsed_port); if (r.ec == std::errc() && is_port_valid) { update_base_port(parsed_port); } else { clear_port(); } } return consumed; } inline void url_aggregator::set_protocol_as_file() { ada_log("url_aggregator::set_protocol_as_file "); ADA_ASSERT_TRUE(validate()); type = ada::scheme::type::FILE; // next line could overflow but unsigned arithmetic has well-defined // overflows. uint32_t new_difference = 5 - components.protocol_end; if (buffer.empty()) { buffer.append("file:"); } else { buffer.erase(0, components.protocol_end); buffer.insert(0, "file:"); } components.protocol_end = 5; // Update the rest of the components. components.username_end += new_difference; components.host_start += new_difference; components.host_end += new_difference; components.pathname_start += new_difference; if (components.search_start != url_components::omitted) { components.search_start += new_difference; } if (components.hash_start != url_components::omitted) { components.hash_start += new_difference; } ADA_ASSERT_TRUE(validate()); } inline std::ostream &operator<<(std::ostream &out, const ada::url_aggregator &u) { return out << u.to_string(); } } // namespace ada #endif // ADA_URL_AGGREGATOR_INL_H /* end file include/ada/url_aggregator-inl.h */ /* begin file include/ada/url_search_params.h */ /** * @file url_search_params.h * @brief Declaration for the URL Search Params */ #ifndef ADA_URL_SEARCH_PARAMS_H #define ADA_URL_SEARCH_PARAMS_H #include #include #include #include namespace ada { /** * @see https://url.spec.whatwg.org/#interface-urlsearchparams */ struct url_search_params { url_search_params() = default; /** * @see * https://github.com/web-platform-tests/wpt/blob/master/url/urlsearchparams-constructor.any.js */ url_search_params(const std::string_view input) { initialize(input); } url_search_params(const url_search_params &u) = default; url_search_params(url_search_params &&u) noexcept = default; url_search_params &operator=(url_search_params &&u) noexcept = default; url_search_params &operator=(const url_search_params &u) = default; ~url_search_params() = default; [[nodiscard]] inline size_t size() const noexcept; /** * @see https://url.spec.whatwg.org/#dom-urlsearchparams-append */ inline void append(std::string_view key, std::string_view value); /** * @see https://url.spec.whatwg.org/#dom-urlsearchparams-delete */ inline void remove(std::string_view key); inline void remove(std::string_view key, std::string_view value); /** * @see https://url.spec.whatwg.org/#dom-urlsearchparams-get */ inline std::optional get(std::string_view key); /** * @see https://url.spec.whatwg.org/#dom-urlsearchparams-getall */ inline std::vector get_all(std::string_view key); /** * @see https://url.spec.whatwg.org/#dom-urlsearchparams-has */ inline bool has(std::string_view key) noexcept; /** * @see https://url.spec.whatwg.org/#dom-urlsearchparams-set */ inline void set(std::string_view key, std::string_view value); /** * @see https://url.spec.whatwg.org/#dom-urlsearchparams-sort */ inline void sort(); /** * @see https://url.spec.whatwg.org/#urlsearchparams-stringification-behavior */ inline std::string to_string(); private: typedef std::pair key_value_pair; std::vector params{}; /** * @see https://url.spec.whatwg.org/#concept-urlencoded-parser */ void initialize(std::string_view init); }; // url_search_params } // namespace ada #endif /* end file include/ada/url_search_params.h */ /* begin file include/ada/url_search_params-inl.h */ /** * @file url_search_params-inl.h * @brief Inline declarations for the URL Search Params */ #ifndef ADA_URL_SEARCH_PARAMS_INL_H #define ADA_URL_SEARCH_PARAMS_INL_H #include #include #include #include #include namespace ada { inline void url_search_params::initialize(std::string_view input) { if (!input.empty() && input.front() == '?') { input.remove_prefix(1); } auto process_key_value = [&](const std::string_view current) { auto equal = current.find('='); if (equal == std::string_view::npos) { auto name = std::string(current); std::replace(name.begin(), name.end(), '+', ' '); params.emplace_back(unicode::percent_decode(name, name.find('%')), ""); } else { auto name = std::string(current.substr(0, equal)); auto value = std::string(current.substr(equal + 1)); std::replace(name.begin(), name.end(), '+', ' '); std::replace(value.begin(), value.end(), '+', ' '); params.emplace_back(unicode::percent_decode(name, name.find('%')), unicode::percent_decode(value, value.find('%'))); } }; while (!input.empty()) { auto ampersand_index = input.find('&'); if (ampersand_index == std::string_view::npos) { if (!input.empty()) { process_key_value(input); } break; } else if (ampersand_index != 0) { process_key_value(input.substr(0, ampersand_index)); } input.remove_prefix(ampersand_index + 1); } } inline void url_search_params::append(const std::string_view key, const std::string_view value) { params.emplace_back(key, value); } inline size_t url_search_params::size() const noexcept { return params.size(); } inline std::optional url_search_params::get( const std::string_view key) { auto entry = std::find_if(params.begin(), params.end(), [&key](auto ¶m) { return param.first == key; }); if (entry == params.end()) { return std::nullopt; } return entry->second; } inline std::vector url_search_params::get_all( const std::string_view key) { std::vector out{}; for (auto ¶m : params) { if (param.first == key) { out.emplace_back(param.second); } } return out; } inline bool url_search_params::has(const std::string_view key) noexcept { auto entry = std::find_if(params.begin(), params.end(), [&key](auto ¶m) { return param.first == key; }); return entry != params.end(); } inline std::string url_search_params::to_string() { auto character_set = ada::character_sets::WWW_FORM_URLENCODED_PERCENT_ENCODE; std::string out{}; for (size_t i = 0; i < params.size(); i++) { auto key = ada::unicode::percent_encode(params[i].first, character_set); auto value = ada::unicode::percent_encode(params[i].second, character_set); // Performance optimization: Move this inside percent_encode. std::replace(key.begin(), key.end(), ' ', '+'); std::replace(value.begin(), value.end(), ' ', '+'); if (i != 0) { out += "&"; } out.append(key); out += "="; out.append(value); } return out; } inline void url_search_params::set(const std::string_view key, const std::string_view value) { const auto find = [&key](auto ¶m) { return param.first == key; }; auto it = std::find_if(params.begin(), params.end(), find); if (it == params.end()) { params.emplace_back(key, value); } else { it->second = value; params.erase(std::remove_if(std::next(it), params.end(), find), params.end()); } } inline void url_search_params::remove(const std::string_view key) { params.erase( std::remove_if(params.begin(), params.end(), [&key](auto ¶m) { return param.first == key; }), params.end()); } inline void url_search_params::remove(const std::string_view key, const std::string_view value) { params.erase(std::remove_if(params.begin(), params.end(), [&key, &value](auto ¶m) { return param.first == key && param.second == value; }), params.end()); } inline void url_search_params::sort() { std::stable_sort(params.begin(), params.end(), [](const key_value_pair &lhs, const key_value_pair &rhs) { return lhs.first < rhs.first; }); } } // namespace ada #endif // ADA_URL_SEARCH_PARAMS_INL_H /* end file include/ada/url_search_params-inl.h */ // Public API /* begin file include/ada/ada_version.h */ /** * @file ada_version.h * @brief Definitions for Ada's version number. */ #ifndef ADA_ADA_VERSION_H #define ADA_ADA_VERSION_H #define ADA_VERSION "2.6.0" namespace ada { enum { ADA_VERSION_MAJOR = 2, ADA_VERSION_MINOR = 6, ADA_VERSION_REVISION = 0, }; } // namespace ada #endif // ADA_ADA_VERSION_H /* end file include/ada/ada_version.h */ /* begin file include/ada/implementation.h */ /** * @file implementation.h * @brief Definitions for user facing functions for parsing URL and it's * components. */ #ifndef ADA_IMPLEMENTATION_H #define ADA_IMPLEMENTATION_H #include #include namespace ada { enum class errors { generic_error }; template using result = tl::expected; /** * The URL parser takes a scalar value string input, with an optional null or * base URL base (default null). The parser assumes the input is a valid ASCII * or UTF-8 string. * * @param input the string input to analyze (must be valid ASCII or UTF-8) * @param base_url the optional URL input to use as a base url. * @return a parsed URL. */ template ada_warn_unused ada::result parse( std::string_view input, const result_type* base_url = nullptr); extern template ada::result parse(std::string_view input, const url* base_url); extern template ada::result parse( std::string_view input, const url_aggregator* base_url); /** * Verifies whether the URL strings can be parsed. The function assumes * that the inputs are valid ASCII or UTF-8 strings. * @see https://url.spec.whatwg.org/#dom-url-canparse * @return If URL can be parsed or not. */ bool can_parse(std::string_view input, const std::string_view* base_input = nullptr); /** * Computes a href string from a file path. The function assumes * that the input is a valid ASCII or UTF-8 string. * @return a href string (starts with file:://) */ std::string href_from_file(std::string_view path); } // namespace ada #endif // ADA_IMPLEMENTATION_H /* end file include/ada/implementation.h */ #endif // ADA_H /* end file include/ada.h */