stdex/include/stdex/unicode.hpp

/*
	SPDX-License-Identifier: MIT
	Copyright © 2023-2025 Amebis
*/

#pragma once

#include "assert.hpp"
#include "compat.hpp"
#include "endian.hpp"
#include "math.hpp"
#include "string.hpp"
#include <stdint.h>
#ifndef _WIN32
#include <iconv.h>
#include <langinfo.h>
#endif
#include <map>
#include <memory>
#include <string>

#if defined(__GNUC__)
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wdeprecated-declarations"
#pragma GCC diagnostic ignored "-Wexit-time-destructors"
#endif

namespace stdex
{
	enum class charset_id : uint16_t {
#ifdef _WIN32
		system = CP_ACP,
		oem = CP_OEMCP,
		ascii = 20127,
		utf7 = CP_UTF7,
		utf8 = CP_UTF8,
		utf16 = 1200 /*CP_WINUNICODE*/,
		utf32 = 12000,
		windows1250 = 1250,
		windows1251 = 1251,
		windows1252 = 1252,
#else
		system = 0,
		ascii,
		utf7,
		utf8,
		utf16,
		utf32,
		windows1250,
		windows1251,
		windows1252,

		_max
#endif
	};

#ifdef _WIN32
	constexpr charset_id wchar_t_charset = charset_id::utf16;
#ifdef _UNICODE
	constexpr charset_id system_charset = charset_id::utf16;
#else
	constexpr charset_id system_charset = charset_id::system;
#endif
#else
	constexpr charset_id wchar_t_charset = charset_id::utf32;
	constexpr charset_id system_charset = charset_id::system;
#endif

	///
	/// Parses charset name and returns matching charset code
	///
	/// \param[in] name  Charset name
	///
	/// \returns Charset code or `charset_id::system` if match not found
	///
	inline charset_id charset_from_name(_In_z_ const char* name)
	{
		struct charset_less {
			bool operator()(_In_z_ const char* a, _In_z_ const char* b) const
			{
				return stricmp(a, b) < 0;
			}
		};
		static const std::map<const char*, charset_id, charset_less> charsets = {
			{ "ANSI_X3.4-1968", charset_id::ascii },
			{ "ANSI_X3.4-1986", charset_id::ascii },
			{ "ASCII", charset_id::ascii },
			{ "CP367", charset_id::ascii },
			{ "IBM367", charset_id::ascii },
			{ "ISO-IR-6", charset_id::ascii },
			{ "ISO646-US", charset_id::ascii },
			{ "ISO_646.IRV:1991", charset_id::ascii },
			{ "US", charset_id::ascii },
			{ "US-ASCII", charset_id::ascii },
			{ "CSASCII", charset_id::ascii },

			{ "UNICODE-1-1-UTF-7", charset_id::utf7 },
			{ "UTF-7", charset_id::utf7 },
			{ "CSUNICODE11UTF7", charset_id::utf7 },

			{ "UTF-8", charset_id::utf8 },
			{ "UTF8", charset_id::utf8 },

			{ "UTF-16", charset_id::utf16 },
#if BYTE_ORDER == BIG_ENDIAN
			{ "UTF-16BE", charset_id::utf16 },
#else
			{ "UTF-16LE", charset_id::utf16 },
#endif

			{ "UTF-32", charset_id::utf32 },
#if BYTE_ORDER == BIG_ENDIAN
			{ "UTF-32BE", charset_id::utf32 },
#else
			{ "UTF-32LE", charset_id::utf32 },
#endif

			{ "CP1250", charset_id::windows1250 },
			{ "MS-EE", charset_id::windows1250 },
			{ "WINDOWS-1250", charset_id::windows1250 },

			{ "CP1251", charset_id::windows1251 },
			{ "MS-CYRL", charset_id::windows1251 },
			{ "WINDOWS-1251", charset_id::windows1251 },

			{ "CP1252", charset_id::windows1252 },
			{ "MS-ANSI", charset_id::windows1252 },
			{ "WINDOWS-1252", charset_id::windows1252 },
		};
		if (auto el = charsets.find(name); el != charsets.end())
			return el->second;
		return charset_id::system;
	}

	///
	/// Parses charset name and returns matching charset code
	///
	/// \param[in] name  Charset name
	///
	/// \returns Charset code or `charset_id::system` if match not found
	///
	template <class TR = std::char_traits<char>, class AX = std::allocator<char>>
	charset_id charset_from_name(_In_ const std::basic_string<char, TR, AX>& name)
	{
		return charset_from_name(name.c_str());
	}

	///
	/// Encoding converter context
	///
	template <typename T_from, typename T_to>
	class charset_encoder
	{
	protected:
		charset_id m_from, m_to;
		T_to m_invalid;

	public:
		charset_encoder(_In_ charset_id from, _In_ charset_id to, _In_ T_to invalid = '?') :
			m_from(from),
			m_to(to),
			m_invalid(invalid)
		{
#ifdef _WIN32
			m_from_wincp = to_encoding(from);
			m_to_wincp = to_encoding(to);
#else
			m_handle = iconv_open(to_encoding(to), to_encoding(from));
			if (m_handle == (iconv_t)-1)
				throw std::system_error(errno, std::system_category(), "iconv_open failed");
#endif
		}

#ifndef _WIN32
		~charset_encoder()
		{
			iconv_close(m_handle);
		}
#endif

		charset_id from_encoding() const { return m_from; }
		charset_id to_encoding() const { return m_to; }

		///
		/// Convert string and append to string
		///
		/// \param[in,out] dst        String to append converted string to
		/// \param[in]     src        String to convert
		/// \param[in]     count_src  String to convert code unit limit
		///
		template <class TR_to = std::char_traits<T_to>, class AX_to = std::allocator<T_to>>
		void strcat(
			_Inout_ std::basic_string<T_to, TR_to, AX_to>& dst,
			_In_reads_or_z_opt_(count_src) const T_from* src, _In_ size_t count_src)
		{
			stdex_assert(src || !count_src);
			count_src = strnlen<T_from>(src, count_src);
			if (!count_src) _Unlikely_
				return;

#ifdef _WIN32
			constexpr DWORD dwFlagsWCMB = 0;

			stdex_assert(src);
			if (m_from_wincp == m_to_wincp) _Unlikely_{
				dst.append(reinterpret_cast<const T_to*>(src), count_src);
				return;
			}

#pragma warning(suppress: 4127) // Can't use precompiler #if on template arguments, using "if" makes MSVC warnings.
			if constexpr (sizeof(T_from) == sizeof(char) && sizeof(T_to) == sizeof(wchar_t)) {
				stdex_assert(count_src < INT_MAX || count_src == SIZE_MAX);

				// Try to convert to stack buffer first.
				WCHAR szStackBuffer[1024 / sizeof(WCHAR)];
#pragma warning(suppress: 6387) // Testing indicates src may be NULL when count_src is also 0. Is SAL of the lpMultiByteStr parameter wrong?
				int cch = MultiByteToWideChar(m_from_wincp, 0, reinterpret_cast<LPCCH>(src), static_cast<int>(count_src), szStackBuffer, _countof(szStackBuffer));
				if (cch) {
					// Append from stack.
					dst.append(reinterpret_cast<const T_to*>(szStackBuffer), count_src != SIZE_MAX ? wcsnlen(szStackBuffer, cch) : static_cast<size_t>(cch) - 1);
					return;
				}
				DWORD dwResult = GetLastError();
				if (dwResult == ERROR_INSUFFICIENT_BUFFER) {
					// Query the required output size. Allocate buffer. Then convert again.
					cch = MultiByteToWideChar(m_from_wincp, 0, reinterpret_cast<LPCCH>(src), static_cast<int>(count_src), NULL, 0);
					size_t offset = dst.size();
					dst.resize(offset + static_cast<size_t>(cch));
					cch = MultiByteToWideChar(m_from_wincp, 0, reinterpret_cast<LPCCH>(src), static_cast<int>(count_src), &dst[offset], cch);
					dst.resize(offset + (count_src != SIZE_MAX ? wcsnlen(&dst[offset], cch) : static_cast<size_t>(cch) - 1));
					return;
				}
				throw std::system_error(dwResult, std::system_category(), "MultiByteToWideChar failed");
			}

#pragma warning(suppress: 4127) // Can't use precompiler #if on template arguments, using "if" makes MSVC warnings.
			if constexpr (sizeof(T_from) == sizeof(wchar_t) && sizeof(T_to) == sizeof(char)) {
				stdex_assert(count_src < INT_MAX || count_src == SIZE_MAX);
				LPCCH lpDefaultChar = m_to_wincp == CP_UTF8 || m_to_wincp == CP_UTF7 ? NULL : &m_invalid;

				// Try to convert to stack buffer first.
				CHAR szStackBuffer[1024 / sizeof(CHAR)];
#pragma warning(suppress: 6387) // Testing indicates src may be NULL when count_src is also 0. Is SAL of the lpWideCharStr parameter wrong?
				int cch = WideCharToMultiByte(m_to_wincp, dwFlagsWCMB, reinterpret_cast<LPCWCH>(src), static_cast<int>(count_src), szStackBuffer, _countof(szStackBuffer), lpDefaultChar, NULL);
				if (cch) {
					// Copy from stack. Be careful not to include zero terminator.
					dst.append(reinterpret_cast<const T_to*>(szStackBuffer), count_src != SIZE_MAX ? strnlen(szStackBuffer, cch) : static_cast<size_t>(cch) - 1);
					return;
				}
				DWORD dwResult = GetLastError();
				if (dwResult == ERROR_INSUFFICIENT_BUFFER) {
					// Query the required output size. Allocate buffer. Then convert again.
					cch = WideCharToMultiByte(m_to_wincp, dwFlagsWCMB, reinterpret_cast<LPCWCH>(src), static_cast<int>(count_src), NULL, 0, lpDefaultChar, NULL);
					size_t offset = dst.size();
					dst.resize(offset + static_cast<size_t>(cch));
					cch = WideCharToMultiByte(m_to_wincp, dwFlagsWCMB, reinterpret_cast<LPCWCH>(src), static_cast<int>(count_src), &dst[offset], cch, lpDefaultChar, NULL);
					dst.resize(offset + (count_src != SIZE_MAX ? strnlen(&dst[offset], cch) : static_cast<size_t>(cch) - 1));
					return;
				}
				throw std::system_error(dwResult, std::system_category(), "WideCharToMultiByte failed");
			}

#pragma warning(suppress: 4127) // Can't use precompiler #if on template arguments, using "if" makes MSVC warnings.
			if constexpr (sizeof(T_from) == sizeof(char) && sizeof(T_to) == sizeof(char)) {
				stdex_assert(count_src < INT_MAX || count_src == SIZE_MAX);
				LPCCH lpDefaultChar = m_to_wincp == CP_UTF8 || m_to_wincp == CP_UTF7 ? NULL : &m_invalid;

				// Try to convert to stack buffer first.
				DWORD dwResult;
				WCHAR szStackBufferMBWC[512 / sizeof(WCHAR)];
#pragma warning(suppress: 6387) // Testing indicates src may be NULL when count_src is also 0. Is SAL of the lpMultiByteStr parameter wrong?
				int cch = MultiByteToWideChar(m_from_wincp, 0, reinterpret_cast<LPCCH>(src), static_cast<int>(count_src), szStackBufferMBWC, _countof(szStackBufferMBWC));
				if (cch) {
					// Append from stack.
					size_t count_inter = count_src != SIZE_MAX ? wcsnlen(szStackBufferMBWC, cch) : static_cast<size_t>(cch) - 1;
					stdex_assert(count_inter < INT_MAX);

					// Try to convert to stack buffer first.
					CHAR szStackBufferWCMB[512 / sizeof(CHAR)];
#pragma warning(suppress: 6387) // Testing indicates szStackBufferMBWC may be NULL when count_inter is also 0. Is SAL of the lpWideCharStr parameter wrong?
					cch = WideCharToMultiByte(m_to_wincp, dwFlagsWCMB, szStackBufferMBWC, static_cast<int>(count_inter), szStackBufferWCMB, _countof(szStackBufferWCMB), lpDefaultChar, NULL);
					if (cch) {
						// Copy from stack. Be careful not to include zero terminator.
						dst.append(reinterpret_cast<const T_to*>(szStackBufferWCMB), strnlen(szStackBufferWCMB, cch));
						return;
					}
					dwResult = GetLastError();
					if (dwResult == ERROR_INSUFFICIENT_BUFFER) {
						// Query the required output size. Allocate buffer. Then convert again.
						cch = WideCharToMultiByte(m_to_wincp, dwFlagsWCMB, szStackBufferMBWC, static_cast<int>(count_inter), NULL, 0, lpDefaultChar, NULL);
						size_t offset = dst.size();
						dst.resize(offset + cch);
						cch = WideCharToMultiByte(m_to_wincp, dwFlagsWCMB, szStackBufferMBWC, static_cast<int>(count_inter), &dst[offset], cch, lpDefaultChar, NULL);
						dst.resize(offset + strnlen(&dst[offset], cch));
						return;
					}
					throw std::system_error(dwResult, std::system_category(), "WideCharToMultiByte failed");
				}
				dwResult = GetLastError();
				if (dwResult == ERROR_INSUFFICIENT_BUFFER) {
					// Query the required output size. Allocate buffer. Then convert again.
					cch = MultiByteToWideChar(m_from_wincp, 0, reinterpret_cast<LPCCH>(src), static_cast<int>(count_src), NULL, 0);
					std::unique_ptr<WCHAR[]> szBufferMBWC(new WCHAR[cch]);
					cch = MultiByteToWideChar(m_from_wincp, 0, reinterpret_cast<LPCCH>(src), static_cast<int>(count_src), szBufferMBWC.get(), cch);
					size_t count_inter = count_src != SIZE_MAX ? wcsnlen(szBufferMBWC.get(), cch) : static_cast<size_t>(cch) - 1;

					// Query the required output size. Allocate buffer. Then convert again.
					cch = WideCharToMultiByte(m_to_wincp, dwFlagsWCMB, szBufferMBWC.get(), static_cast<int>(count_inter), NULL, 0, lpDefaultChar, NULL);
					size_t offset = dst.size();
					dst.resize(offset + cch);
					cch = WideCharToMultiByte(m_to_wincp, dwFlagsWCMB, szBufferMBWC.get(), static_cast<int>(count_inter), &dst[offset], cch, lpDefaultChar, NULL);
					dst.resize(offset + strnlen(&dst[offset], cch));
					return;
				}
				throw std::system_error(dwResult, std::system_category(), "MultiByteToWideChar failed");
			}
#else
			dst.reserve(dst.size() + count_src);
			T_to buf[1024 / sizeof(T_to)];
			size_t src_size = stdex::mul(sizeof(T_from), count_src);
			for (;;) {
				T_to* output = &buf[0];
				size_t output_size = sizeof(buf);
				errno = 0;
				iconv(m_handle, const_cast<char**>(reinterpret_cast<const char**>(&src)), &src_size, reinterpret_cast<char**>(&output), &output_size);
				dst.append(buf, reinterpret_cast<T_to*>(reinterpret_cast<char*>(buf) + sizeof(buf) - output_size));
				if (!errno)
					break;
				if (errno == E2BIG)
					continue;
				if (errno == EILSEQ) {
					dst.append(1, m_invalid);
					++src; src_size -= sizeof(T_from);
					continue;
				}
				throw std::system_error(errno, std::system_category(), "iconv failed");
			}
#endif
		}

		///
		/// Convert string and append to string
		///
		/// \param[in,out] dst        String to append converted string to
		/// \param[in]     src        Zero-terminated string to convert
		///
		template <class TR_to = std::char_traits<T_to>, class AX_to = std::allocator<T_to>>
		void strcat(
			_Inout_ std::basic_string<T_to, TR_to, AX_to>& dst,
			_In_z_ const T_from* src)
		{
			strcat(dst, src, SIZE_MAX);
		}

		///
		/// Convert string and append to string
		///
		/// \param[in,out] dst        String to append converted string to
		/// \param[in]     src        String to convert
		///
		template <class TR_to = std::char_traits<T_to>, class AX_to = std::allocator<T_to>>
		void strcat(
			_Inout_ std::basic_string<T_to, TR_to, AX_to>& dst,
			_In_ const std::basic_string_view<T_from, std::char_traits<T_from>> src)
		{
			strcat(dst, src.data(), src.size());
		}

		///
		/// Convert string
		///
		/// \param[in,out] dst        String to write converted string to
		/// \param[in]     src        String to convert
		/// \param[in]     count_src  String to convert code unit limit
		///
		template <class TR_to = std::char_traits<T_to>, class AX_to = std::allocator<T_to>>
		void strcpy(
			_Inout_ std::basic_string<T_to, TR_to, AX_to>& dst,
			_In_reads_or_z_opt_(count_src) const T_from* src, _In_ size_t count_src)
		{
			dst.clear();
			strcat(dst, src, count_src);
		}

		///
		/// Convert string
		///
		/// \param[in,out] dst        String to write converted string to
		/// \param[in]     src        Zero-terminated string to convert
		///
		template <class TR_to = std::char_traits<T_to>, class AX_to = std::allocator<T_to>>
		void strcpy(
			_Inout_ std::basic_string<T_to, TR_to, AX_to>& dst,
			_In_z_ const T_from* src)
		{
			strcpy(dst, src, SIZE_MAX);
		}

		///
		/// Convert string
		///
		/// \param[in,out] dst        String to write converted string to
		/// \param[in]     src        String to convert
		///
		template <class TR_to = std::char_traits<T_to>, class AX_to = std::allocator<T_to>>
		void strcpy(
			_Inout_ std::basic_string<T_to, TR_to, AX_to>& dst,
			_In_ const std::basic_string_view<T_from, std::char_traits<T_from>> src)
		{
			strcpy(dst, src.data(), src.size());
		}

		///
		/// Return converted string
		///
		/// \param[in]     src        String to convert
		/// \param[in]     count_src  String to convert code unit limit
		///
		template <class TR_to = std::char_traits<T_to>, class AX_to = std::allocator<T_to>>
		std::basic_string<T_to, TR_to, AX_to> convert(_In_reads_or_z_opt_(count_src) const T_from* src, _In_ size_t count_src)
		{
			std::basic_string<T_to, TR_to, AX_to> dst;
			strcat(dst, src, count_src);
			return dst;
		}

		///
		/// Return converted string
		///
		/// \param[in]     src        Zero-terminated string to convert
		///
		template <class TR_to = std::char_traits<T_to>, class AX_to = std::allocator<T_to>>
		std::basic_string<T_to, TR_to, AX_to> convert(_In_z_ const T_from* src)
		{
			return convert(src, SIZE_MAX);
		}

		///
		/// Return converted string
		///
		/// \param[in]     src        String to convert
		///
		template <class TR_to = std::char_traits<T_to>, class AX_to = std::allocator<T_to>>
		std::basic_string<T_to, TR_to, AX_to> convert(_In_ const std::basic_string_view<T_from, std::char_traits<T_from>> src)
		{
			return convert(src.data(), src.size());
		}

		void clear()
		{
#ifndef _WIN32
			iconv(m_handle, NULL, NULL, NULL, NULL);
#endif
		}

		static charset_id system_charset()
		{
#ifdef _WIN32
			return static_cast<charset_id>(GetACP());
#else
			return charset_from_name(nl_langinfo(CODESET));
#endif
		}

#ifdef _WIN32
	protected:
		static UINT to_encoding(_In_ charset_id charset)
		{
			return
				charset == charset_id::system ? GetACP() :
				charset == charset_id::oem ? GetOEMCP() :
				static_cast<UINT>(charset);
		}

	protected:
		UINT m_from_wincp, m_to_wincp;
#else
	protected:
		static const char* to_encoding(_In_ charset_id charset)
		{
			static const char* const encodings[static_cast<std::underlying_type_t<charset_id>>(charset_id::_max)] = {
				"",         // system
				"ASCII",    // ascii
				"UTF-7",    // utf7
				"UTF-8",    // utf8
#if BYTE_ORDER == BIG_ENDIAN
				"UTF-16BE", // utf16
				"UTF-32BE", // utf32
#else
				"UTF-16LE", // utf16
				"UTF-32LE", // utf32
#endif
				"CP1250",   // windows1250
				"CP1251",   // windows1251
				"CP1252",   // windows1252
			};
			return
				charset == charset_id::system ? nl_langinfo(CODESET) :
				encodings[static_cast<std::underlying_type_t<charset_id>>(charset)];
		}

	protected:
		iconv_t m_handle;
#endif
	};

	///
	/// Convert string to Unicode (UTF-16 on Windows, UTF-32 elsewhere)) and append to string
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in,out] dst        String to append Unicode to
	/// \param[in]     src        String
	/// \param[in]     count_src  String character count limit
	/// \param[in]     charset    Charset (stdex::charset_id::system - system default)
	///
	template <class TR_to = std::char_traits<wchar_t>, class AX_to = std::allocator<wchar_t>>
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline void strcat(
			_Inout_ std::basic_string<wchar_t, TR_to, AX_to>& dst,
			_In_reads_or_z_opt_(count_src) const char* src, _In_ size_t count_src,
			_In_ charset_id charset = charset_id::system)
	{
		charset_encoder<char, wchar_t>(charset, wchar_t_charset).strcat(dst, src, count_src);
	}

	template <class TR_to = std::char_traits<wchar_t>, class AX_to = std::allocator<wchar_t>>
	_Deprecated_("Use stdex::strcat")
		inline void str2wstr(
			_Inout_ std::basic_string<wchar_t, TR_to, AX_to>& dst,
			_In_reads_or_z_opt_(count_src) const char* src, _In_ size_t count_src,
			_In_ charset_id charset = charset_id::system)
	{
		strcat(dst, src, count_src, charset);
	}

	///
	/// Convert string to Unicode (UTF-16 on Windows) and append to string
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in,out] dst        String to append Unicode to
	/// \param[in]     src        String
	/// \param[in]     charset    Charset (stdex::charset_id::system - system default)
	///
	template <class TR_to = std::char_traits<wchar_t>, class AX_to = std::allocator<wchar_t>>
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline void strcat(
			_Inout_ std::basic_string<wchar_t, TR_to, AX_to>& dst,
			_In_ const std::basic_string_view<char, std::char_traits<char>> src,
			_In_ charset_id charset = charset_id::system)
	{
		strcat(dst, src.data(), src.size(), charset);
	}

	template <class TR_to = std::char_traits<wchar_t>, class AX_to = std::allocator<wchar_t>>
	_Deprecated_("Use stdex::strcat")
		inline void str2wstr(
			_Inout_ std::basic_string<wchar_t, TR_to, AX_to>& dst,
			_In_ const std::basic_string_view<char, std::char_traits<char>> src,
			_In_ charset_id charset = charset_id::system)
	{
		strcat(dst, src, charset);
	}

	///
	/// Convert string to Unicode (UTF-16 on Windows)
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in,out] dst        String to write Unicode to
	/// \param[in]     src        String
	/// \param[in]     count_src  String character count limit
	/// \param[in]     charset    Charset (stdex::charset_id::system - system default)
	///
	template <class TR_to = std::char_traits<wchar_t>, class AX_to = std::allocator<wchar_t>>
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline void strcpy(
			_Inout_ std::basic_string<wchar_t, TR_to, AX_to>& dst,
			_In_reads_or_z_opt_(count_src) const char* src, _In_ size_t count_src,
			_In_ charset_id charset = charset_id::system)
	{
		dst.clear();
		strcat(dst, src, count_src, charset);
	}

	///
	/// Convert string to Unicode (UTF-16 on Windows)
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in,out] dst        String to write Unicode to
	/// \param[in]     src        String
	/// \param[in]     charset    Charset (stdex::charset_id::system - system default)
	///
	template <class TR_to = std::char_traits<wchar_t>, class AX_to = std::allocator<wchar_t>>
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline void strcpy(
			_Inout_ std::basic_string<wchar_t, TR_to, AX_to>& dst,
			_In_ const std::basic_string_view<char, std::char_traits<char>> src,
			_In_ charset_id charset = charset_id::system)
	{
		strcpy(dst, src.data(), src.size(), charset);
	}

	///
	/// Convert string to Unicode string (UTF-16 on Windows)
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in]  src        String. Must be zero-terminated.
	/// \param[in]  charset    Charset (stdex::charset_id::system - system default)
	///
	/// \return Unicode string
	///
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline std::wstring str2wstr(
			_In_z_ const char* src,
			_In_ charset_id charset = charset_id::system)
	{
		std::wstring dst;
		strcat(dst, src, SIZE_MAX, charset);
		return dst;
	}

	///
	/// Convert string to Unicode string (UTF-16 on Windows)
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in]  src        String
	/// \param[in]  count_src  String character count limit
	/// \param[in]  charset    Charset (stdex::charset_id::system - system default)
	///
	/// \return Unicode string
	///
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline std::wstring str2wstr(
			_In_reads_or_z_opt_(count_src) const char* src, _In_ size_t count_src,
			_In_ charset_id charset = charset_id::system)
	{
		std::wstring dst;
		strcat(dst, src, count_src, charset);
		return dst;
	}

	///
	/// Convert string to Unicode string (UTF-16 on Windows)
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in]  src        String
	/// \param[in]  charset    Charset (stdex::charset_id::system - system default)
	///
	/// \return Unicode string
	///
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline std::wstring str2wstr(
			_In_ const std::basic_string_view<char, std::char_traits<char>> src,
			_In_ charset_id charset = charset_id::system)
	{
		return str2wstr(src.data(), src.size(), charset);
	}

	///
	/// Convert Unicode string (UTF-16 on Windows, UTF-32 elsewhere) to SGML and append to string
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in,out] dst        String to append SGML to
	/// \param[in]     src        Unicode string
	/// \param[in]     count_src  Unicode string character count limit
	/// \param[in]     charset    Charset (stdex::charset_id::system - system default)
	///
	template <class TR_to = std::char_traits<char>, class AX_to = std::allocator<char>>
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline void strcat(
			_Inout_ std::basic_string<char, TR_to, AX_to>& dst,
			_In_reads_or_z_opt_(count_src) const wchar_t* src, _In_ size_t count_src,
			_In_ charset_id charset = charset_id::system)
	{
		charset_encoder<wchar_t, char>(wchar_t_charset, charset).strcat(dst, src, count_src);
	}

	template <class TR_to = std::char_traits<char>, class AX_to = std::allocator<char>>
	_Deprecated_("Use stdex::strcat")
		inline void wstr2str(
			_Inout_ std::basic_string<char, TR_to, AX_to>& dst,
			_In_reads_or_z_opt_(count_src) const wchar_t* src, _In_ size_t count_src,
			_In_ charset_id charset = charset_id::system)
	{
		strcat(dst, src, count_src, charset);
	}

	///
	/// Convert Unicode string (UTF-16 on Windows) to SGML and append to string
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in,out] dst        String to append SGML to
	/// \param[in]     src        Unicode string
	/// \param[in]     charset    Charset (stdex::charset_id::system - system default)
	///
	template <class TR_to = std::char_traits<char>, class AX_to = std::allocator<char>>
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline void strcat(
			_Inout_ std::basic_string<char, TR_to, AX_to>& dst,
			_In_ const std::basic_string_view<wchar_t, std::char_traits<wchar_t>> src,
			_In_ charset_id charset = charset_id::system)
	{
		strcat(dst, src.data(), src.size(), charset);
	}

	template <class TR_to = std::char_traits<char>, class AX_to = std::allocator<char>>
	_Deprecated_("Use stdex::strcat")
		inline void wstr2str(
			_Inout_ std::basic_string<char, TR_to, AX_to>& dst,
			_In_ const std::basic_string_view<wchar_t, std::char_traits<wchar_t>> src,
			_In_ charset_id charset = charset_id::system)
	{
		strcat(dst, src, charset);
	}

	///
	/// Convert Unicode string (UTF-16 on Windows) to SGML
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in,out] dst        String to write SGML to
	/// \param[in]     src        Unicode string
	/// \param[in]     count_src  Unicode string character count limit
	/// \param[in]     charset    Charset (stdex::charset_id::system - system default)
	///
	template <class TR_to = std::char_traits<char>, class AX_to = std::allocator<char>>
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline void strcpy(
			_Inout_ std::basic_string<char, TR_to, AX_to>& dst,
			_In_reads_or_z_opt_(count_src) const wchar_t* src, _In_ size_t count_src,
			_In_ charset_id charset = charset_id::system)
	{
		dst.clear();
		strcat(dst, src, count_src, charset);
	}

	///
	/// Convert Unicode string (UTF-16 on Windows) to SGML
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in,out] dst        String to write SGML to
	/// \param[in]     src        Unicode string
	/// \param[in]     charset    Charset (stdex::charset_id::system - system default)
	///
	template <class TR_to = std::char_traits<char>, class AX_to = std::allocator<char>>
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline void strcpy(
			_Inout_ std::basic_string<char, TR_to, AX_to>& dst,
			_In_ const std::basic_string_view<wchar_t, std::char_traits<wchar_t>> src,
			_In_ charset_id charset = charset_id::system)
	{
		strcpy(dst, src.data(), src.size(), charset);
	}

	///
	/// Convert Unicode string (UTF-16 on Windows) to string
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in]  src        Unicode string. Must be zero-terminated.
	/// \param[in]  charset    Charset (stdex::charset_id::system - system default)
	///
	/// \return String
	///
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline std::string wstr2str(
			_In_z_ const wchar_t* src,
			_In_ charset_id charset = charset_id::system)
	{
		std::string dst;
		strcat(dst, src, SIZE_MAX, charset);
		return dst;
	}

	///
	/// Convert Unicode string (UTF-16 on Windows) to string
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in]  src        Unicode string
	/// \param[in]  count_src  Unicode string character count limit
	/// \param[in]  charset    Charset (stdex::charset_id::system - system default)
	///
	/// \return String
	///
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline std::string wstr2str(
			_In_reads_or_z_opt_(count_src) const wchar_t* src, _In_ size_t count_src,
			_In_ charset_id charset = charset_id::system)
	{
		std::string dst;
		strcat(dst, src, count_src, charset);
		return dst;
	}

	///
	/// Convert Unicode string (UTF-16 on Windows) to string
	///
	/// \note For better performance, consider a reusable charset_encoder.
	///
	/// \param[in]  src        Unicode string
	/// \param[in]  charset    Charset (stdex::charset_id::system - system default)
	///
	/// \return String
	///
#ifndef _WIN32
	_Deprecated_("For better performance, consider a reusable charset_encoder")
#endif
		inline std::string wstr2str(
			_In_ const std::basic_string_view<wchar_t, std::char_traits<wchar_t>> src,
			_In_ charset_id charset = charset_id::system)
	{
		return wstr2str(src.data(), src.size(), charset);
	}

#ifdef _WIN32
	///
	/// Normalize characters of a text string according to Unicode 4.0 TR#15 and append to string
	///
	/// \param[in,out] dst        String to append normalized string to
	/// \param[in]     src        String to normalize
	/// \param[in]     count_src  String to normalize code unit limit
	///
	/// \return Number of code units excluding zero terminator in the dst string after the operation.
	///
	template <class TR = std::char_traits<wchar_t>, class AX = std::allocator<wchar_t>>
	size_t normalizecat(
		_Inout_ std::basic_string<wchar_t, TR, AX>& dst,
		_In_reads_or_z_opt_(count_src) const wchar_t* src, _In_ size_t count_src)
	{
		count_src = strnlen(src, count_src);
		size_t count_dst = dst.size();
		dst.resize(count_dst + count_src);
		stdex_assert(count_src + 1 < INT_MAX);
#pragma warning(suppress: 6387) // Testing indicates src may be NULL when count_src is also 0. Is SAL of the lpSrcString parameter wrong?
		int r = NormalizeString(NormalizationC, src, static_cast<int>(count_src), dst.data() + count_dst, static_cast<int>(count_src + 1));
		if (r >= 0)
			dst.resize(count_dst + r);
		else
#pragma warning(suppress: 6387) // Testing indicates src may be NULL when count_src is also 0. Is SAL of the _Src parameter wrong?
			memcpy(dst.data() + count_dst, src, count_src * sizeof(wchar_t));
		return dst.size();
	}

	///
	/// Normalize characters of a text string according to Unicode 4.0 TR#15 and append to string
	///
	/// \param[in,out] dst  String to append normalized string to
	/// \param[in]     src  String to normalize
	///
	/// \return Number of code units excluding zero terminator in the dst string after the operation.
	///
	template <size_t N, class TR = std::char_traits<wchar_t>, class AX = std::allocator<wchar_t>>
	size_t normalizecat(
		_Inout_ std::basic_string<wchar_t, TR, AX>& dst,
		_In_ const wchar_t (&src)[N])
	{
		return normalizecat(dst, src, N);
	}

	///
	/// Normalize characters of a text string according to Unicode 4.0 TR#15 and append to string
	///
	/// \param[in,out] dst  String to append normalized string to
	/// \param[in]     src  String to normalize
	///
	/// \return Number of code units excluding zero terminator in the dst string after the operation.
	///
	template <class TR_dst = std::char_traits<wchar_t>, class AX_dst = std::allocator<wchar_t>>
	size_t normalizecat(
		_Inout_ std::basic_string<wchar_t, TR_dst, AX_dst>& dst,
		_In_ const std::basic_string_view<wchar_t, std::char_traits<wchar_t>> src)
	{
		return normalizecat(dst, src.data(), src.size());
	}

	///
	/// Normalize characters of a text string according to Unicode 4.0 TR#15 and assign to string
	///
	/// \param[in,out] dst        String to assign normalized string to
	/// \param[in]     src        String to normalize
	/// \param[in]     count_src  String to normalize code unit limit
	///
	/// \return Number of code units excluding zero terminator in the dst string after the operation.
	///
	template <class TR = std::char_traits<wchar_t>, class AX = std::allocator<wchar_t>>
	size_t normalize(
		_Inout_ std::basic_string<wchar_t, TR, AX>& dst,
		_In_reads_or_z_opt_(count_src) const wchar_t* src, _In_ size_t count_src)
	{
		dst.clear();
		return normalizecat(dst, src, count_src);
	}

	///
	/// Normalize characters of a text string according to Unicode 4.0 TR#15 and assign to string
	///
	/// \param[in,out] dst  String to assign normalized string to
	/// \param[in]     src  String to normalize
	///
	/// \return Number of code units excluding zero terminator in the dst string after the operation.
	///
	template <size_t N, class TR = std::char_traits<wchar_t>, class AX = std::allocator<wchar_t>>
	size_t normalize(
		_Inout_ std::basic_string<wchar_t, TR, AX>& dst,
		_In_ const wchar_t(&src)[N])
	{
		return normalize(dst, src, N);
	}

	///
	/// Normalize characters of a text string according to Unicode 4.0 TR#15 and assign to string
	///
	/// \param[in,out] dst  String to assign normalized string to
	/// \param[in]     src  String to normalize
	///
	/// \return Number of code units excluding zero terminator in the dst string after the operation.
	///
	template <class TR_dst = std::char_traits<wchar_t>, class AX_dst = std::allocator<wchar_t>>
	size_t normalize(
		_Inout_ std::basic_string<wchar_t, TR_dst, AX_dst>& dst,
		_In_ const std::basic_string_view<wchar_t, std::char_traits<wchar_t>> src)
	{
		return normalize(dst, src.data(), src.size());
	}

	///
	/// Normalize characters of a text string according to Unicode 4.0 TR#15
	///
	/// \param[in] src        String to normalize
	/// \param[in] count_src  String to normalize code unit limit
	///
	/// \return Normalized string
	///
	inline std::wstring normalize(_In_reads_or_z_opt_(count_src) const wchar_t* src, _In_ size_t count_src)
	{
		std::wstring dst;
		normalizecat(dst, src, count_src);
		return dst;
	}

	///
	/// Normalize characters of a text string according to Unicode 4.0 TR#15
	///
	/// \param[in] src  String to normalize
	///
	/// \return Normalized string
	///
	template <size_t N>
	std::wstring normalize(_In_ const wchar_t(&src)[N])
	{
		std::wstring dst;
		normalizecat(dst, src, N);
		return dst;
	}

	///
	/// Normalize characters of a text string according to Unicode 4.0 TR#15
	///
	/// \param[in] src  String to normalize
	///
	/// \return Normalized string
	///
	inline std::wstring normalize(_In_ const std::basic_string_view<wchar_t, std::char_traits<wchar_t>> src)
	{
		std::wstring dst;
		normalizecat(dst, src.data(), src.size());
		return dst;
	}
#endif
}

#if defined(__GNUC__)
#pragma GCC diagnostic pop
#endif