class.path/path.member/path.charconv.pass.cpp

0b71bf79SMartin Storsjö//===----------------------------------------------------------------------===//
0b71bf79SMartin Storsjö//
0b71bf79SMartin Storsjö// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
0b71bf79SMartin Storsjö// See https://llvm.org/LICENSE.txt for license information.
0b71bf79SMartin Storsjö// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
0b71bf79SMartin Storsjö//
0b71bf79SMartin Storsjö//===----------------------------------------------------------------------===//
0b71bf79SMartin Storsjö
a7f9895cSLouis Dionne// UNSUPPORTED: no-localization
*ac8c9f1eSLouis Dionne// UNSUPPORTED: c++03, c++11, c++14
c352fa74SLouis Dionne// UNSUPPORTED: availability-filesystem-missing
0b71bf79SMartin Storsjö// ADDITIONAL_COMPILE_FLAGS: -D_LIBCPP_DISABLE_DEPRECATION_WARNINGS
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjö// <filesystem>
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjö// class path
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjö// Test constructors, accessors and modifiers that convert from/to various
0b71bf79SMartin Storsjö// character encodings. Constructors and modifiers (append, concat,
0b71bf79SMartin Storsjö// operator/=, operator+=) accept inputs with various character encodings,
0b71bf79SMartin Storsjö// and accessors (*string(), string<>(), u8string()) export the string with
0b71bf79SMartin Storsjö// various encodings.
0b71bf79SMartin Storsjö//
0b71bf79SMartin Storsjö// Some encodings are standardized; char16_t, char32_t and the u8string
0b71bf79SMartin Storsjö// accessor and u8path constructor (and normal functions taking char8_t in
0b71bf79SMartin Storsjö// C++20) convert from/to UTF-16, UTF-32 and UTF-8. wchar_t can be either
0b71bf79SMartin Storsjö// UTF-16 or UTF-32 depending on the size of the wchar_t type, or can be
0b71bf79SMartin Storsjö// left unimplemented.
0b71bf79SMartin Storsjö//
0b71bf79SMartin Storsjö// Plain char is implicitly UTF-8 on posix systems. On Windows, plain char
0b71bf79SMartin Storsjö// is supposed to be in the same encoding as the platform's native file
0b71bf79SMartin Storsjö// system APIs consumes in the functions that take narrow strings as path
0b71bf79SMartin Storsjö// names.
0b71bf79SMartin Storsjö
*ac8c9f1eSLouis Dionne#include <filesystem>
0b71bf79SMartin Storsjö#include <type_traits>
0b71bf79SMartin Storsjö#include <cassert>
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjö#include "test_macros.h"
c352fa74SLouis Dionne
c352fa74SLouis Dionne#ifdef _WIN32
c352fa74SLouis Dionne#  include <windows.h> // SetFileApisToANSI & friends
c352fa74SLouis Dionne#endif
*ac8c9f1eSLouis Dionnenamespace fs = std::filesystem;
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjö// Test conversion with strings that fit within the latin1 charset, that fit
0b71bf79SMartin Storsjö// within one code point in UTF-16, and that can be expressible in certain
0b71bf79SMartin Storsjö// one-byte code pages.
0b71bf79SMartin Storsjöstatic void test_latin_unicode()
0b71bf79SMartin Storsjö{
0b71bf79SMartin Storsjö  const char16_t u16str[] = { 0xe5, 0xe4, 0xf6, 0x00 };
0b71bf79SMartin Storsjö  const char32_t u32str[] = { 0xe5, 0xe4, 0xf6, 0x00 };
0b71bf79SMartin Storsjö  const char str[] = { char(0xc3), char(0xa5), char(0xc3), char(0xa4), char(0xc3), char(0xb6), 0x00 }; // UTF8, in a regular char string
0b71bf79SMartin Storsjö#if TEST_STD_VER > 17 && defined(__cpp_lib_char8_t)
0b71bf79SMartin Storsjö  const char8_t u8str[] = { 0xc3, 0xa5, 0xc3, 0xa4, 0xc3, 0xb6, 0x00 };
0b71bf79SMartin Storsjö#else
0b71bf79SMartin Storsjö  const char u8str[] = { char(0xc3), char(0xa5), char(0xc3), char(0xa4), char(0xc3), char(0xb6), 0x00 };
0b71bf79SMartin Storsjö#endif
f4c1258dSLouis Dionne#ifndef TEST_HAS_NO_WIDE_CHARACTERS
0b71bf79SMartin Storsjö  const wchar_t wstr[] = { 0xe5, 0xe4, 0xf6, 0x00 };
0b71bf79SMartin Storsjö#endif
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjö  // Test well-defined conversion between UTF-8, UTF-16 and UTF-32
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(u16str);
0b71bf79SMartin Storsjö    assert(p.u8string() == u8str);
0b71bf79SMartin Storsjö    assert(p.u16string() == u16str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32str);
0b71bf79SMartin Storsjö    assert(p.string<char16_t>() == u16str);
0b71bf79SMartin Storsjö    assert(p.string<char32_t>() == u32str);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(u32str);
0b71bf79SMartin Storsjö    assert(p.u8string() == u8str);
0b71bf79SMartin Storsjö    assert(p.u16string() == u16str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32str);
0b71bf79SMartin Storsjö    assert(p.string<char16_t>() == u16str);
0b71bf79SMartin Storsjö    assert(p.string<char32_t>() == u32str);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p = fs::u8path(str);
0b71bf79SMartin Storsjö    assert(p.u8string() == u8str);
0b71bf79SMartin Storsjö    assert(p.u16string() == u16str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32str);
0b71bf79SMartin Storsjö    assert(p.string<char16_t>() == u16str);
0b71bf79SMartin Storsjö    assert(p.string<char32_t>() == u32str);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö#if TEST_STD_VER > 17 && defined(__cpp_lib_char8_t)
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    // In C++20, the path constructor can unambiguously handle UTF-8 input,
0b71bf79SMartin Storsjö    // even if the plain char constructor would treat it as something else.
0b71bf79SMartin Storsjö    const fs::path p(u8str);
0b71bf79SMartin Storsjö    assert(p.u8string() == u8str);
0b71bf79SMartin Storsjö    assert(p.u16string() == u16str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32str);
0b71bf79SMartin Storsjö    assert(p.string<char8_t>() == u8str);
0b71bf79SMartin Storsjö    assert(p.string<char16_t>() == u16str);
0b71bf79SMartin Storsjö    assert(p.string<char32_t>() == u32str);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  // Check reading various inputs with string<char8_t>()
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(u16str);
0b71bf79SMartin Storsjö    assert(p.string<char8_t>() == u8str);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(u32str);
0b71bf79SMartin Storsjö    assert(p.string<char8_t>() == u8str);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p = fs::u8path(str);
0b71bf79SMartin Storsjö    assert(p.string<char8_t>() == u8str);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö#endif
f4c1258dSLouis Dionne#ifndef TEST_HAS_NO_WIDE_CHARACTERS
0b71bf79SMartin Storsjö  // Test conversion to/from wchar_t.
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(u16str);
0b71bf79SMartin Storsjö    assert(p.wstring() == wstr);
0b71bf79SMartin Storsjö    assert(p.string<wchar_t>() == wstr);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p = fs::u8path(str);
0b71bf79SMartin Storsjö    assert(p.wstring() == wstr);
0b71bf79SMartin Storsjö    assert(p.string<wchar_t>() == wstr);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(wstr);
0b71bf79SMartin Storsjö    assert(p.wstring() == wstr);
0b71bf79SMartin Storsjö    assert(p.u8string() == u8str);
0b71bf79SMartin Storsjö    assert(p.u16string() == u16str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32str);
0b71bf79SMartin Storsjö    assert(p.string<wchar_t>() == wstr);
0b71bf79SMartin Storsjö  }
f4c1258dSLouis Dionne#endif // TEST_HAS_NO_WIDE_CHARACTERS
0b71bf79SMartin Storsjö#ifndef _WIN32
0b71bf79SMartin Storsjö  // Test conversion to/from regular char-based string. On POSIX, this
0b71bf79SMartin Storsjö  // is implied to convert to/from UTF-8.
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(str);
0b71bf79SMartin Storsjö    assert(p.string() == str);
0b71bf79SMartin Storsjö    assert(p.u16string() == u16str);
0b71bf79SMartin Storsjö    assert(p.string<char>() == str);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(u16str);
0b71bf79SMartin Storsjö    assert(p.string() == str);
0b71bf79SMartin Storsjö    assert(p.string<char>() == str);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö#else
0b71bf79SMartin Storsjö  // On windows, the narrow char-based input/output is supposed to be
0b71bf79SMartin Storsjö  // in the charset that narrow file IO APIs use. This can either be the
0b71bf79SMartin Storsjö  // current active code page (ACP) or the OEM code page, exposed by
0b71bf79SMartin Storsjö  // the AreFileApisANSI() function, and settable with SetFileApisToANSI() and
0b71bf79SMartin Storsjö  // SetFileApisToOEM(). We can't set which codepage is active within
0b71bf79SMartin Storsjö  // the process, but for some specific known ones, we can check if they
0b71bf79SMartin Storsjö  // behave as expected.
0b71bf79SMartin Storsjö  SetFileApisToANSI();
0b71bf79SMartin Storsjö  if (GetACP() == 1252) {
0b71bf79SMartin Storsjö    const char latin1[] = { char(0xe5), char(0xe4), char(0xf6), 0x00 };
0b71bf79SMartin Storsjö    {
0b71bf79SMartin Storsjö      const fs::path p(wstr);
0b71bf79SMartin Storsjö      assert(p.string() == latin1);
0b71bf79SMartin Storsjö      assert(p.string<char>() == latin1);
0b71bf79SMartin Storsjö    }
0b71bf79SMartin Storsjö    {
0b71bf79SMartin Storsjö      const fs::path p(latin1);
0b71bf79SMartin Storsjö      assert(p.string() == latin1);
0b71bf79SMartin Storsjö      assert(p.wstring() == wstr);
0b71bf79SMartin Storsjö      assert(p.u8string() == u8str);
0b71bf79SMartin Storsjö      assert(p.u16string() == u16str);
0b71bf79SMartin Storsjö      assert(p.string<char>() == latin1);
0b71bf79SMartin Storsjö      assert(p.string<wchar_t>() == wstr);
0b71bf79SMartin Storsjö    }
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  SetFileApisToOEM();
0b71bf79SMartin Storsjö  if (GetOEMCP() == 850 || GetOEMCP() == 437) {
0b71bf79SMartin Storsjö    // These chars are identical in both CP 850 and 437
0b71bf79SMartin Storsjö    const char cp850[] = { char(0x86), char(0x84), char(0x94), 0x00 };
0b71bf79SMartin Storsjö    {
0b71bf79SMartin Storsjö      const fs::path p(wstr);
0b71bf79SMartin Storsjö      assert(p.string() == cp850);
0b71bf79SMartin Storsjö      assert(p.string<char>() == cp850);
0b71bf79SMartin Storsjö    }
0b71bf79SMartin Storsjö    {
0b71bf79SMartin Storsjö      const fs::path p(cp850);
0b71bf79SMartin Storsjö      assert(p.string() == cp850);
0b71bf79SMartin Storsjö      assert(p.wstring() == wstr);
0b71bf79SMartin Storsjö      assert(p.u8string() == u8str);
0b71bf79SMartin Storsjö      assert(p.u16string() == u16str);
0b71bf79SMartin Storsjö      assert(p.string<char>() == cp850);
0b71bf79SMartin Storsjö      assert(p.string<wchar_t>() == wstr);
0b71bf79SMartin Storsjö    }
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö#endif
0b71bf79SMartin Storsjö}
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjö// Test conversion with strings that don't fit within one UTF-16 code point.
0b71bf79SMartin Storsjö// Here, wchar_t can be either UTF-16 or UTF-32 depending on the size on the
0b71bf79SMartin Storsjö// particular platform.
0b71bf79SMartin Storsjöstatic void test_wide_unicode()
0b71bf79SMartin Storsjö{
0b71bf79SMartin Storsjö  const char16_t u16str[] = { 0xd801, 0xdc37, 0x00 };
0b71bf79SMartin Storsjö  const char32_t u32str[] = { 0x10437, 0x00 };
0b71bf79SMartin Storsjö#if TEST_STD_VER > 17 && defined(__cpp_lib_char8_t)
0b71bf79SMartin Storsjö  const char8_t u8str[] = { 0xf0, 0x90, 0x90, 0xb7, 0x00 };
0b71bf79SMartin Storsjö#else
0b71bf79SMartin Storsjö  const char u8str[] = { char(0xf0), char(0x90), char(0x90), char(0xb7), 0x00 };
0b71bf79SMartin Storsjö#endif
0b71bf79SMartin Storsjö  const char str[] = { char(0xf0), char(0x90), char(0x90), char(0xb7), 0x00 };
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p = fs::u8path(str);
0b71bf79SMartin Storsjö    assert(p.u8string() == u8str);
0b71bf79SMartin Storsjö    assert(p.u16string() == u16str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32str);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(u16str);
0b71bf79SMartin Storsjö    assert(p.u8string() == u8str);
0b71bf79SMartin Storsjö    assert(p.u16string() == u16str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32str);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(u32str);
0b71bf79SMartin Storsjö    assert(p.u8string() == u8str);
0b71bf79SMartin Storsjö    assert(p.u16string() == u16str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32str);
0b71bf79SMartin Storsjö  }
f4c1258dSLouis Dionne#if !defined(TEST_HAS_NO_WIDE_CHARACTERS) && defined(__SIZEOF_WCHAR_T__)
0b71bf79SMartin Storsjö# if __SIZEOF_WCHAR_T__ == 2
0b71bf79SMartin Storsjö  const wchar_t wstr[] = { 0xd801, 0xdc37, 0x00 };
0b71bf79SMartin Storsjö# else
0b71bf79SMartin Storsjö  const wchar_t wstr[] = { 0x10437, 0x00 };
0b71bf79SMartin Storsjö# endif
0b71bf79SMartin Storsjö  // Test conversion to/from wchar_t.
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p = fs::u8path(str);
0b71bf79SMartin Storsjö    assert(p.wstring() == wstr);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(u16str);
0b71bf79SMartin Storsjö    assert(p.wstring() == wstr);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(u32str);
0b71bf79SMartin Storsjö    assert(p.wstring() == wstr);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const fs::path p(wstr);
0b71bf79SMartin Storsjö    assert(p.u8string() == u8str);
0b71bf79SMartin Storsjö    assert(p.u16string() == u16str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32str);
0b71bf79SMartin Storsjö    assert(p.wstring() == wstr);
0b71bf79SMartin Storsjö  }
f4c1258dSLouis Dionne#endif // !defined(TEST_HAS_NO_WIDE_CHARACTERS) && defined(__SIZEOF_WCHAR_T__)
0b71bf79SMartin Storsjö}
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjö// Test appending paths in different encodings.
0b71bf79SMartin Storsjöstatic void test_append()
0b71bf79SMartin Storsjö{
0b71bf79SMartin Storsjö  const char16_t u16str[] = { 0xd801, 0xdc37, 0x00 };
0b71bf79SMartin Storsjö  const char32_t u32str[] = { 0x10437, 0x00 };
0b71bf79SMartin Storsjö  const char32_t u32ref[] = { 0x10437, fs::path::preferred_separator, 0x10437, fs::path::preferred_separator, 0x10437, 0x00 };
0b71bf79SMartin Storsjö  const char str[] = { char(0xf0), char(0x90), char(0x90), char(0xb7), 0x00 };
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    fs::path p = fs::u8path(str) / u16str / u32str;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref);
0b71bf79SMartin Storsjö    p = fs::u8path(str).append(u16str).append(u32str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref);
0b71bf79SMartin Storsjö    p = fs::u8path(str);
0b71bf79SMartin Storsjö    p /= u16str;
0b71bf79SMartin Storsjö    p /= u32str;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref);
0b71bf79SMartin Storsjö  }
f4c1258dSLouis Dionne#if !defined(TEST_HAS_NO_WIDE_CHARACTERS) && defined(__SIZEOF_WCHAR_T__)
0b71bf79SMartin Storsjö# if __SIZEOF_WCHAR_T__ == 2
0b71bf79SMartin Storsjö  const wchar_t wstr[] = { 0xd801, 0xdc37, 0x00 };
0b71bf79SMartin Storsjö# else
0b71bf79SMartin Storsjö  const wchar_t wstr[] = { 0x10437, 0x00 };
0b71bf79SMartin Storsjö# endif
0b71bf79SMartin Storsjö  // Test conversion from wchar_t.
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    fs::path p = fs::path(u16str) / wstr / u32str;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref);
0b71bf79SMartin Storsjö    p = fs::path(u16str).append(wstr).append(u32str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref);
0b71bf79SMartin Storsjö    p = fs::path(u16str);
0b71bf79SMartin Storsjö    p /= wstr;
0b71bf79SMartin Storsjö    p /= u32str;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref);
0b71bf79SMartin Storsjö  }
f4c1258dSLouis Dionne#endif // !defined(TEST_HAS_NO_WIDE_CHARACTERS) && defined(__SIZEOF_WCHAR_T__)
0b71bf79SMartin Storsjö}
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjöstatic void test_concat()
0b71bf79SMartin Storsjö{
0b71bf79SMartin Storsjö  const char16_t u16str[] = { 0xd801, 0xdc37, 0x00 };
0b71bf79SMartin Storsjö  const char32_t u32str[] = { 0x10437, 0x00 };
0b71bf79SMartin Storsjö  const char32_t u32ref[] = { 0x10437, 0x10437, 0x10437, 0x00 };
0b71bf79SMartin Storsjö  const char str[] = { char(0xf0), char(0x90), char(0x90), char(0xb7), 0x00 };
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    fs::path p = fs::u8path(str);
0b71bf79SMartin Storsjö    p += u16str;
0b71bf79SMartin Storsjö    p += u32str;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref);
0b71bf79SMartin Storsjö    p = fs::u8path(str).concat(u16str).concat(u32str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref);
0b71bf79SMartin Storsjö  }
f4c1258dSLouis Dionne#if !defined(TEST_HAS_NO_WIDE_CHARACTERS) && defined(__SIZEOF_WCHAR_T__)
0b71bf79SMartin Storsjö# if __SIZEOF_WCHAR_T__ == 2
0b71bf79SMartin Storsjö  const wchar_t wstr[] = { 0xd801, 0xdc37, 0x00 };
0b71bf79SMartin Storsjö# else
0b71bf79SMartin Storsjö  const wchar_t wstr[] = { 0x10437, 0x00 };
0b71bf79SMartin Storsjö# endif
0b71bf79SMartin Storsjö  // Test conversion from wchar_t.
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    fs::path p = fs::path(u16str);
0b71bf79SMartin Storsjö    p += wstr;
0b71bf79SMartin Storsjö    p += u32str;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref);
0b71bf79SMartin Storsjö    p = fs::path(u16str).concat(wstr).concat(u32str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref);
0b71bf79SMartin Storsjö  }
f4c1258dSLouis Dionne#endif // !defined(TEST_HAS_NO_WIDE_CHARACTERS) && defined(__SIZEOF_WCHAR_T__)
0b71bf79SMartin Storsjö}
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjöstatic void test_append_concat_narrow()
0b71bf79SMartin Storsjö{
0b71bf79SMartin Storsjö  const char16_t u16str[] = { 0xe5, 0x00 };
0b71bf79SMartin Storsjö  const char32_t u32ref_append[] = { 0xe5, fs::path::preferred_separator, 0xe5, 0x00 };
0b71bf79SMartin Storsjö  const char32_t u32ref_concat[] = { 0xe5, 0xe5, 0x00 };
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjö#if TEST_STD_VER > 17 && defined(__cpp_lib_char8_t)
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const char8_t u8str[] = { 0xc3, 0xa5, 0x00 };
0b71bf79SMartin Storsjö    // In C++20, appends of a char8_t string is unambiguously treated as
0b71bf79SMartin Storsjö    // UTF-8.
0b71bf79SMartin Storsjö    fs::path p = fs::path(u16str) / u8str;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_append);
0b71bf79SMartin Storsjö    p = fs::path(u16str).append(u8str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_append);
0b71bf79SMartin Storsjö    p = fs::path(u16str);
0b71bf79SMartin Storsjö    p /= u8str;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_append);
0b71bf79SMartin Storsjö    p = fs::path(u16str).concat(u8str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_concat);
0b71bf79SMartin Storsjö    p = fs::path(u16str);
0b71bf79SMartin Storsjö    p += u8str;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_concat);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö#endif
0b71bf79SMartin Storsjö#ifndef _WIN32
0b71bf79SMartin Storsjö  // Test appending a regular char-based string. On POSIX, this
0b71bf79SMartin Storsjö  // is implied to convert to/from UTF-8.
0b71bf79SMartin Storsjö  {
0b71bf79SMartin Storsjö    const char str[] = { char(0xc3), char(0xa5), 0x00 }; // UTF8, in a regular char string
0b71bf79SMartin Storsjö    fs::path p = fs::path(u16str) / str;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_append);
0b71bf79SMartin Storsjö    p = fs::path(u16str).append(str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_append);
0b71bf79SMartin Storsjö    p = fs::path(u16str);
0b71bf79SMartin Storsjö    p /= str;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_append);
0b71bf79SMartin Storsjö    p = fs::path(u16str).concat(str);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_concat);
0b71bf79SMartin Storsjö    p = fs::path(u16str);
0b71bf79SMartin Storsjö    p += str;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_concat);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö#else
0b71bf79SMartin Storsjö  SetFileApisToANSI();
0b71bf79SMartin Storsjö  if (GetACP() == 1252) {
0b71bf79SMartin Storsjö    const char latin1[] = { char(0xe5), 0x00 };
0b71bf79SMartin Storsjö    fs::path p = fs::path(u16str) / latin1;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_append);
0b71bf79SMartin Storsjö    p = fs::path(u16str).append(latin1);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_append);
0b71bf79SMartin Storsjö    p = fs::path(u16str);
0b71bf79SMartin Storsjö    p /= latin1;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_append);
0b71bf79SMartin Storsjö    p = fs::path(u16str).concat(latin1);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_concat);
0b71bf79SMartin Storsjö    p = fs::path(u16str);
0b71bf79SMartin Storsjö    p += latin1;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_concat);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö  SetFileApisToOEM();
0b71bf79SMartin Storsjö  if (GetOEMCP() == 850 || GetOEMCP() == 437) {
0b71bf79SMartin Storsjö    // This chars is identical in both CP 850 and 437
0b71bf79SMartin Storsjö    const char cp850[] = { char(0x86), 0x00 };
0b71bf79SMartin Storsjö    fs::path p = fs::path(u16str) / cp850;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_append);
0b71bf79SMartin Storsjö    p = fs::path(u16str).append(cp850);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_append);
0b71bf79SMartin Storsjö    p = fs::path(u16str);
0b71bf79SMartin Storsjö    p /= cp850;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_append);
0b71bf79SMartin Storsjö    p = fs::path(u16str).concat(cp850);
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_concat);
0b71bf79SMartin Storsjö    p = fs::path(u16str);
0b71bf79SMartin Storsjö    p += cp850;
0b71bf79SMartin Storsjö    assert(p.u32string() == u32ref_concat);
0b71bf79SMartin Storsjö  }
0b71bf79SMartin Storsjö#endif
0b71bf79SMartin Storsjö}
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjöint main(int, char**)
0b71bf79SMartin Storsjö{
0b71bf79SMartin Storsjö  test_latin_unicode();
0b71bf79SMartin Storsjö  test_wide_unicode();
0b71bf79SMartin Storsjö  test_append();
0b71bf79SMartin Storsjö  test_concat();
0b71bf79SMartin Storsjö  test_append_concat_narrow();
0b71bf79SMartin Storsjö
0b71bf79SMartin Storsjö  return 0;
0b71bf79SMartin Storsjö}