first commit

This commit is contained in:
Jose Caban
2025-06-07 11:34:38 -04:00
commit 0eb2d7c07d
4708 changed files with 1500614 additions and 0 deletions

86
extern/ustl/1.5/bvt/bvt16.cc vendored Normal file
View File

@@ -0,0 +1,86 @@
// This file is part of the uSTL library, an STL implementation.
//
// Copyright (c) 2005 by Mike Sharov <msharov@users.sourceforge.net>
// This file is free software, distributed under the MIT License.
#include "stdtest.h"
static void Widen (const string& str, vector<wchar_t>& result)
{
result.clear();
result.resize (str.length());
copy (str.utf8_begin(), str.utf8_end(), result.begin());
}
static void DumpWchars (const vector<wchar_t>& v)
{
foreach (vector<wchar_t>::const_iterator, i, v)
cout.format (" %u", uint32_t(*i));
}
void TestUTF8 (void)
{
cout << "Generating Unicode characters ";
vector<wchar_t> srcChars;
srcChars.resize (0xFFFF);
iota (srcChars.begin(), srcChars.end(), 0);
cout.format ("%zu - %zu\n", size_t(srcChars[0]), size_t(srcChars.back()));
cout << "Encoding to utf8.\n";
string encoded;
encoded.reserve (srcChars.size() * 4);
copy (srcChars, utf8out (back_inserter(encoded)));
static const char c_ProperEncoding[] = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10 };
if (encoded.compare (encoded.begin(), encoded.begin() + VectorSize(c_ProperEncoding), VectorRange(c_ProperEncoding))) {
cout << "Encoding failed: ";
for (string::const_iterator i = encoded.begin(); i != encoded.begin() + VectorSize(c_ProperEncoding); ++ i)
cout << uint32_t(*i);
cout << endl;
}
cout << "Decoding back.\n";
vector<wchar_t> decChars;
Widen (encoded, decChars);
cout.format ("Comparing.\nsrc = %zu chars, encoded = %zu chars, decoded = %zu\n", srcChars.size(), encoded.size(), decChars.size());
size_t nDiffs = 0;
for (uoff_t i = 0; i < min (srcChars.size(), decChars.size()); ++ i) {
if (srcChars[i] != decChars[i]) {
cout.format ("%u != %u\n", uint32_t(srcChars[i]), uint32_t(decChars[i]));
++ nDiffs;
}
}
cout.format ("%zu differences between src and decoded.\n", nDiffs);
cout << "Testing wide character string::insert\n";
string ws ("1234567890", 10);
ws.insert (ws.find('1'), wchar_t(1234));
static const wchar_t c_WChars[2] = { 3456, 4567 };
ws.insert (ws.find('3'), VectorRange(c_WChars), 2);
ws.insert (ws.find('3'), wchar_t(2345));
ws.insert (ws.size(), wchar_t(5678));
cout.format ("Values[%zu]:", ws.length());
for (string::utf8_iterator j = ws.utf8_begin(); j < ws.utf8_end(); ++ j)
cout.format (" %u", uint32_t(*j));
cout << endl;
cout << "Character offsets:";
for (string::utf8_iterator k = ws.utf8_begin(); k < ws.utf8_end(); ++ k)
cout.format (" %zu", distance (ws.begin(), k.base()));
cout << endl;
cout.format ("Erasing character %zu: ", ws.length() - 1);
ws.erase (ws.wiat(ws.length() - 1), ws.end());
Widen (ws, decChars);
DumpWchars (decChars);
cout << endl;
cout << "Erasing 2 characters after '2': ";
ws.erase (ws.find('2')+1, Utf8Bytes(VectorRange(c_WChars)));
Widen (ws, decChars);
DumpWchars (decChars);
cout << endl;
}
StdBvtMain (TestUTF8)