summaryrefslogtreecommitdiff
path: root/lib/utfcpp/v3/samples/docsample.cpp
diff options
context:
space:
mode:
authorAlexis Hildebrandt <afh@surryhill.net>2023-12-07 16:43:46 +0100
committerAlexis Hildebrandt <afh@surryhill.net>2023-12-10 19:01:27 +0100
commitf017686dd4720bac373e8fcd5b779777a83162ec (patch)
tree408f1a27aa999bce0646f21c76330e3f252e1c76 /lib/utfcpp/v3/samples/docsample.cpp
parent3cfad2570d7fe8aa5d88de3797797d695d4fbe06 (diff)
downloadfork-ledger-f017686dd4720bac373e8fcd5b779777a83162ec.tar.gz
fork-ledger-f017686dd4720bac373e8fcd5b779777a83162ec.tar.bz2
fork-ledger-f017686dd4720bac373e8fcd5b779777a83162ec.zip
utfcpp: Update to 4.0.4
Diffstat (limited to 'lib/utfcpp/v3/samples/docsample.cpp')
-rw-r--r--lib/utfcpp/v3/samples/docsample.cpp64
1 files changed, 0 insertions, 64 deletions
diff --git a/lib/utfcpp/v3/samples/docsample.cpp b/lib/utfcpp/v3/samples/docsample.cpp
deleted file mode 100644
index 65338872..00000000
--- a/lib/utfcpp/v3/samples/docsample.cpp
+++ /dev/null
@@ -1,64 +0,0 @@
-#include "../source/utf8.h"
-#include <iostream>
-#include <fstream>
-#include <string>
-#include <vector>
-
-
-using namespace std;
-
-int main(int argc, char** argv)
-{
- if (argc != 2) {
- cout << "\nUsage: docsample filename\n";
- return 0;
- }
- const char* test_file_path = argv[1];
- // Open the test file (must be UTF-8 encoded)
- ifstream fs8(test_file_path);
- if (!fs8.is_open()) {
- cout << "Could not open " << test_file_path << endl;
- return 0;
- }
-
- unsigned line_count = 1;
- string line;
- // Play with all the lines in the file
- while (getline(fs8, line)) {
- // check for invalid utf-8 (for a simple yes/no check, there is also utf8::is_valid function)
-#if __cplusplus >= 201103L // C++ 11 or later
- auto end_it = utf8::find_invalid(line.begin(), line.end());
-#else
- string::iterator end_it = utf8::find_invalid(line.begin(), line.end());
-#endif // C++ 11
- if (end_it != line.end()) {
- cout << "Invalid UTF-8 encoding detected at line " << line_count << "\n";
- cout << "This part is fine: " << string(line.begin(), end_it) << "\n";
- }
- // Get the line length (at least for the valid part)
- ptrdiff_t length = utf8::distance(line.begin(), end_it);
- cout << "Length of line " << line_count << " is " << length << "\n";
-
- // Convert it to utf-16
-#if __cplusplus >= 201103L // C++ 11 or later
- u16string utf16line = utf8::utf8to16(line);
-#else
- vector<unsigned short> utf16line;
- utf8::utf8to16(line.begin(), end_it, back_inserter(utf16line));
-#endif // C++ 11
- // And back to utf-8;
-#if __cplusplus >= 201103L // C++ 11 or later
- string utf8line = utf8::utf16to8(utf16line);
-#else
- string utf8line;
- utf8::utf16to8(utf16line.begin(), utf16line.end(), back_inserter(utf8line));
-#endif // C++ 11
- // Confirm that the conversion went OK:
- if (utf8line != string(line.begin(), end_it))
- cout << "Error in UTF-16 conversion at line: " << line_count << "\n";
-
- line_count++;
- }
-
- return 0;
-}