summaryrefslogtreecommitdiffstats
path: root/src/boost/libs/locale/examples/wboundary.cpp
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-27 18:24:20 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-27 18:24:20 +0000
commit483eb2f56657e8e7f419ab1a4fab8dce9ade8609 (patch)
treee5d88d25d870d5dedacb6bbdbe2a966086a0a5cf /src/boost/libs/locale/examples/wboundary.cpp
parentInitial commit. (diff)
downloadceph-483eb2f56657e8e7f419ab1a4fab8dce9ade8609.tar.xz
ceph-483eb2f56657e8e7f419ab1a4fab8dce9ade8609.zip
Adding upstream version 14.2.21.upstream/14.2.21upstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'src/boost/libs/locale/examples/wboundary.cpp')
-rw-r--r--src/boost/libs/locale/examples/wboundary.cpp104
1 files changed, 104 insertions, 0 deletions
diff --git a/src/boost/libs/locale/examples/wboundary.cpp b/src/boost/libs/locale/examples/wboundary.cpp
new file mode 100644
index 00000000..a14325fa
--- /dev/null
+++ b/src/boost/libs/locale/examples/wboundary.cpp
@@ -0,0 +1,104 @@
+//
+// Copyright (c) 2009-2011 Artyom Beilis (Tonkikh)
+//
+// Distributed under the Boost Software License, Version 1.0. (See
+// accompanying file LICENSE_1_0.txt or copy at
+// http://www.boost.org/LICENSE_1_0.txt)
+//
+
+//
+// ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! !
+//
+// BIG FAT WARNING FOR Microsoft Visual Studio Users
+//
+// YOU NEED TO CONVERT THIS SOURCE FILE ENCODING TO UTF-8 WITH BOM ENCODING.
+//
+// Unfortunately MSVC understands that the source code is encoded as
+// UTF-8 only if you add useless BOM in the beginning.
+//
+// So, before you compile "wide" examples with MSVC, please convert them to text
+// files with BOM. There are two very simple ways to do it:
+//
+// 1. Open file with Notepad and save it from there. It would convert
+// it to file with BOM.
+// 2. In Visual Studio go File->Advances Save Options... and select
+// Unicode (UTF-8 with signature) Codepage 65001
+//
+// Note: once converted to UTF-8 with BOM, this source code would not
+// compile with other compilers, because no-one uses BOM with UTF-8 today
+// because it is absolutely meaningless in context of UTF-8.
+//
+// ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! !
+//
+#include <boost/locale.hpp>
+#include <iostream>
+#include <cassert>
+#include <ctime>
+
+int main()
+{
+ using namespace boost::locale;
+ using namespace std;
+
+ // Create system default locale
+ generator gen;
+ locale loc=gen("");
+ locale::global(loc);
+ wcout.imbue(loc);
+
+ // This is needed to prevent C library to
+ // convert strings to narrow
+ // instead of C++ on some platforms
+ std::ios_base::sync_with_stdio(false);
+
+
+ wstring text=L"Hello World! あにま! Linux2.6 and Windows7 is word and number. שָלוֹם עוֹלָם!";
+
+ wcout<<text<<endl;
+
+ boundary::wssegment_index index(boundary::word,text.begin(),text.end());
+ boundary::wssegment_index::iterator p,e;
+
+ for(p=index.begin(),e=index.end();p!=e;++p) {
+ wcout<<L"Part ["<<*p<<L"] has ";
+ if(p->rule() & boundary::word_number)
+ wcout<<L"number(s) ";
+ if(p->rule() & boundary::word_letter)
+ wcout<<L"letter(s) ";
+ if(p->rule() & boundary::word_kana)
+ wcout<<L"kana character(s) ";
+ if(p->rule() & boundary::word_ideo)
+ wcout<<L"ideographic character(s) ";
+ if(p->rule() & boundary::word_none)
+ wcout<<L"no word characters";
+ wcout<<endl;
+ }
+
+ index.map(boundary::character,text.begin(),text.end());
+
+ for(p=index.begin(),e=index.end();p!=e;++p) {
+ wcout<<L"|" <<*p ;
+ }
+ wcout<<L"|\n\n";
+
+ index.map(boundary::line,text.begin(),text.end());
+
+ for(p=index.begin(),e=index.end();p!=e;++p) {
+ wcout<<L"|" <<*p ;
+ }
+ wcout<<L"|\n\n";
+
+ index.map(boundary::sentence,text.begin(),text.end());
+
+ for(p=index.begin(),e=index.end();p!=e;++p) {
+ wcout<<L"|" <<*p ;
+ }
+ wcout<<"|\n\n";
+
+}
+
+
+// vim: tabstop=4 expandtab shiftwidth=4 softtabstop=4
+
+// boostinspect:noascii
+