summaryrefslogtreecommitdiffstats
path: root/intl/icu/source/data/xml/brkitr
diff options
context:
space:
mode:
Diffstat (limited to 'intl/icu/source/data/xml/brkitr')
-rw-r--r--intl/icu/source/data/xml/brkitr/de.xml20
-rw-r--r--intl/icu/source/data/xml/brkitr/el.xml26
-rw-r--r--intl/icu/source/data/xml/brkitr/en.xml19
-rw-r--r--intl/icu/source/data/xml/brkitr/en_US.xml20
-rw-r--r--intl/icu/source/data/xml/brkitr/en_US_POSIX.xml28
-rw-r--r--intl/icu/source/data/xml/brkitr/es.xml21
-rw-r--r--intl/icu/source/data/xml/brkitr/fi.xml26
-rw-r--r--intl/icu/source/data/xml/brkitr/fr.xml21
-rw-r--r--intl/icu/source/data/xml/brkitr/it.xml21
-rw-r--r--intl/icu/source/data/xml/brkitr/ja.xml278
-rw-r--r--intl/icu/source/data/xml/brkitr/ko.xml42
-rw-r--r--intl/icu/source/data/xml/brkitr/pt.xml21
-rw-r--r--intl/icu/source/data/xml/brkitr/root.xml48
-rw-r--r--intl/icu/source/data/xml/brkitr/ru.xml21
-rw-r--r--intl/icu/source/data/xml/brkitr/sv.xml26
-rw-r--r--intl/icu/source/data/xml/brkitr/zh.xml30
-rw-r--r--intl/icu/source/data/xml/brkitr/zh_Hant.xml30
17 files changed, 698 insertions, 0 deletions
diff --git a/intl/icu/source/data/xml/brkitr/de.xml b/intl/icu/source/data/xml/brkitr/de.xml
new file mode 100644
index 0000000000..581c6a49a2
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/de.xml
@@ -0,0 +1,20 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2010-2015 International Business Machines Corporation and others. All rights reserved.
+
+ See comments on https://unicode-org.atlassian.net/browse/ICU-10750 - this file is needed to emit break iterator rules properly.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="de"/>
+ </identity>
+</ldml>
diff --git a/intl/icu/source/data/xml/brkitr/el.xml b/intl/icu/source/data/xml/brkitr/el.xml
new file mode 100644
index 0000000000..6101bffa3c
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/el.xml
@@ -0,0 +1,26 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2010-2015 International Business Machines Corporation and others. All rights reserved.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="el"/>
+ </identity>
+ <special xmlns:icu="http://www.icu-project.org/">
+ <icu:breakIteratorData>
+ <icu:boundaries>
+ <icu:sentence icu:dependency="sent_el.brk"/>
+ </icu:boundaries>
+ </icu:breakIteratorData>
+ </special>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/en.xml b/intl/icu/source/data/xml/brkitr/en.xml
new file mode 100644
index 0000000000..c10869f186
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/en.xml
@@ -0,0 +1,19 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2010-2015 International Business Machines Corporation and others. All rights reserved.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="en"/>
+ </identity>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/en_US.xml b/intl/icu/source/data/xml/brkitr/en_US.xml
new file mode 100644
index 0000000000..dafa29408f
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/en_US.xml
@@ -0,0 +1,20 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2010-2015 International Business Machines Corporation and others. All rights reserved.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="en"/>
+ <territory type="US"/>
+ </identity>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/en_US_POSIX.xml b/intl/icu/source/data/xml/brkitr/en_US_POSIX.xml
new file mode 100644
index 0000000000..6722b3b761
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/en_US_POSIX.xml
@@ -0,0 +1,28 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2010-2015 International Business Machines Corporation and others. All rights reserved.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="en"/>
+ <territory type="US"/>
+ <variant type="POSIX"/>
+ </identity>
+ <special xmlns:icu="http://www.icu-project.org/">
+ <icu:breakIteratorData>
+ <icu:boundaries>
+ <icu:word icu:dependency="word_POSIX.brk"/>
+ </icu:boundaries>
+ </icu:breakIteratorData>
+ </special>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/es.xml b/intl/icu/source/data/xml/brkitr/es.xml
new file mode 100644
index 0000000000..3ac3031f99
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/es.xml
@@ -0,0 +1,21 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2010-2015 International Business Machines Corporation and others. All rights reserved.
+
+ See comments on https://unicode-org.atlassian.net/browse/ICU-10750 - this file is needed to emit break iterator rules properly.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="es"/>
+ </identity>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/fi.xml b/intl/icu/source/data/xml/brkitr/fi.xml
new file mode 100644
index 0000000000..5081e7cd4e
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/fi.xml
@@ -0,0 +1,26 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2010-2015 International Business Machines Corporation and others. All rights reserved.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="fi"/>
+ </identity>
+ <special xmlns:icu="http://www.icu-project.org/">
+ <icu:breakIteratorData>
+ <icu:boundaries>
+ <icu:word icu:dependency="word_fi_sv.brk"/>
+ </icu:boundaries>
+ </icu:breakIteratorData>
+ </special>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/fr.xml b/intl/icu/source/data/xml/brkitr/fr.xml
new file mode 100644
index 0000000000..fea05ffb29
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/fr.xml
@@ -0,0 +1,21 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2010-2015 International Business Machines Corporation and others. All rights reserved.
+
+ See comments on https://unicode-org.atlassian.net/browse/ICU-10750 - this file is needed to emit break iterator rules properly.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="fr"/>
+ </identity>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/it.xml b/intl/icu/source/data/xml/brkitr/it.xml
new file mode 100644
index 0000000000..568b4624c7
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/it.xml
@@ -0,0 +1,21 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2010-2015 International Business Machines Corporation and others. All rights reserved.
+
+ See comments on https://unicode-org.atlassian.net/browse/ICU-10750 - this file is needed to emit break iterator rules properly.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="it"/>
+ </identity>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/ja.xml b/intl/icu/source/data/xml/brkitr/ja.xml
new file mode 100644
index 0000000000..2e4ffeafd0
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/ja.xml
@@ -0,0 +1,278 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2006-2015 International Business Machines Corporation and others. All rights reserved.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="ja"/>
+ </identity>
+ <special xmlns:icu="http://www.icu-project.org/">
+ <icu:breakIteratorData>
+ <icu:boundaries>
+ <icu:line icu:dependency="line_normal.brk"/>
+ <icu:line alt="loose" icu:dependency="line_loose_cj.brk"/>
+ <icu:line alt="normal" icu:dependency="line_normal_cj.brk"/>
+ <icu:line alt="strict" icu:dependency="line_cj.brk"/>
+ <icu:line alt="loose_phrase" icu:dependency="line_loose_phrase_cj.brk"/>
+ <icu:line alt="normal_phrase" icu:dependency="line_normal_phrase_cj.brk"/>
+ <icu:line alt="strict_phrase" icu:dependency="line_phrase_cj.brk"/>
+ <icu:line alt="phrase" icu:dependency="line_phrase_cj.brk"/>
+ </icu:boundaries>
+ <icu:extensions>
+ <!--
+ Entries in cjdict.txt categorized as particles (助詞), auxiliary verbs (助動詞),
+ conjugations (活用) and prefix of them.
+ These entries are connected to the previous words for phrase based line breaking.
+ https://ja.wikipedia.org/wiki/助詞
+ https://ja.wikipedia.org/wiki/助動詞_(国文法)
+ https://ja.wikipedia.org/wiki/活用
+ -->
+ <icu:extension>かい</icu:extension>
+ <icu:extension>かしら</icu:extension>
+ <icu:extension>から</icu:extension>
+ <icu:extension>かれい</icu:extension>
+ <icu:extension>かれつ</icu:extension>
+ <icu:extension>かれる</icu:extension>
+ <icu:extension>かれん</icu:extension>
+ <icu:extension>きり</icu:extension>
+ <icu:extension>くらい</icu:extension>
+ <icu:extension>ぐらい</icu:extension>
+ <icu:extension>けれど</icu:extension>
+ <icu:extension>けれども</icu:extension>
+ <icu:extension>こそ</icu:extension>
+ <icu:extension>さえ</icu:extension>
+ <icu:extension>しか</icu:extension>
+ <icu:extension>した</icu:extension>
+ <icu:extension>ずつ</icu:extension>
+ <icu:extension>せる</icu:extension>
+ <icu:extension>せん</icu:extension>
+ <icu:extension>たい</icu:extension>
+ <icu:extension>たがる</icu:extension>
+ <icu:extension>たく</icu:extension>
+ <icu:extension>たら</icu:extension>
+ <icu:extension>たり</icu:extension>
+ <icu:extension>たれ</icu:extension>
+ <icu:extension>たれる</icu:extension>
+ <icu:extension>だけ</icu:extension>
+ <icu:extension>だに</icu:extension>
+ <icu:extension>だの</icu:extension>
+ <icu:extension>だり</icu:extension>
+ <icu:extension>つつ</icu:extension>
+ <icu:extension>てる</icu:extension>
+ <icu:extension>です</icu:extension>
+ <icu:extension>でも</icu:extension>
+ <icu:extension>ところが</icu:extension>
+ <icu:extension>ところで</icu:extension>
+ <icu:extension>とも</icu:extension>
+ <icu:extension>ない</icu:extension>
+ <icu:extension>なか</icu:extension>
+ <icu:extension>ながら</icu:extension>
+ <icu:extension>なく</icu:extension>
+ <icu:extension>なし</icu:extension>
+ <icu:extension>なぞ</icu:extension>
+ <icu:extension>など</icu:extension>
+ <icu:extension>なら</icu:extension>
+ <icu:extension>なり</icu:extension>
+ <icu:extension>なれる</icu:extension>
+ <icu:extension>なんぞ</icu:extension>
+ <icu:extension>ねる</icu:extension>
+ <icu:extension>ので</icu:extension>
+ <icu:extension>のに</icu:extension>
+ <icu:extension>のみ</icu:extension>
+ <icu:extension>はれる</icu:extension>
+ <icu:extension>ばかり</icu:extension>
+ <icu:extension>へる</icu:extension>
+ <icu:extension>ほど</icu:extension>
+ <icu:extension>まい</icu:extension>
+ <icu:extension>まう</icu:extension>
+ <icu:extension>まし</icu:extension>
+ <icu:extension>ます</icu:extension>
+ <icu:extension>まっ</icu:extension>
+ <icu:extension>まで</icu:extension>
+ <icu:extension>まま</icu:extension>
+ <icu:extension>まれ</icu:extension>
+ <icu:extension>もん</icu:extension>
+ <icu:extension>やら</icu:extension>
+ <icu:extension>やれる</icu:extension>
+ <icu:extension>よう</icu:extension>
+ <icu:extension>より</icu:extension>
+ <icu:extension>らしい</icu:extension>
+ <icu:extension>られる</icu:extension>
+ <icu:extension>れる</icu:extension>
+ <icu:extension>ろう</icu:extension>
+ <icu:extension>わっ</icu:extension>
+ <icu:extension>わな</icu:extension>
+ <icu:extension>わら</icu:extension>
+ <icu:extension>わり</icu:extension>
+ <icu:extension>わる</icu:extension>
+ <icu:extension>われ</icu:extension>
+ <icu:extension>われと</icu:extension>
+ <icu:extension>われる</icu:extension>
+ <icu:extension>わん</icu:extension>
+ <!--
+ Entries added for technical reasons (particle + others).
+ Entries in cjdict.txt, which are compound words starting from the above categories
+ (i.e. particles, auxiliary verbs and conjunctions).
+ These entries are connected to the previous words for phrase based line breaking.
+ -->
+ <icu:extension>えたい</icu:extension>
+ <icu:extension>えて</icu:extension>
+ <icu:extension>える</icu:extension>
+ <icu:extension>けた</icu:extension>
+ <icu:extension>けたい</icu:extension>
+ <icu:extension>ける</icu:extension>
+ <icu:extension>させる</icu:extension>
+ <icu:extension>そうだ</icu:extension>
+ <icu:extension>っきゃ</icu:extension>
+ <icu:extension>っきり</icu:extension>
+ <icu:extension>っけ</icu:extension>
+ <icu:extension>っす</icu:extension>
+ <icu:extension>ったらしい</icu:extension>
+ <icu:extension>っちゅう</icu:extension>
+ <icu:extension>って</icu:extension>
+ <icu:extension>っていう</icu:extension>
+ <icu:extension>ってか</icu:extension>
+ <icu:extension>ってな</icu:extension>
+ <icu:extension>っと</icu:extension>
+ <icu:extension>っぱなし</icu:extension>
+ <icu:extension>っぷり</icu:extension>
+ <icu:extension>っぽい</icu:extension>
+ <icu:extension>にあう</icu:extension>
+ <icu:extension>にあがる</icu:extension>
+ <icu:extension>にあたって</icu:extension>
+ <icu:extension>にあたり</icu:extension>
+ <icu:extension>にあたりまして</icu:extension>
+ <icu:extension>にあたります</icu:extension>
+ <icu:extension>にあたる</icu:extension>
+ <icu:extension>において</icu:extension>
+ <icu:extension>におきまして</icu:extension>
+ <icu:extension>における</icu:extension>
+ <icu:extension>にかけ</icu:extension>
+ <icu:extension>にかけて</icu:extension>
+ <icu:extension>にかけまして</icu:extension>
+ <icu:extension>にたいして</icu:extension>
+ <icu:extension>にたいしまして</icu:extension>
+ <icu:extension>にたいします</icu:extension>
+ <icu:extension>にたいする</icu:extension>
+ <icu:extension>について</icu:extension>
+ <icu:extension>につき</icu:extension>
+ <icu:extension>につきまして</icu:extension>
+ <icu:extension>につけ</icu:extension>
+ <icu:extension>につれ</icu:extension>
+ <icu:extension>につれて</icu:extension>
+ <icu:extension>にて</icu:extension>
+ <icu:extension>にとって</icu:extension>
+ <icu:extension>にとり</icu:extension>
+ <icu:extension>にとりまして</icu:extension>
+ <icu:extension>にまつわります</icu:extension>
+ <icu:extension>にまつわる</icu:extension>
+ <icu:extension>にもかかわらず</icu:extension>
+ <icu:extension>にゃ</icu:extension>
+ <icu:extension>によって</icu:extension>
+ <icu:extension>により</icu:extension>
+ <icu:extension>によりまして</icu:extension>
+ <icu:extension>によります</icu:extension>
+ <icu:extension>による</icu:extension>
+ <icu:extension>にわたって</icu:extension>
+ <icu:extension>にわたり</icu:extension>
+ <icu:extension>にわたりまして</icu:extension>
+ <icu:extension>にわたります</icu:extension>
+ <icu:extension>にわたる</icu:extension>
+ <icu:extension>に対し</icu:extension>
+ <icu:extension>に対して</icu:extension>
+ <icu:extension>に対しまして</icu:extension>
+ <icu:extension>に対します</icu:extension>
+ <icu:extension>に対する</icu:extension>
+ <icu:extension>に当たって</icu:extension>
+ <icu:extension>に当たり</icu:extension>
+ <icu:extension>に当たりまして</icu:extension>
+ <icu:extension>に当たります</icu:extension>
+ <icu:extension>に当たる</icu:extension>
+ <icu:extension>に従い</icu:extension>
+ <icu:extension>に従いまして</icu:extension>
+ <icu:extension>に従います</icu:extension>
+ <icu:extension>に従う</icu:extension>
+ <icu:extension>に従って</icu:extension>
+ <icu:extension>に関し</icu:extension>
+ <icu:extension>に関して</icu:extension>
+ <icu:extension>に関しまして</icu:extension>
+ <icu:extension>に関します</icu:extension>
+ <icu:extension>に関する</icu:extension>
+ <icu:extension>に際し</icu:extension>
+ <icu:extension>に際して</icu:extension>
+ <icu:extension>ものの</icu:extension>
+ <icu:extension>ろうし</icu:extension>
+ <icu:extension>ろうと</icu:extension>
+ <icu:extension>われと</icu:extension>
+ <icu:extension>をの</icu:extension>
+ <icu:extension>をめぐって</icu:extension>
+ <icu:extension>をめぐりまして</icu:extension>
+ <icu:extension>をめぐります</icu:extension>
+ <icu:extension>をめぐる</icu:extension>
+ <icu:extension>をもちまして</icu:extension>
+ <icu:extension>をもって</icu:extension>
+ <icu:extension>を以て</icu:extension>
+ <icu:extension>を通して</icu:extension>
+ <icu:extension>を通しまして</icu:extension>
+ <icu:extension>を通じ</icu:extension>
+ <icu:extension>を通じて</icu:extension>
+ <icu:extension>を通じまして</icu:extension>
+ <icu:extension>んじゃ</icu:extension>
+ <icu:extension>んで</icu:extension>
+ <!--
+ Entries added for technical reasons (noun suffix).
+ Entries in cjdict.txt, which are suffixes of nouns.
+ These entries should be connected to the previous (noun) words.
+ -->
+ <icu:extension>々宮</icu:extension>
+ <icu:extension>々家</icu:extension>
+ <icu:extension>え目</icu:extension>
+ <icu:extension>が丘</icu:extension>
+ <icu:extension>が台</icu:extension>
+ <icu:extension>が床</icu:extension>
+ <icu:extension>が浜</icu:extension>
+ <icu:extension>の内</icu:extension>
+ <icu:extension>の山公園</icu:extension>
+ <icu:extension>の峰</icu:extension>
+ <icu:extension>の森</icu:extension>
+ <icu:extension>の沢</icu:extension>
+ <icu:extension>の通り</icu:extension>
+ <icu:extension>の里</icu:extension>
+ <icu:extension>ヵ国</icu:extension>
+ <icu:extension>ヵ年</icu:extension>
+ <icu:extension>ヵ所</icu:extension>
+ <icu:extension>ヵ月</icu:extension>
+ <icu:extension>ヵ村</icu:extension>
+ <icu:extension>ヵ条</icu:extension>
+ <icu:extension>ヶ丘</icu:extension>
+ <icu:extension>ヶ国</icu:extension>
+ <icu:extension>ヶ島</icu:extension>
+ <icu:extension>ヶ年</icu:extension>
+ <icu:extension>ヶ所</icu:extension>
+ <icu:extension>ヶ月</icu:extension>
+ <icu:extension>ヶ村</icu:extension>
+ <icu:extension>ヶ条</icu:extension>
+ <icu:extension>ージ</icu:extension>
+ <icu:extension>ーズ</icu:extension>
+ <icu:extension>ータ</icu:extension>
+ <icu:extension>ード</icu:extension>
+ <icu:extension>ーニャ</icu:extension>
+ <icu:extension>ープランス</icu:extension>
+ <icu:extension>ーユ</icu:extension>
+ <icu:extension>ーランド</icu:extension>
+ <icu:extension>ーリンズ</icu:extension>
+ <icu:extension>ーン</icu:extension>
+ </icu:extensions>
+ </icu:breakIteratorData>
+ </special>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/ko.xml b/intl/icu/source/data/xml/brkitr/ko.xml
new file mode 100644
index 0000000000..5ba204b4f4
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/ko.xml
@@ -0,0 +1,42 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2006-2015 International Business Machines Corporation and others. All rights reserved.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="ko"/>
+ </identity>
+ <special xmlns:icu="http://www.icu-project.org/">
+ <icu:breakIteratorData>
+ <icu:boundaries>
+ <icu:line icu:dependency="line_normal.brk"/>
+ <icu:line alt="loose" icu:dependency="line_loose_cj.brk"/>
+ <icu:line alt="normal" icu:dependency="line_normal_cj.brk"/>
+ <icu:line alt="strict" icu:dependency="line_cj.brk"/>
+ <icu:line alt="loose_phrase" icu:dependency="line_loose_phrase_cj.brk"/>
+ <icu:line alt="normal_phrase" icu:dependency="line_normal_phrase_cj.brk"/>
+ <icu:line alt="strict_phrase" icu:dependency="line_phrase_cj.brk"/>
+ <icu:line alt="phrase" icu:dependency="line_phrase_cj.brk"/>
+ </icu:boundaries>
+ <!--
+ <icu:extensions>
+ Korean particles should be added here and dictbe.cpp needs to be adjusted
+ once a Korean dictionary is added. Even without a Korean dictionary,
+ Korean particle list can be used when a Korean word written in CJK ideographs
+ or a Korean word in Hangul and a closing puncutation mark is followed by a Korean
+ particle. Examples include: "大韓民國은 民主共和國이다", "『님의 침묵』이" .
+ </icu:extensions>
+ -->
+ </icu:breakIteratorData>
+ </special>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/pt.xml b/intl/icu/source/data/xml/brkitr/pt.xml
new file mode 100644
index 0000000000..8ff12bf014
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/pt.xml
@@ -0,0 +1,21 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2014-2015 International Business Machines Corporation and others. All rights reserved.
+
+ See comments on https://unicode-org.atlassian.net/browse/ICU-10750 - this file is needed to emit break iterator rules properly.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="pt"/>
+ </identity>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/root.xml b/intl/icu/source/data/xml/brkitr/root.xml
new file mode 100644
index 0000000000..0d3e667ae1
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/root.xml
@@ -0,0 +1,48 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2010-2015 International Business Machines Corporation and others. All rights reserved.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="root"/>
+ </identity>
+ <special xmlns:icu="http://www.icu-project.org/">
+ <icu:breakIteratorData>
+ <icu:boundaries>
+ <icu:grapheme icu:dependency="char.brk"/>
+ <icu:word icu:dependency="word.brk"/>
+ <icu:line icu:dependency="line.brk"/>
+ <icu:line alt="loose" icu:dependency="line_loose.brk"/>
+ <icu:line alt="normal" icu:dependency="line_normal.brk"/>
+ <icu:line alt="strict" icu:dependency="line.brk"/>
+ <icu:sentence icu:dependency="sent.brk"/>
+ <icu:title icu:dependency="title.brk"/>
+ </icu:boundaries>
+ <icu:dictionaries>
+ <icu:dictionary type="Hani" icu:dependency="cjdict.dict"/>
+ <icu:dictionary type="Hira" icu:dependency="cjdict.dict"/>
+ <icu:dictionary type="Kana" icu:dependency="cjdict.dict"/>
+ <icu:dictionary type="Khmr" icu:dependency="khmerdict.dict"/>
+ <icu:dictionary type="Laoo" icu:dependency="laodict.dict"/>
+ <icu:dictionary type="Mymr" icu:dependency="burmesedict.dict"/>
+ <icu:dictionary type="Thai" icu:dependency="thaidict.dict"/>
+ </icu:dictionaries>
+ <!--
+ <icu:lstm>
+ <icu:lstmdata type="Thai" icu:dependency="Thai_graphclust_model4_heavy.res"/>
+ <icu:lstmdata type="Mymr" icu:dependency="Burmese_graphclust_model5_heavy.res"/>
+ </icu:lstm>
+ -->
+ </icu:breakIteratorData>
+ </special>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/ru.xml b/intl/icu/source/data/xml/brkitr/ru.xml
new file mode 100644
index 0000000000..5a7ae84964
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/ru.xml
@@ -0,0 +1,21 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2010-2015 International Business Machines Corporation and others. All rights reserved.
+
+ See comments on https://unicode-org.atlassian.net/browse/ICU-10750 - this file is needed to emit break iterator rules properly.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="ru"/>
+ </identity>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/sv.xml b/intl/icu/source/data/xml/brkitr/sv.xml
new file mode 100644
index 0000000000..5f1566942d
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/sv.xml
@@ -0,0 +1,26 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2010-2015 International Business Machines Corporation and others. All rights reserved.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$Revision$"/>
+ <language type="sv"/>
+ </identity>
+ <special xmlns:icu="http://www.icu-project.org/">
+ <icu:breakIteratorData>
+ <icu:boundaries>
+ <icu:word icu:dependency="word_fi_sv.brk"/>
+ </icu:boundaries>
+ </icu:breakIteratorData>
+ </special>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/zh.xml b/intl/icu/source/data/xml/brkitr/zh.xml
new file mode 100644
index 0000000000..48d0d68110
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/zh.xml
@@ -0,0 +1,30 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2006-2015 International Business Machines Corporation and others. All rights reserved.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$ $"/>
+ <generation date="$ $"/>
+ <language type="zh"/>
+ </identity>
+ <special xmlns:icu="http://www.icu-project.org/">
+ <icu:breakIteratorData>
+ <icu:boundaries>
+ <icu:line icu:dependency="line_cj.brk"/>
+ <icu:line alt="loose" icu:dependency="line_loose_cj.brk"/>
+ <icu:line alt="normal" icu:dependency="line_normal_cj.brk"/>
+ <icu:line alt="strict" icu:dependency="line_cj.brk"/>
+ </icu:boundaries>
+ </icu:breakIteratorData>
+ </special>
+</ldml>
+
diff --git a/intl/icu/source/data/xml/brkitr/zh_Hant.xml b/intl/icu/source/data/xml/brkitr/zh_Hant.xml
new file mode 100644
index 0000000000..287b9a5639
--- /dev/null
+++ b/intl/icu/source/data/xml/brkitr/zh_Hant.xml
@@ -0,0 +1,30 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Copyright (C) 2016 and later: Unicode, Inc. and others.
+ License & terms of use: http://www.unicode.org/copyright.html
+ Copyright (c) 2006-2015 International Business Machines Corporation and others. All rights reserved.
+-->
+<!DOCTYPE ldml SYSTEM "../../dtd/cldr/common/dtd/ldml.dtd"
+[
+ <!ENTITY % icu SYSTEM "../../dtd/cldr/common/dtd/ldmlICU.dtd">
+ %icu;
+]
+>
+<ldml>
+ <identity>
+ <version number="$ $"/>
+ <generation date="$ $"/>
+ <language type="zh_Hant"/>
+ </identity>
+ <special xmlns:icu="http://www.icu-project.org/">
+ <icu:breakIteratorData>
+ <icu:boundaries>
+ <icu:line icu:dependency="line_cj.brk"/>
+ <icu:line alt="loose" icu:dependency="line_loose_cj.brk"/>
+ <icu:line alt="normal" icu:dependency="line_normal_cj.brk"/>
+ <icu:line alt="strict" icu:dependency="line_cj.brk"/>
+ </icu:boundaries>
+ </icu:breakIteratorData>
+ </special>
+</ldml>
+