summaryrefslogtreecommitdiff
path: root/i18npool
diff options
context:
space:
mode:
authorVladimir Glazounov <vg@openoffice.org>2008-10-01 07:16:40 +0000
committerVladimir Glazounov <vg@openoffice.org>2008-10-01 07:16:40 +0000
commit17236a45c1368b8e9be8dae0f2b6918a88e7f4f4 (patch)
tree90569747d57f84437e79f4ab3ab7a92a0a6b4273 /i18npool
parent53414cda09bf3d5ff63e9b984ab4e932a5b12878 (diff)
CWS-TOOLING: integrate CWS i18n45
Diffstat (limited to 'i18npool')
-rw-r--r--i18npool/inc/breakiterator_cjk.hxx4
-rw-r--r--i18npool/inc/breakiterator_hi.hxx37
-rw-r--r--i18npool/inc/localedata.hxx3
-rw-r--r--i18npool/source/breakiterator/breakiteratorImpl.cxx4
-rw-r--r--i18npool/source/breakiterator/breakiterator_cjk.cxx25
-rw-r--r--i18npool/source/breakiterator/breakiterator_hi.cxx191
-rw-r--r--i18npool/source/breakiterator/breakiterator_unicode.cxx10
-rw-r--r--i18npool/source/breakiterator/data/char_in.txt48
-rw-r--r--i18npool/source/breakiterator/data/char_ta.txt46
-rw-r--r--i18npool/source/breakiterator/makefile.mk3
-rw-r--r--i18npool/source/localedata/LocaleNode.cxx9
-rw-r--r--i18npool/source/localedata/data/bn_BD.xml7
-rw-r--r--i18npool/source/localedata/data/bn_IN.xml7
-rw-r--r--i18npool/source/localedata/data/gu_IN.xml7
-rw-r--r--i18npool/source/localedata/data/hi_IN.xml7
-rw-r--r--i18npool/source/localedata/data/ja_JP.xml1
-rw-r--r--i18npool/source/localedata/data/kn_IN.xml7
-rw-r--r--i18npool/source/localedata/data/ko_KR.xml1
-rw-r--r--i18npool/source/localedata/data/locale.dtd2
-rw-r--r--i18npool/source/localedata/data/ml_IN.xml7
-rw-r--r--i18npool/source/localedata/data/or_IN.xml7
-rw-r--r--i18npool/source/localedata/data/pa_IN.xml7
-rw-r--r--i18npool/source/localedata/data/ta_IN.xml7
-rw-r--r--i18npool/source/localedata/data/te_IN.xml7
-rw-r--r--i18npool/source/localedata/data/zh_CN.xml1
-rw-r--r--i18npool/source/localedata/data/zh_TW.xml1
-rw-r--r--i18npool/source/localedata/localedata.cxx17
-rw-r--r--i18npool/source/registerservices/registerservices.cxx11
28 files changed, 190 insertions, 294 deletions
diff --git a/i18npool/inc/breakiterator_cjk.hxx b/i18npool/inc/breakiterator_cjk.hxx
index f01351103b54..8a1ec419324c 100644
--- a/i18npool/inc/breakiterator_cjk.hxx
+++ b/i18npool/inc/breakiterator_cjk.hxx
@@ -7,7 +7,7 @@
* OpenOffice.org - a multi-platform office productivity suite
*
* $RCSfile: breakiterator_cjk.hxx,v $
- * $Revision: 1.6 $
+ * $Revision: 1.6.16.1 $
*
* This file is part of OpenOffice.org.
*
@@ -58,6 +58,7 @@ public:
protected:
xdictionary *dict;
+ rtl::OUString hangingCharacters;
};
#define BREAKITERATOR_CJK( lang ) \
@@ -69,6 +70,7 @@ public:\
#ifdef BREAKITERATOR_ALL
BREAKITERATOR_CJK( zh )
+BREAKITERATOR_CJK( zh_TW )
BREAKITERATOR_CJK( ja )
BREAKITERATOR_CJK( ko )
#endif
diff --git a/i18npool/inc/breakiterator_hi.hxx b/i18npool/inc/breakiterator_hi.hxx
index 76fa22c354f1..e69de29bb2d1 100644
--- a/i18npool/inc/breakiterator_hi.hxx
+++ b/i18npool/inc/breakiterator_hi.hxx
@@ -1,37 +0,0 @@
-/*************************************************************************
-#*
-#* Copyright (c) 2002 Sun Microsystems Inc.
-#*
-#* Bugs! - Contact Prabhat.Hegde@sun.com
-#*************************************************************************/
-
-#ifndef _I18N_BREAKITERATOR_HI_HXX_
-#define _I18N_BREAKITERATOR_HI_HXX_
-
-#include <breakiterator_ctl.hxx>
-
-namespace com {
-namespace sun {
-namespace star {
-namespace i18n {
-
-// ----------------------------------------------------
-// class BreakIterator_hi
-// ----------------------------------------------------
-class BreakIterator_hi : public BreakIterator_CTL
-{
-public:
- BreakIterator_hi();
- ~BreakIterator_hi();
-
-protected:
- void SAL_CALL makeIndex(const rtl::OUString& text, sal_Int32 pos)
- throw(com::sun::star::uno::RuntimeException);
-};
-
-}
-}
-}
-}
-
-#endif
diff --git a/i18npool/inc/localedata.hxx b/i18npool/inc/localedata.hxx
index 41ec2bd12410..37a643cac392 100644
--- a/i18npool/inc/localedata.hxx
+++ b/i18npool/inc/localedata.hxx
@@ -7,7 +7,7 @@
* OpenOffice.org - a multi-platform office productivity suite
*
* $RCSfile: localedata.hxx,v $
- * $Revision: 1.20 $
+ * $Revision: 1.20.16.1 $
*
* This file is part of OpenOffice.org.
*
@@ -112,6 +112,7 @@ public:
virtual com::sun::star::uno::Sequence< rtl::OUString > SAL_CALL getFollowPageWords( const com::sun::star::lang::Locale& rLocale ) throw(com::sun::star::uno::RuntimeException);
virtual sal_Bool SAL_CALL hasPhonetic( const com::sun::star::lang::Locale& rLocale ) throw(com::sun::star::uno::RuntimeException);
virtual sal_Bool SAL_CALL isPhonetic( const com::sun::star::lang::Locale& rLocale, const rtl::OUString& algorithm ) throw(com::sun::star::uno::RuntimeException);
+ virtual rtl::OUString SAL_CALL getHangingCharacters( const com::sun::star::lang::Locale& rLocale ) throw(com::sun::star::uno::RuntimeException);
//XServiceInfo
virtual rtl::OUString SAL_CALL getImplementationName() throw( com::sun::star::uno::RuntimeException );
diff --git a/i18npool/source/breakiterator/breakiteratorImpl.cxx b/i18npool/source/breakiterator/breakiteratorImpl.cxx
index 122d8835df70..bb08d9e4e6c3 100644
--- a/i18npool/source/breakiterator/breakiteratorImpl.cxx
+++ b/i18npool/source/breakiterator/breakiteratorImpl.cxx
@@ -7,7 +7,7 @@
* OpenOffice.org - a multi-platform office productivity suite
*
* $RCSfile: breakiteratorImpl.cxx,v $
- * $Revision: 1.28 $
+ * $Revision: 1.27.4.2 $
*
* This file is part of OpenOffice.org.
*
@@ -234,6 +234,7 @@ sal_Int32 SAL_CALL BreakIteratorImpl::beginOfSentence( const OUString& Text, sal
{
if (nStartPos < 0 || nStartPos > Text.getLength())
return -1;
+ if (Text.getLength() == 0) return 0;
return LBI->beginOfSentence(Text, nStartPos, rLocale);
}
@@ -242,6 +243,7 @@ sal_Int32 SAL_CALL BreakIteratorImpl::endOfSentence( const OUString& Text, sal_I
{
if (nStartPos < 0 || nStartPos > Text.getLength())
return -1;
+ if (Text.getLength() == 0) return 0;
return LBI->endOfSentence(Text, nStartPos, rLocale);
}
diff --git a/i18npool/source/breakiterator/breakiterator_cjk.cxx b/i18npool/source/breakiterator/breakiterator_cjk.cxx
index d2b15d0be742..3d684b8788df 100644
--- a/i18npool/source/breakiterator/breakiterator_cjk.cxx
+++ b/i18npool/source/breakiterator/breakiterator_cjk.cxx
@@ -7,7 +7,7 @@
* OpenOffice.org - a multi-platform office productivity suite
*
* $RCSfile: breakiterator_cjk.cxx,v $
- * $Revision: 1.17 $
+ * $Revision: 1.17.16.1 $
*
* This file is part of OpenOffice.org.
*
@@ -33,6 +33,7 @@
#define BREAKITERATOR_ALL
#include <breakiterator_cjk.hxx>
+#include <localedata.hxx>
#include <i18nutil/unicode.hxx>
using namespace ::com::sun::star::uno;
@@ -108,7 +109,7 @@ LineBreakResults SAL_CALL BreakIterator_CJK::getLineBreak(
LineBreakResults lbr;
if (bOptions.allowPunctuationOutsideMargin &&
- bOptions.forbiddenBeginCharacters.indexOf(Text[nStartPos]) != -1 &&
+ hangingCharacters.indexOf(Text[nStartPos]) != -1 &&
++nStartPos == Text.getLength()) {
; // do nothing
} else if (bOptions.applyForbiddenRules && 0 < nStartPos && nStartPos < Text.getLength()) {
@@ -122,12 +123,15 @@ LineBreakResults SAL_CALL BreakIterator_CJK::getLineBreak(
lbr.breakType = BreakType::WORDBOUNDARY;
return lbr;
}
+
+#define LOCALE(language, country) lang::Locale(OUString::createFromAscii(language), OUString::createFromAscii(country), OUString())
// ----------------------------------------------------
// class BreakIterator_zh
// ----------------------------------------------------;
BreakIterator_zh::BreakIterator_zh()
{
dict = new xdictionary("zh");
+ hangingCharacters = LocaleData().getHangingCharacters(LOCALE("zh", "CN"));
cBreakIterator = "com.sun.star.i18n.BreakIterator_zh";
}
@@ -137,12 +141,28 @@ BreakIterator_zh::~BreakIterator_zh()
}
// ----------------------------------------------------
+// class BreakIterator_zh_TW
+// ----------------------------------------------------;
+BreakIterator_zh_TW::BreakIterator_zh_TW()
+{
+ dict = new xdictionary("zh");
+ hangingCharacters = LocaleData().getHangingCharacters(LOCALE("zh", "TW"));
+ cBreakIterator = "com.sun.star.i18n.BreakIterator_zh_TW";
+}
+
+BreakIterator_zh_TW::~BreakIterator_zh_TW()
+{
+ delete dict;
+}
+
+// ----------------------------------------------------
// class BreakIterator_ja
// ----------------------------------------------------;
BreakIterator_ja::BreakIterator_ja()
{
dict = new xdictionary("ja");
dict->setJapaneseWordBreak();
+ hangingCharacters = LocaleData().getHangingCharacters(LOCALE("ja", "JP"));
cBreakIterator = "com.sun.star.i18n.BreakIterator_ja";
}
@@ -156,6 +176,7 @@ BreakIterator_ja::~BreakIterator_ja()
// ----------------------------------------------------;
BreakIterator_ko::BreakIterator_ko()
{
+ hangingCharacters = LocaleData().getHangingCharacters(LOCALE("ko", "KR"));
cBreakIterator = "com.sun.star.i18n.BreakIterator_ko";
}
diff --git a/i18npool/source/breakiterator/breakiterator_hi.cxx b/i18npool/source/breakiterator/breakiterator_hi.cxx
index d3002a6f3d80..e69de29bb2d1 100644
--- a/i18npool/source/breakiterator/breakiterator_hi.cxx
+++ b/i18npool/source/breakiterator/breakiterator_hi.cxx
@@ -1,191 +0,0 @@
-/*************************************************************************
-#*
-#* Copyright (c) 2002 Sun Microsystems Inc.
-#*
-#* Bugs! - Contact Prabhat.Hegde@sun.com
-#************************************************************************/
-
-// MARKER(update_precomp.py): autogen include statement, do not remove
-#include "precompiled_i18npool.hxx"
-
-#include <breakiterator_hi.hxx>
-
-#include <string.h> // for memset
-
-using namespace ::com::sun::star::uno;
-using namespace ::com::sun::star::lang;
-using namespace ::rtl;
-
-namespace com { namespace sun { namespace star { namespace i18n {
-
-// ----------------------------------------------------
-// class Breakiterator_hi
-// ----------------------------------------------------;
-BreakIterator_hi::BreakIterator_hi()
-{
- cBreakIterator = "com.sun.star.i18n.BreakIterator_hi";
-}
-
-BreakIterator_hi::~BreakIterator_hi()
-{
-}
-
-/*
- * Devanagari character class Definitions
- */
-#define _NP 1L
-#define _UP (1L<<1)
-#define _IV (1L<<2)
-#define _CN (1L<<3)
-#define _CK (1L<<4)
-#define _RC (1L<<5)
-#define _NM (1L<<6)
-#define _IM (1L<<7)
-#define _HL (1L<<8)
-#define _NK (1L<<9)
-#define _VD (1L<<10)
-#define _HD (1L<<11)
-#define _II_M (1L<<12)
-#define _EY_M (1L<<13)
-#define _AI_M (1L<<14)
-#define _OW1_M (1L<<15)
-#define _OW2_M (1L<<16)
-#define _MS (1L<<17)
-#define _AYE_M (1L<<18)
-#define _EE_M (1L<<19)
-#define _AWE_M (1L<<20)
-#define _O_M (1L<<21)
-#define _RM (_II_M|_EY_M|_AI_M|_OW1_M|_OW2_M|_AYE_M|_EE_M|_AWE_M|_O_M)
-
-/* Non-Defined Class type */
-#define __ND 0
-
-/*
- * Devanagari character type definitions
- */
-#define __UP 1 // ChandraBindu & Anuswar
-#define __NP 2 // Visarg
-#define __IV 3 // Independant Vowels
-#define __CN 4 // Consonants except _CK & _RC
-#define __CK 5 // Consonants that can be followed by Nukta
-#define __RC 6 // Ra
-#define __NM 7 // Matra
-#define __RM 8 // Ra + HAL
-#define __IM 9 // Choti I Matra
-#define __HL 10 // HAL
-#define __NK 11 // Nukta
-#define __VD 12 // Vedic
-#define __HD 13 // Hindu Numerals
-
-/*
- * Devanagari character type table
- */
-static const sal_uInt16 devaCT[128] = {
-/* 0, 1, 2, 3, 4, 5, 6, 7,
- 8, 9, A, B, C, D, E, F, */
-/* 0900 */ __ND, __UP, __UP, __NP, __ND, __IV, __IV, __IV,
- __IV, __IV, __IV, __IV, __IV, __IV, __IV, __IV,
-/* 0910 */ __IV, __IV, __IV, __IV, __IV, __CK, __CK, __CK,
- __CN, __CN, __CN, __CN, __CK, __CN, __CN, __CN,
-/* 0920 */ __CN, __CK, __CK, __CN, __CN, __CN, __CN, __CN,
- __CN, __CN, __CN, __CK, __CN, __CN, __CN, __CN,
-/* 0930 */ __RC, __CN, __CN, __CN, __CN, __CN, __CN, __CN,
- __CN, __CN, __ND, __ND, __NK, __VD, __NM, __IM,
-/* 0940 */ __RM, __NM, __NM, __NM, __NM, __RM, __RM, __RM,
- __RM, __RM, __RM, __RM, __RM, __HL, __ND, __ND,
-/* 0950 */ __ND, __VD, __VD, __VD, __VD, __ND, __ND, __ND,
- __CN, __CN, __CN, __CN, __CN, __CN, __CN, __CN,
-/* 0960 */ __IV, __IV, __NM, __NM, __ND, __ND, __HD, __HD,
- __HD, __HD, __HD, __HD, __HD, __HD, __HD, __HD,
-/* 0970 */ __ND, __ND, __ND, __ND, __ND, __ND, __ND, __ND,
- __ND, __ND, __ND, __ND, __ND, __ND, __ND, __ND,
-};
-
-
-#define getCharType(x) \
- ((x >= 0x0900 && x < 0x097f) ? devaCT[x - 0x0900] : __ND)
-
-/*
- * Devanagari character composition table
- */
-static const sal_uInt16 devaCompRel[14][14] = {
- /* ND, UP, NP, IV, CN, CK, RC, NM, RM, IM, HL, NK, VD, HD, */
- /* 0 */ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /* ND */
- /* 1 */ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /* UP */
- /* 2 */ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /* NP */
- /* 3 */ { 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /* IV */
- /* 4 */ { 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0 }, /* CN */
- /* 5 */ { 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0 }, /* CK */
- /* 6 */ { 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0 }, /* RC */
- /* 7 */ { 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /* NM */
- /* 8 */ { 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /* RM */
- /* 9 */ { 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /* IM */
- /* 10 */ { 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0 }, /* HL */
- /* 11 */ { 0, 1, 1, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0 }, /* NK */
- /* 12 */ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, /* VD */
- /* 13 */ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } /* HD */
-};
-
-static sal_uInt16 SAL_CALL
-getCombState(const sal_Unicode *text, sal_Int32 pos)
-{
- sal_uInt16 ch1 = getCharType(text[pos]);
- sal_uInt16 ch2 = getCharType(text[pos+1]);
-
- return devaCompRel[ch1][ch2];
-}
-
-static sal_uInt32 SAL_CALL
-getACell(const sal_Unicode *text, sal_Int32 pos, sal_Int32 len)
-{
- sal_uInt32 curr = 1;
- for (; pos + 1 < len && getCombState(text, pos) == 1; curr++, pos++) {}
- return curr;
-}
-
-#define is_Hindi(x) ((x >= 0x0900 && x < 0x097f) || (x >= 0x0905 && x < 0x0940) || \
- (x >= 0x093c && x < 0x094e) || (x >= 0x0950 && x < 0x0954) || \
- (x >= 0x0958 && x < 0x0971))
-
-void SAL_CALL
-i18n::BreakIterator_hi::makeIndex(const OUString& Text, sal_Int32 nStartPos)
- throw(uno::RuntimeException)
-{
- if (Text != cachedText) {
- cachedText = Text;
- if (cellIndexSize < cachedText.getLength()) {
- cellIndexSize = cachedText.getLength();
- free(nextCellIndex);
- free(previousCellIndex);
- nextCellIndex = (sal_Int32*) calloc(cellIndexSize, sizeof(sal_Int32));
- previousCellIndex = (sal_Int32*) calloc(cellIndexSize, sizeof(sal_Int32));
- }
- // reset nextCell for new Text
- memset(nextCellIndex, 0, cellIndexSize * sizeof(sal_Int32));
- }
- else if (nextCellIndex[nStartPos] > 0 || ! is_Hindi(Text[nStartPos]))
- return;
-
- const sal_Unicode* str = cachedText.getStr();
- sal_Int32 len = cachedText.getLength(), startPos, endPos;
-
- startPos = nStartPos;
- while (startPos > 0 && is_Hindi(str[startPos-1])) startPos--;
- endPos = nStartPos+1;
- while (endPos < len && is_Hindi(str[endPos])) endPos++;
-
- sal_Int32 start, end, pos;
- pos = start = end = startPos;
-
- while (pos < endPos) {
- end += getACell(str, start, endPos);
- while (pos < end) {
- nextCellIndex[pos] = end;
- previousCellIndex[pos] = start;
- pos++;
- }
- start = end;
- }
-}
-
-} } } }
diff --git a/i18npool/source/breakiterator/breakiterator_unicode.cxx b/i18npool/source/breakiterator/breakiterator_unicode.cxx
index 33244844f1c6..9dbecd813b49 100644
--- a/i18npool/source/breakiterator/breakiterator_unicode.cxx
+++ b/i18npool/source/breakiterator/breakiterator_unicode.cxx
@@ -7,7 +7,7 @@
* OpenOffice.org - a multi-platform office productivity suite
*
* $RCSfile: breakiterator_unicode.cxx,v $
- * $Revision: 1.36 $
+ * $Revision: 1.36.2.1 $
*
* This file is part of OpenOffice.org.
*
@@ -363,11 +363,17 @@ LineBreakResults SAL_CALL BreakIterator_Unicode::getLineBreak(
{
LineBreakResults lbr;
+ if (nStartPos >= Text.getLength()) {
+ lbr.breakIndex = Text.getLength();
+ lbr.breakType = BreakType::WORDBOUNDARY;
+ return lbr;
+ }
+
loadICUBreakIterator(rLocale, LOAD_LINE_BREAKITERATOR, 0, lineRule, Text);
sal_Bool GlueSpace=sal_True;
while (GlueSpace) {
- if (line.aBreakIterator->isBoundary(nStartPos)) { //Line boundary break
+ if (line.aBreakIterator->preceding(nStartPos + 1) == nStartPos) { //Line boundary break
lbr.breakIndex = nStartPos;
lbr.breakType = BreakType::WORDBOUNDARY;
} else if (hOptions.rHyphenator.is()) { //Hyphenation break
diff --git a/i18npool/source/breakiterator/data/char_in.txt b/i18npool/source/breakiterator/data/char_in.txt
new file mode 100644
index 000000000000..72c4a44720cd
--- /dev/null
+++ b/i18npool/source/breakiterator/data/char_in.txt
@@ -0,0 +1,48 @@
+#
+# Copyright (C) 2002-2003, International Business Machines Corporation and others.
+# All Rights Reserved.
+#
+# file: char.txt
+#
+# ICU Character Break Rules, also known as Grapheme Cluster Boundaries
+# See Unicode Standard Annex #29.
+# These rules are based on TR29 Version 4.0.0
+#
+
+#
+# Character Class Definitions.
+# The names are those from TR29.
+#
+$CR = \r;
+$LF = \n;
+$Control = [[:Zl:] [:Zp:] [:Cc:] [:Cf:]];
+
+# add Japanese Half Width voicing marks to $Extend
+$VoiceMarks = [\uff9e\uff9f];
+$cmcextend = [ \u0903 \u093e-\u0940 \u0949-\u094C \u09bf-\u09c0 \u09c7-\u09c8 \u09cb-\u09cc \u0bc1-\u0bc2 \u0bc6-\u0bc8 \u0bca-\u0bcc \u0c01-\u0c03 \u0c41-\u0c44];
+$Extend = [[:Grapheme_Extend = TRUE:] $VoiceMarks $cmcextend];
+
+#
+# Korean Syllable Definitions
+#
+$L = [:Hangul_Syllable_Type = L:];
+$V = [:Hangul_Syllable_Type = V:];
+$T = [:Hangul_Syllable_Type = T:];
+
+$LV = [:Hangul_Syllable_Type = LV:];
+$LVT = [:Hangul_Syllable_Type = LVT:];
+
+$HangulSyllable = $L+ | ($L* ($LV? $V+ | $LV | $LVT) $T*) | $T+;
+
+#
+# Forward Break Rules
+#
+$CR $LF;
+([^$Control] | $HangulSyllable) $Extend*;
+.;
+
+
+#
+# Reverse Rule, back up to the beginning of some preceding grapheme cluster.
+#
+! ($Extend | $V | $T )* ($LF $CR | ($LV | $LVT)?$L* | .);
diff --git a/i18npool/source/breakiterator/data/char_ta.txt b/i18npool/source/breakiterator/data/char_ta.txt
index 5c9c702356a6..e69de29bb2d1 100644
--- a/i18npool/source/breakiterator/data/char_ta.txt
+++ b/i18npool/source/breakiterator/data/char_ta.txt
@@ -1,46 +0,0 @@
-#
-# Copyright (C) 2002-2003, International Business Machines Corporation and others.
-# All Rights Reserved.
-#
-# file: char.txt
-#
-# ICU Character Break Rules, also known as Grapheme Cluster Boundaries
-# See Unicode Standard Annex #29.
-# These rules are based on TR29 Version 4.0.0
-#
-
-#
-# Character Class Definitions.
-# The names are those from TR29.
-#
-$CR = \r;
-$LF = \n;
-$Control = [[:Zl:] [:Zp:] [:Cc:] [:Cf:]];
-
-$TAMIL = [ \u0bc1-\u0bc2 \u0bc6-\u0bc8 \u0bca-\u0bcc ];
-$Extend = [[:Grapheme_Extend = TRUE:] $TAMIL];
-
-#
-# Korean Syllable Definitions
-#
-$L = [:Hangul_Syllable_Type = L:];
-$V = [:Hangul_Syllable_Type = V:];
-$T = [:Hangul_Syllable_Type = T:];
-
-$LV = [:Hangul_Syllable_Type = LV:];
-$LVT = [:Hangul_Syllable_Type = LVT:];
-
-$HangulSyllable = $L+ | ($L* ($LV? $V+ | $LV | $LVT) $T*) | $T+;
-
-#
-# Forward Break Rules
-#
-$CR $LF;
-([^$Control] | $HangulSyllable) $Extend*;
-.;
-
-
-#
-# Reverse Rule, back up to the beginning of some preceding grapheme cluster.
-#
-! ($Extend | $V | $T )* ($LF $CR | ($LV | $LVT)?$L* | .);
diff --git a/i18npool/source/breakiterator/makefile.mk b/i18npool/source/breakiterator/makefile.mk
index 425806f6134e..2db7d3c7d73b 100644
--- a/i18npool/source/breakiterator/makefile.mk
+++ b/i18npool/source/breakiterator/makefile.mk
@@ -8,7 +8,7 @@
#
# $RCSfile: makefile.mk,v $
#
-# $Revision: 1.17 $
+# $Revision: 1.17.16.1 $
#
# This file is part of OpenOffice.org.
#
@@ -57,7 +57,6 @@ SLOFILES= \
$(SLO)$/breakiterator_cjk.obj \
$(SLO)$/breakiterator_ctl.obj \
$(SLO)$/breakiterator_th.obj \
- $(SLO)$/breakiterator_hi.obj \
$(SLO)$/breakiterator_unicode.obj \
$(SLO)$/xdictionary.obj \
$(subst,$(MISC)$/,$(SLO)$/ $(MY_MISC_CXXFILES:s/.c/.obj/))
diff --git a/i18npool/source/localedata/LocaleNode.cxx b/i18npool/source/localedata/LocaleNode.cxx
index 725033b929f8..0835746ba55c 100644
--- a/i18npool/source/localedata/LocaleNode.cxx
+++ b/i18npool/source/localedata/LocaleNode.cxx
@@ -7,7 +7,7 @@
* OpenOffice.org - a multi-platform office productivity suite
*
* $RCSfile: LocaleNode.cxx,v $
- * $Revision: 1.29 $
+ * $Revision: 1.29.16.1 $
*
* This file is part of OpenOffice.org.
*
@@ -1449,15 +1449,18 @@ void LCMiscNode::generateCode (const OFileWriter &of) const
if (forbidNode) {
of.writeParameter( "forbiddenBegin", forbidNode -> getChildAt(0)->getValue());
of.writeParameter( "forbiddenEnd", forbidNode -> getChildAt(1)->getValue());
+ of.writeParameter( "hangingChars", forbidNode -> getChildAt(2)->getValue());
} else {
of.writeParameter( "forbiddenBegin", ::rtl::OUString());
of.writeParameter( "forbiddenEnd", ::rtl::OUString());
+ of.writeParameter( "hangingChars", ::rtl::OUString());
}
of.writeAsciiString("\nstatic const sal_Unicode* LCForbiddenCharactersArray[] = {\n");
of.writeAsciiString("\tforbiddenBegin,\n");
- of.writeAsciiString("\tforbiddenEnd\n");
+ of.writeAsciiString("\tforbiddenEnd,\n");
+ of.writeAsciiString("\thangingChars\n");
of.writeAsciiString("};\n\n");
- of.writeFunction("getForbiddenCharacters_", "2", "LCForbiddenCharactersArray");
+ of.writeFunction("getForbiddenCharacters_", "3", "LCForbiddenCharactersArray");
if (breakNode) {
of.writeParameter( "EditMode", breakNode -> getChildAt(0)->getValue());
diff --git a/i18npool/source/localedata/data/bn_BD.xml b/i18npool/source/localedata/data/bn_BD.xml
index 95f54ecadf08..a89bb1b6a1c2 100644
--- a/i18npool/source/localedata/data/bn_BD.xml
+++ b/i18npool/source/localedata/data/bn_BD.xml
@@ -151,6 +151,13 @@
</LC_CURRENCY>
<LC_TRANSLITERATION ref="en_US"/>
<LC_MISC>
+ <BreakIteratorRules>
+ <EditMode/>
+ <DictionaryMode/>
+ <WordCountMode/>
+ <CharacterMode>char_in</CharacterMode>
+ <LineMode/>
+ </BreakIteratorRules>
<ReservedWords>
<trueWord>সত্য</trueWord>
<falseWord>মিথ্যা</falseWord>
diff --git a/i18npool/source/localedata/data/bn_IN.xml b/i18npool/source/localedata/data/bn_IN.xml
index d28990dd8df2..1dc7992f9ffd 100644
--- a/i18npool/source/localedata/data/bn_IN.xml
+++ b/i18npool/source/localedata/data/bn_IN.xml
@@ -316,6 +316,13 @@
</LC_CURRENCY>
<LC_TRANSLITERATION ref="en_US"/>
<LC_MISC>
+ <BreakIteratorRules>
+ <EditMode/>
+ <DictionaryMode/>
+ <WordCountMode/>
+ <CharacterMode>char_in</CharacterMode>
+ <LineMode/>
+ </BreakIteratorRules>
<ReservedWords>
<trueWord>সত্য</trueWord>
<falseWord>মিথ্যা</falseWord>
diff --git a/i18npool/source/localedata/data/gu_IN.xml b/i18npool/source/localedata/data/gu_IN.xml
index 70842a35f94c..f5923a70f9a9 100644
--- a/i18npool/source/localedata/data/gu_IN.xml
+++ b/i18npool/source/localedata/data/gu_IN.xml
@@ -146,6 +146,13 @@
</LC_CURRENCY>
<LC_TRANSLITERATION ref="en_US"/>
<LC_MISC>
+<BreakIteratorRules>
+<EditMode/>
+<DictionaryMode/>
+<WordCountMode/>
+<CharacterMode>char_in</CharacterMode>
+<LineMode/>
+</BreakIteratorRules>
<ReservedWords>
<trueWord>સહી</trueWord>
<falseWord>ગલત</falseWord>
diff --git a/i18npool/source/localedata/data/hi_IN.xml b/i18npool/source/localedata/data/hi_IN.xml
index 80a0da791cac..cfca665ad46c 100644
--- a/i18npool/source/localedata/data/hi_IN.xml
+++ b/i18npool/source/localedata/data/hi_IN.xml
@@ -358,6 +358,13 @@
</LC_CURRENCY>
<LC_TRANSLITERATION ref="en_US"/>
<LC_MISC>
+<BreakIteratorRules>
+<EditMode/>
+<DictionaryMode/>
+<WordCountMode/>
+<CharacterMode>char_in</CharacterMode>
+<LineMode/>
+</BreakIteratorRules>
<ReservedWords>
<trueWord>सही</trueWord>
<falseWord>गलत</falseWord>
diff --git a/i18npool/source/localedata/data/ja_JP.xml b/i18npool/source/localedata/data/ja_JP.xml
index f0e9dad78e75..d09dd5302749 100644
--- a/i18npool/source/localedata/data/ja_JP.xml
+++ b/i18npool/source/localedata/data/ja_JP.xml
@@ -503,6 +503,7 @@
<ForbiddenCharacters>
<ForbiddenLineBeginCharacters>!%),.:;?]}¢°’”‰′″℃、。々〉》」』】〕ぁぃぅぇぉっゃゅょゎ゛゜ゝゞァィゥェォッャュョヮヵヶ・ーヽヾ!%),.:;?]}。」、・ァィゥェォャュョッー゙゚¢</ForbiddenLineBeginCharacters>
<ForbiddenLineEndCharacters>$([¥{£¥‘“〈《「『【〔$([{「£¥</ForbiddenLineEndCharacters>
+ <LineBreakHangingCharacters>、。,.</LineBreakHangingCharacters>
</ForbiddenCharacters>
<ReservedWords>
<trueWord>true</trueWord>
diff --git a/i18npool/source/localedata/data/kn_IN.xml b/i18npool/source/localedata/data/kn_IN.xml
index 60ad028677d1..00d5dcff7639 100644
--- a/i18npool/source/localedata/data/kn_IN.xml
+++ b/i18npool/source/localedata/data/kn_IN.xml
@@ -146,6 +146,13 @@
</LC_CURRENCY>
<LC_TRANSLITERATION ref="en_US"/>
<LC_MISC>
+<BreakIteratorRules>
+<EditMode/>
+<DictionaryMode/>
+<WordCountMode/>
+<CharacterMode>char_in</CharacterMode>
+<LineMode/>
+</BreakIteratorRules>
<ReservedWords>
<trueWord>ಸಹೀ</trueWord>
<falseWord>ಗಲತ್</falseWord>
diff --git a/i18npool/source/localedata/data/ko_KR.xml b/i18npool/source/localedata/data/ko_KR.xml
index 4a5f4f63d7bb..bbd5b0ded2be 100644
--- a/i18npool/source/localedata/data/ko_KR.xml
+++ b/i18npool/source/localedata/data/ko_KR.xml
@@ -580,6 +580,7 @@
<ForbiddenCharacters>
<ForbiddenLineBeginCharacters>!%),.:;?]}¢¢?&apos;&quot;′″℃&gt;〉>》」』】〕!%),.:;?]}。」、・ ゙゚</ForbiddenLineBeginCharacters>
<ForbiddenLineEndCharacters>$(¥£[\{£¥&apos;&quot;&lt;<《「『【〔$([{₩「</ForbiddenLineEndCharacters>
+ <LineBreakHangingCharacters>!,.:;?、。!,.:;?</LineBreakHangingCharacters>
</ForbiddenCharacters>
<ReservedWords>
<trueWord>참</trueWord>
diff --git a/i18npool/source/localedata/data/locale.dtd b/i18npool/source/localedata/data/locale.dtd
index fb2cc54c7260..5e9f82dc36d2 100644
--- a/i18npool/source/localedata/data/locale.dtd
+++ b/i18npool/source/localedata/data/locale.dtd
@@ -403,7 +403,7 @@
<!ELEMENT LC_MISC (ForbiddenCharacters?, BreakIteratorRules?, ReservedWords?)>
<!ATTLIST LC_MISC %RefLocale;>
-<!ELEMENT ForbiddenCharacters (ForbiddenLineBeginCharacters, ForbiddenLineEndCharacters)>
+<!ELEMENT ForbiddenCharacters (ForbiddenLineBeginCharacters, ForbiddenLineEndCharacters, LineBreakHangingCharacters)>
<!ELEMENT ForbiddenLineBeginCharacters (#PCDATA)>
<!ELEMENT ForbiddenLineEndCharacters (#PCDATA)>
diff --git a/i18npool/source/localedata/data/ml_IN.xml b/i18npool/source/localedata/data/ml_IN.xml
index eb3fc4a342cd..813e523aa9aa 100644
--- a/i18npool/source/localedata/data/ml_IN.xml
+++ b/i18npool/source/localedata/data/ml_IN.xml
@@ -314,6 +314,13 @@
</LC_CURRENCY>
<LC_TRANSLITERATION ref="en_US"/>
<LC_MISC>
+ <BreakIteratorRules>
+ <EditMode/>
+ <DictionaryMode/>
+ <WordCountMode/>
+ <CharacterMode>char_in</CharacterMode>
+ <LineMode/>
+ </BreakIteratorRules>
<ReservedWords>
<trueWord>അതെ</trueWord>
<falseWord>അല്ല</falseWord>
diff --git a/i18npool/source/localedata/data/or_IN.xml b/i18npool/source/localedata/data/or_IN.xml
index c0ea95fefc33..168b542f1894 100644
--- a/i18npool/source/localedata/data/or_IN.xml
+++ b/i18npool/source/localedata/data/or_IN.xml
@@ -327,6 +327,13 @@
<Transliteration unoid="IGNORE_CASE"/>
</LC_TRANSLITERATION>
<LC_MISC>
+ <BreakIteratorRules>
+ <EditMode/>
+ <DictionaryMode/>
+ <WordCountMode/>
+ <CharacterMode>char_in</CharacterMode>
+ <LineMode/>
+ </BreakIteratorRules>
<ReservedWords>
<trueWord>ସତ</trueWord>
<falseWord>ମିଛ</falseWord>
diff --git a/i18npool/source/localedata/data/pa_IN.xml b/i18npool/source/localedata/data/pa_IN.xml
index e411eeb9ae77..8ca94443e161 100644
--- a/i18npool/source/localedata/data/pa_IN.xml
+++ b/i18npool/source/localedata/data/pa_IN.xml
@@ -168,6 +168,13 @@
</LC_CURRENCY>
<LC_TRANSLITERATION ref="en_US"/>
<LC_MISC>
+ <BreakIteratorRules>
+ <EditMode/>
+ <DictionaryMode/>
+ <WordCountMode/>
+ <CharacterMode>char_in</CharacterMode>
+ <LineMode/>
+ </BreakIteratorRules>
<ReservedWords>
<trueWord>ਸਹੀ</trueWord>
<falseWord>ਗਲਤ</falseWord>
diff --git a/i18npool/source/localedata/data/ta_IN.xml b/i18npool/source/localedata/data/ta_IN.xml
index 298cb218b46d..a06e3743f06e 100644
--- a/i18npool/source/localedata/data/ta_IN.xml
+++ b/i18npool/source/localedata/data/ta_IN.xml
@@ -146,6 +146,13 @@
</LC_CURRENCY>
<LC_TRANSLITERATION ref="en_US"/>
<LC_MISC>
+<BreakIteratorRules>
+<EditMode/>
+<DictionaryMode/>
+<WordCountMode/>
+<CharacterMode>char_in</CharacterMode>
+<LineMode/>
+</BreakIteratorRules>
<ReservedWords>
<trueWord>ஸரி</trueWord>
<falseWord>தப்ப</falseWord>
diff --git a/i18npool/source/localedata/data/te_IN.xml b/i18npool/source/localedata/data/te_IN.xml
index 492240ae835f..b753b34ff68c 100644
--- a/i18npool/source/localedata/data/te_IN.xml
+++ b/i18npool/source/localedata/data/te_IN.xml
@@ -145,6 +145,13 @@
</LC_CURRENCY>
<LC_TRANSLITERATION ref="en_US"/>
<LC_MISC>
+<BreakIteratorRules>
+<EditMode/>
+<DictionaryMode/>
+<WordCountMode/>
+<CharacterMode>char_in</CharacterMode>
+<LineMode/>
+</BreakIteratorRules>
<ReservedWords>
<trueWord>నిజము</trueWord>
<falseWord>అపాదము</falseWord>
diff --git a/i18npool/source/localedata/data/zh_CN.xml b/i18npool/source/localedata/data/zh_CN.xml
index 081e0866f39b..3409144ae95a 100644
--- a/i18npool/source/localedata/data/zh_CN.xml
+++ b/i18npool/source/localedata/data/zh_CN.xml
@@ -430,6 +430,7 @@
<ForbiddenCharacters>
<ForbiddenLineBeginCharacters>:!),.:;?]}¢'"、。〉》」』】〕〗〞︰︱︳﹐、﹒﹔﹕﹖﹗﹚﹜﹞!),.:;?|}︴︶︸︺︼︾﹀﹂﹄﹏、~¢々‖•·ˇˉ―--′</ForbiddenLineBeginCharacters>
<ForbiddenLineEndCharacters>([{£¥'"‵〈《「『【〔〖([{£¥〝︵︷︹︻︽︿﹁﹃﹙﹛﹝({</ForbiddenLineEndCharacters>
+<LineBreakHangingCharacters>!,.:;?、。!,.:;?</LineBreakHangingCharacters>
</ForbiddenCharacters>
<ReservedWords>
<trueWord>真</trueWord>
diff --git a/i18npool/source/localedata/data/zh_TW.xml b/i18npool/source/localedata/data/zh_TW.xml
index 57882119ef0c..1d1e476b7771 100644
--- a/i18npool/source/localedata/data/zh_TW.xml
+++ b/i18npool/source/localedata/data/zh_TW.xml
@@ -359,6 +359,7 @@
<ForbiddenCharacters>
<ForbiddenLineBeginCharacters>!),.:;?]}¢·--'"¨•′、。〉》」』】〕〞︰︱︳︴︶︸︺︼︾﹀﹂﹄﹏﹐、﹒﹔﹕﹖﹗﹚﹜﹞!),.:;?|}、</ForbiddenLineBeginCharacters>
<ForbiddenLineEndCharacters>([{£¥'"‵〈《「『【〔〝︵︷︹︻︽︿﹁﹃﹙﹛﹝({</ForbiddenLineEndCharacters>
+<LineBreakHangingCharacters>!,.:;?、。!,.:;?</LineBreakHangingCharacters>
</ForbiddenCharacters>
<ReservedWords>
<trueWord>真</trueWord>
diff --git a/i18npool/source/localedata/localedata.cxx b/i18npool/source/localedata/localedata.cxx
index 1cfdce7b185e..e8001913e048 100644
--- a/i18npool/source/localedata/localedata.cxx
+++ b/i18npool/source/localedata/localedata.cxx
@@ -7,7 +7,7 @@
* OpenOffice.org - a multi-platform office productivity suite
*
* $RCSfile: localedata.cxx,v $
- * $Revision: 1.59 $
+ * $Revision: 1.59.16.1 $
*
* This file is part of OpenOffice.org.
*
@@ -999,6 +999,21 @@ LocaleData::getForbiddenCharacters( const Locale& rLocale ) throw(RuntimeExcepti
}
}
+OUString SAL_CALL
+LocaleData::getHangingCharacters( const Locale& rLocale ) throw(RuntimeException)
+{
+ sal_Int16 LCForbiddenCharactersCount = 0;
+ sal_Unicode **LCForbiddenCharactersArray = NULL;
+
+ MyFunc_Type func = (MyFunc_Type) getFunctionSymbol( rLocale, "getForbiddenCharacters" );
+
+ if ( func ) {
+ LCForbiddenCharactersArray = func(LCForbiddenCharactersCount);
+ return OUString(LCForbiddenCharactersArray[2]);
+ }
+
+ return OUString();
+}
Sequence< OUString > SAL_CALL
LocaleData::getBreakIteratorRules( const Locale& rLocale ) throw(RuntimeException)
diff --git a/i18npool/source/registerservices/registerservices.cxx b/i18npool/source/registerservices/registerservices.cxx
index 54a5ecc67209..870c49939648 100644
--- a/i18npool/source/registerservices/registerservices.cxx
+++ b/i18npool/source/registerservices/registerservices.cxx
@@ -7,7 +7,7 @@
* OpenOffice.org - a multi-platform office productivity suite
*
* $RCSfile: registerservices.cxx,v $
- * $Revision: 1.44 $
+ * $Revision: 1.44.16.2 $
*
* This file is part of OpenOffice.org.
*
@@ -65,7 +65,6 @@
#include <breakiteratorImpl.hxx>
#include <breakiterator_cjk.hxx>
#include <breakiterator_th.hxx>
-#include <breakiterator_hi.hxx>
#include <breakiterator_unicode.hxx>
#include <indexentrysupplier.hxx>
@@ -152,9 +151,9 @@ IMPL_CREATEINSTANCE_MSF( BreakIteratorImpl )
IMPL_CREATEINSTANCE( BreakIterator_Unicode )
IMPL_CREATEINSTANCE( BreakIterator_ja )
IMPL_CREATEINSTANCE( BreakIterator_zh )
+IMPL_CREATEINSTANCE( BreakIterator_zh_TW )
IMPL_CREATEINSTANCE( BreakIterator_ko )
IMPL_CREATEINSTANCE( BreakIterator_th )
-IMPL_CREATEINSTANCE( BreakIterator_hi )
IMPL_CREATEINSTANCE_MSF( ChapterCollator )
IMPL_CREATEINSTANCE_MSF( CollatorImpl )
IMPL_CREATEINSTANCE( Collator_Unicode )
@@ -369,15 +368,15 @@ static const struct InstancesArray {
{ "com.sun.star.i18n.BreakIterator_zh",
"com.sun.star.i18n.BreakIterator_zh",
&BreakIterator_zh_CreateInstance },
+ { "com.sun.star.i18n.BreakIterator_zh_TW",
+ "com.sun.star.i18n.BreakIterator_zh_TW",
+ &BreakIterator_zh_TW_CreateInstance },
{ "com.sun.star.i18n.BreakIterator_ko",
"com.sun.star.i18n.BreakIterator_ko",
&BreakIterator_ko_CreateInstance },
{ "com.sun.star.i18n.BreakIterator_th",
"com.sun.star.i18n.BreakIterator_th",
&BreakIterator_th_CreateInstance },
- { "com.sun.star.i18n.BreakIterator_hi",
- "com.sun.star.i18n.BreakIterator_hi",
- &BreakIterator_hi_CreateInstance },
{ "com.sun.star.i18n.Collator",
"com.sun.star.i18n.Collator",
&CollatorImpl_CreateInstance },