summaryrefslogtreecommitdiff
path: root/linguistic
diff options
context:
space:
mode:
authorOliver Bolte <obo@openoffice.org>2004-04-27 15:06:34 +0000
committerOliver Bolte <obo@openoffice.org>2004-04-27 15:06:34 +0000
commitdca163da5ee9664db914276ecfafb314836cca72 (patch)
treefdc48a01603c9341536c2e25cc2090b3af3f43b0 /linguistic
parentb5633ab341f54718b2e88d167c55bdbd3b783166 (diff)
INTEGRATION: CWS tl01 (1.1.2); FILE ADDED
2004/04/02 10:35:05 tl 1.1.2.6: #110762# change in Hangul/Hanja text conversion API 2004/03/22 16:22:50 tl 1.1.2.5: #110762# Solaris crash fixed by removing exception that was thrown for load performance reasons 2004/03/22 16:11:56 tl 1.1.2.4: #110762# Solaris crash fixed by removing exception that was thrown for load performance reasons 2004/03/20 10:34:00 gt 1.1.2.3: #111170# ConvDicXMLDictionaryContext_Impl::StartElement() missing exception declaration 2003/09/23 12:22:08 tl 1.1.2.2: #110762# prefix now checked for every local name usage 2003/09/12 10:42:39 tl 1.1.2.1: #110762# make textconversion dictionaries read/write XML
Diffstat (limited to 'linguistic')
-rw-r--r--linguistic/source/convdicxml.cxx529
1 files changed, 529 insertions, 0 deletions
diff --git a/linguistic/source/convdicxml.cxx b/linguistic/source/convdicxml.cxx
new file mode 100644
index 000000000000..f28f0c850471
--- /dev/null
+++ b/linguistic/source/convdicxml.cxx
@@ -0,0 +1,529 @@
+/*************************************************************************
+ *
+ * $RCSfile: convdicxml.cxx,v $
+ *
+ * $Revision: 1.2 $
+ *
+ * last change: $Author: obo $ $Date: 2004-04-27 16:06:34 $
+ *
+ * The Contents of this file are made available subject to the terms of
+ * either of the following licenses
+ *
+ * - GNU Lesser General Public License Version 2.1
+ * - Sun Industry Standards Source License Version 1.1
+ *
+ * Sun Microsystems Inc., October, 2000
+ *
+ * GNU Lesser General Public License Version 2.1
+ * =============================================
+ * Copyright 2000 by Sun Microsystems, Inc.
+ * 901 San Antonio Road, Palo Alto, CA 94303, USA
+ *
+ * This library is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License version 2.1, as published by the Free Software Foundation.
+ *
+ * This library is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with this library; if not, write to the Free Software
+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston,
+ * MA 02111-1307 USA
+ *
+ *
+ * Sun Industry Standards Source License Version 1.1
+ * =================================================
+ * The contents of this file are subject to the Sun Industry Standards
+ * Source License Version 1.1 (the "License"); You may not use this file
+ * except in compliance with the License. You may obtain a copy of the
+ * License at http://www.openoffice.org/license.html.
+ *
+ * Software provided under this License is provided on an "AS IS" basis,
+ * WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING,
+ * WITHOUT LIMITATION, WARRANTIES THAT THE SOFTWARE IS FREE OF DEFECTS,
+ * MERCHANTABLE, FIT FOR A PARTICULAR PURPOSE, OR NON-INFRINGING.
+ * See the License for the specific provisions governing your rights and
+ * obligations concerning the Software.
+ *
+ * The Initial Developer of the Original Code is: Sun Microsystems, Inc.
+ *
+ * Copyright: 2000 by Sun Microsystems, Inc.
+ *
+ * All Rights Reserved.
+ *
+ * Contributor(s): _______________________________________
+ *
+ *
+ ************************************************************************/
+
+#ifndef _LANG_HXX //autogen wg. LANGUAGE_ENGLISH_US
+#include <tools/lang.hxx>
+#endif
+#ifndef _URLOBJ_HXX
+#include <tools/urlobj.hxx>
+#endif
+#ifndef _TOOLS_DEBUG_HXX
+#include <tools/debug.hxx>
+#endif
+#ifndef _FSYS_HXX
+#include <tools/fsys.hxx>
+#endif
+#ifndef _STRING_HXX
+#include <tools/string.hxx>
+#endif
+#ifndef _ISOLANG_HXX
+#include <tools/isolang.hxx>
+#endif
+#ifndef _STREAM_HXX
+#include <tools/stream.hxx>
+#endif
+#ifndef _SFXDOCFILE_HXX
+#include <sfx2/docfile.hxx>
+#endif
+#ifndef _OSL_MUTEX_HXX_
+#include <osl/mutex.hxx>
+#endif
+#ifndef _UNOTOOLS_PROCESSFACTORY_HXX_
+#include <unotools/processfactory.hxx>
+#endif
+#ifndef _UCBHELPER_CONTENT_HXX
+#include <ucbhelper/content.hxx>
+#endif
+
+#include <cppuhelper/factory.hxx> // helper for factories
+
+#ifndef _COM_SUN_STAR_LINGUISTIC2_XCONVERSIONDICTIONARY_HPP_
+#include <com/sun/star/linguistic2/XConversionDictionary.hpp>
+#endif
+#ifndef _COM_SUN_STAR_LINGUISTIC2_CONVERSIONDICTIONARYTYPE_HPP_
+#include <com/sun/star/linguistic2/ConversionDictionaryType.hpp>
+#endif
+#ifndef _COM_SUN_STAR_UTIL_XFLUSHABLE_HPP_
+#include <com/sun/star/util/XFlushable.hpp>
+#endif
+#ifndef _COM_SUN_STAR_LANG_LOCALE_HPP_
+#include <com/sun/star/lang/Locale.hpp>
+#endif
+#ifndef _COM_SUN_STAR_LANG_EVENTOBJECT_HPP_
+#include <com/sun/star/lang/EventObject.hpp>
+#endif
+#ifndef _COM_SUN_STAR_UNO_REFERENCE_HPP_
+#include <com/sun/star/uno/Reference.h>
+#endif
+#ifndef _COM_SUN_STAR_REGISTRY_XREGISTRYKEY_HPP_
+#include <com/sun/star/registry/XRegistryKey.hpp>
+#endif
+#ifndef _COM_SUN_STAR_UTIL_XFLUSHLISTENER_HPP_
+#include <com/sun/star/util/XFlushListener.hpp>
+#endif
+#ifndef _COM_SUN_STAR_IO_XACTIVEDATASOURCE_HPP_
+#include <com/sun/star/io/XActiveDataSource.hpp>
+#endif
+#ifndef _COM_SUN_STAR_DOCUMENT_XFILTER_HPP_
+#include <com/sun/star/document/XFilter.hpp>
+#endif
+#ifndef _COM_SUN_STAR_BEANS_PROPERTYVALUE_HPP_
+#include <com/sun/star/beans/PropertyValue.hpp>
+#endif
+
+#ifndef _XMLOFF_NMSPMAP_HXX
+#include <xmloff/nmspmap.hxx>
+#endif
+#ifndef _XMLOFF_XMLNMSPE_HXX
+#include <xmloff/xmlnmspe.hxx>
+#endif
+#ifndef _UTL_STREAM_WRAPPER_HXX_
+#include <unotools/streamwrap.hxx>
+#endif
+
+#include "convdic.hxx"
+#include "convdicxml.hxx"
+#include "misc.hxx"
+#include "defs.hxx"
+
+using namespace std;
+using namespace utl;
+using namespace osl;
+using namespace rtl;
+using namespace com::sun::star;
+using namespace com::sun::star::lang;
+using namespace com::sun::star::uno;
+using namespace com::sun::star::linguistic2;
+using namespace linguistic;
+
+#define XML_NAMESPACE_TCD_STRING "http://openoffice.org/2003/text-conversion-dictionary"
+#define CONV_TYPE_HANGUL_HANJA "Hangul / Hanja"
+//#define CONV_TYPE_SCHINESE_TCHINESE "Chinese simplified / Chinese traditional"
+
+///////////////////////////////////////////////////////////////////////////
+
+static const OUString ConversionTypeToText( sal_Int16 nConversionType )
+{
+ OUString aRes;
+ if (nConversionType == ConversionDictionaryType::HANGUL_HANJA)
+ aRes = A2OU( CONV_TYPE_HANGUL_HANJA );
+// else if (nConversionType == ConversionDictionaryType::SCHINESE_TCHINESE)
+// aRes = A2OU( CONV_TYPE_SCHINESE_TCHINESE );
+ return aRes;
+}
+
+static sal_Int16 GetConversionTypeFromText( const String &rText )
+{
+ sal_Int16 nRes = -1;
+ if (rText.EqualsAscii( CONV_TYPE_HANGUL_HANJA ))
+ nRes = ConversionDictionaryType::HANGUL_HANJA;
+// else if (rText.EqualsAscii( CONV_TYPE_SCHINESE_TCHINESE ))
+// nRes = ConversionDictionaryType::SCHINESE_TCHINESE;
+ return nRes;
+}
+
+///////////////////////////////////////////////////////////////////////////
+
+class ConvDicXMLImportContext :
+ public SvXMLImportContext
+{
+public:
+ ConvDicXMLImportContext(
+ ConvDicXMLImport &rImport,
+ sal_uInt16 nPrfx, const OUString& rLName ) :
+ SvXMLImportContext( rImport, nPrfx, rLName )
+ {
+ }
+
+ const ConvDicXMLImport & GetConvDicImport() const
+ {
+ return (const ConvDicXMLImport &) GetImport();
+ }
+
+ ConvDicXMLImport & GetConvDicImport()
+ {
+ return (ConvDicXMLImport &) GetImport();
+ }
+
+ // SvXMLImportContext
+ virtual void Characters( const OUString &rChars );
+ virtual SvXMLImportContext * CreateChildContext( sal_uInt16 nPrefix, const OUString& rLocalName, const uno::Reference< xml::sax::XAttributeList > &rxAttrList);
+};
+
+
+class ConvDicXMLDictionaryContext_Impl :
+ public ConvDicXMLImportContext
+{
+ INT16 nLanguage;
+ sal_Int16 nConversionType;
+
+public:
+ ConvDicXMLDictionaryContext_Impl( ConvDicXMLImport &rImport,
+ sal_uInt16 nPrefix, const OUString& rLName) :
+ ConvDicXMLImportContext( rImport, nPrefix, rLName )
+ {
+ nLanguage = LANGUAGE_NONE;
+ nConversionType = -1;
+ }
+
+ // SvXMLImportContext
+ virtual void StartElement( const ::com::sun::star::uno::Reference< ::com::sun::star::xml::sax::XAttributeList >& xAttrList );
+ virtual SvXMLImportContext * CreateChildContext( sal_uInt16 nPrefix, const OUString& rLocalName, const uno::Reference< xml::sax::XAttributeList > &rxAttrList );
+
+ INT16 GetLanguage() const { return nLanguage; }
+ sal_Int16 GetConversionType() const { return nConversionType; }
+};
+
+
+class ConvDicXMLEntryTextContext_Impl :
+ public ConvDicXMLImportContext
+{
+ OUString aLeftText;
+ ConvDicXMLDictionaryContext_Impl &rDicContext;
+
+public:
+ ConvDicXMLEntryTextContext_Impl(
+ ConvDicXMLImport &rImport,
+ sal_uInt16 nPrefix, const OUString& rLName,
+ ConvDicXMLDictionaryContext_Impl &rParentContext ) :
+ ConvDicXMLImportContext( rImport, nPrefix, rLName ),
+ rDicContext( rParentContext )
+ {
+ }
+
+ // SvXMLImportContext
+ virtual void StartElement( const ::com::sun::star::uno::Reference< ::com::sun::star::xml::sax::XAttributeList >& xAttrList );
+ virtual SvXMLImportContext * CreateChildContext( sal_uInt16 nPrefix, const OUString& rLocalName, const uno::Reference< xml::sax::XAttributeList > &rxAttrList );
+
+ const OUString & GetLeftText() const { return aLeftText; }
+};
+
+
+class ConvDicXMLRightTextContext_Impl :
+ public ConvDicXMLImportContext
+{
+ OUString aRightText;
+ ConvDicXMLEntryTextContext_Impl &rEntryContext;
+
+public:
+ ConvDicXMLRightTextContext_Impl(
+ ConvDicXMLImport &rImport,
+ sal_uInt16 nPrefix, const OUString& rLName,
+ ConvDicXMLEntryTextContext_Impl &rParentContext ) :
+ ConvDicXMLImportContext( rImport, nPrefix, rLName ),
+ rEntryContext( rParentContext )
+ {
+ }
+
+ // SvXMLImportContext
+ virtual void EndElement();
+ virtual SvXMLImportContext * CreateChildContext( sal_uInt16 nPrefix, const OUString& rLocalName, const uno::Reference< xml::sax::XAttributeList > &rxAttrList );
+ virtual void Characters( const OUString &rChars );
+
+ const OUString & GetRightText() const { return aRightText; }
+ const OUString & GetLeftText() const { return rEntryContext.GetLeftText(); }
+ ConvDic * GetDic() { return GetConvDicImport().GetDic(); }
+};
+
+///////////////////////////////////////////////////////////////////////////
+
+void ConvDicXMLImportContext::Characters(const OUString &rChars)
+{
+ /*
+ Whitespace occurring within the content of token elements is "trimmed"
+ from the ends (i.e. all whitespace at the beginning and end of the
+ content is removed), and "collapsed" internally (i.e. each sequence of
+ 1 or more whitespace characters is replaced with one blank character).
+ */
+ //collapsing not done yet!
+ const OUString &rChars2 = rChars.trim();
+}
+
+SvXMLImportContext * ConvDicXMLImportContext::CreateChildContext(
+ sal_uInt16 nPrefix, const OUString& rLocalName,
+ const uno::Reference< xml::sax::XAttributeList > &rxAttrList )
+{
+ SvXMLImportContext *pContext = 0;
+ if (nPrefix == XML_NAMESPACE_TCD && rLocalName.equalsAscii( "text-conversion-dictionary" ))
+ pContext = new ConvDicXMLDictionaryContext_Impl( GetConvDicImport(), nPrefix, rLocalName );
+ else
+ pContext = new SvXMLImportContext( GetImport(), nPrefix, rLocalName );
+ return pContext;
+}
+
+////////////////////////////////////////
+
+void ConvDicXMLDictionaryContext_Impl::StartElement(
+ const Reference< xml::sax::XAttributeList >& rxAttrList )
+{
+ sal_Int16 nAttrCount = rxAttrList.is() ? rxAttrList->getLength() : 0;
+ for (sal_Int16 i = 0; i < nAttrCount; ++i)
+ {
+ OUString aAttrName = rxAttrList->getNameByIndex(i);
+ OUString aLocalName;
+ sal_uInt16 nPrefix = GetImport().GetNamespaceMap().
+ GetKeyByAttrName( aAttrName, &aLocalName );
+ OUString aValue = rxAttrList->getValueByIndex(i);
+
+ if (nPrefix == XML_NAMESPACE_TCD && aLocalName.equalsAscii( "lang" ))
+ nLanguage = ConvertIsoStringToLanguage( aValue );
+ else if (nPrefix == XML_NAMESPACE_TCD && aLocalName.equalsAscii( "conversion-type" ))
+ nConversionType = GetConversionTypeFromText( aValue );
+ }
+ GetConvDicImport().SetLanguage( nLanguage );
+ GetConvDicImport().SetConversionType( nConversionType );
+
+ //!! hack to stop the parser from reading the rest of the file !!
+ //!! when only the header (language, conversion type) is needed !!
+// if (GetConvDicImport().GetDic() == 0)
+// throw uno::RuntimeException();
+}
+
+SvXMLImportContext * ConvDicXMLDictionaryContext_Impl::CreateChildContext(
+ sal_uInt16 nPrefix, const OUString& rLocalName,
+ const uno::Reference< xml::sax::XAttributeList > &rxAttrList )
+{
+ SvXMLImportContext *pContext = 0;
+ if (nPrefix == XML_NAMESPACE_TCD && rLocalName.equalsAscii( "entry" ))
+ pContext = new ConvDicXMLEntryTextContext_Impl( GetConvDicImport(), nPrefix, rLocalName, *this );
+ else
+ pContext = new SvXMLImportContext( GetImport(), nPrefix, rLocalName );
+ return pContext;
+}
+
+////////////////////////////////////////
+
+SvXMLImportContext * ConvDicXMLEntryTextContext_Impl::CreateChildContext(
+ sal_uInt16 nPrefix, const OUString& rLocalName,
+ const uno::Reference< xml::sax::XAttributeList > &rxAttrList )
+{
+ SvXMLImportContext *pContext = 0;
+ if (nPrefix == XML_NAMESPACE_TCD && rLocalName.equalsAscii( "right-text" ))
+ pContext = new ConvDicXMLRightTextContext_Impl( GetConvDicImport(), nPrefix, rLocalName, *this );
+ else
+ pContext = new SvXMLImportContext( GetImport(), nPrefix, rLocalName );
+ return pContext;
+}
+
+void ConvDicXMLEntryTextContext_Impl::StartElement(
+ const Reference< xml::sax::XAttributeList >& rxAttrList )
+{
+ sal_Int16 nAttrCount = rxAttrList.is() ? rxAttrList->getLength() : 0;
+ for (sal_Int16 i = 0; i < nAttrCount; ++i)
+ {
+ OUString aAttrName = rxAttrList->getNameByIndex(i);
+ OUString aLocalName;
+ sal_uInt16 nPrefix = GetImport().GetNamespaceMap().
+ GetKeyByAttrName( aAttrName, &aLocalName );
+ OUString aValue = rxAttrList->getValueByIndex(i);
+
+ if (nPrefix == XML_NAMESPACE_TCD && aLocalName.equalsAscii( "left-text" ))
+ aLeftText = aValue;
+ }
+}
+
+////////////////////////////////////////
+
+SvXMLImportContext * ConvDicXMLRightTextContext_Impl::CreateChildContext(
+ sal_uInt16 nPrefix, const OUString& rLocalName,
+ const uno::Reference< xml::sax::XAttributeList > &rxAttrList )
+{
+ // leaf: return default (empty) context
+ SvXMLImportContext *pContext = new SvXMLImportContext( GetImport(), nPrefix, rLocalName );
+ return pContext;
+}
+
+void ConvDicXMLRightTextContext_Impl::Characters( const OUString &rChars )
+{
+ aRightText += rChars;
+}
+
+void ConvDicXMLRightTextContext_Impl::EndElement()
+{
+ ConvDic *pDic = GetDic();
+ if (pDic)
+ pDic->AddEntry( GetLeftText(), GetRightText() );
+}
+
+
+///////////////////////////////////////////////////////////////////////////
+
+sal_Bool ConvDicXMLExport::Export( SfxMedium &rMedium )
+{
+ sal_Bool bRet = sal_False;
+
+ Reference< document::XExporter > xExporter( this );
+ Reference< document::XFilter > xFilter( xExporter, UNO_QUERY );
+ uno::Sequence< beans::PropertyValue > aProps(0);
+ xFilter->filter( aProps ); // calls exportDoc implicitly
+
+ return bRet = bSuccess;
+}
+
+
+sal_uInt32 ConvDicXMLExport::exportDoc( enum ::xmloff::token::XMLTokenEnum eClass )
+{
+ _GetNamespaceMap().Add( A2OU( "tcd" ),
+ A2OU( XML_NAMESPACE_TCD_STRING ), XML_NAMESPACE_TCD );
+
+ GetDocHandler()->startDocument();
+
+ // Add xmlns line and some other arguments
+ AddAttribute( _GetNamespaceMap().GetAttrNameByKey( XML_NAMESPACE_TCD ),
+ _GetNamespaceMap().GetNameByKey( XML_NAMESPACE_TCD ) );
+ AddAttributeASCII( XML_NAMESPACE_TCD, "package", "org.openoffice.Office" );
+
+ OUString aIsoLang( ConvertLanguageToIsoString( rDic.nLanguage ) );
+ AddAttribute( XML_NAMESPACE_TCD, "lang", aIsoLang );
+ OUString aConvType( ConversionTypeToText( rDic.nConversionType ) );
+ AddAttribute( XML_NAMESPACE_TCD, "conversion-type", aConvType );
+
+ //!! block necessary in order to have SvXMLElementExport d-tor called
+ //!! before the call to endDocument
+ {
+ SvXMLElementExport aRoot( *this, XML_NAMESPACE_TCD, "text-conversion-dictionary", sal_True, sal_True );
+ _ExportContent();
+ }
+
+ GetDocHandler()->endDocument();
+
+ bSuccess = sal_True;
+ return 0;
+}
+
+
+void ConvDicXMLExport::_ExportContent()
+{
+ // aquire sorted list of all keys
+ ConvMapKeySet aKeySet;
+ ConvMap::iterator aIt;
+ for (aIt = rDic.aFromLeft.begin(); aIt != rDic.aFromLeft.end(); ++aIt)
+ aKeySet.insert( (*aIt).first );
+#ifdef DEBUG
+ size_t nSz = aKeySet.size();
+#endif
+
+ ConvMapKeySet::iterator aKeyIt;
+ for (aKeyIt = aKeySet.begin(); aKeyIt != aKeySet.end(); ++aKeyIt)
+ {
+ OUString aLeftText( *aKeyIt );
+ AddAttribute( XML_NAMESPACE_TCD, "left-text", aLeftText );
+ SvXMLElementExport aEntryMain( *this, XML_NAMESPACE_TCD,
+ "entry" , sal_True, sal_True );
+
+ pair< ConvMap::iterator, ConvMap::iterator > aRange =
+ rDic.aFromLeft.equal_range( *aKeyIt );
+ for (aIt = aRange.first; aIt != aRange.second; ++aIt)
+ {
+ DBG_ASSERT( *aKeyIt == (*aIt).first, "key <-> entry mismatch" );
+ OUString aRightText( (*aIt).second );
+ SvXMLElementExport aEntryRightText( *this, XML_NAMESPACE_TCD,
+ "right-text" , sal_True, sal_False );
+ Characters( aRightText );
+ }
+ }
+}
+
+::rtl::OUString SAL_CALL ConvDicXMLExport::getImplementationName()
+ throw( uno::RuntimeException )
+{
+ return A2OU( "com.sun.star.lingu2.ConvDicXMLExport" );
+}
+
+///////////////////////////////////////////////////////////////////////////
+
+void SAL_CALL ConvDicXMLImport::startDocument(void)
+ throw( xml::sax::SAXException, uno::RuntimeException )
+{
+ // register namespace at first possible opportunity
+ GetNamespaceMap().Add( A2OU( "tcd" ),
+ A2OU( XML_NAMESPACE_TCD_STRING ), XML_NAMESPACE_TCD );
+ SvXMLImport::startDocument();
+}
+
+void SAL_CALL ConvDicXMLImport::endDocument(void)
+ throw( xml::sax::SAXException, uno::RuntimeException )
+{
+ SvXMLImport::endDocument();
+}
+
+SvXMLImportContext * ConvDicXMLImport::CreateContext(
+ sal_uInt16 nPrefix,
+ const rtl::OUString &rLocalName,
+ const com::sun::star::uno::Reference < com::sun::star::xml::sax::XAttributeList > &rxAttrList )
+{
+ SvXMLImportContext *pContext = 0;
+ if (nPrefix == XML_NAMESPACE_TCD && rLocalName.equalsAscii( "text-conversion-dictionary" ))
+ pContext = new ConvDicXMLDictionaryContext_Impl( *this, nPrefix, rLocalName );
+ else
+ pContext = new SvXMLImportContext( *this, nPrefix, rLocalName );
+ return pContext;
+}
+
+
+OUString SAL_CALL ConvDicXMLImport::getImplementationName()
+ throw( uno::RuntimeException )
+{
+ return A2OU( "com.sun.star.lingu2.ConvDicXMLImport" );
+}
+
+///////////////////////////////////////////////////////////////////////////
+