/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */ /* * This file is part of the LibreOffice project. * * This Source Code Form is subject to the terms of the Mozilla Public * License, v. 2.0. If a copy of the MPL was not distributed with this * file, You can obtain one at http://mozilla.org/MPL/2.0/. * * This file incorporates work covered by the following license notice: * * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed * with this work for additional information regarding copyright * ownership. The ASF licenses this file to you under the Apache * License, Version 2.0 (the "License"); you may not use this file * except in compliance with the License. You may obtain a copy of * the License at http://www.apache.org/licenses/LICENSE-2.0 . */ #include "HtmlReader.hxx" #include #include #include #include #include #include #include #include "strings.hrc" #include "stringconstants.hxx" #include #include #include "core_resource.hxx" #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include "WCopyTable.hxx" #include "WExtendPages.hxx" #include "WNameMatch.hxx" #include "WColumnSelect.hxx" #include "QEnumTypes.hxx" #include "WCPage.hxx" #include #include "core_resource.hxx" #include "UITools.hxx" #include #include using namespace dbaui; using namespace ::com::sun::star::uno; using namespace ::com::sun::star::beans; using namespace ::com::sun::star::container; using namespace ::com::sun::star::sdbc; using namespace ::com::sun::star::sdbcx; using namespace ::com::sun::star::awt; #define DBAUI_HTML_FONTSIZES 8 // like export, HTML-Options // OHTMLReader OHTMLReader::OHTMLReader(SvStream& rIn,const SharedConnection& _rxConnection, const Reference< css::util::XNumberFormatter >& _rxNumberF, const css::uno::Reference< css::uno::XComponentContext >& _rxContext) : HTMLParser(rIn) , ODatabaseExport( _rxConnection, _rxNumberF, _rxContext, rIn ) , m_nTableCount(0) , m_nColumnWidth(87) { SetSrcEncoding( GetExtendedCompatibilityTextEncoding( RTL_TEXTENCODING_ISO_8859_1 ) ); // If the file starts with a BOM, switch to UCS2. SetSwitchToUCS2( true ); } OHTMLReader::OHTMLReader(SvStream& rIn, sal_Int32 nRows, const TPositions &_rColumnPositions, const Reference< css::util::XNumberFormatter >& _rxNumberF, const css::uno::Reference< css::uno::XComponentContext >& _rxContext, const TColumnVector* pList, const OTypeInfoMap* _pInfoMap, bool _bAutoIncrementEnabled) : HTMLParser(rIn) , ODatabaseExport( nRows, _rColumnPositions, _rxNumberF, _rxContext, pList, _pInfoMap, _bAutoIncrementEnabled, rIn ) , m_nTableCount(0) , m_nColumnWidth(87) { SetSrcEncoding( GetExtendedCompatibilityTextEncoding( RTL_TEXTENCODING_ISO_8859_1 ) ); // If the file starts with a BOM, switch to UCS2. SetSwitchToUCS2( true ); } OHTMLReader::~OHTMLReader() { } SvParserState OHTMLReader::CallParser() { rInput.Seek(STREAM_SEEK_TO_BEGIN); rInput.ResetError(); SvParserState eParseState = HTMLParser::CallParser(); SetColumnTypes(m_pColumnList,m_pInfoMap); return m_bFoundTable ? eParseState : SvParserState::Error; } void OHTMLReader::NextToken( HtmlTokenId nToken ) { if(m_bError || !m_nRows) // if there is an error or no more rows to check, return immediately return; if ( nToken == HtmlTokenId::META ) setTextEncoding(); if(m_xConnection.is()) // names, which CTOR was called and hence, if a table should be created { switch(nToken) { case HtmlTokenId::TABLE_ON: ++m_nTableCount; { // can also be TD or TH, if there was no TABLE before const HTMLOptions& rHtmlOptions = GetOptions(); for (const auto & rOption : rHtmlOptions) { if( rOption.GetToken() == HtmlOptionId::WIDTH ) { // percentage: of document width respectively outer cell m_nColumnWidth = GetWidthPixel( rOption ); } } } SAL_FALLTHROUGH; case HtmlTokenId::THEAD_ON: case HtmlTokenId::TBODY_ON: { sal_uInt64 const nTell = rInput.Tell(); // perhaps alters position of the stream if ( !m_xTable.is() ) {// use first line as header m_bError = !CreateTable(nToken); if ( m_bAppendFirstLine ) rInput.Seek(nTell); } } break; case HtmlTokenId::TABLE_OFF: if(!--m_nTableCount) { m_xTable = nullptr; } break; case HtmlTokenId::TABLEROW_ON: if ( m_pUpdateHelper.get() ) { try { m_pUpdateHelper->moveToInsertRow(); // otherwise append new line } catch(SQLException& e) // handling update failure { showErrorDialog(e); } } else m_bError = true; break; case HtmlTokenId::TEXTTOKEN: case HtmlTokenId::SINGLECHAR: if ( m_bInTbl ) //&& !m_bSDNum ) // important, as otherwise we also get the names of the fonts m_sTextToken += aToken; break; case HtmlTokenId::PARABREAK_OFF: m_sCurrent += m_sTextToken; break; case HtmlTokenId::PARABREAK_ON: m_sTextToken.clear(); break; case HtmlTokenId::TABLEDATA_ON: fetchOptions(); break; case HtmlTokenId::TABLEDATA_OFF: { if ( !m_sCurrent.isEmpty() ) m_sTextToken = m_sCurrent; try { insertValueIntoColumn(); } catch(SQLException& e) // handling update failure { showErrorDialog(e); } m_sCurrent.clear(); m_nColumnPos++; eraseTokens(); m_bInTbl = false; } break; case HtmlTokenId::TABLEROW_OFF: if ( !m_pUpdateHelper.get() ) { m_bError = true; break; } try { m_nRowCount++; if (m_bIsAutoIncrement) // if bSetAutoIncrement then I have to set the autoincrement m_pUpdateHelper->updateInt(1,m_nRowCount); m_pUpdateHelper->insertRow(); } catch(SQLException& e) // handling update failure { showErrorDialog(e); } m_nColumnPos = 0; break; default: break; } } else // branch only valid for type checking { switch(nToken) { case HtmlTokenId::THEAD_ON: case HtmlTokenId::TBODY_ON: // The head of the column is not included if(m_bHead) { do {} while(GetNextToken() != HtmlTokenId::TABLEROW_OFF); m_bHead = false; } break; case HtmlTokenId::TABLEDATA_ON: case HtmlTokenId::TABLEHEADER_ON: fetchOptions(); break; case HtmlTokenId::TEXTTOKEN: case HtmlTokenId::SINGLECHAR: if ( m_bInTbl ) // && !m_bSDNum ) // important, as otherwise we also get the names of the fonts m_sTextToken += aToken; break; case HtmlTokenId::PARABREAK_OFF: m_sCurrent += m_sTextToken; break; case HtmlTokenId::PARABREAK_ON: m_sTextToken.clear(); break; case HtmlTokenId::TABLEDATA_OFF: if ( !m_sCurrent.isEmpty() ) m_sTextToken = m_sCurrent; adjustFormat(); m_nColumnPos++; m_bInTbl = false; m_sCurrent.clear(); break; case HtmlTokenId::TABLEROW_OFF: if ( !m_sCurrent.isEmpty() ) m_sTextToken = m_sCurrent; adjustFormat(); m_nColumnPos = 0; m_nRows--; m_sCurrent.clear(); break; default: break; } } } void OHTMLReader::fetchOptions() { m_bInTbl = true; const HTMLOptions& options = GetOptions(); for (const auto & rOption : options) { switch( rOption.GetToken() ) { case HtmlOptionId::SDVAL: m_sValToken = rOption.GetString(); break; case HtmlOptionId::SDNUM: m_sNumToken = rOption.GetString(); break; default: break; } } } void OHTMLReader::TableDataOn(SvxCellHorJustify& eVal) { const HTMLOptions& rHtmlOptions = GetOptions(); for (const auto & rOption : rHtmlOptions) { switch( rOption.GetToken() ) { case HtmlOptionId::ALIGN: { const OUString& rOptVal = rOption.GetString(); if (rOptVal.equalsIgnoreAsciiCase( OOO_STRING_SVTOOLS_HTML_AL_right )) eVal = SvxCellHorJustify::Right; else if (rOptVal.equalsIgnoreAsciiCase( OOO_STRING_SVTOOLS_HTML_AL_center )) eVal = SvxCellHorJustify::Center; else if (rOptVal.equalsIgnoreAsciiCase( OOO_STRING_SVTOOLS_HTML_AL_left )) eVal = SvxCellHorJustify::Left; else eVal = SvxCellHorJustify::Standard; } break; default: break; } } } void OHTMLReader::TableFontOn(FontDescriptor& _rFont,sal_Int32 &_rTextColor) { const HTMLOptions& rHtmlOptions = GetOptions(); for (const auto & rOption : rHtmlOptions) { switch( rOption.GetToken() ) { case HtmlOptionId::COLOR: { Color aColor; rOption.GetColor( aColor ); _rTextColor = aColor.GetRGBColor(); } break; case HtmlOptionId::FACE : { const OUString& rFace = rOption.GetString(); OUString aFontName; sal_Int32 nPos = 0; while( nPos != -1 ) { // list fo fonts, VCL: semicolon as separator, HTML: comma OUString aFName = rFace.getToken( 0, ',', nPos ); aFName = comphelper::string::strip(aFName, ' '); if( !aFontName.isEmpty() ) aFontName += ";"; aFontName += aFName; } if ( !aFontName.isEmpty() ) _rFont.Name = aFontName; } break; case HtmlOptionId::SIZE : { sal_Int16 nSize = (sal_Int16) rOption.GetNumber(); if ( nSize == 0 ) nSize = 1; else if ( nSize < DBAUI_HTML_FONTSIZES ) nSize = DBAUI_HTML_FONTSIZES; _rFont.Height = nSize; } break; default: break; } } } sal_Int16 OHTMLReader::GetWidthPixel( const HTMLOption& rOption ) { const OUString& rOptVal = rOption.GetString(); if ( rOptVal.indexOf('%') != -1 ) { // percentage OSL_ENSURE( m_nColumnWidth, "WIDTH Option: m_nColumnWidth==0 and Width%" ); return (sal_Int16)((rOption.GetNumber() * m_nColumnWidth) / 100); } else { if ( rOptVal.indexOf('*') != -1 ) { // relative to what?!? //TODO: collect ColArray of all relevant values and then MakeCol return 0; } else return (sal_Int16)rOption.GetNumber(); // pixel } } bool OHTMLReader::CreateTable(HtmlTokenId nToken) { OUString aTempName(DBA_RES(STR_TBL_TITLE)); aTempName = aTempName.getToken(0,' '); aTempName = ::dbtools::createUniqueName(m_xTables, aTempName); bool bCaption = false; bool bTableHeader = false; OUString aColumnName; SvxCellHorJustify eVal; OUString aTableName; FontDescriptor aFont = VCLUnoHelper::CreateFontDescriptor(Application::GetSettings().GetStyleSettings().GetAppFont()); sal_Int32 nTextColor = 0; do { switch (nToken) { case HtmlTokenId::TEXTTOKEN: case HtmlTokenId::SINGLECHAR: if(bTableHeader) aColumnName += aToken; if(bCaption) aTableName += aToken; break; case HtmlTokenId::PARABREAK_OFF: m_sCurrent += aColumnName; break; case HtmlTokenId::PARABREAK_ON: m_sTextToken.clear(); break; case HtmlTokenId::TABLEDATA_ON: case HtmlTokenId::TABLEHEADER_ON: TableDataOn(eVal); bTableHeader = true; break; case HtmlTokenId::TABLEDATA_OFF: case HtmlTokenId::TABLEHEADER_OFF: { aColumnName = comphelper::string::strip(aColumnName, ' ' ); if (aColumnName.isEmpty() || m_bAppendFirstLine ) aColumnName = DBA_RES(STR_COLUMN_NAME); else if ( !m_sCurrent.isEmpty() ) aColumnName = m_sCurrent; aColumnName = comphelper::string::strip(aColumnName, ' '); CreateDefaultColumn(aColumnName); aColumnName.clear(); m_sCurrent.clear(); eVal = SvxCellHorJustify::Standard; bTableHeader = false; } break; case HtmlTokenId::TITLE_ON: case HtmlTokenId::CAPTION_ON: bCaption = true; break; case HtmlTokenId::TITLE_OFF: case HtmlTokenId::CAPTION_OFF: aTableName = comphelper::string::strip(aTableName, ' '); if(aTableName.isEmpty()) aTableName = ::dbtools::createUniqueName(m_xTables, aTableName); else aTableName = aTempName; bCaption = false; break; case HtmlTokenId::FONT_ON: TableFontOn(aFont,nTextColor); break; case HtmlTokenId::BOLD_ON: aFont.Weight = css::awt::FontWeight::BOLD; break; case HtmlTokenId::ITALIC_ON: aFont.Slant = css::awt::FontSlant_ITALIC; break; case HtmlTokenId::UNDERLINE_ON: aFont.Underline = css::awt::FontUnderline::SINGLE; break; case HtmlTokenId::STRIKE_ON: aFont.Strikeout = css::awt::FontStrikeout::SINGLE; break; default: break; } nToken = GetNextToken(); } while (nToken != HtmlTokenId::TABLEROW_OFF); if ( !m_sCurrent.isEmpty() ) aColumnName = m_sCurrent; aColumnName = comphelper::string::strip(aColumnName, ' '); if(!aColumnName.isEmpty()) CreateDefaultColumn(aColumnName); if ( m_vDestVector.empty() ) return false; if(aTableName.isEmpty()) aTableName = aTempName; m_bInTbl = false; m_bFoundTable = true; if ( isCheckEnabled() ) return true; return !executeWizard(aTableName,makeAny(nTextColor),aFont) && m_xTable.is(); } void OHTMLReader::setTextEncoding() { ParseMetaOptions(nullptr, nullptr); } void OHTMLReader::release() { ReleaseRef(); } TypeSelectionPageFactory OHTMLReader::getTypeSelectionPageFactory() { return &OWizHTMLExtend::Create; } /* vim:set shiftwidth=4 softtabstop=4 expandtab: */