Change-Id: I7ec4c946be52a6b56aee908426f95ecacc7b0746 Reviewed-on: https://gerrit.libreoffice.org/36072 Tested-by: Jenkins <ci@libreoffice.org> Reviewed-by: Noel Grandin <noel.grandin@collabora.co.uk>
528 lines
17 KiB
C++
528 lines
17 KiB
C++
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
|
|
/*
|
|
* This file is part of the LibreOffice project.
|
|
*
|
|
* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
*
|
|
* This file incorporates work covered by the following license notice:
|
|
*
|
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
|
* contributor license agreements. See the NOTICE file distributed
|
|
* with this work for additional information regarding copyright
|
|
* ownership. The ASF licenses this file to you under the Apache
|
|
* License, Version 2.0 (the "License"); you may not use this file
|
|
* except in compliance with the License. You may obtain a copy of
|
|
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
|
|
*/
|
|
|
|
#include "HtmlReader.hxx"
|
|
#include <connectivity/dbconversion.hxx>
|
|
#include <connectivity/dbtools.hxx>
|
|
#include <toolkit/helper/vclunohelper.hxx>
|
|
#include <tools/stream.hxx>
|
|
#include <tools/tenccvt.hxx>
|
|
#include <comphelper/extract.hxx>
|
|
#include <comphelper/string.hxx>
|
|
#include "dbu_misc.hrc"
|
|
#include "dbustrings.hrc"
|
|
#include <sfx2/sfxhtml.hxx>
|
|
#include <osl/diagnose.h>
|
|
#include "moduledbu.hxx"
|
|
#include <com/sun/star/sdbcx/XDataDescriptorFactory.hpp>
|
|
#include <com/sun/star/sdbcx/XColumnsSupplier.hpp>
|
|
#include <com/sun/star/sdbcx/XAppend.hpp>
|
|
#include <com/sun/star/sdbc/DataType.hpp>
|
|
#include <com/sun/star/sdbc/ColumnValue.hpp>
|
|
#include <com/sun/star/awt/FontDescriptor.hpp>
|
|
#include <com/sun/star/awt/FontWeight.hpp>
|
|
#include <com/sun/star/awt/FontStrikeout.hpp>
|
|
#include <com/sun/star/awt/FontSlant.hpp>
|
|
#include <com/sun/star/awt/FontUnderline.hpp>
|
|
#include <com/sun/star/util/NumberFormat.hpp>
|
|
#include <com/sun/star/util/XNumberFormatTypes.hpp>
|
|
#include <svtools/htmltokn.h>
|
|
#include <svtools/htmlkywd.hxx>
|
|
#include <tools/color.hxx>
|
|
#include "WCopyTable.hxx"
|
|
#include "WExtendPages.hxx"
|
|
#include "WNameMatch.hxx"
|
|
#include "WColumnSelect.hxx"
|
|
#include "QEnumTypes.hxx"
|
|
#include "WCPage.hxx"
|
|
#include <rtl/tencinfo.h>
|
|
#include "UITools.hxx"
|
|
#include <vcl/svapp.hxx>
|
|
#include <vcl/settings.hxx>
|
|
|
|
using namespace dbaui;
|
|
using namespace ::com::sun::star::uno;
|
|
using namespace ::com::sun::star::beans;
|
|
using namespace ::com::sun::star::container;
|
|
using namespace ::com::sun::star::sdbc;
|
|
using namespace ::com::sun::star::sdbcx;
|
|
using namespace ::com::sun::star::awt;
|
|
|
|
#define DBAUI_HTML_FONTSIZES 8 // like export, HTML-Options
|
|
|
|
// OHTMLReader
|
|
OHTMLReader::OHTMLReader(SvStream& rIn,const SharedConnection& _rxConnection,
|
|
const Reference< css::util::XNumberFormatter >& _rxNumberF,
|
|
const css::uno::Reference< css::uno::XComponentContext >& _rxContext)
|
|
: HTMLParser(rIn)
|
|
, ODatabaseExport( _rxConnection, _rxNumberF, _rxContext, rIn )
|
|
, m_nTableCount(0)
|
|
, m_nWidth(0)
|
|
, m_nColumnWidth(87)
|
|
, m_bMetaOptions(false)
|
|
, m_bSDNum(false)
|
|
{
|
|
SetSrcEncoding( GetExtendedCompatibilityTextEncoding( RTL_TEXTENCODING_ISO_8859_1 ) );
|
|
// If the file starts with a BOM, switch to UCS2.
|
|
SetSwitchToUCS2( true );
|
|
}
|
|
|
|
OHTMLReader::OHTMLReader(SvStream& rIn,
|
|
sal_Int32 nRows,
|
|
const TPositions &_rColumnPositions,
|
|
const Reference< css::util::XNumberFormatter >& _rxNumberF,
|
|
const css::uno::Reference< css::uno::XComponentContext >& _rxContext,
|
|
const TColumnVector* pList,
|
|
const OTypeInfoMap* _pInfoMap,
|
|
bool _bAutoIncrementEnabled)
|
|
: HTMLParser(rIn)
|
|
, ODatabaseExport( nRows, _rColumnPositions, _rxNumberF, _rxContext, pList, _pInfoMap, _bAutoIncrementEnabled, rIn )
|
|
, m_nTableCount(0)
|
|
, m_nWidth(0)
|
|
, m_nColumnWidth(87)
|
|
, m_bMetaOptions(false)
|
|
, m_bSDNum(false)
|
|
{
|
|
SetSrcEncoding( GetExtendedCompatibilityTextEncoding( RTL_TEXTENCODING_ISO_8859_1 ) );
|
|
// If the file starts with a BOM, switch to UCS2.
|
|
SetSwitchToUCS2( true );
|
|
}
|
|
|
|
OHTMLReader::~OHTMLReader()
|
|
{
|
|
}
|
|
|
|
SvParserState OHTMLReader::CallParser()
|
|
{
|
|
rInput.Seek(STREAM_SEEK_TO_BEGIN);
|
|
rInput.ResetError();
|
|
SvParserState eParseState = HTMLParser::CallParser();
|
|
SetColumnTypes(m_pColumnList,m_pInfoMap);
|
|
return m_bFoundTable ? eParseState : SvParserState::Error;
|
|
}
|
|
|
|
void OHTMLReader::NextToken( int nToken )
|
|
{
|
|
if(m_bError || !m_nRows) // if there is an error or no more rows to check, return immediately
|
|
return;
|
|
if ( nToken == HTML_META )
|
|
setTextEncoding();
|
|
|
|
if(m_xConnection.is()) // names, which CTOR was called and hence, if a table should be created
|
|
{
|
|
switch(nToken)
|
|
{
|
|
case HTML_TABLE_ON:
|
|
++m_nTableCount;
|
|
{ // can also be TD or TH, if there was no TABLE before
|
|
const HTMLOptions& rHtmlOptions = GetOptions();
|
|
for (const auto & rOption : rHtmlOptions)
|
|
{
|
|
switch( rOption.GetToken() )
|
|
{
|
|
case HTML_O_WIDTH:
|
|
{ // percentage: of document width respectively outer cell
|
|
m_nColumnWidth = GetWidthPixel( rOption );
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
SAL_FALLTHROUGH;
|
|
case HTML_THEAD_ON:
|
|
case HTML_TBODY_ON:
|
|
{
|
|
sal_uInt64 const nTell = rInput.Tell(); // perhaps alters position of the stream
|
|
if ( !m_xTable.is() )
|
|
{// use first line as header
|
|
m_bError = !CreateTable(nToken);
|
|
if ( m_bAppendFirstLine )
|
|
rInput.Seek(nTell);
|
|
}
|
|
}
|
|
break;
|
|
case HTML_TABLE_OFF:
|
|
if(!--m_nTableCount)
|
|
{
|
|
m_xTable = nullptr;
|
|
}
|
|
break;
|
|
case HTML_TABLEROW_ON:
|
|
if ( m_pUpdateHelper.get() )
|
|
{
|
|
try
|
|
{
|
|
m_pUpdateHelper->moveToInsertRow(); // otherwise append new line
|
|
}
|
|
catch(SQLException& e)
|
|
// handling update failure
|
|
{
|
|
showErrorDialog(e);
|
|
}
|
|
}
|
|
else
|
|
m_bError = true;
|
|
break;
|
|
case HTML_TEXTTOKEN:
|
|
case HTML_SINGLECHAR:
|
|
if ( m_bInTbl ) //&& !m_bSDNum ) // important, as otherwise we also get the names of the fonts
|
|
m_sTextToken += aToken;
|
|
break;
|
|
case HTML_PARABREAK_OFF:
|
|
m_sCurrent += m_sTextToken;
|
|
break;
|
|
case HTML_PARABREAK_ON:
|
|
m_sTextToken.clear();
|
|
break;
|
|
case HTML_TABLEDATA_ON:
|
|
fetchOptions();
|
|
break;
|
|
case HTML_TABLEDATA_OFF:
|
|
{
|
|
if ( !m_sCurrent.isEmpty() )
|
|
m_sTextToken = m_sCurrent;
|
|
try
|
|
{
|
|
insertValueIntoColumn();
|
|
}
|
|
catch(SQLException& e)
|
|
// handling update failure
|
|
{
|
|
showErrorDialog(e);
|
|
}
|
|
m_sCurrent.clear();
|
|
m_nColumnPos++;
|
|
eraseTokens();
|
|
m_bSDNum = m_bInTbl = false;
|
|
}
|
|
break;
|
|
case HTML_TABLEROW_OFF:
|
|
if ( !m_pUpdateHelper.get() )
|
|
{
|
|
m_bError = true;
|
|
break;
|
|
}
|
|
try
|
|
{
|
|
m_nRowCount++;
|
|
if (m_bIsAutoIncrement) // if bSetAutoIncrement then I have to set the autoincrement
|
|
m_pUpdateHelper->updateInt(1,m_nRowCount);
|
|
m_pUpdateHelper->insertRow();
|
|
}
|
|
catch(SQLException& e)
|
|
// handling update failure
|
|
{
|
|
showErrorDialog(e);
|
|
}
|
|
m_nColumnPos = 0;
|
|
break;
|
|
}
|
|
}
|
|
else // branch only valid for type checking
|
|
{
|
|
switch(nToken)
|
|
{
|
|
case HTML_THEAD_ON:
|
|
case HTML_TBODY_ON:
|
|
// The head of the column is not included
|
|
if(m_bHead)
|
|
{
|
|
do
|
|
{}
|
|
while(GetNextToken() != HTML_TABLEROW_OFF);
|
|
m_bHead = false;
|
|
}
|
|
break;
|
|
case HTML_TABLEDATA_ON:
|
|
case HTML_TABLEHEADER_ON:
|
|
fetchOptions();
|
|
break;
|
|
case HTML_TEXTTOKEN:
|
|
case HTML_SINGLECHAR:
|
|
if ( m_bInTbl ) // && !m_bSDNum ) // important, as otherwise we also get the names of the fonts
|
|
m_sTextToken += aToken;
|
|
break;
|
|
case HTML_PARABREAK_OFF:
|
|
m_sCurrent += m_sTextToken;
|
|
break;
|
|
case HTML_PARABREAK_ON:
|
|
m_sTextToken.clear();
|
|
break;
|
|
case HTML_TABLEDATA_OFF:
|
|
if ( !m_sCurrent.isEmpty() )
|
|
m_sTextToken = m_sCurrent;
|
|
adjustFormat();
|
|
m_nColumnPos++;
|
|
m_bSDNum = m_bInTbl = false;
|
|
m_sCurrent.clear();
|
|
break;
|
|
case HTML_TABLEROW_OFF:
|
|
if ( !m_sCurrent.isEmpty() )
|
|
m_sTextToken = m_sCurrent;
|
|
adjustFormat();
|
|
m_nColumnPos = 0;
|
|
m_nRows--;
|
|
m_sCurrent.clear();
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
void OHTMLReader::fetchOptions()
|
|
{
|
|
m_bInTbl = true;
|
|
const HTMLOptions& options = GetOptions();
|
|
for (const auto & rOption : options)
|
|
{
|
|
switch( rOption.GetToken() )
|
|
{
|
|
case HTML_O_SDVAL:
|
|
{
|
|
m_sValToken = rOption.GetString();
|
|
m_bSDNum = true;
|
|
}
|
|
break;
|
|
case HTML_O_SDNUM:
|
|
m_sNumToken = rOption.GetString();
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
void OHTMLReader::TableDataOn(SvxCellHorJustify& eVal)
|
|
{
|
|
const HTMLOptions& rHtmlOptions = GetOptions();
|
|
for (const auto & rOption : rHtmlOptions)
|
|
{
|
|
switch( rOption.GetToken() )
|
|
{
|
|
case HTML_O_ALIGN:
|
|
{
|
|
const OUString& rOptVal = rOption.GetString();
|
|
if (rOptVal.equalsIgnoreAsciiCase( OOO_STRING_SVTOOLS_HTML_AL_right ))
|
|
eVal = SvxCellHorJustify::Right;
|
|
else if (rOptVal.equalsIgnoreAsciiCase( OOO_STRING_SVTOOLS_HTML_AL_center ))
|
|
eVal = SvxCellHorJustify::Center;
|
|
else if (rOptVal.equalsIgnoreAsciiCase( OOO_STRING_SVTOOLS_HTML_AL_left ))
|
|
eVal = SvxCellHorJustify::Left;
|
|
else
|
|
eVal = SvxCellHorJustify::Standard;
|
|
}
|
|
break;
|
|
case HTML_O_WIDTH:
|
|
m_nWidth = GetWidthPixel( rOption );
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
void OHTMLReader::TableFontOn(FontDescriptor& _rFont,sal_Int32 &_rTextColor)
|
|
{
|
|
const HTMLOptions& rHtmlOptions = GetOptions();
|
|
for (const auto & rOption : rHtmlOptions)
|
|
{
|
|
switch( rOption.GetToken() )
|
|
{
|
|
case HTML_O_COLOR:
|
|
{
|
|
Color aColor;
|
|
rOption.GetColor( aColor );
|
|
_rTextColor = aColor.GetRGBColor();
|
|
}
|
|
break;
|
|
case HTML_O_FACE :
|
|
{
|
|
const OUString& rFace = rOption.GetString();
|
|
OUString aFontName;
|
|
sal_Int32 nPos = 0;
|
|
while( nPos != -1 )
|
|
{
|
|
// list fo fonts, VCL: semicolon as separator, HTML: comma
|
|
OUString aFName = rFace.getToken( 0, ',', nPos );
|
|
aFName = comphelper::string::strip(aFName, ' ');
|
|
if( !aFontName.isEmpty() )
|
|
aFontName += ";";
|
|
aFontName += aFName;
|
|
}
|
|
if ( !aFontName.isEmpty() )
|
|
_rFont.Name = aFontName;
|
|
}
|
|
break;
|
|
case HTML_O_SIZE :
|
|
{
|
|
sal_Int16 nSize = (sal_Int16) rOption.GetNumber();
|
|
if ( nSize == 0 )
|
|
nSize = 1;
|
|
else if ( nSize < DBAUI_HTML_FONTSIZES )
|
|
nSize = DBAUI_HTML_FONTSIZES;
|
|
|
|
_rFont.Height = nSize;
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
sal_Int16 OHTMLReader::GetWidthPixel( const HTMLOption& rOption )
|
|
{
|
|
const OUString& rOptVal = rOption.GetString();
|
|
if ( rOptVal.indexOf('%') != -1 )
|
|
{ // percentage
|
|
OSL_ENSURE( m_nColumnWidth, "WIDTH Option: m_nColumnWidth==0 and Width%" );
|
|
return (sal_Int16)((rOption.GetNumber() * m_nColumnWidth) / 100);
|
|
}
|
|
else
|
|
{
|
|
if ( rOptVal.indexOf('*') != -1 )
|
|
{ // relative to what?!?
|
|
//TODO: collect ColArray of all relevant values and then MakeCol
|
|
return 0;
|
|
}
|
|
else
|
|
return (sal_Int16)rOption.GetNumber(); // pixel
|
|
}
|
|
}
|
|
|
|
bool OHTMLReader::CreateTable(int nToken)
|
|
{
|
|
OUString aTempName(ModuleRes(STR_TBL_TITLE));
|
|
aTempName = aTempName.getToken(0,' ');
|
|
aTempName = ::dbtools::createUniqueName(m_xTables, aTempName);
|
|
|
|
bool bCaption = false;
|
|
bool bTableHeader = false;
|
|
OUString aColumnName;
|
|
SvxCellHorJustify eVal;
|
|
|
|
OUString aTableName;
|
|
FontDescriptor aFont = VCLUnoHelper::CreateFontDescriptor(Application::GetSettings().GetStyleSettings().GetAppFont());
|
|
sal_Int32 nTextColor = 0;
|
|
do
|
|
{
|
|
switch (nToken)
|
|
{
|
|
case HTML_TEXTTOKEN:
|
|
case HTML_SINGLECHAR:
|
|
if(bTableHeader)
|
|
aColumnName += aToken;
|
|
if(bCaption)
|
|
aTableName += aToken;
|
|
break;
|
|
case HTML_PARABREAK_OFF:
|
|
m_sCurrent += aColumnName;
|
|
break;
|
|
case HTML_PARABREAK_ON:
|
|
m_sTextToken.clear();
|
|
break;
|
|
case HTML_TABLEDATA_ON:
|
|
case HTML_TABLEHEADER_ON:
|
|
TableDataOn(eVal);
|
|
bTableHeader = true;
|
|
break;
|
|
case HTML_TABLEDATA_OFF:
|
|
case HTML_TABLEHEADER_OFF:
|
|
{
|
|
aColumnName = comphelper::string::strip(aColumnName, ' ' );
|
|
if (aColumnName.isEmpty() || m_bAppendFirstLine )
|
|
aColumnName = ModuleRes(STR_COLUMN_NAME);
|
|
else if ( !m_sCurrent.isEmpty() )
|
|
aColumnName = m_sCurrent;
|
|
|
|
aColumnName = comphelper::string::strip(aColumnName, ' ');
|
|
CreateDefaultColumn(aColumnName);
|
|
aColumnName.clear();
|
|
m_sCurrent.clear();
|
|
|
|
eVal = SvxCellHorJustify::Standard;
|
|
bTableHeader = false;
|
|
}
|
|
break;
|
|
|
|
case HTML_TITLE_ON:
|
|
case HTML_CAPTION_ON:
|
|
bCaption = true;
|
|
break;
|
|
case HTML_TITLE_OFF:
|
|
case HTML_CAPTION_OFF:
|
|
aTableName = comphelper::string::strip(aTableName, ' ');
|
|
if(aTableName.isEmpty())
|
|
aTableName = ::dbtools::createUniqueName(m_xTables, aTableName);
|
|
else
|
|
aTableName = aTempName;
|
|
bCaption = false;
|
|
break;
|
|
case HTML_FONT_ON:
|
|
TableFontOn(aFont,nTextColor);
|
|
break;
|
|
case HTML_BOLD_ON:
|
|
aFont.Weight = css::awt::FontWeight::BOLD;
|
|
break;
|
|
case HTML_ITALIC_ON:
|
|
aFont.Slant = css::awt::FontSlant_ITALIC;
|
|
break;
|
|
case HTML_UNDERLINE_ON:
|
|
aFont.Underline = css::awt::FontUnderline::SINGLE;
|
|
break;
|
|
case HTML_STRIKE_ON:
|
|
aFont.Strikeout = css::awt::FontStrikeout::SINGLE;
|
|
break;
|
|
}
|
|
nToken = GetNextToken();
|
|
}
|
|
while (nToken != HTML_TABLEROW_OFF);
|
|
|
|
if ( !m_sCurrent.isEmpty() )
|
|
aColumnName = m_sCurrent;
|
|
aColumnName = comphelper::string::strip(aColumnName, ' ');
|
|
if(!aColumnName.isEmpty())
|
|
CreateDefaultColumn(aColumnName);
|
|
|
|
if ( m_vDestVector.empty() )
|
|
return false;
|
|
|
|
if(aTableName.isEmpty())
|
|
aTableName = aTempName;
|
|
|
|
m_bInTbl = false;
|
|
m_bFoundTable = true;
|
|
|
|
if ( isCheckEnabled() )
|
|
return true;
|
|
|
|
return !executeWizard(aTableName,makeAny(nTextColor),aFont) && m_xTable.is();
|
|
}
|
|
|
|
void OHTMLReader::setTextEncoding()
|
|
{
|
|
m_bMetaOptions = true;
|
|
ParseMetaOptions(nullptr, nullptr);
|
|
}
|
|
|
|
void OHTMLReader::release()
|
|
{
|
|
ReleaseRef();
|
|
}
|
|
|
|
TypeSelectionPageFactory OHTMLReader::getTypeSelectionPageFactory()
|
|
{
|
|
return &OWizHTMLExtend::Create;
|
|
}
|
|
|
|
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
|