office-gobmx/linguistic/source/hyphdsp.cxx
Rüdiger Timm fae29986d3 INTEGRATION: CWS changefileheader (1.23.2); FILE MERGED
2008/04/01 15:21:26 thb 1.23.2.3: #i85898# Stripping all external header guards
2008/04/01 12:31:46 thb 1.23.2.2: #i85898# Stripping all external header guards
2008/03/31 16:25:38 rt 1.23.2.1: #i87441# Change license header to LPGL v3.
2008-04-10 11:23:13 +00:00

741 lines
25 KiB
C++

/*************************************************************************
*
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* Copyright 2008 by Sun Microsystems, Inc.
*
* OpenOffice.org - a multi-platform office productivity suite
*
* $RCSfile: hyphdsp.cxx,v $
* $Revision: 1.24 $
*
* This file is part of OpenOffice.org.
*
* OpenOffice.org is free software: you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License version 3
* only, as published by the Free Software Foundation.
*
* OpenOffice.org is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License version 3 for more details
* (a copy is included in the LICENSE file that accompanied this code).
*
* You should have received a copy of the GNU Lesser General Public License
* version 3 along with OpenOffice.org. If not, see
* <http://www.openoffice.org/license.html>
* for a copy of the LGPLv3 License.
*
************************************************************************/
// MARKER(update_precomp.py): autogen include statement, do not remove
#include "precompiled_linguistic.hxx"
#include <cppuhelper/factory.hxx> // helper for factories
#include <com/sun/star/registry/XRegistryKey.hpp>
#include <com/sun/star/linguistic2/XSearchableDictionaryList.hpp>
#include <com/sun/star/linguistic2/XHyphenatedWord.hpp>
#include <rtl/ustrbuf.hxx>
#include <i18npool/lang.h>
#include <unotools/localedatawrapper.hxx>
#include <tools/debug.hxx>
#include <svtools/lngmisc.hxx>
#include <unotools/processfactory.hxx>
#include <osl/mutex.hxx>
#include "hyphdsp.hxx"
#include "hyphdta.hxx"
#include "lngprops.hxx"
#include "lngsvcmgr.hxx"
using namespace utl;
using namespace osl;
using namespace rtl;
using namespace com::sun::star;
using namespace com::sun::star::beans;
using namespace com::sun::star::lang;
using namespace com::sun::star::uno;
using namespace com::sun::star::linguistic2;
using namespace linguistic;
///////////////////////////////////////////////////////////////////////////
LangSvcEntry_Hyph::~LangSvcEntry_Hyph()
{
}
LangSvcEntry_Hyph::LangSvcEntry_Hyph( const ::rtl::OUString &rSvcImplName ) :
aSvcImplName( rSvcImplName )
{
}
///////////////////////////////////////////////////////////////////////////
HyphenatorDispatcher::HyphenatorDispatcher( LngSvcMgr &rLngSvcMgr ) :
rMgr (rLngSvcMgr)
{
}
HyphenatorDispatcher::~HyphenatorDispatcher()
{
ClearSvcList();
}
void HyphenatorDispatcher::ClearSvcList()
{
// release memory for each table entry
LangSvcEntry_Hyph *pItem = aSvcList.First();
while (pItem)
{
LangSvcEntry_Hyph *pTmp = pItem;
pItem = aSvcList.Next();
delete pTmp;
}
}
Reference<XHyphenatedWord> HyphenatorDispatcher::buildHyphWord(
const OUString rOrigWord,
const Reference<XDictionaryEntry> &xEntry,
INT16 nLang, INT16 nMaxLeading )
{
MutexGuard aGuard( GetLinguMutex() );
Reference< XHyphenatedWord > xRes;
if (xEntry.is())
{
OUString aText( xEntry->getDictionaryWord() );
INT32 nTextLen = aText.getLength();
// trailing '=' means "hyphenation should not be possible"
if (nTextLen > 0 && aText[ nTextLen - 1 ] != '=')
{
INT16 nHyphenationPos = -1;
OUStringBuffer aTmp( nTextLen );
BOOL bSkip = FALSE;
INT32 nHyphIdx = -1;
INT32 nLeading = 0;
for (INT32 i = 0; i < nTextLen; i++)
{
sal_Unicode cTmp = aText[i];
if (cTmp != '=')
{
aTmp.append( cTmp );
nLeading++;
bSkip = FALSE;
nHyphIdx++;
}
else
{
if (!bSkip && nHyphIdx >= 0)
{
if (nLeading <= nMaxLeading)
nHyphenationPos = (INT16) nHyphIdx;
}
bSkip = TRUE; //! multiple '=' should count as one only
}
}
if (nHyphenationPos > 0)
{
aText = aTmp.makeStringAndClear();
#if OSL_DEBUG_LEVEL > 1
{
if (aText != rOrigWord)
{
// both words should only differ by a having a trailing '.'
// character or not...
OUString aShorter, aLonger;
if (aText.getLength() <= rOrigWord.getLength())
{
aShorter = aText;
aLonger = rOrigWord;
}
else
{
aShorter = rOrigWord;
aLonger = aText;
}
xub_StrLen nS = sal::static_int_cast< xub_StrLen >( aShorter.getLength() );
xub_StrLen nL = sal::static_int_cast< xub_StrLen >( aLonger.getLength() );
if (nS > 0 && nL > 0)
{
DBG_ASSERT( (nS + 1 == nL) && aLonger[nL-1] == (sal_Unicode) '.',
"HyphenatorDispatcher::buildHyphWord: unexpected difference between words!" );
}
}
}
#endif
//! take care of #i22591#
aText = rOrigWord;
DBG_ASSERT( aText == rOrigWord, "failed to " );
xRes = new HyphenatedWord( aText, nLang, nHyphenationPos,
aText, nHyphenationPos );
}
}
}
return xRes;
}
Reference< XPossibleHyphens > HyphenatorDispatcher::buildPossHyphens(
const Reference< XDictionaryEntry > &xEntry, INT16 nLanguage )
{
MutexGuard aGuard( GetLinguMutex() );
Reference<XPossibleHyphens> xRes;
if (xEntry.is())
{
// text with hyphenation info
OUString aText( xEntry->getDictionaryWord() );
INT32 nTextLen = aText.getLength();
// trailing '=' means "hyphenation should not be possible"
if (nTextLen > 0 && aText[ nTextLen - 1 ] != '=')
{
// sequence to hold hyphenation positions
Sequence< INT16 > aHyphPos( nTextLen );
INT16 *pPos = aHyphPos.getArray();
INT32 nHyphCount = 0;
OUStringBuffer aTmp( nTextLen );
BOOL bSkip = FALSE;
INT32 nHyphIdx = -1;
for (INT32 i = 0; i < nTextLen; i++)
{
sal_Unicode cTmp = aText[i];
if (cTmp != '=')
{
aTmp.append( cTmp );
bSkip = FALSE;
nHyphIdx++;
}
else
{
if (!bSkip && nHyphIdx >= 0)
pPos[ nHyphCount++ ] = (INT16) nHyphIdx;
bSkip = TRUE; //! multiple '=' should count as one only
}
}
// ignore (multiple) trailing '='
if (bSkip && nHyphIdx >= 0)
{
nHyphCount--;
}
DBG_ASSERT( nHyphCount >= 0, "lng : invalid hyphenation count");
if (nHyphCount > 0)
{
aHyphPos.realloc( nHyphCount );
xRes = new PossibleHyphens( aTmp.makeStringAndClear(), nLanguage,
aText, aHyphPos );
}
}
}
return xRes;
}
Sequence< Locale > SAL_CALL HyphenatorDispatcher::getLocales()
throw(RuntimeException)
{
MutexGuard aGuard( GetLinguMutex() );
ULONG nCnt = aSvcList.Count();
Sequence< Locale > aLocales( nCnt );
Locale *pItem = aLocales.getArray();
LangSvcEntry_Hyph *pEntry = aSvcList.First();
for (ULONG i = 0; i < nCnt; i++)
{
DBG_ASSERT( pEntry, "lng : pEntry is NULL pointer" );
pItem[i] = CreateLocale( (LanguageType) aSvcList.GetKey( pEntry ) );
pEntry = aSvcList.Next();
}
return aLocales;
}
BOOL SAL_CALL HyphenatorDispatcher::hasLocale(const Locale& rLocale)
throw(RuntimeException)
{
MutexGuard aGuard( GetLinguMutex() );
return 0 != aSvcList.Get( LocaleToLanguage( rLocale ) );
}
Reference< XHyphenatedWord > SAL_CALL
HyphenatorDispatcher::hyphenate(
const OUString& rWord, const Locale& rLocale, sal_Int16 nMaxLeading,
const PropertyValues& rProperties )
throw(IllegalArgumentException, RuntimeException)
{
MutexGuard aGuard( GetLinguMutex() );
Reference< XHyphenatedWord > xRes;
INT32 nWordLen = rWord.getLength();
INT16 nLanguage = LocaleToLanguage( rLocale );
if (nLanguage == LANGUAGE_NONE || !nWordLen ||
nMaxLeading == 0 || nMaxLeading == nWordLen)
return xRes;
// search for entry with that language
LangSvcEntry_Hyph *pEntry = aSvcList.Get( nLanguage );
BOOL bWordModified = FALSE;
if (!pEntry || (nMaxLeading < 0 || nMaxLeading > nWordLen))
{
#ifdef LINGU_EXCEPTIONS
throw IllegalArgumentException();
#else
return NULL;
#endif
}
else
{
OUString aChkWord( rWord );
// replace typographical apostroph by ascii apostroph
String aSingleQuote( GetLocaleDataWrapper( nLanguage ).getQuotationMarkEnd() );
DBG_ASSERT( 1 == aSingleQuote.Len(), "unexpectend length of quotation mark" );
if (aSingleQuote.Len())
aChkWord = aChkWord.replace( aSingleQuote.GetChar(0), '\'' );
bWordModified |= RemoveHyphens( aChkWord );
if (IsIgnoreControlChars( rProperties, GetPropSet() ))
bWordModified |= RemoveControlChars( aChkWord );
INT16 nChkMaxLeading = (INT16) GetPosInWordToCheck( rWord, nMaxLeading );
// check for results from (positive) dictionaries which have precedence!
Reference< XDictionaryEntry > xEntry;
if (GetDicList().is() && IsUseDicList( rProperties, GetPropSet() ))
{
xEntry = GetDicList()->queryDictionaryEntry( aChkWord, rLocale,
TRUE, FALSE );
}
if (xEntry.is())
{
//! because queryDictionaryEntry (in the end DictionaryNeo::getEntry)
//! does not distinguish betwee "XYZ" and "XYZ." in order to avoid
//! to require them as different entry we have to supply the
//! original word here as well so it can be used in th result
//! otherwise a strange effect may occur (see #i22591#)
xRes = buildHyphWord( rWord, xEntry, nLanguage, nChkMaxLeading );
}
else
{
INT32 nLen = pEntry->aSvcImplName.getLength() ? 1 : 0;
DBG_ASSERT( pEntry->aFlags.nLastTriedSvcIndex < nLen,
"lng : index out of range");
INT32 i = 0;
Reference< XHyphenator > &rHyph = pEntry->aSvcRef;
// try already instantiated service
if (i <= pEntry->aFlags.nLastTriedSvcIndex)
{
if (rHyph.is() && rHyph->hasLocale( rLocale ))
xRes = rHyph->hyphenate( aChkWord, rLocale, nChkMaxLeading,
rProperties );
++i;
}
else if (pEntry->aFlags.nLastTriedSvcIndex < nLen - 1)
// instantiate services and try it
{
Reference< XMultiServiceFactory > xMgr( getProcessServiceFactory() );
if (xMgr.is())
{
// build service initialization argument
Sequence< Any > aArgs(2);
aArgs.getArray()[0] <<= GetPropSet();
//! The dispatcher searches the dictionary-list
//! thus the service needs not to now about it
//aArgs.getArray()[1] <<= GetDicList();
// create specific service via it's implementation name
Reference< XHyphenator > xHyph;
try
{
xHyph = Reference< XHyphenator >(
xMgr->createInstanceWithArguments(
pEntry->aSvcImplName, aArgs ), UNO_QUERY );
}
catch (uno::Exception &)
{
DBG_ERROR( "createInstanceWithArguments failed" );
}
rHyph = xHyph;
Reference< XLinguServiceEventBroadcaster >
xBroadcaster( xHyph, UNO_QUERY );
if (xBroadcaster.is())
rMgr.AddLngSvcEvtBroadcaster( xBroadcaster );
if (rHyph.is() && rHyph->hasLocale( rLocale ))
xRes = rHyph->hyphenate( aChkWord, rLocale, nChkMaxLeading,
rProperties );
pEntry->aFlags.nLastTriedSvcIndex = (INT16) i;
++i;
// if language is not supported by the services
// remove it from the list.
if (rHyph.is() && !rHyph->hasLocale( rLocale ))
aSvcList.Remove( nLanguage );
}
}
} // if (xEntry.is())
}
if (bWordModified && xRes.is())
xRes = RebuildHyphensAndControlChars( rWord, xRes );
if (xRes.is() && xRes->getWord() != rWord)
{
xRes = new HyphenatedWord( rWord, nLanguage, xRes->getHyphenationPos(),
xRes->getHyphenatedWord(),
xRes->getHyphenPos() );
}
return xRes;
}
Reference< XHyphenatedWord > SAL_CALL
HyphenatorDispatcher::queryAlternativeSpelling(
const OUString& rWord, const Locale& rLocale, sal_Int16 nIndex,
const PropertyValues& rProperties )
throw(IllegalArgumentException, RuntimeException)
{
MutexGuard aGuard( GetLinguMutex() );
Reference< XHyphenatedWord > xRes;
INT32 nWordLen = rWord.getLength();
INT16 nLanguage = LocaleToLanguage( rLocale );
if (nLanguage == LANGUAGE_NONE || !nWordLen)
return xRes;
// search for entry with that language
LangSvcEntry_Hyph *pEntry = aSvcList.Get( nLanguage );
BOOL bWordModified = FALSE;
if (!pEntry || !(0 <= nIndex && nIndex <= nWordLen - 2))
{
#ifdef LINGU_EXCEPTIONS
throw IllegalArgumentException();
#else
return NULL;
#endif
}
else
{
OUString aChkWord( rWord );
// replace typographical apostroph by ascii apostroph
String aSingleQuote( GetLocaleDataWrapper( nLanguage ).getQuotationMarkEnd() );
DBG_ASSERT( 1 == aSingleQuote.Len(), "unexpectend length of quotation mark" );
if (aSingleQuote.Len())
aChkWord = aChkWord.replace( aSingleQuote.GetChar(0), '\'' );
bWordModified |= RemoveHyphens( aChkWord );
if (IsIgnoreControlChars( rProperties, GetPropSet() ))
bWordModified |= RemoveControlChars( aChkWord );
INT16 nChkIndex = (INT16) GetPosInWordToCheck( rWord, nIndex );
// check for results from (positive) dictionaries which have precedence!
Reference< XDictionaryEntry > xEntry;
if (GetDicList().is() && IsUseDicList( rProperties, GetPropSet() ))
{
xEntry = GetDicList()->queryDictionaryEntry( aChkWord, rLocale,
TRUE, FALSE );
}
if (xEntry.is())
{
//! alternative spellings not yet supported by dictionaries
}
else
{
INT32 nLen = pEntry->aSvcImplName.getLength() ? 1 : 0;
DBG_ASSERT( pEntry->aFlags.nLastTriedSvcIndex < nLen,
"lng : index out of range");
INT32 i = 0;
Reference< XHyphenator > &rHyph = pEntry->aSvcRef;
// try already instantiated service
if (i <= pEntry->aFlags.nLastTriedSvcIndex)
{
if (rHyph.is() && rHyph->hasLocale( rLocale ))
xRes = rHyph->queryAlternativeSpelling( aChkWord, rLocale,
nChkIndex, rProperties );
++i;
}
else if (pEntry->aFlags.nLastTriedSvcIndex < nLen - 1)
// instantiate services and try it
{
Reference< XMultiServiceFactory > xMgr( getProcessServiceFactory() );
if (xMgr.is())
{
// build service initialization argument
Sequence< Any > aArgs(2);
aArgs.getArray()[0] <<= GetPropSet();
//! The dispatcher searches the dictionary-list
//! thus the service needs not to now about it
//aArgs.getArray()[1] <<= GetDicList();
// create specific service via it's implementation name
Reference< XHyphenator > xHyph;
try
{
xHyph = Reference< XHyphenator >(
xMgr->createInstanceWithArguments(
pEntry->aSvcImplName, aArgs ), UNO_QUERY );
}
catch (uno::Exception &)
{
DBG_ERROR( "createInstanceWithArguments failed" );
}
rHyph = xHyph;
Reference< XLinguServiceEventBroadcaster >
xBroadcaster( xHyph, UNO_QUERY );
if (xBroadcaster.is())
rMgr.AddLngSvcEvtBroadcaster( xBroadcaster );
if (rHyph.is() && rHyph->hasLocale( rLocale ))
xRes = rHyph->queryAlternativeSpelling( aChkWord, rLocale,
nChkIndex, rProperties );
pEntry->aFlags.nLastTriedSvcIndex = (INT16) i;
++i;
// if language is not supported by the services
// remove it from the list.
if (rHyph.is() && !rHyph->hasLocale( rLocale ))
aSvcList.Remove( nLanguage );
}
}
} // if (xEntry.is())
}
if (bWordModified && xRes.is())
xRes = RebuildHyphensAndControlChars( rWord, xRes );
if (xRes.is() && xRes->getWord() != rWord)
{
xRes = new HyphenatedWord( rWord, nLanguage, xRes->getHyphenationPos(),
xRes->getHyphenatedWord(),
xRes->getHyphenPos() );
}
return xRes;
}
Reference< XPossibleHyphens > SAL_CALL
HyphenatorDispatcher::createPossibleHyphens(
const OUString& rWord, const Locale& rLocale,
const PropertyValues& rProperties )
throw(IllegalArgumentException, RuntimeException)
{
MutexGuard aGuard( GetLinguMutex() );
Reference< XPossibleHyphens > xRes;
INT16 nLanguage = LocaleToLanguage( rLocale );
if (nLanguage == LANGUAGE_NONE || !rWord.getLength())
return xRes;
// search for entry with that language
LangSvcEntry_Hyph *pEntry = aSvcList.Get( nLanguage );
if (!pEntry)
{
#ifdef LINGU_EXCEPTIONS
throw IllegalArgumentException();
#endif
}
else
{
OUString aChkWord( rWord );
// replace typographical apostroph by ascii apostroph
String aSingleQuote( GetLocaleDataWrapper( nLanguage ).getQuotationMarkEnd() );
DBG_ASSERT( 1 == aSingleQuote.Len(), "unexpectend length of quotation mark" );
if (aSingleQuote.Len())
aChkWord = aChkWord.replace( aSingleQuote.GetChar(0), '\'' );
RemoveHyphens( aChkWord );
if (IsIgnoreControlChars( rProperties, GetPropSet() ))
RemoveControlChars( aChkWord );
// check for results from (positive) dictionaries which have precedence!
Reference< XDictionaryEntry > xEntry;
if (GetDicList().is() && IsUseDicList( rProperties, GetPropSet() ))
{
xEntry = GetDicList()->queryDictionaryEntry( aChkWord, rLocale,
TRUE, FALSE );
}
if (xEntry.is())
{
xRes = buildPossHyphens( xEntry, nLanguage );
}
else
{
INT32 nLen = pEntry->aSvcImplName.getLength() ? 1 : 0;
DBG_ASSERT( pEntry->aFlags.nLastTriedSvcIndex < nLen,
"lng : index out of range");
INT32 i = 0;
Reference< XHyphenator > &rHyph = pEntry->aSvcRef;
// try already instantiated service
if (i <= pEntry->aFlags.nLastTriedSvcIndex)
{
if (rHyph.is() && rHyph->hasLocale( rLocale ))
xRes = rHyph->createPossibleHyphens( aChkWord, rLocale,
rProperties );
++i;
}
else if (pEntry->aFlags.nLastTriedSvcIndex < nLen - 1)
// instantiate services and try it
{
Reference< XMultiServiceFactory > xMgr( getProcessServiceFactory() );
if (xMgr.is())
{
// build service initialization argument
Sequence< Any > aArgs(2);
aArgs.getArray()[0] <<= GetPropSet();
//! The dispatcher searches the dictionary-list
//! thus the service needs not to now about it
//aArgs.getArray()[1] <<= GetDicList();
// create specific service via it's implementation name
Reference< XHyphenator > xHyph;
try
{
xHyph = Reference< XHyphenator >(
xMgr->createInstanceWithArguments(
pEntry->aSvcImplName, aArgs ), UNO_QUERY );
}
catch (uno::Exception &)
{
DBG_ERROR( "createWithArguments failed" );
}
rHyph = xHyph;
Reference< XLinguServiceEventBroadcaster >
xBroadcaster( xHyph, UNO_QUERY );
if (xBroadcaster.is())
rMgr.AddLngSvcEvtBroadcaster( xBroadcaster );
if (rHyph.is() && rHyph->hasLocale( rLocale ))
xRes = rHyph->createPossibleHyphens( aChkWord, rLocale,
rProperties );
pEntry->aFlags.nLastTriedSvcIndex = (INT16) i;
++i;
// if language is not supported by the services
// remove it from the list.
if (rHyph.is() && !rHyph->hasLocale( rLocale ))
aSvcList.Remove( nLanguage );
}
}
} // if (xEntry.is())
}
if (xRes.is() && xRes->getWord() != rWord)
{
xRes = new PossibleHyphens( rWord, nLanguage,
xRes->getPossibleHyphens(),
xRes->getHyphenationPositions() );
}
return xRes;
}
void HyphenatorDispatcher::SetServiceList( const Locale &rLocale,
const Sequence< OUString > &rSvcImplNames )
{
MutexGuard aGuard( GetLinguMutex() );
INT16 nLanguage = LocaleToLanguage( rLocale );
INT32 nLen = rSvcImplNames.getLength();
if (0 == nLen)
// remove entry
aSvcList.Remove( nLanguage );
else
{
// modify/add entry
LangSvcEntry_Hyph *pEntry = aSvcList.Get( nLanguage );
// only one hypenator can be in use for a language...
const OUString &rSvcImplName = rSvcImplNames.getConstArray()[0];
if (pEntry)
{
pEntry->aSvcImplName = rSvcImplName;
pEntry->aSvcRef = NULL;
pEntry->aFlags = SvcFlags();
}
else
{
pEntry = new LangSvcEntry_Hyph( rSvcImplName );
aSvcList.Insert( nLanguage, pEntry );
DBG_ASSERT( aSvcList.Get( nLanguage ), "lng : Insert failed" );
}
}
}
Sequence< OUString >
HyphenatorDispatcher::GetServiceList( const Locale &rLocale ) const
{
MutexGuard aGuard( GetLinguMutex() );
Sequence< OUString > aRes(1);
// search for entry with that language and use data from that
INT16 nLanguage = LocaleToLanguage( rLocale );
HyphenatorDispatcher *pThis = (HyphenatorDispatcher *) this;
const LangSvcEntry_Hyph *pEntry = pThis->aSvcList.Get( nLanguage );
if (pEntry)
aRes.getArray()[0] = pEntry->aSvcImplName;
else
aRes.realloc(0);
return aRes;
}
HyphenatorDispatcher::DspType
HyphenatorDispatcher::GetDspType() const
{
return DSP_HYPH;
}
///////////////////////////////////////////////////////////////////////////