office-gobmx/linguistic/source/iprcache.cxx
László Németh 57d79744c7 tdf#136306 offapi linguistic: add options to disable rule-based compounding
Add two new spell checking options to disable rule-based closed
and hyphenated compound word recognition with Hunspell dictionaries:

com::sun::linguistic2::XLinguProperties::IsSpellClosedCompound
com::sun::linguistic2::XLinguProperties::IsSpellHyphenatedCompound

For professional proofreaders, it can be more important to avoid
of the mistakes of the rule-based compound word recognition, than
to speed up proofreading. Disabling the following two new options
will report all rule-based closed compound words (default in
Dutch, German, Hungarian etc. dictionaries) and rule-based
hyphenated compound words (all languages with BREAK usage in
their Hunspell dictionaries):

- "Accept possible closed compound words"

- "Accept possible hyphenated compound words"

For example, disabling the second one, dictionary word "scot-free"
will be still correct word in English spell checking, but not
the previously accepted compound "arbitrary-word-with-hyphen".

Note: the second option works with the update to Hunspell 1.7.2.

Change-Id: Id879610927d5e8269fda5ad207c1c2fe1f57a0b6
Reviewed-on: https://gerrit.libreoffice.org/c/core/+/144875
Tested-by: Jenkins
Reviewed-by: László Németh <nemeth@numbertext.org>
2022-12-30 11:03:39 +00:00

229 lines
6.4 KiB
C++

/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
/*
* This file is part of the LibreOffice project.
*
* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
*
* This file incorporates work covered by the following license notice:
*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed
* with this work for additional information regarding copyright
* ownership. The ASF licenses this file to you under the Apache
* License, Version 2.0 (the "License"); you may not use this file
* except in compliance with the License. You may obtain a copy of
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
*/
#include <iprcache.hxx>
#include <linguistic/misc.hxx>
#include <com/sun/star/linguistic2/DictionaryListEventFlags.hpp>
#include <osl/mutex.hxx>
#include <unotools/linguprops.hxx>
using namespace osl;
using namespace com::sun::star;
using namespace com::sun::star::beans;
using namespace com::sun::star::lang;
using namespace com::sun::star::uno;
using namespace com::sun::star::linguistic2;
namespace linguistic
{
#define NUM_FLUSH_PROPS 8
const struct
{
OUString aPropName;
sal_Int32 nPropHdl;
} aFlushProperties[ NUM_FLUSH_PROPS ] =
{
{ UPN_IS_USE_DICTIONARY_LIST, UPH_IS_USE_DICTIONARY_LIST },
{ UPN_IS_IGNORE_CONTROL_CHARACTERS, UPH_IS_IGNORE_CONTROL_CHARACTERS },
{ UPN_IS_SPELL_UPPER_CASE, UPH_IS_SPELL_UPPER_CASE },
{ UPN_IS_SPELL_WITH_DIGITS, UPH_IS_SPELL_WITH_DIGITS },
{ UPN_IS_SPELL_CAPITALIZATION, UPH_IS_SPELL_CAPITALIZATION },
{ UPN_IS_SPELL_CLOSED_COMPOUND, UPH_IS_SPELL_CLOSED_COMPOUND },
{ UPN_IS_SPELL_HYPHENATED_COMPOUND, UPH_IS_SPELL_HYPHENATED_COMPOUND }
};
static void lcl_AddAsPropertyChangeListener(
const Reference< XPropertyChangeListener >& xListener,
Reference< XLinguProperties > const &rPropSet )
{
if (xListener.is() && rPropSet.is())
{
for (auto& aFlushProperty : aFlushProperties)
{
rPropSet->addPropertyChangeListener(
aFlushProperty.aPropName, xListener );
}
}
}
static void lcl_RemoveAsPropertyChangeListener(
const Reference< XPropertyChangeListener >& xListener,
Reference< XLinguProperties > const &rPropSet )
{
if (xListener.is() && rPropSet.is())
{
for (auto& aFlushProperty : aFlushProperties)
{
rPropSet->removePropertyChangeListener(
aFlushProperty.aPropName, xListener );
}
}
}
static bool lcl_IsFlushProperty( sal_Int32 nHandle )
{
int i;
for (i = 0; i < NUM_FLUSH_PROPS; ++i)
{
if (nHandle == aFlushProperties[i].nPropHdl)
break;
}
return i < NUM_FLUSH_PROPS;
}
void FlushListener::SetDicList( Reference<XSearchableDictionaryList> const &rDL )
{
MutexGuard aGuard( GetLinguMutex() );
if (xDicList != rDL)
{
if (xDicList.is())
xDicList->removeDictionaryListEventListener( this );
xDicList = rDL;
if (xDicList.is())
xDicList->addDictionaryListEventListener( this, false );
}
}
void FlushListener::SetPropSet( Reference< XLinguProperties > const &rPS )
{
MutexGuard aGuard( GetLinguMutex() );
if (xPropSet != rPS)
{
if (xPropSet.is())
lcl_RemoveAsPropertyChangeListener( this, xPropSet );
xPropSet = rPS;
if (xPropSet.is())
lcl_AddAsPropertyChangeListener( this, xPropSet );
}
}
void SAL_CALL FlushListener::disposing( const EventObject& rSource )
{
MutexGuard aGuard( GetLinguMutex() );
if (xDicList.is() && rSource.Source == xDicList)
{
xDicList->removeDictionaryListEventListener( this );
xDicList = nullptr; //! release reference
}
if (xPropSet.is() && rSource.Source == xPropSet)
{
lcl_RemoveAsPropertyChangeListener( this, xPropSet );
xPropSet = nullptr; //! release reference
}
}
void SAL_CALL FlushListener::processDictionaryListEvent(
const DictionaryListEvent& rDicListEvent )
{
MutexGuard aGuard( GetLinguMutex() );
if (rDicListEvent.Source != xDicList)
return;
sal_Int16 nEvt = rDicListEvent.nCondensedEvent;
sal_Int16 const nFlushFlags =
DictionaryListEventFlags::ADD_NEG_ENTRY |
DictionaryListEventFlags::DEL_POS_ENTRY |
DictionaryListEventFlags::ACTIVATE_NEG_DIC |
DictionaryListEventFlags::DEACTIVATE_POS_DIC;
bool bFlush = 0 != (nEvt & nFlushFlags);
if (bFlush)
mrSpellCache.Flush();
}
void SAL_CALL FlushListener::propertyChange(
const PropertyChangeEvent& rEvt )
{
MutexGuard aGuard( GetLinguMutex() );
if (rEvt.Source == xPropSet)
{
bool bFlush = lcl_IsFlushProperty( rEvt.PropertyHandle );
if (bFlush)
mrSpellCache.Flush();
}
}
SpellCache::SpellCache()
{
mxFlushLstnr = new FlushListener( *this );
Reference<XSearchableDictionaryList> aDictionaryList(GetDictionaryList());
mxFlushLstnr->SetDicList( aDictionaryList ); //! after reference is established
Reference<XLinguProperties> aPropertySet(GetLinguProperties());
mxFlushLstnr->SetPropSet( aPropertySet ); //! after reference is established
}
SpellCache::~SpellCache()
{
Reference<XSearchableDictionaryList> aEmptyList;
Reference<XLinguProperties> aEmptySet;
mxFlushLstnr->SetDicList( aEmptyList );
mxFlushLstnr->SetPropSet( aEmptySet );
}
void SpellCache::Flush()
{
MutexGuard aGuard( GetLinguMutex() );
// clear word list
LangWordList_t().swap(aWordLists);
}
bool SpellCache::CheckWord( const OUString& rWord, LanguageType nLang )
{
MutexGuard aGuard( GetLinguMutex() );
WordList_t &rList = aWordLists[ nLang ];
const WordList_t::const_iterator aIt = rList.find( rWord );
return aIt != rList.end();
}
void SpellCache::AddWord( const OUString& rWord, LanguageType nLang )
{
MutexGuard aGuard( GetLinguMutex() );
WordList_t & rList = aWordLists[ nLang ];
// occasional clean-up...
if (rList.size() > 500)
rList.clear();
rList.insert( rWord );
}
} // namespace linguistic
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */