4af9819795
2008/03/31 16:01:33 rt 1.16.10.1: #i87441# Change license header to LPGL v3.
688 lines
24 KiB
C++
688 lines
24 KiB
C++
/*************************************************************************
|
|
*
|
|
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
|
*
|
|
* Copyright 2008 by Sun Microsystems, Inc.
|
|
*
|
|
* OpenOffice.org - a multi-platform office productivity suite
|
|
*
|
|
* $RCSfile: transliterationImpl.cxx,v $
|
|
* $Revision: 1.17 $
|
|
*
|
|
* This file is part of OpenOffice.org.
|
|
*
|
|
* OpenOffice.org is free software: you can redistribute it and/or modify
|
|
* it under the terms of the GNU Lesser General Public License version 3
|
|
* only, as published by the Free Software Foundation.
|
|
*
|
|
* OpenOffice.org is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU Lesser General Public License version 3 for more details
|
|
* (a copy is included in the LICENSE file that accompanied this code).
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public License
|
|
* version 3 along with OpenOffice.org. If not, see
|
|
* <http://www.openoffice.org/license.html>
|
|
* for a copy of the LGPLv3 License.
|
|
*
|
|
************************************************************************/
|
|
|
|
// MARKER(update_precomp.py): autogen include statement, do not remove
|
|
#include "precompiled_i18npool.hxx"
|
|
|
|
#include "transliterationImpl.hxx"
|
|
#include "servicename.hxx"
|
|
|
|
#include <com/sun/star/i18n/TransliterationType.hpp>
|
|
#include <com/sun/star/lang/XComponent.hpp>
|
|
#include <com/sun/star/container/XContentEnumerationAccess.hpp>
|
|
#include <com/sun/star/container/XEnumeration.hpp>
|
|
#include <com/sun/star/lang/XServiceInfo.hpp>
|
|
#include <com/sun/star/lang/XSingleServiceFactory.hpp>
|
|
|
|
#include <comphelper/processfactory.hxx>
|
|
#include <rtl/string.h>
|
|
#include <rtl/ustring.hxx>
|
|
#include <rtl/ustrbuf.hxx>
|
|
|
|
#if OSL_DEBUG_LEVEL > 1
|
|
#include <stdio.h>
|
|
#endif
|
|
|
|
using namespace com::sun::star::uno;
|
|
using namespace com::sun::star::lang;
|
|
using namespace rtl;
|
|
using namespace com::sun::star::container;
|
|
|
|
namespace com { namespace sun { namespace star { namespace i18n {
|
|
|
|
#define ERROR RuntimeException()
|
|
|
|
#define TmItem1( name ) \
|
|
{TransliterationModules_##name, TransliterationModulesNew_##name, #name}
|
|
|
|
#define TmItem2( name ) \
|
|
{(TransliterationModules)0, TransliterationModulesNew_##name, #name}
|
|
|
|
// Ignore Module list
|
|
static struct TMlist {
|
|
TransliterationModules tm;
|
|
TransliterationModulesNew tmn;
|
|
const sal_Char *implName;
|
|
} TMlist[] = { // Modules ModulesNew
|
|
TmItem1 (IGNORE_CASE), // 0. (1<<8 256) (7)
|
|
TmItem1 (IGNORE_WIDTH), // 1. (1<<9 512) (8)
|
|
TmItem1 (IGNORE_KANA), // 2. (1<<10 1024) (9)
|
|
// No enum define for this trans. application has to use impl name to load it
|
|
// TmItem1 (IGNORE_CASE_SIMPLE), // (1<<11 1024) (66)
|
|
|
|
TmItem1 (ignoreTraditionalKanji_ja_JP), // 3. (1<<12 4096) (10)
|
|
TmItem1 (ignoreTraditionalKana_ja_JP), // 4. (1<<13 8192) (11)
|
|
TmItem1 (ignoreMinusSign_ja_JP), // 5. (1<<13 16384) (12)
|
|
TmItem1 (ignoreIterationMark_ja_JP), // 6. (1<<14 32768) (13)
|
|
TmItem1 (ignoreSeparator_ja_JP), // 7. (1<<15 65536) (14)
|
|
TmItem1 (ignoreSize_ja_JP), // 15. (1<<23 16777216) (22)
|
|
TmItem1 (ignoreMiddleDot_ja_JP), // 17. (1<<25 67108864) (24)
|
|
TmItem1 (ignoreSpace_ja_JP), // 18. (1<<26 134217728) (25)
|
|
TmItem1 (ignoreZiZu_ja_JP), // 8. (1<<16 131072) (15)
|
|
TmItem1 (ignoreBaFa_ja_JP), // 9. (1<<17 262144) (16)
|
|
TmItem1 (ignoreTiJi_ja_JP), // 10. (1<<18 524288) (17)
|
|
TmItem1 (ignoreHyuByu_ja_JP), // 11. (1<<19 1048576) (18)
|
|
TmItem1 (ignoreSeZe_ja_JP), // 12. (1<<20 2097152) (19)
|
|
TmItem1 (ignoreIandEfollowedByYa_ja_JP), // 13. (1<<21 4194304) (20)
|
|
TmItem1 (ignoreKiKuFollowedBySa_ja_JP), // 14. (1<<22 8388608) (21)
|
|
TmItem1 (ignoreProlongedSoundMark_ja_JP), // 16. (1<<24 33554432) (23)
|
|
|
|
TmItem1 (UPPERCASE_LOWERCASE), // 19. (1) (1)
|
|
TmItem1 (LOWERCASE_UPPERCASE), // 20. (2) (2)
|
|
TmItem1 (HALFWIDTH_FULLWIDTH), // 21. (3) (3)
|
|
TmItem1 (FULLWIDTH_HALFWIDTH), // 22. (4) (4)
|
|
TmItem1 (KATAKANA_HIRAGANA), // 23. (5) (5)
|
|
TmItem1 (HIRAGANA_KATAKANA), // 24. (6) (6)
|
|
|
|
TmItem1 (smallToLarge_ja_JP), // 25. (1<<27 268435456) (26)
|
|
TmItem1 (largeToSmall_ja_JP), // 26. (1<<28 536870912) (27)
|
|
TmItem2 (NumToTextLower_zh_CN), // 27. () (28)
|
|
TmItem2 (NumToTextUpper_zh_CN), // 28. () (29)
|
|
TmItem2 (NumToTextLower_zh_TW), // 29. () (30)
|
|
TmItem2 (NumToTextUpper_zh_TW), // 30. () (31)
|
|
TmItem2 (NumToTextFormalHangul_ko), // 31. () (32)
|
|
TmItem2 (NumToTextFormalLower_ko), // 32. () (33)
|
|
TmItem2 (NumToTextFormalUpper_ko), // 33. () (34)
|
|
TmItem2 (NumToTextInformalHangul_ko), // 34. () (35)
|
|
TmItem2 (NumToTextInformalLower_ko), // 35. () (36)
|
|
TmItem2 (NumToTextInformalUpper_ko), // 36. () (37)
|
|
TmItem2 (NumToCharLower_zh_CN), // 37. () (38)
|
|
TmItem2 (NumToCharUpper_zh_CN), // 38. () (39)
|
|
TmItem2 (NumToCharLower_zh_TW), // 39. () (40)
|
|
TmItem2 (NumToCharUpper_zh_TW), // 40. () (41)
|
|
TmItem2 (NumToCharHangul_ko), // 41. () (42)
|
|
TmItem2 (NumToCharLower_ko), // 42. () (43)
|
|
TmItem2 (NumToCharUpper_ko), // 43. () (44)
|
|
TmItem2 (NumToCharFullwidth), // 44. () (45)
|
|
TmItem2 (NumToCharKanjiShort_ja_JP), // 45. () (46)
|
|
TmItem2 (TextToNumLower_zh_CN), // 46. () (47)
|
|
TmItem2 (TextToNumUpper_zh_CN), // 47. () (48)
|
|
TmItem2 (TextToNumLower_zh_TW), // 48. () (49)
|
|
TmItem2 (TextToNumUpper_zh_TW), // 49. () (50)
|
|
TmItem2 (TextToNumFormalHangul_ko), // 50. () (51)
|
|
TmItem2 (TextToNumFormalLower_ko), // 51. () (52)
|
|
TmItem2 (TextToNumFormalUpper_ko), // 52. () (53)
|
|
TmItem2 (TextToNumInformalHangul_ko), // 53. () (54)
|
|
TmItem2 (TextToNumInformalLower_ko), // 54. () (55)
|
|
TmItem2 (TextToNumInformalUpper_ko), // 55. () (56)
|
|
|
|
TmItem2 (CharToNumLower_zh_CN), // 56. () (59)
|
|
TmItem2 (CharToNumUpper_zh_CN), // 57. () (60)
|
|
TmItem2 (CharToNumLower_zh_TW), // 58. () (61)
|
|
TmItem2 (CharToNumUpper_zh_TW), // 59. () (62)
|
|
TmItem2 (CharToNumHangul_ko), // 60. () (63)
|
|
TmItem2 (CharToNumLower_ko), // 61. () (64)
|
|
TmItem2 (CharToNumUpper_ko), // 62. () (65)
|
|
|
|
// no enum defined for these trans. application has to use impl name to load them
|
|
// TmItem2 (NumToCharArabic_Indic), // () (67)
|
|
// TmItem2 (NumToCharEstern_Arabic_Indic),// () (68)
|
|
// TmItem2 (NumToCharIndic), // () (69)
|
|
// TmItem2 (NumToCharThai), // () (70)
|
|
{(TransliterationModules)0, (TransliterationModulesNew)0, NULL}
|
|
};
|
|
|
|
TransliterationImpl::TransBody TransliterationImpl::lastTransBody;
|
|
|
|
// Constructor/Destructor
|
|
TransliterationImpl::TransliterationImpl(const Reference <XMultiServiceFactory>& xMSF) : xSMgr(xMSF)
|
|
{
|
|
numCascade = 0;
|
|
caseignoreOnly = sal_True;
|
|
|
|
if ( xMSF.is() )
|
|
{
|
|
Reference < XInterface > xI=
|
|
xMSF->createInstance(OUString::createFromAscii("com.sun.star.i18n.LocaleData"));
|
|
if ( xI.is() ) {
|
|
Any x = xI->queryInterface( ::getCppuType( (const uno::Reference< i18n::XLocaleData >*)0) );
|
|
x >>= localedata;
|
|
}
|
|
}
|
|
}
|
|
|
|
TransliterationImpl::~TransliterationImpl()
|
|
{
|
|
localedata.clear();
|
|
clear();
|
|
}
|
|
|
|
|
|
// Methods
|
|
OUString SAL_CALL
|
|
TransliterationImpl::getName() throw(RuntimeException)
|
|
{
|
|
if (numCascade == 1 && bodyCascade[0].is())
|
|
return bodyCascade[0]->getName();
|
|
if (numCascade < 1)
|
|
return ( OUString::createFromAscii("Not Loaded"));
|
|
throw ERROR;
|
|
}
|
|
|
|
sal_Int16 SAL_CALL
|
|
TransliterationImpl::getType() throw(RuntimeException)
|
|
{
|
|
if (numCascade > 1)
|
|
return (TransliterationType::CASCADE|TransliterationType::IGNORE);
|
|
if (numCascade > 0 && bodyCascade[0].is())
|
|
return(bodyCascade[0]->getType());
|
|
throw ERROR;
|
|
}
|
|
|
|
void SAL_CALL
|
|
TransliterationImpl::loadModule( TransliterationModules modType, const Locale& rLocale )
|
|
throw(RuntimeException)
|
|
{
|
|
clear();
|
|
if (modType&TransliterationModules_IGNORE_MASK && modType&TransliterationModules_NON_IGNORE_MASK) {
|
|
throw ERROR;
|
|
} else if (modType&TransliterationModules_IGNORE_MASK) {
|
|
#define TransliterationModules_IGNORE_CASE_MASK (TransliterationModules_IGNORE_CASE | \
|
|
TransliterationModules_IGNORE_WIDTH | \
|
|
TransliterationModules_IGNORE_KANA)
|
|
sal_Int32 mask = ((modType&TransliterationModules_IGNORE_CASE_MASK) == modType) ?
|
|
TransliterationModules_IGNORE_CASE_MASK : TransliterationModules_IGNORE_MASK;
|
|
for (sal_Int16 i = 0; TMlist[i].tm & mask; i++) {
|
|
if (modType & TMlist[i].tm)
|
|
if (loadModuleByName(OUString::createFromAscii(TMlist[i].implName),
|
|
bodyCascade[numCascade], rLocale))
|
|
numCascade++;
|
|
}
|
|
} else if (modType&TransliterationModules_NON_IGNORE_MASK) {
|
|
for (sal_Int16 i = 0; TMlist[i].tm; i++) {
|
|
if (TMlist[i].tm == modType) {
|
|
if (loadModuleByName(OUString::createFromAscii(TMlist[i].implName), bodyCascade[numCascade], rLocale))
|
|
numCascade++;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void SAL_CALL
|
|
TransliterationImpl::loadModuleNew( const Sequence < TransliterationModulesNew > & modType, const Locale& rLocale )
|
|
throw(RuntimeException)
|
|
{
|
|
clear();
|
|
sal_Int32 mask = 0, count = modType.getLength();
|
|
if (count > maxCascade)
|
|
throw ERROR; // could not handle more than maxCascade
|
|
for (sal_Int16 i = 0; i < count; i++) {
|
|
for (sal_Int16 j = 0; TMlist[j].tmn; j++) {
|
|
if (TMlist[j].tmn == modType[i]) {
|
|
if (mask == 0)
|
|
mask = TMlist[i].tm && (TMlist[i].tm&TransliterationModules_IGNORE_MASK) ?
|
|
TransliterationModules_IGNORE_MASK : TransliterationModules_NON_IGNORE_MASK;
|
|
else if (mask == TransliterationModules_IGNORE_MASK &&
|
|
(TMlist[i].tm&TransliterationModules_IGNORE_MASK) == 0)
|
|
throw ERROR; // could not mess up ignore trans. with non_ignore trans.
|
|
if (loadModuleByName(OUString::createFromAscii(TMlist[j].implName), bodyCascade[numCascade], rLocale))
|
|
numCascade++;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void SAL_CALL
|
|
TransliterationImpl::loadModuleByImplName(const OUString& implName, const Locale& rLocale)
|
|
throw(RuntimeException)
|
|
{
|
|
clear();
|
|
if (loadModuleByName(implName, bodyCascade[numCascade], rLocale))
|
|
numCascade++;
|
|
}
|
|
|
|
|
|
void SAL_CALL
|
|
TransliterationImpl::loadModulesByImplNames(const Sequence< OUString >& implNameList, const Locale& rLocale ) throw(RuntimeException)
|
|
{
|
|
if (implNameList.getLength() > maxCascade || implNameList.getLength() <= 0)
|
|
throw ERROR;
|
|
|
|
clear();
|
|
for (sal_Int32 i = 0; i < implNameList.getLength(); i++)
|
|
if (loadModuleByName(implNameList[i], bodyCascade[numCascade], rLocale))
|
|
numCascade++;
|
|
}
|
|
|
|
|
|
Sequence<OUString> SAL_CALL
|
|
TransliterationImpl::getAvailableModules( const Locale& rLocale, sal_Int16 sType ) throw(RuntimeException)
|
|
{
|
|
const Sequence<OUString> &translist = localedata->getTransliterations(rLocale);
|
|
Sequence<OUString> r(translist.getLength());
|
|
Reference<XExtendedTransliteration> body;
|
|
sal_Int32 n = 0;
|
|
for (sal_Int32 i = 0; i < translist.getLength(); i++)
|
|
{
|
|
if (loadModuleByName(translist[i], body, rLocale)) {
|
|
if (body->getType() & sType)
|
|
r[n++] = translist[i];
|
|
body.clear();
|
|
}
|
|
}
|
|
r.realloc(n);
|
|
return (r);
|
|
}
|
|
|
|
|
|
OUString SAL_CALL
|
|
TransliterationImpl::transliterate( const OUString& inStr, sal_Int32 startPos, sal_Int32 nCount,
|
|
Sequence< sal_Int32 >& offset ) throw(RuntimeException)
|
|
{
|
|
|
|
if (numCascade == 0)
|
|
return inStr;
|
|
|
|
if (offset.getLength() != nCount)
|
|
offset.realloc(nCount);
|
|
if (numCascade == 1)
|
|
{
|
|
if ( startPos == 0 && nCount == inStr.getLength() )
|
|
return bodyCascade[0]->transliterate( inStr, 0, nCount, offset);
|
|
else
|
|
{
|
|
OUString tmpStr = inStr.copy(startPos, nCount);
|
|
tmpStr = bodyCascade[0]->transliterate(tmpStr, 0, nCount, offset);
|
|
if ( startPos )
|
|
{
|
|
sal_Int32 * pArr = offset.getArray();
|
|
nCount = offset.getLength();
|
|
for (sal_Int32 j = 0; j < nCount; j++)
|
|
pArr[j] += startPos;
|
|
}
|
|
return tmpStr;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
OUString tmpStr = inStr.copy(startPos, nCount);
|
|
sal_Int32 * pArr = offset.getArray();
|
|
for (sal_Int32 j = 0; j < nCount; j++)
|
|
pArr[j] = startPos + j;
|
|
|
|
sal_Int16 from = 0, to = 1, tmp;
|
|
Sequence<sal_Int32> off[2];
|
|
|
|
off[to] = offset;
|
|
off[from].realloc(nCount);
|
|
for (sal_Int32 i = 0; i < numCascade; i++) {
|
|
tmpStr = bodyCascade[i]->transliterate(tmpStr, 0, nCount, off[from]);
|
|
|
|
nCount = tmpStr.getLength();
|
|
|
|
tmp = from; from = to; to = tmp;
|
|
for (sal_Int32 j = 0; j < nCount; j++)
|
|
off[to][j] = off[from][off[to][j]];
|
|
}
|
|
offset = off[to];
|
|
return tmpStr;
|
|
}
|
|
}
|
|
|
|
|
|
//
|
|
OUString SAL_CALL
|
|
TransliterationImpl::folding( const OUString& inStr, sal_Int32 startPos, sal_Int32 nCount,
|
|
Sequence< sal_Int32 >& offset ) throw(RuntimeException)
|
|
{
|
|
if (numCascade == 0)
|
|
return inStr;
|
|
|
|
if (offset.getLength() != nCount)
|
|
offset.realloc(nCount);
|
|
if (numCascade == 1)
|
|
{
|
|
if ( startPos == 0 && nCount == inStr.getLength() )
|
|
return bodyCascade[0]->folding( inStr, 0, nCount, offset);
|
|
else
|
|
{
|
|
OUString tmpStr = inStr.copy(startPos, nCount);
|
|
tmpStr = bodyCascade[0]->folding(tmpStr, 0, nCount, offset);
|
|
if ( startPos )
|
|
{
|
|
sal_Int32 * pArr = offset.getArray();
|
|
nCount = offset.getLength();
|
|
for (sal_Int32 j = 0; j < nCount; j++)
|
|
pArr[j] += startPos;
|
|
}
|
|
return tmpStr;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
OUString tmpStr = inStr.copy(startPos, nCount);
|
|
sal_Int32 * pArr = offset.getArray();
|
|
for (sal_Int32 j = 0; j < nCount; j++)
|
|
pArr[j] = startPos + j;
|
|
|
|
sal_Int16 from = 0, to = 1, tmp;
|
|
Sequence<sal_Int32> off[2];
|
|
|
|
off[to] = offset;
|
|
for (sal_Int32 i = 0; i < numCascade; i++) {
|
|
tmpStr = bodyCascade[i]->folding(tmpStr, 0, nCount, off[from]);
|
|
|
|
nCount = tmpStr.getLength();
|
|
|
|
tmp = from; from = to; to = tmp;
|
|
for (sal_Int32 j = 0; j < nCount; j++)
|
|
off[to][j] = off[from][off[to][j]];
|
|
}
|
|
offset = off[to];
|
|
return tmpStr;
|
|
}
|
|
}
|
|
|
|
OUString SAL_CALL
|
|
TransliterationImpl::transliterateString2String( const OUString& inStr, sal_Int32 startPos, sal_Int32 nCount ) throw(RuntimeException)
|
|
{
|
|
if (numCascade == 0)
|
|
return inStr;
|
|
else if (numCascade == 1)
|
|
return bodyCascade[0]->transliterateString2String( inStr, startPos, nCount);
|
|
else {
|
|
OUString tmpStr = bodyCascade[0]->transliterateString2String(inStr, startPos, nCount);
|
|
|
|
for (sal_Int32 i = 1; i < numCascade; i++)
|
|
tmpStr = bodyCascade[i]->transliterateString2String(tmpStr, 0, tmpStr.getLength());
|
|
return tmpStr;
|
|
}
|
|
}
|
|
|
|
OUString SAL_CALL
|
|
TransliterationImpl::transliterateChar2String( sal_Unicode inChar ) throw(RuntimeException)
|
|
{
|
|
if (numCascade == 0)
|
|
return OUString(&inChar, 1);
|
|
else if (numCascade == 1)
|
|
return bodyCascade[0]->transliterateChar2String( inChar);
|
|
else {
|
|
OUString tmpStr = bodyCascade[0]->transliterateChar2String(inChar);
|
|
|
|
for (sal_Int32 i = 1; i < numCascade; i++)
|
|
tmpStr = bodyCascade[i]->transliterateString2String(tmpStr, 0, tmpStr.getLength());
|
|
return tmpStr;
|
|
}
|
|
}
|
|
|
|
sal_Unicode SAL_CALL
|
|
TransliterationImpl::transliterateChar2Char( sal_Unicode inChar ) throw(MultipleCharsOutputException, RuntimeException)
|
|
{
|
|
sal_Unicode tmpChar = inChar;
|
|
for (sal_Int32 i = 0; i < numCascade; i++)
|
|
tmpChar = bodyCascade[i]->transliterateChar2Char(tmpChar);
|
|
return tmpChar;
|
|
}
|
|
|
|
|
|
sal_Bool SAL_CALL
|
|
TransliterationImpl::equals(
|
|
const OUString& str1, sal_Int32 pos1, sal_Int32 nCount1, sal_Int32& nMatch1,
|
|
const OUString& str2, sal_Int32 pos2, sal_Int32 nCount2, sal_Int32& nMatch2)
|
|
throw(RuntimeException)
|
|
{
|
|
// since this is an API function make it user fail safe
|
|
if ( nCount1 < 0 ) {
|
|
pos1 += nCount1;
|
|
nCount1 = -nCount1;
|
|
}
|
|
if ( nCount2 < 0 ) {
|
|
pos2 += nCount2;
|
|
nCount2 = -nCount2;
|
|
}
|
|
if ( !nCount1 || !nCount2 ||
|
|
pos1 >= str1.getLength() || pos2 >= str2.getLength() ||
|
|
pos1 < 0 || pos2 < 0 ) {
|
|
nMatch1 = nMatch2 = 0;
|
|
// two empty strings return true, else false
|
|
return !nCount1 && !nCount2 && pos1 == str1.getLength() && pos2 == str2.getLength();
|
|
}
|
|
if ( pos1 + nCount1 > str1.getLength() )
|
|
nCount1 = str1.getLength() - pos1;
|
|
if ( pos2 + nCount2 > str2.getLength() )
|
|
nCount2 = str2.getLength() - pos2;
|
|
|
|
if (caseignoreOnly && caseignore.is())
|
|
return caseignore->equals(str1, pos1, nCount1, nMatch1, str2, pos2, nCount2, nMatch2);
|
|
|
|
Sequence<sal_Int32> offset1, offset2;
|
|
|
|
OUString tmpStr1 = folding(str1, pos1, nCount1, offset1);
|
|
OUString tmpStr2 = folding(str2, pos2, nCount2, offset2);
|
|
|
|
const sal_Unicode *p1 = tmpStr1.getStr();
|
|
const sal_Unicode *p2 = tmpStr2.getStr();
|
|
sal_Int32 i, nLen = (tmpStr1.getLength() < tmpStr1.getLength() ?
|
|
tmpStr1.getLength() : tmpStr2.getLength());
|
|
for (i = 0; i < nLen; ++i, ++p1, ++p2 ) {
|
|
if (*p1 != *p2) {
|
|
// return number of matched code points so far
|
|
nMatch1 = offset1[i];
|
|
nMatch2 = offset2[i];
|
|
return sal_False;
|
|
}
|
|
}
|
|
// i==nLen
|
|
if ( tmpStr1.getLength() != tmpStr2.getLength() ) {
|
|
// return number of matched code points so far
|
|
nMatch1 = offset1[i-1] + 1;
|
|
nMatch2 = offset2[i-1] + 1;
|
|
return sal_False;
|
|
} else {
|
|
nMatch1 = nCount1;
|
|
nMatch2 = nCount2;
|
|
return sal_True;
|
|
}
|
|
}
|
|
|
|
#define MaxOutput 2
|
|
|
|
Sequence< OUString > SAL_CALL
|
|
TransliterationImpl::getRange(const Sequence< OUString > &inStrs,
|
|
const sal_Int32 length, sal_Int16 _numCascade) throw(RuntimeException)
|
|
{
|
|
if (_numCascade >= numCascade || ! bodyCascade[_numCascade].is())
|
|
return inStrs;
|
|
|
|
sal_Int32 j_tmp = 0;
|
|
Sequence< OUString > ostr(MaxOutput*length);
|
|
for (sal_Int32 j = 0; j < length; j+=2) {
|
|
const Sequence< OUString >& temp = bodyCascade[_numCascade]->transliterateRange(inStrs[j], inStrs[j+1]);
|
|
|
|
for ( sal_Int32 k = 0; k < temp.getLength(); k++) {
|
|
if ( j_tmp >= MaxOutput*length ) throw ERROR;
|
|
ostr[j_tmp++] = temp[k];
|
|
}
|
|
}
|
|
ostr.realloc(j_tmp);
|
|
|
|
return this->getRange(ostr, j_tmp, ++_numCascade);
|
|
}
|
|
|
|
|
|
Sequence< OUString > SAL_CALL
|
|
TransliterationImpl::transliterateRange( const OUString& str1, const OUString& str2 )
|
|
throw(RuntimeException)
|
|
{
|
|
if (numCascade == 1)
|
|
return bodyCascade[0]->transliterateRange(str1, str2);
|
|
|
|
Sequence< OUString > ostr(2);
|
|
ostr[0] = str1;
|
|
ostr[1] = str2;
|
|
|
|
return this->getRange(ostr, 2, 0);
|
|
}
|
|
|
|
|
|
sal_Int32 SAL_CALL
|
|
TransliterationImpl::compareSubstring(
|
|
const OUString& str1, sal_Int32 off1, sal_Int32 len1,
|
|
const OUString& str2, sal_Int32 off2, sal_Int32 len2)
|
|
throw(RuntimeException)
|
|
{
|
|
if (caseignoreOnly && caseignore.is())
|
|
return caseignore->compareSubstring(str1, off1, len1, str2, off2, len2);
|
|
|
|
Sequence <sal_Int32> offset;
|
|
|
|
OUString in_str1 = this->transliterate(str1, off1, len1, offset);
|
|
OUString in_str2 = this->transliterate(str2, off2, len2, offset);
|
|
const sal_Unicode* unistr1 = in_str1.getStr();
|
|
const sal_Unicode* unistr2 = in_str2.getStr();
|
|
sal_Int32 strlen1 = in_str1.getLength();
|
|
sal_Int32 strlen2 = in_str2.getLength();
|
|
|
|
while (strlen1 && strlen2) {
|
|
if (*unistr1 != *unistr2)
|
|
return *unistr1 > *unistr2 ? 1 : -1;
|
|
|
|
unistr1++; unistr2++; strlen1--; strlen2--;
|
|
}
|
|
return strlen1 == strlen2 ? 0 : (strlen1 > strlen2 ? 1 : -1);
|
|
}
|
|
|
|
|
|
sal_Int32 SAL_CALL
|
|
TransliterationImpl::compareString(const OUString& str1, const OUString& str2 ) throw (RuntimeException)
|
|
{
|
|
if (caseignoreOnly && caseignore.is())
|
|
return caseignore->compareString(str1, str2);
|
|
else
|
|
return this->compareSubstring(str1, 0, str1.getLength(), str2, 0, str2.getLength());
|
|
}
|
|
|
|
|
|
void
|
|
TransliterationImpl::clear()
|
|
{
|
|
for (sal_Int32 i = 0; i < numCascade; i++)
|
|
if (bodyCascade[i].is())
|
|
bodyCascade[i].clear();
|
|
numCascade = 0;
|
|
caseignore.clear();
|
|
caseignoreOnly = sal_True;
|
|
}
|
|
|
|
void TransliterationImpl::loadBody( OUString &implName, Reference<XExtendedTransliteration>& body )
|
|
throw (RuntimeException)
|
|
{
|
|
::osl::MutexGuard guard(lastTransBody.mutex);
|
|
|
|
if (implName.equals(lastTransBody.Name))
|
|
{
|
|
// Use the cached body instead of going through the expensive looping again.
|
|
body = lastTransBody.Body;
|
|
return;
|
|
}
|
|
|
|
Reference< XContentEnumerationAccess > xEnumAccess( xSMgr, UNO_QUERY );
|
|
Reference< XEnumeration > xEnum(xEnumAccess->createContentEnumeration(
|
|
OUString::createFromAscii(TRLT_SERVICELNAME_L10N)));
|
|
if (xEnum.is()) {
|
|
while (xEnum->hasMoreElements()) {
|
|
Any a = xEnum->nextElement();
|
|
Reference< XServiceInfo > xsInfo;
|
|
if (a >>= xsInfo) {
|
|
if (implName.equals(xsInfo->getImplementationName())) {
|
|
Reference< XSingleServiceFactory > xFactory;
|
|
if (a >>= xFactory) {
|
|
Reference< XInterface > xI = xFactory->createInstance();
|
|
if (xI.is()) {
|
|
a = xI->queryInterface(::getCppuType((
|
|
const Reference<XExtendedTransliteration>*)0));
|
|
a >>= body;
|
|
lastTransBody.Name = implName;
|
|
lastTransBody.Body = body;
|
|
return;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
throw ERROR;
|
|
}
|
|
|
|
sal_Bool SAL_CALL
|
|
TransliterationImpl::loadModuleByName( const OUString& implName,
|
|
Reference<XExtendedTransliteration>& body, const Locale& rLocale) throw(RuntimeException)
|
|
{
|
|
OUString cname = OUString::createFromAscii(TRLT_IMPLNAME_PREFIX) + implName;
|
|
loadBody(cname, body);
|
|
if (body.is()) {
|
|
body->loadModule((TransliterationModules)0, rLocale); // toUpper/toLoad need rLocale
|
|
|
|
// if the module is ignore case/kana/width, load caseignore for equals/compareString mothed
|
|
for (sal_Int16 i = 0; i < 3; i++) {
|
|
if (implName.compareToAscii(TMlist[i].implName) == 0) {
|
|
if (i == 0) // current module is caseignore
|
|
body->loadModule(TMlist[0].tm, rLocale); // caseingore need to setup module name
|
|
if (! caseignore.is()) {
|
|
OUString bname = OUString::createFromAscii(TRLT_IMPLNAME_PREFIX) +
|
|
OUString::createFromAscii(TMlist[0].implName);
|
|
loadBody(bname, caseignore);
|
|
}
|
|
if (caseignore.is())
|
|
caseignore->loadModule(TMlist[i].tm, rLocale);
|
|
return sal_True;
|
|
}
|
|
}
|
|
caseignoreOnly = sal_False; // has other module than just ignore case/kana/width
|
|
}
|
|
return body.is();
|
|
}
|
|
|
|
const sal_Char cTrans[] = "com.sun.star.i18n.Transliteration";
|
|
|
|
OUString SAL_CALL
|
|
TransliterationImpl::getImplementationName() throw( RuntimeException )
|
|
{
|
|
return OUString::createFromAscii(cTrans);
|
|
}
|
|
|
|
|
|
sal_Bool SAL_CALL
|
|
TransliterationImpl::supportsService(const OUString& rServiceName) throw( RuntimeException )
|
|
{
|
|
return !rServiceName.compareToAscii(cTrans);
|
|
}
|
|
|
|
Sequence< OUString > SAL_CALL
|
|
TransliterationImpl::getSupportedServiceNames(void) throw( RuntimeException )
|
|
{
|
|
Sequence< OUString > aRet(1);
|
|
aRet[0] = OUString::createFromAscii(cTrans);
|
|
return aRet;
|
|
}
|
|
|
|
} } } }
|