983a62b547
Patches from Herbert Duerr: #i118925# fix old word-boundary emulation http://svn.apache.org/viewvc?view=revision&revision=1301596 #i119031# preserving ASCII in ignore-* transliterations allows full SIMPLE_TRANS_MASK http://svn.apache.org/viewvc?view=revision&revision=1301104 #i118887# ignore zero-length matches in regexp search http://svn.apache.org/viewvc?view=revision&revision=1242235 fix transliteration flags for search pattern preprocessing http://svn.apache.org/viewvc?view=revision&revision=1236199 fix minor typo in comment http://svn.apache.org/viewvc?view=revision&revision=1234799 improve standard conformance regarding unicode UAX#29 word boundaries http://svn.apache.org/viewvc?view=revision&revision=1234786 emulate word boundary matching of old regex engine The new ICU regex engine has much improved unicode capabilities. The old regex engine had the extensions \< and \> for matching word boundaries. For the convenience of a smooth upgrade experience these artifacts now get mapped to \b which is supported by almost all regex engines. http://svn.apache.org/viewvc?view=revision&revision=1234777 #i118723# fill in regexp matcher group details http://svn.apache.org/viewvc?view=revision&revision=1228084 use ICU regexp instead of LGPL i18nregexp http://svn.apache.org/viewvc?view=revision&revision=1177610 #i119031# default to preserve ASCII in ignore-width transliteration http://svn.apache.org/viewvc?view=revision&revision=1301101
63 lines
2.1 KiB
C++
63 lines
2.1 KiB
C++
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
|
|
/*
|
|
* This file is part of the LibreOffice project.
|
|
*
|
|
* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
*
|
|
* This file incorporates work covered by the following license notice:
|
|
*
|
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
|
* contributor license agreements. See the NOTICE file distributed
|
|
* with this work for additional information regarding copyright
|
|
* ownership. The ASF licenses this file to you under the Apache
|
|
* License, Version 2.0 (the "License"); you may not use this file
|
|
* except in compliance with the License. You may obtain a copy of
|
|
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
|
|
*/
|
|
|
|
// prevent internal compiler error with MSVC6SP3
|
|
#include <utility>
|
|
|
|
#define TRANSLITERATION_Width
|
|
#include <transliteration_Ignore.hxx>
|
|
#define TRANSLITERATION_fullwidthToHalfwidth
|
|
#define TRANSLITERATION_halfwidthToFullwidth
|
|
#include <transliteration_OneToOne.hxx>
|
|
|
|
using namespace com::sun::star::uno;
|
|
using namespace com::sun::star::lang;
|
|
|
|
using ::rtl::OUString;
|
|
|
|
namespace com { namespace sun { namespace star { namespace i18n {
|
|
|
|
OUString SAL_CALL
|
|
ignoreWidth::folding( const OUString& inStr, sal_Int32 startPos, sal_Int32 nCount, Sequence< sal_Int32 >& offset )
|
|
throw(RuntimeException)
|
|
{
|
|
fullwidthToHalfwidth t1;
|
|
return t1.transliterate(inStr, startPos, nCount, offset);
|
|
}
|
|
|
|
Sequence< OUString > SAL_CALL
|
|
ignoreWidth::transliterateRange( const OUString& str1, const OUString& str2 )
|
|
throw(RuntimeException)
|
|
{
|
|
fullwidthToHalfwidth t1;
|
|
halfwidthToFullwidth t2;
|
|
|
|
return transliteration_Ignore::transliterateRange(str1, str2, t1, t2);
|
|
}
|
|
|
|
sal_Unicode SAL_CALL
|
|
ignoreWidth::transliterateChar2Char( sal_Unicode inChar) throw(RuntimeException, MultipleCharsOutputException)
|
|
{
|
|
fullwidthToHalfwidth t1;
|
|
return t1.transliterateChar2Char(inChar);
|
|
}
|
|
|
|
} } } }
|
|
|
|
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
|