2010-10-14 01:27:31 -05:00
|
|
|
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
|
2002-03-26 06:36:40 -06:00
|
|
|
/*************************************************************************
|
|
|
|
*
|
2008-04-10 02:39:53 -05:00
|
|
|
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
|
2002-03-26 06:36:40 -06:00
|
|
|
*
|
2010-02-12 08:01:35 -06:00
|
|
|
* Copyright 2000, 2010 Oracle and/or its affiliates.
|
2002-03-26 10:57:44 -06:00
|
|
|
*
|
2008-04-10 02:39:53 -05:00
|
|
|
* OpenOffice.org - a multi-platform office productivity suite
|
2002-03-26 10:57:44 -06:00
|
|
|
*
|
2008-04-10 02:39:53 -05:00
|
|
|
* This file is part of OpenOffice.org.
|
2002-03-26 06:36:40 -06:00
|
|
|
*
|
2008-04-10 02:39:53 -05:00
|
|
|
* OpenOffice.org is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU Lesser General Public License version 3
|
|
|
|
* only, as published by the Free Software Foundation.
|
2002-03-26 06:36:40 -06:00
|
|
|
*
|
2008-04-10 02:39:53 -05:00
|
|
|
* OpenOffice.org is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU Lesser General Public License version 3 for more details
|
|
|
|
* (a copy is included in the LICENSE file that accompanied this code).
|
2002-03-26 06:36:40 -06:00
|
|
|
*
|
2008-04-10 02:39:53 -05:00
|
|
|
* You should have received a copy of the GNU Lesser General Public License
|
|
|
|
* version 3 along with OpenOffice.org. If not, see
|
|
|
|
* <http://www.openoffice.org/license.html>
|
|
|
|
* for a copy of the LGPLv3 License.
|
2002-03-26 06:36:40 -06:00
|
|
|
*
|
|
|
|
************************************************************************/
|
|
|
|
#ifndef _I18N_CCLASS_UNICODE_HXX_
|
|
|
|
#define _I18N_CCLASS_UNICODE_HXX_
|
|
|
|
|
2003-04-24 05:02:43 -05:00
|
|
|
#include <com/sun/star/i18n/XNativeNumberSupplier.hpp>
|
2002-03-26 06:36:40 -06:00
|
|
|
#include <com/sun/star/i18n/XCharacterClassification.hpp>
|
|
|
|
#include <com/sun/star/i18n/XLocaleData.hpp>
|
2003-04-15 08:24:07 -05:00
|
|
|
#include <com/sun/star/lang/XMultiServiceFactory.hpp>
|
2002-03-26 06:36:40 -06:00
|
|
|
#include <cppuhelper/implbase1.hxx> // helper for implementations
|
|
|
|
#include <com/sun/star/lang/XServiceInfo.hpp>
|
|
|
|
|
|
|
|
#define TRANSLITERATION_casemapping
|
|
|
|
#include <transliteration_body.hxx>
|
|
|
|
|
|
|
|
namespace com { namespace sun { namespace star { namespace i18n {
|
|
|
|
|
|
|
|
typedef sal_uInt32 UPT_FLAG_TYPE;
|
|
|
|
|
|
|
|
class cclass_Unicode : public cppu::WeakImplHelper1 < XCharacterClassification >
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
cclass_Unicode(com::sun::star::uno::Reference < com::sun::star::lang::XMultiServiceFactory > xSMgr );
|
|
|
|
~cclass_Unicode();
|
|
|
|
|
|
|
|
virtual rtl::OUString SAL_CALL toUpper( const rtl::OUString& Text, sal_Int32 nPos, sal_Int32 nCount,
|
|
|
|
const com::sun::star::lang::Locale& rLocale ) throw(com::sun::star::uno::RuntimeException);
|
|
|
|
virtual rtl::OUString SAL_CALL toLower( const rtl::OUString& Text, sal_Int32 nPos, sal_Int32 nCount,
|
|
|
|
const com::sun::star::lang::Locale& rLocale ) throw(com::sun::star::uno::RuntimeException);
|
|
|
|
virtual rtl::OUString SAL_CALL toTitle( const rtl::OUString& Text, sal_Int32 nPos, sal_Int32 nCount,
|
|
|
|
const com::sun::star::lang::Locale& rLocale ) throw(com::sun::star::uno::RuntimeException);
|
|
|
|
virtual sal_Int16 SAL_CALL getType( const rtl::OUString& Text, sal_Int32 nPos ) throw(com::sun::star::uno::RuntimeException);
|
|
|
|
virtual sal_Int16 SAL_CALL getCharacterDirection( const rtl::OUString& Text, sal_Int32 nPos )
|
|
|
|
throw(com::sun::star::uno::RuntimeException);
|
|
|
|
virtual sal_Int16 SAL_CALL getScript( const rtl::OUString& Text, sal_Int32 nPos ) throw(com::sun::star::uno::RuntimeException);
|
|
|
|
virtual sal_Int32 SAL_CALL getCharacterType( const rtl::OUString& text, sal_Int32 nPos,
|
|
|
|
const com::sun::star::lang::Locale& rLocale ) throw(com::sun::star::uno::RuntimeException);
|
|
|
|
virtual sal_Int32 SAL_CALL getStringType( const rtl::OUString& text, sal_Int32 nPos, sal_Int32 nCount,
|
|
|
|
const com::sun::star::lang::Locale& rLocale ) throw(com::sun::star::uno::RuntimeException);
|
|
|
|
virtual ParseResult SAL_CALL parseAnyToken( const rtl::OUString& Text, sal_Int32 nPos,
|
|
|
|
const com::sun::star::lang::Locale& rLocale, sal_Int32 nStartCharFlags, const rtl::OUString& userDefinedCharactersStart,
|
|
|
|
sal_Int32 nContCharFlags, const rtl::OUString& userDefinedCharactersCont ) throw(com::sun::star::uno::RuntimeException);
|
|
|
|
virtual ParseResult SAL_CALL parsePredefinedToken( sal_Int32 nTokenType, const rtl::OUString& Text,
|
|
|
|
sal_Int32 nPos, const com::sun::star::lang::Locale& rLocale, sal_Int32 nStartCharFlags,
|
|
|
|
const rtl::OUString& userDefinedCharactersStart, sal_Int32 nContCharFlags,
|
|
|
|
const rtl::OUString& userDefinedCharactersCont ) throw(com::sun::star::uno::RuntimeException);
|
|
|
|
|
|
|
|
//XServiceInfo
|
|
|
|
virtual rtl::OUString SAL_CALL getImplementationName() throw( com::sun::star::uno::RuntimeException );
|
|
|
|
virtual sal_Bool SAL_CALL supportsService(const rtl::OUString& ServiceName) throw( com::sun::star::uno::RuntimeException );
|
|
|
|
virtual com::sun::star::uno::Sequence< rtl::OUString > SAL_CALL getSupportedServiceNames() throw( com::sun::star::uno::RuntimeException );
|
|
|
|
|
|
|
|
protected:
|
2004-01-20 06:16:36 -06:00
|
|
|
const sal_Char *cClass;
|
2002-03-26 06:36:40 -06:00
|
|
|
|
|
|
|
private:
|
|
|
|
Transliteration_casemapping *trans;
|
|
|
|
|
|
|
|
// --- parser specific (implemented in cclass_unicode_parser.cxx) ---
|
|
|
|
|
|
|
|
enum ScanState
|
|
|
|
{
|
|
|
|
ssGetChar,
|
|
|
|
ssGetValue,
|
|
|
|
ssGetWord,
|
|
|
|
ssGetWordFirstChar,
|
|
|
|
ssGetString,
|
|
|
|
ssGetBool,
|
2002-09-20 10:12:55 -05:00
|
|
|
ssRewindFromValue,
|
2005-11-01 07:51:41 -06:00
|
|
|
ssIgnoreLeadingInRewind,
|
2002-03-26 06:36:40 -06:00
|
|
|
ssStopBack,
|
|
|
|
ssBounce,
|
|
|
|
ssStop
|
|
|
|
};
|
|
|
|
|
|
|
|
static const sal_uInt8 nDefCnt;
|
|
|
|
static const UPT_FLAG_TYPE pDefaultParserTable[];
|
|
|
|
static const sal_Int32 pParseTokensType[];
|
|
|
|
|
|
|
|
/// Flag values of table.
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_ILLEGAL;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_CHAR;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_CHAR_BOOL;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_CHAR_WORD;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_CHAR_VALUE;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_CHAR_STRING;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_CHAR_DONTCARE;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_BOOL;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_WORD;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_WORD_SEP;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_VALUE;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_VALUE_SEP;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_VALUE_EXP;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_VALUE_SIGN;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_VALUE_EXP_VALUE;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_VALUE_DIGIT;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_NAME_SEP;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_STRING_SEP;
|
|
|
|
static const UPT_FLAG_TYPE TOKEN_EXCLUDED;
|
|
|
|
|
|
|
|
/// If and where c occurs in pStr
|
|
|
|
static const sal_Unicode* StrChr( const sal_Unicode* pStr, sal_Unicode c );
|
|
|
|
|
2002-08-05 10:22:55 -05:00
|
|
|
|
2002-03-26 06:36:40 -06:00
|
|
|
com::sun::star::uno::Reference < com::sun::star::lang::XMultiServiceFactory > xMSF;
|
|
|
|
|
|
|
|
/// used for parser only
|
|
|
|
com::sun::star::lang::Locale aParserLocale;
|
|
|
|
com::sun::star::uno::Reference < XLocaleData > xLocaleData;
|
2003-04-24 05:02:43 -05:00
|
|
|
com::sun::star::uno::Reference < com::sun::star::i18n::XNativeNumberSupplier > xNatNumSup;
|
2002-03-26 06:36:40 -06:00
|
|
|
rtl::OUString aStartChars;
|
|
|
|
rtl::OUString aContChars;
|
|
|
|
UPT_FLAG_TYPE* pTable;
|
|
|
|
UPT_FLAG_TYPE* pStart;
|
|
|
|
UPT_FLAG_TYPE* pCont;
|
|
|
|
sal_Int32 nStartTypes;
|
|
|
|
sal_Int32 nContTypes;
|
|
|
|
ScanState eState;
|
|
|
|
sal_Unicode cGroupSep;
|
|
|
|
sal_Unicode cDecimalSep;
|
|
|
|
|
|
|
|
/// Get corresponding KParseTokens flag for a character
|
2002-11-05 16:41:29 -06:00
|
|
|
sal_Int32 getParseTokensType( const sal_Unicode* aStr, sal_Int32 nPos );
|
2002-03-26 06:36:40 -06:00
|
|
|
|
|
|
|
/// Access parser table flags.
|
2002-11-05 16:41:29 -06:00
|
|
|
UPT_FLAG_TYPE getFlags( const sal_Unicode* aStr, sal_Int32 nPos );
|
2002-03-26 06:36:40 -06:00
|
|
|
|
|
|
|
/// Access parser flags via International and special definitions.
|
2002-11-05 16:41:29 -06:00
|
|
|
UPT_FLAG_TYPE getFlagsExtended( const sal_Unicode* aStr, sal_Int32 nPos );
|
2002-03-26 06:36:40 -06:00
|
|
|
|
|
|
|
/// Access parser table flags for user defined start characters.
|
|
|
|
UPT_FLAG_TYPE getStartCharsFlags( sal_Unicode c );
|
|
|
|
|
|
|
|
/// Access parser table flags for user defined continuation characters.
|
|
|
|
UPT_FLAG_TYPE getContCharsFlags( sal_Unicode c );
|
|
|
|
|
|
|
|
/// Setup parser table. Calls initParserTable() only if needed.
|
|
|
|
void setupParserTable( const com::sun::star::lang::Locale& rLocale, sal_Int32 startCharTokenType,
|
|
|
|
const rtl::OUString& userDefinedCharactersStart, sal_Int32 contCharTokenType,
|
|
|
|
const rtl::OUString& userDefinedCharactersCont );
|
|
|
|
|
|
|
|
/// Init parser table.
|
|
|
|
void initParserTable( const com::sun::star::lang::Locale& rLocale, sal_Int32 startCharTokenType,
|
|
|
|
const rtl::OUString& userDefinedCharactersStart, sal_Int32 contCharTokenType,
|
|
|
|
const rtl::OUString& userDefinedCharactersCont );
|
|
|
|
|
|
|
|
/// Destroy parser table.
|
|
|
|
void destroyParserTable();
|
|
|
|
|
|
|
|
/// Parse a text.
|
|
|
|
void parseText( ParseResult& r, const rtl::OUString& rText, sal_Int32 nPos,
|
|
|
|
sal_Int32 nTokenType = 0xffffffff );
|
|
|
|
|
|
|
|
/// Setup International class, new'ed only if different from existing.
|
|
|
|
sal_Bool setupInternational( const com::sun::star::lang::Locale& rLocale );
|
|
|
|
|
|
|
|
/// Implementation of getCharacterType() for one single character
|
2007-07-26 03:07:35 -05:00
|
|
|
sal_Int32 SAL_CALL getCharType( const rtl::OUString& Text, sal_Int32 *nPos, sal_Int32 increment);
|
2002-03-26 06:36:40 -06:00
|
|
|
|
|
|
|
};
|
|
|
|
|
|
|
|
} } } }
|
|
|
|
|
|
|
|
#endif
|
2010-10-14 01:27:31 -05:00
|
|
|
|
|
|
|
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
|