office-gobmx/starmath/inc/parse.hxx
2011-08-30 16:56:38 +02:00

306 lines
11 KiB
C++

/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
/*************************************************************************
*
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* Copyright 2000, 2010 Oracle and/or its affiliates.
*
* OpenOffice.org - a multi-platform office productivity suite
*
* This file is part of OpenOffice.org.
*
* OpenOffice.org is free software: you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License version 3
* only, as published by the Free Software Foundation.
*
* OpenOffice.org is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License version 3 for more details
* (a copy is included in the LICENSE file that accompanied this code).
*
* You should have received a copy of the GNU Lesser General Public License
* version 3 along with OpenOffice.org. If not, see
* <http://www.openoffice.org/license.html>
* for a copy of the LGPLv3 License.
*
************************************************************************/
#ifndef PARSE_HXX
#define PARSE_HXX
#include <vcl/svapp.hxx>
#include <tools/stack.hxx>
#include <tools/string.hxx>
#include <set>
#include <stack>
#include <list>
#include "types.hxx"
#include <vector>
class SmNode;
class SmDocShell;
//////////////////////////////////////////////////////////////////////
// TokenGroups
#define TGOPER 0x00000001
#define TGRELATION 0x00000002
#define TGSUM 0x00000004
#define TGPRODUCT 0x00000008
#define TGUNOPER 0x00000010
#define TGPOWER 0x00000020
#define TGATTRIBUT 0x00000040
#define TGALIGN 0x00000080
#define TGFUNCTION 0x00000100
#define TGBLANK 0x00000200
#define TGLBRACES 0x00000400
#define TGRBRACES 0x00000800
#define TGCOLOR 0x00001000
#define TGFONT 0x00002000
#define TGSTANDALONE 0x00004000
#define TGDISCARDED 0x00008000
#define TGLIMIT 0x00010000
#define TGFONTATTR 0x00020000
enum SmTokenType
{
/* 0*/ TEND, TLGROUP, TRGROUP, TLPARENT, TRPARENT,
/* 5*/ TLBRACKET, TRBRACKET, TPLUS, TMINUS, TMULTIPLY,
/* 10*/ TDIVIDEBY, TASSIGN, TPOUND, TSPECIAL, TSLASH,
/* 15*/ TBACKSLASH, TBLANK, TSBLANK, TRSUB, TRSUP,
/* 20*/ TCSUB, TCSUP, TLSUB, TLSUP, TGT,
/* 25*/ TLT, TAND, TOR, TINTERSECT, TUNION,
/* 30*/ TNEWLINE, TBINOM, TFROM, TTO, TINT,
/* 35*/ TSUM, TOPER, TABS, TSQRT, TFACT,
/* 40*/ TNROOT, TOVER, TTIMES, TGE, TLE,
/* 45*/ TGG, TLL, TDOTSAXIS, TDOTSLOW, TDOTSVERT,
/* 50*/ TDOTSDIAG, TDOTSUP, TDOTSDOWN, TACUTE, TBAR,
/* 55*/ TBREVE, TCHECK, TCIRCLE, TDOT, TDDOT,
/* 60*/ TDDDOT, TGRAVE, THAT, TTILDE, TVEC,
/* 65*/ TUNDERLINE, TOVERLINE, TOVERSTRIKE, TITALIC, TNITALIC,
/* 70*/ TBOLD, TNBOLD, TPHANTOM, TFONT, TSIZE,
/* 75*/ TCOLOR, TALIGNL, TALIGNC, TALIGNR, TLEFT,
/* 80*/ TRIGHT, TLANGLE, TLBRACE, TLLINE, TLDLINE,
/* 85*/ TLCEIL, TLFLOOR, TNONE, TMLINE, TRANGLE,
/* 90*/ TRBRACE, TRLINE, TRDLINE, TRCEIL, TRFLOOR,
/* 95*/ TSIN, TCOS, TTAN, TCOT, TFUNC,
/*100*/ TSTACK, TMATRIX, TMATFORM, TDPOUND, TPLACE,
/*105*/ TTEXT, TNUMBER, TCHARACTER, TIDENT, TNEQ,
/*110*/ TEQUIV, TDEF, TPROP, TSIM, TSIMEQ,
/*115*/ TAPPROX, TPARALLEL, TORTHO, TIN, TNOTIN,
/*120*/ TSUBSET, TSUBSETEQ, TSUPSET, TSUPSETEQ, TPLUSMINUS,
/*125*/ TMINUSPLUS, TOPLUS, TOMINUS, TDIV, TOTIMES,
/*130*/ TODIVIDE, TTRANSL, TTRANSR, TIINT, TIIINT,
/*135*/ TLINT, TLLINT, TLLLINT, TPROD, TCOPROD,
/*140*/ TFORALL, TEXISTS, TLIM, TNABLA, TTOWARD,
/*145*/ TSINH, TCOSH, TTANH, TCOTH, TASIN,
/*150*/ TACOS, TATAN, TLN, TLOG, TUOPER,
/*155*/ TBOPER, TBLACK, TWHITE, TRED, TGREEN,
/*160*/ TBLUE, TCYAN, TMAGENTA, TYELLOW, TFIXED,
/*165*/ TSANS, TSERIF, TPOINT, TASINH, TACOSH,
/*170*/ TATANH, TACOTH, TACOT, TEXP, TCDOT,
/*175*/ TODOT, TLESLANT, TGESLANT, TNSUBSET, TNSUPSET,
/*180*/ TNSUBSETEQ, TNSUPSETEQ, TPARTIAL, TNEG, TNI,
/*185*/ TBACKEPSILON, TALEPH, TIM, TRE, TWP,
/*190*/ TEMPTYSET, TINFINITY, TESCAPE, TLIMSUP, TLIMINF,
/*195*/ TNDIVIDES, TDRARROW, TDLARROW, TDLRARROW, TUNDERBRACE,
/*200*/ TOVERBRACE, TCIRC, TTOP, THBAR, TLAMBDABAR,
/*205*/ TLEFTARROW, TRIGHTARROW, TUPARROW, TDOWNARROW, TDIVIDES,
/*210*/ TNDIBVIDES, TSETN, TSETZ, TSETQ, TSETR,
/*215*/ TSETC, TWIDEVEC, TWIDETILDE, TWIDEHAT, TWIDESLASH,
/*220*/ TWIDEBACKSLASH, TLDBRACKET, TRDBRACKET, TNOSPACE,
/*225*/ TUNKNOWN, TDEBUG
};
struct SmToken
{
String aText; // token text
SmTokenType eType; // token info
sal_Unicode cMathChar;
// parse-help info
sal_uLong nGroup;
sal_uInt16 nLevel;
// token position
sal_uInt16 nRow;
xub_StrLen nCol;
SmToken();
SmToken(SmTokenType eTokenType,
sal_Unicode cMath,
const sal_Char* pText,
sal_uLong nTokenGroup = 0,
sal_uInt16 nTokenLevel = 0);
};
enum SmParseError
{
PE_NONE, PE_UNEXPECTED_END_OF_INPUT,
PE_UNEXPECTED_CHAR, PE_UNEXPECTED_TOKEN,
PE_FUNC_EXPECTED, PE_UNOPER_EXPECTED,
PE_BINOPER_EXPECTED, PE_SYMBOL_EXPECTED,
PE_IDENTIFIER_EXPECTED, PE_POUND_EXPECTED,
PE_COLOR_EXPECTED, PE_LGROUP_EXPECTED,
PE_RGROUP_EXPECTED, PE_LBRACE_EXPECTED,
PE_RBRACE_EXPECTED, PE_PARENT_MISMATCH,
PE_RIGHT_EXPECTED, PE_FONT_EXPECTED,
PE_SIZE_EXPECTED, PE_DOUBLE_ALIGN,
PE_DOUBLE_SUBSUPSCRIPT
};
struct SmErrorDesc
{
SmParseError Type;
SmNode *pNode;
String Text;
};
DECLARE_STACK(SmNodeStack, SmNode *)
typedef ::std::vector< SmErrorDesc* > SmErrDescList;
/**************************************************************************/
// defines possible conversions of the formula text from the format of
// one release to the one of another.
enum SmConvert
{
CONVERT_NONE,
CONVERT_40_TO_50,
CONVERT_50_TO_60,
CONVERT_60_TO_50
};
struct SmTokenTableEntry
{
const sal_Char* pIdent;
SmTokenType eType;
sal_Unicode cMathChar;
sal_uLong nGroup;
sal_uInt16 nLevel;
};
class SmParser
{
String m_aBufferString;
SmToken m_aCurToken;
SmNodeStack m_aNodeStack;
SmErrDescList m_aErrDescList;
int m_nCurError;
LanguageType m_nLang;
xub_StrLen m_nBufferIndex,
m_nTokenIndex;
sal_uInt16 m_Row,
m_nColOff;
SmConvert m_eConversion;
bool bImportSymNames,
m_bExportSymNames;
// map of used symbols (used to reduce file size by exporting only actually used symbols)
std::set< rtl::OUString > m_aUsedSymbols;
//! locale where '.' is decimal seperator!
::com::sun::star::lang::Locale m_aDotLoc;
// declare copy-constructor and assignment-operator private
SmParser(const SmParser &);
SmParser & operator = (const SmParser &);
protected:
#if OSL_DEBUG_LEVEL > 1
bool IsDelimiter( const String &rTxt, xub_StrLen nPos );
#endif
void NextToken();
xub_StrLen GetTokenIndex() const { return m_nTokenIndex; }
void Insert(const String &rText, sal_uInt16 nPos);
void Replace( sal_uInt16 nPos, sal_uInt16 nLen, const String &rText );
inline bool TokenInGroup( sal_uLong nGroup );
// grammar
void Table();
void Line();
void Expression();
void Relation();
void Sum();
void Product();
void SubSup(sal_uLong nActiveGroup);
void OpSubSup();
void Power();
void Blank();
void Term();
void Escape();
void Operator();
void Oper();
void UnOper();
void Align();
void FontAttribut();
void Attribut();
void Font();
void FontSize();
void Color();
void Brace();
void Bracebody(bool bIsLeftRight);
void Function();
void Binom();
void Stack();
void Matrix();
void Special();
void GlyphSpecial();
// end of grammar
LanguageType GetLanguage() const { return m_nLang; }
void SetLanguage( LanguageType nNewLang ) { m_nLang = nNewLang; }
void Error(SmParseError Error);
void ClearUsedSymbols() { m_aUsedSymbols.clear(); }
void AddToUsedSymbols( const String &rSymbolName ) { m_aUsedSymbols.insert( rSymbolName ); }
public:
SmParser();
/** Parse rBuffer to formula tree */
SmNode *Parse(const String &rBuffer);
/** Parse rBuffer to formula subtree that constitutes an expression */
SmNode *ParseExpression(const String &rBuffer);
const String & GetText() const { return m_aBufferString; };
SmConvert GetConversion() const { return m_eConversion; }
void SetConversion(SmConvert eConv) { m_eConversion = eConv; }
bool IsImportSymbolNames() const { return bImportSymNames; }
void SetImportSymbolNames(bool bVal) { bImportSymNames = bVal; }
bool IsExportSymbolNames() const { return m_bExportSymNames; }
void SetExportSymbolNames(bool bVal) { m_bExportSymNames = bVal; }
size_t AddError(SmParseError Type, SmNode *pNode);
const SmErrorDesc* NextError();
const SmErrorDesc* PrevError();
const SmErrorDesc* GetError(size_t i = size_t(-1) );
static const SmTokenTableEntry* GetTokenTableEntry( const String &rName );
bool IsUsedSymbol( const String &rSymbolName ) const { return m_aUsedSymbols.find( rSymbolName ) != m_aUsedSymbols.end(); }
std::set< rtl::OUString > GetUsedSymbols() const { return m_aUsedSymbols; }
};
inline bool SmParser::TokenInGroup( sal_uLong nGroup)
{
return (m_aCurToken.nGroup & nGroup) ? true : false;
}
#endif
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */