1*cdf0e10cSrcweir /************************************************************************* 2*cdf0e10cSrcweir * 3*cdf0e10cSrcweir * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 4*cdf0e10cSrcweir * 5*cdf0e10cSrcweir * Copyright 2000, 2010 Oracle and/or its affiliates. 6*cdf0e10cSrcweir * 7*cdf0e10cSrcweir * OpenOffice.org - a multi-platform office productivity suite 8*cdf0e10cSrcweir * 9*cdf0e10cSrcweir * This file is part of OpenOffice.org. 10*cdf0e10cSrcweir * 11*cdf0e10cSrcweir * OpenOffice.org is free software: you can redistribute it and/or modify 12*cdf0e10cSrcweir * it under the terms of the GNU Lesser General Public License version 3 13*cdf0e10cSrcweir * only, as published by the Free Software Foundation. 14*cdf0e10cSrcweir * 15*cdf0e10cSrcweir * OpenOffice.org is distributed in the hope that it will be useful, 16*cdf0e10cSrcweir * but WITHOUT ANY WARRANTY; without even the implied warranty of 17*cdf0e10cSrcweir * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 18*cdf0e10cSrcweir * GNU Lesser General Public License version 3 for more details 19*cdf0e10cSrcweir * (a copy is included in the LICENSE file that accompanied this code). 20*cdf0e10cSrcweir * 21*cdf0e10cSrcweir * You should have received a copy of the GNU Lesser General Public License 22*cdf0e10cSrcweir * version 3 along with OpenOffice.org. If not, see 23*cdf0e10cSrcweir * <http://www.openoffice.org/license.html> 24*cdf0e10cSrcweir * for a copy of the LGPLv3 License. 25*cdf0e10cSrcweir * 26*cdf0e10cSrcweir ************************************************************************/ 27*cdf0e10cSrcweir 28*cdf0e10cSrcweir #ifndef _LEX_HXX 29*cdf0e10cSrcweir #define _LEX_HXX 30*cdf0e10cSrcweir 31*cdf0e10cSrcweir #include <hash.hxx> 32*cdf0e10cSrcweir #include <tools/gen.hxx> 33*cdf0e10cSrcweir #include <tools/stream.hxx> 34*cdf0e10cSrcweir 35*cdf0e10cSrcweir /******************** enum ***********************************************/ 36*cdf0e10cSrcweir enum SVTOKEN_ENUM { SVTOKEN_EMPTY, SVTOKEN_COMMENT, 37*cdf0e10cSrcweir SVTOKEN_INTEGER, SVTOKEN_STRING, 38*cdf0e10cSrcweir SVTOKEN_BOOL, SVTOKEN_IDENTIFIER, 39*cdf0e10cSrcweir SVTOKEN_CHAR, SVTOKEN_RTTIBASE, 40*cdf0e10cSrcweir SVTOKEN_EOF, SVTOKEN_HASHID }; 41*cdf0e10cSrcweir 42*cdf0e10cSrcweir /******************** class SvToken **************************************/ 43*cdf0e10cSrcweir class BigInt; 44*cdf0e10cSrcweir class SvToken 45*cdf0e10cSrcweir { 46*cdf0e10cSrcweir friend class SvTokenStream; 47*cdf0e10cSrcweir sal_uLong nLine, nColumn; 48*cdf0e10cSrcweir SVTOKEN_ENUM nType; 49*cdf0e10cSrcweir ByteString aString; 50*cdf0e10cSrcweir union 51*cdf0e10cSrcweir { 52*cdf0e10cSrcweir sal_uLong nLong; 53*cdf0e10cSrcweir sal_Bool bBool; 54*cdf0e10cSrcweir char cChar; 55*cdf0e10cSrcweir // SvRttiBase * pComplexObj; 56*cdf0e10cSrcweir SvStringHashEntry * pHash; 57*cdf0e10cSrcweir }; 58*cdf0e10cSrcweir public: 59*cdf0e10cSrcweir SvToken(); 60*cdf0e10cSrcweir SvToken( const SvToken & rObj ); 61*cdf0e10cSrcweir SvToken( sal_uLong n ); 62*cdf0e10cSrcweir SvToken( SVTOKEN_ENUM nTypeP, sal_Bool b ); 63*cdf0e10cSrcweir SvToken( char c ); 64*cdf0e10cSrcweir SvToken( SVTOKEN_ENUM nTypeP, const ByteString & rStr ); 65*cdf0e10cSrcweir // SvToken( SvRttiBase * pComplexObj ); 66*cdf0e10cSrcweir SvToken( SVTOKEN_ENUM nTypeP ); 67*cdf0e10cSrcweir 68*cdf0e10cSrcweir SvToken & operator = ( const SvToken & rObj ); 69*cdf0e10cSrcweir 70*cdf0e10cSrcweir ByteString GetTokenAsString() const; 71*cdf0e10cSrcweir SVTOKEN_ENUM GetType() const { return nType; } 72*cdf0e10cSrcweir 73*cdf0e10cSrcweir void SetLine( sal_uLong nLineP ) { nLine = nLineP; } 74*cdf0e10cSrcweir sal_uLong GetLine() const { return nLine; } 75*cdf0e10cSrcweir 76*cdf0e10cSrcweir void SetColumn( sal_uLong nColumnP ) { nColumn = nColumnP; } 77*cdf0e10cSrcweir sal_uLong GetColumn() const { return nColumn; } 78*cdf0e10cSrcweir 79*cdf0e10cSrcweir sal_Bool IsEmpty() const { return nType == SVTOKEN_EMPTY; } 80*cdf0e10cSrcweir sal_Bool IsComment() const { return nType == SVTOKEN_COMMENT; } 81*cdf0e10cSrcweir sal_Bool IsInteger() const { return nType == SVTOKEN_INTEGER; } 82*cdf0e10cSrcweir sal_Bool IsString() const { return nType == SVTOKEN_STRING; } 83*cdf0e10cSrcweir sal_Bool IsBool() const { return nType == SVTOKEN_BOOL; } 84*cdf0e10cSrcweir sal_Bool IsIdentifierHash() const 85*cdf0e10cSrcweir { return nType == SVTOKEN_HASHID; } 86*cdf0e10cSrcweir sal_Bool IsIdentifier() const 87*cdf0e10cSrcweir { 88*cdf0e10cSrcweir return nType == SVTOKEN_IDENTIFIER 89*cdf0e10cSrcweir || nType == SVTOKEN_HASHID; 90*cdf0e10cSrcweir } 91*cdf0e10cSrcweir sal_Bool IsChar() const { return nType == SVTOKEN_CHAR; } 92*cdf0e10cSrcweir sal_Bool IsRttiBase() const { return nType == SVTOKEN_RTTIBASE; } 93*cdf0e10cSrcweir sal_Bool IsEof() const { return nType == SVTOKEN_EOF; } 94*cdf0e10cSrcweir 95*cdf0e10cSrcweir const ByteString & GetString() const 96*cdf0e10cSrcweir { 97*cdf0e10cSrcweir return IsIdentifierHash() 98*cdf0e10cSrcweir ? pHash->GetName() 99*cdf0e10cSrcweir : aString; 100*cdf0e10cSrcweir } 101*cdf0e10cSrcweir sal_uLong GetNumber() const { return nLong; } 102*cdf0e10cSrcweir sal_Bool GetBool() const { return bBool; } 103*cdf0e10cSrcweir char GetChar() const { return cChar; } 104*cdf0e10cSrcweir // SvRttiBase *GetObject() const { return pComplexObj; } 105*cdf0e10cSrcweir 106*cdf0e10cSrcweir void SetHash( SvStringHashEntry * pHashP ) 107*cdf0e10cSrcweir { pHash = pHashP; nType = SVTOKEN_HASHID; } 108*cdf0e10cSrcweir sal_Bool HasHash() const 109*cdf0e10cSrcweir { return nType == SVTOKEN_HASHID; } 110*cdf0e10cSrcweir SvStringHashEntry * GetHash() const { return pHash; } 111*cdf0e10cSrcweir sal_Bool Is( SvStringHashEntry * pEntry ) const 112*cdf0e10cSrcweir { return IsIdentifierHash() && pHash == pEntry; } 113*cdf0e10cSrcweir }; 114*cdf0e10cSrcweir 115*cdf0e10cSrcweir inline SvToken::SvToken() 116*cdf0e10cSrcweir : nType( SVTOKEN_EMPTY ) {} 117*cdf0e10cSrcweir 118*cdf0e10cSrcweir inline SvToken::SvToken( sal_uLong n ) 119*cdf0e10cSrcweir : nType( SVTOKEN_INTEGER ), nLong( n ) {} 120*cdf0e10cSrcweir 121*cdf0e10cSrcweir inline SvToken::SvToken( SVTOKEN_ENUM nTypeP, sal_Bool b ) 122*cdf0e10cSrcweir : nType( nTypeP ), bBool( b ) {} 123*cdf0e10cSrcweir 124*cdf0e10cSrcweir inline SvToken::SvToken( char c ) 125*cdf0e10cSrcweir : nType( SVTOKEN_CHAR ), cChar( c ) {} 126*cdf0e10cSrcweir 127*cdf0e10cSrcweir inline SvToken::SvToken( SVTOKEN_ENUM nTypeP, const ByteString & rStr ) 128*cdf0e10cSrcweir : nType( nTypeP ), aString( rStr ) {} 129*cdf0e10cSrcweir 130*cdf0e10cSrcweir /* 131*cdf0e10cSrcweir inline SvToken::SvToken( SvRttiBase * pObj ) 132*cdf0e10cSrcweir : nType( SVTOKEN_RTTIBASE ), pComplexObj( pObj ) 133*cdf0e10cSrcweir { pObj->AddRef(); } 134*cdf0e10cSrcweir */ 135*cdf0e10cSrcweir 136*cdf0e10cSrcweir inline SvToken::SvToken( SVTOKEN_ENUM nTypeP ) 137*cdf0e10cSrcweir : nType( nTypeP ) {} 138*cdf0e10cSrcweir 139*cdf0e10cSrcweir DECLARE_LIST( SvTokenList, SvToken * ) 140*cdf0e10cSrcweir 141*cdf0e10cSrcweir /******************** class SvTokenStream ********************************/ 142*cdf0e10cSrcweir class SvTokenStream 143*cdf0e10cSrcweir { 144*cdf0e10cSrcweir sal_uLong nLine, nColumn; 145*cdf0e10cSrcweir int nBufPos; 146*cdf0e10cSrcweir int c; // naechstes Zeichen 147*cdf0e10cSrcweir CharSet nCharSet; 148*cdf0e10cSrcweir char * pCharTab; // Zeiger auf die Konverierungstabelle 149*cdf0e10cSrcweir sal_uInt16 nTabSize; // Tabulator Laenge 150*cdf0e10cSrcweir ByteString aStrTrue; 151*cdf0e10cSrcweir ByteString aStrFalse; 152*cdf0e10cSrcweir sal_uLong nMaxPos; 153*cdf0e10cSrcweir 154*cdf0e10cSrcweir SvFileStream * pInStream; 155*cdf0e10cSrcweir SvStream & rInStream; 156*cdf0e10cSrcweir String aFileName; 157*cdf0e10cSrcweir SvTokenList aTokList; 158*cdf0e10cSrcweir SvToken * pCurToken; 159*cdf0e10cSrcweir 160*cdf0e10cSrcweir void InitCtor(); 161*cdf0e10cSrcweir 162*cdf0e10cSrcweir ByteString aBufStr; 163*cdf0e10cSrcweir int GetNextChar(); 164*cdf0e10cSrcweir int GetFastNextChar() 165*cdf0e10cSrcweir { 166*cdf0e10cSrcweir return aBufStr.GetChar((sal_uInt16)nBufPos++); 167*cdf0e10cSrcweir } 168*cdf0e10cSrcweir 169*cdf0e10cSrcweir void FillTokenList(); 170*cdf0e10cSrcweir sal_uLong GetNumber(); 171*cdf0e10cSrcweir sal_Bool MakeToken( SvToken & ); 172*cdf0e10cSrcweir sal_Bool IsEof() const { return rInStream.IsEof(); } 173*cdf0e10cSrcweir void SetMax() 174*cdf0e10cSrcweir { 175*cdf0e10cSrcweir sal_uLong n = Tell(); 176*cdf0e10cSrcweir if( n > nMaxPos ) 177*cdf0e10cSrcweir nMaxPos = n; 178*cdf0e10cSrcweir } 179*cdf0e10cSrcweir void CalcColumn() 180*cdf0e10cSrcweir { 181*cdf0e10cSrcweir // wenn Zeilenende berechnung sparen 182*cdf0e10cSrcweir if( 0 != c ) 183*cdf0e10cSrcweir { 184*cdf0e10cSrcweir sal_uInt16 n = 0; 185*cdf0e10cSrcweir nColumn = 0; 186*cdf0e10cSrcweir while( n < nBufPos ) 187*cdf0e10cSrcweir nColumn += aBufStr.GetChar(n++) == '\t' ? nTabSize : 1; 188*cdf0e10cSrcweir } 189*cdf0e10cSrcweir } 190*cdf0e10cSrcweir public: 191*cdf0e10cSrcweir SvTokenStream( const String & rFileName ); 192*cdf0e10cSrcweir SvTokenStream( SvStream & rInStream, const String & rFileName ); 193*cdf0e10cSrcweir ~SvTokenStream(); 194*cdf0e10cSrcweir 195*cdf0e10cSrcweir const String & GetFileName() const { return aFileName; } 196*cdf0e10cSrcweir SvStream & GetStream() { return rInStream; } 197*cdf0e10cSrcweir 198*cdf0e10cSrcweir void SetCharSet( CharSet nSet ); 199*cdf0e10cSrcweir CharSet GetCharSet() const { return nCharSet; } 200*cdf0e10cSrcweir 201*cdf0e10cSrcweir void SetTabSize( sal_uInt16 nTabSizeP ) 202*cdf0e10cSrcweir { nTabSize = nTabSizeP; } 203*cdf0e10cSrcweir sal_uInt16 GetTabSize() const { return nTabSize; } 204*cdf0e10cSrcweir 205*cdf0e10cSrcweir SvToken * GetToken_PrevAll() 206*cdf0e10cSrcweir { 207*cdf0e10cSrcweir SvToken * pRetToken = pCurToken; 208*cdf0e10cSrcweir if( NULL == (pCurToken = aTokList.Prev()) ) 209*cdf0e10cSrcweir // Current Zeiger nie Null 210*cdf0e10cSrcweir pCurToken = pRetToken; 211*cdf0e10cSrcweir 212*cdf0e10cSrcweir return pRetToken; 213*cdf0e10cSrcweir } 214*cdf0e10cSrcweir SvToken * GetToken_NextAll() 215*cdf0e10cSrcweir { 216*cdf0e10cSrcweir SvToken * pRetToken = pCurToken; 217*cdf0e10cSrcweir if( NULL == (pCurToken = aTokList.Next()) ) 218*cdf0e10cSrcweir // Current Zeiger nie Null 219*cdf0e10cSrcweir pCurToken = pRetToken; 220*cdf0e10cSrcweir SetMax(); 221*cdf0e10cSrcweir return pRetToken; 222*cdf0e10cSrcweir } 223*cdf0e10cSrcweir SvToken * GetToken_Next() 224*cdf0e10cSrcweir { 225*cdf0e10cSrcweir // Kommentare werden initial entfernt 226*cdf0e10cSrcweir return GetToken_NextAll(); 227*cdf0e10cSrcweir } 228*cdf0e10cSrcweir SvToken * GetToken() const { return pCurToken; } 229*cdf0e10cSrcweir sal_Bool Read( char cChar ) 230*cdf0e10cSrcweir { 231*cdf0e10cSrcweir if( pCurToken->IsChar() 232*cdf0e10cSrcweir && cChar == pCurToken->GetChar() ) 233*cdf0e10cSrcweir { 234*cdf0e10cSrcweir GetToken_Next(); 235*cdf0e10cSrcweir return sal_True; 236*cdf0e10cSrcweir } 237*cdf0e10cSrcweir else 238*cdf0e10cSrcweir return sal_False; 239*cdf0e10cSrcweir } 240*cdf0e10cSrcweir void ReadDelemiter() 241*cdf0e10cSrcweir { 242*cdf0e10cSrcweir if( pCurToken->IsChar() 243*cdf0e10cSrcweir && (';' == pCurToken->GetChar() 244*cdf0e10cSrcweir || ',' == pCurToken->GetChar()) ) 245*cdf0e10cSrcweir { 246*cdf0e10cSrcweir GetToken_Next(); 247*cdf0e10cSrcweir } 248*cdf0e10cSrcweir } 249*cdf0e10cSrcweir 250*cdf0e10cSrcweir sal_uInt32 Tell() const 251*cdf0e10cSrcweir { return aTokList.GetCurPos(); } 252*cdf0e10cSrcweir void Seek( sal_uInt32 nPos ) 253*cdf0e10cSrcweir { 254*cdf0e10cSrcweir pCurToken = aTokList.Seek( nPos ); 255*cdf0e10cSrcweir SetMax(); 256*cdf0e10cSrcweir } 257*cdf0e10cSrcweir void SeekRel( sal_Int32 nRelPos ) 258*cdf0e10cSrcweir { 259*cdf0e10cSrcweir pCurToken = aTokList.Seek( Tell() + nRelPos ); 260*cdf0e10cSrcweir SetMax(); 261*cdf0e10cSrcweir } 262*cdf0e10cSrcweir void SeekEnd() 263*cdf0e10cSrcweir { 264*cdf0e10cSrcweir pCurToken = aTokList.Seek( nMaxPos ); 265*cdf0e10cSrcweir } 266*cdf0e10cSrcweir }; 267*cdf0e10cSrcweir 268*cdf0e10cSrcweir 269*cdf0e10cSrcweir 270*cdf0e10cSrcweir #endif // _LEX_HXX 271*cdf0e10cSrcweir 272