xref: /AOO41X/main/idl/inc/lex.hxx (revision cdf0e10c4e3984b49a9502b011690b615761d4a3)
1*cdf0e10cSrcweir /*************************************************************************
2*cdf0e10cSrcweir  *
3*cdf0e10cSrcweir  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4*cdf0e10cSrcweir  *
5*cdf0e10cSrcweir  * Copyright 2000, 2010 Oracle and/or its affiliates.
6*cdf0e10cSrcweir  *
7*cdf0e10cSrcweir  * OpenOffice.org - a multi-platform office productivity suite
8*cdf0e10cSrcweir  *
9*cdf0e10cSrcweir  * This file is part of OpenOffice.org.
10*cdf0e10cSrcweir  *
11*cdf0e10cSrcweir  * OpenOffice.org is free software: you can redistribute it and/or modify
12*cdf0e10cSrcweir  * it under the terms of the GNU Lesser General Public License version 3
13*cdf0e10cSrcweir  * only, as published by the Free Software Foundation.
14*cdf0e10cSrcweir  *
15*cdf0e10cSrcweir  * OpenOffice.org is distributed in the hope that it will be useful,
16*cdf0e10cSrcweir  * but WITHOUT ANY WARRANTY; without even the implied warranty of
17*cdf0e10cSrcweir  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
18*cdf0e10cSrcweir  * GNU Lesser General Public License version 3 for more details
19*cdf0e10cSrcweir  * (a copy is included in the LICENSE file that accompanied this code).
20*cdf0e10cSrcweir  *
21*cdf0e10cSrcweir  * You should have received a copy of the GNU Lesser General Public License
22*cdf0e10cSrcweir  * version 3 along with OpenOffice.org.  If not, see
23*cdf0e10cSrcweir  * <http://www.openoffice.org/license.html>
24*cdf0e10cSrcweir  * for a copy of the LGPLv3 License.
25*cdf0e10cSrcweir  *
26*cdf0e10cSrcweir  ************************************************************************/
27*cdf0e10cSrcweir 
28*cdf0e10cSrcweir #ifndef _LEX_HXX
29*cdf0e10cSrcweir #define _LEX_HXX
30*cdf0e10cSrcweir 
31*cdf0e10cSrcweir #include <hash.hxx>
32*cdf0e10cSrcweir #include <tools/gen.hxx>
33*cdf0e10cSrcweir #include <tools/stream.hxx>
34*cdf0e10cSrcweir 
35*cdf0e10cSrcweir /******************** enum ***********************************************/
36*cdf0e10cSrcweir enum SVTOKEN_ENUM { SVTOKEN_EMPTY,      SVTOKEN_COMMENT,
37*cdf0e10cSrcweir                     SVTOKEN_INTEGER,    SVTOKEN_STRING,
38*cdf0e10cSrcweir                     SVTOKEN_BOOL,       SVTOKEN_IDENTIFIER,
39*cdf0e10cSrcweir                     SVTOKEN_CHAR,       SVTOKEN_RTTIBASE,
40*cdf0e10cSrcweir                     SVTOKEN_EOF,		SVTOKEN_HASHID };
41*cdf0e10cSrcweir 
42*cdf0e10cSrcweir /******************** class SvToken **************************************/
43*cdf0e10cSrcweir class BigInt;
44*cdf0e10cSrcweir class SvToken
45*cdf0e10cSrcweir {
46*cdf0e10cSrcweir friend class SvTokenStream;
47*cdf0e10cSrcweir     sal_uLong               	nLine, nColumn;
48*cdf0e10cSrcweir     SVTOKEN_ENUM        	nType;
49*cdf0e10cSrcweir     ByteString              	aString;
50*cdf0e10cSrcweir     union
51*cdf0e10cSrcweir 	{
52*cdf0e10cSrcweir         sal_uLong           	nLong;
53*cdf0e10cSrcweir         sal_Bool            	bBool;
54*cdf0e10cSrcweir         char            	cChar;
55*cdf0e10cSrcweir //	    SvRttiBase *    	pComplexObj;
56*cdf0e10cSrcweir 	    SvStringHashEntry *	pHash;
57*cdf0e10cSrcweir     };
58*cdf0e10cSrcweir public:
59*cdf0e10cSrcweir             SvToken();
60*cdf0e10cSrcweir             SvToken( const SvToken & rObj );
61*cdf0e10cSrcweir             SvToken( sal_uLong n );
62*cdf0e10cSrcweir             SvToken( SVTOKEN_ENUM nTypeP, sal_Bool b );
63*cdf0e10cSrcweir             SvToken( char c );
64*cdf0e10cSrcweir             SvToken( SVTOKEN_ENUM nTypeP, const ByteString & rStr );
65*cdf0e10cSrcweir //            SvToken( SvRttiBase * pComplexObj );
66*cdf0e10cSrcweir             SvToken( SVTOKEN_ENUM nTypeP );
67*cdf0e10cSrcweir 
68*cdf0e10cSrcweir     SvToken & operator = ( const SvToken & rObj );
69*cdf0e10cSrcweir 
70*cdf0e10cSrcweir     ByteString          GetTokenAsString() const;
71*cdf0e10cSrcweir     SVTOKEN_ENUM    GetType() const { return nType; }
72*cdf0e10cSrcweir 
73*cdf0e10cSrcweir     void        SetLine( sal_uLong nLineP )     { nLine = nLineP;       }
74*cdf0e10cSrcweir     sal_uLong       GetLine() const             { return nLine;         }
75*cdf0e10cSrcweir 
76*cdf0e10cSrcweir     void        SetColumn( sal_uLong nColumnP ) { nColumn = nColumnP;   }
77*cdf0e10cSrcweir     sal_uLong       GetColumn() const           { return nColumn;       }
78*cdf0e10cSrcweir 
79*cdf0e10cSrcweir     sal_Bool        IsEmpty() const     { return nType == SVTOKEN_EMPTY; }
80*cdf0e10cSrcweir     sal_Bool        IsComment() const   { return nType == SVTOKEN_COMMENT; }
81*cdf0e10cSrcweir     sal_Bool        IsInteger() const   { return nType == SVTOKEN_INTEGER; }
82*cdf0e10cSrcweir     sal_Bool        IsString() const    { return nType == SVTOKEN_STRING; }
83*cdf0e10cSrcweir     sal_Bool        IsBool() const      { return nType == SVTOKEN_BOOL; }
84*cdf0e10cSrcweir     sal_Bool        IsIdentifierHash() const
85*cdf0e10cSrcweir                 { return nType == SVTOKEN_HASHID; }
86*cdf0e10cSrcweir     sal_Bool        IsIdentifier() const
87*cdf0e10cSrcweir 				{
88*cdf0e10cSrcweir 					return nType == SVTOKEN_IDENTIFIER
89*cdf0e10cSrcweir 							|| nType == SVTOKEN_HASHID;
90*cdf0e10cSrcweir 				}
91*cdf0e10cSrcweir     sal_Bool        IsChar() const      { return nType == SVTOKEN_CHAR; }
92*cdf0e10cSrcweir     sal_Bool        IsRttiBase() const  { return nType == SVTOKEN_RTTIBASE; }
93*cdf0e10cSrcweir     sal_Bool        IsEof() const       { return nType == SVTOKEN_EOF; }
94*cdf0e10cSrcweir 
95*cdf0e10cSrcweir     const ByteString & GetString() const
96*cdf0e10cSrcweir 				{
97*cdf0e10cSrcweir 					return IsIdentifierHash()
98*cdf0e10cSrcweir 						? pHash->GetName()
99*cdf0e10cSrcweir 						: aString;
100*cdf0e10cSrcweir 				}
101*cdf0e10cSrcweir     sal_uLong       GetNumber() const       { return nLong;         }
102*cdf0e10cSrcweir     sal_Bool        GetBool() const         { return bBool;         }
103*cdf0e10cSrcweir     char        GetChar() const         { return cChar;         }
104*cdf0e10cSrcweir //    SvRttiBase *GetObject() const       { return pComplexObj;   }
105*cdf0e10cSrcweir 
106*cdf0e10cSrcweir     void        SetHash( SvStringHashEntry * pHashP )
107*cdf0e10cSrcweir 				{ pHash = pHashP; nType = SVTOKEN_HASHID; }
108*cdf0e10cSrcweir     sal_Bool        HasHash() const
109*cdf0e10cSrcweir                 { return nType == SVTOKEN_HASHID; }
110*cdf0e10cSrcweir     SvStringHashEntry * GetHash() const { return pHash; }
111*cdf0e10cSrcweir     sal_Bool        Is( SvStringHashEntry * pEntry ) const
112*cdf0e10cSrcweir                 { return IsIdentifierHash() && pHash == pEntry; }
113*cdf0e10cSrcweir };
114*cdf0e10cSrcweir 
115*cdf0e10cSrcweir inline SvToken::SvToken()
116*cdf0e10cSrcweir     : nType( SVTOKEN_EMPTY ) {}
117*cdf0e10cSrcweir 
118*cdf0e10cSrcweir inline SvToken::SvToken( sal_uLong n )
119*cdf0e10cSrcweir     : nType( SVTOKEN_INTEGER ), nLong( n ) {}
120*cdf0e10cSrcweir 
121*cdf0e10cSrcweir inline SvToken::SvToken( SVTOKEN_ENUM nTypeP, sal_Bool b )
122*cdf0e10cSrcweir     : nType( nTypeP ), bBool( b ) {}
123*cdf0e10cSrcweir 
124*cdf0e10cSrcweir inline SvToken::SvToken( char c )
125*cdf0e10cSrcweir     : nType( SVTOKEN_CHAR ), cChar( c ) {}
126*cdf0e10cSrcweir 
127*cdf0e10cSrcweir inline SvToken::SvToken( SVTOKEN_ENUM nTypeP, const ByteString & rStr )
128*cdf0e10cSrcweir     : nType( nTypeP ), aString( rStr ) {}
129*cdf0e10cSrcweir 
130*cdf0e10cSrcweir /*
131*cdf0e10cSrcweir inline SvToken::SvToken( SvRttiBase * pObj )
132*cdf0e10cSrcweir     : nType( SVTOKEN_RTTIBASE ), pComplexObj( pObj )
133*cdf0e10cSrcweir 		{ pObj->AddRef(); }
134*cdf0e10cSrcweir */
135*cdf0e10cSrcweir 
136*cdf0e10cSrcweir inline SvToken::SvToken( SVTOKEN_ENUM nTypeP )
137*cdf0e10cSrcweir : nType( nTypeP ) {}
138*cdf0e10cSrcweir 
139*cdf0e10cSrcweir DECLARE_LIST( SvTokenList, SvToken * )
140*cdf0e10cSrcweir 
141*cdf0e10cSrcweir /******************** class SvTokenStream ********************************/
142*cdf0e10cSrcweir class SvTokenStream
143*cdf0e10cSrcweir {
144*cdf0e10cSrcweir     sal_uLong       nLine, nColumn;
145*cdf0e10cSrcweir     int			nBufPos;
146*cdf0e10cSrcweir     int         c;          // naechstes Zeichen
147*cdf0e10cSrcweir     CharSet     nCharSet;
148*cdf0e10cSrcweir     char *      pCharTab;   // Zeiger auf die Konverierungstabelle
149*cdf0e10cSrcweir     sal_uInt16      nTabSize;   // Tabulator Laenge
150*cdf0e10cSrcweir 	ByteString		aStrTrue;
151*cdf0e10cSrcweir 	ByteString		aStrFalse;
152*cdf0e10cSrcweir 	sal_uLong		nMaxPos;
153*cdf0e10cSrcweir 
154*cdf0e10cSrcweir     SvFileStream *  pInStream;
155*cdf0e10cSrcweir     SvStream &      rInStream;
156*cdf0e10cSrcweir     String          aFileName;
157*cdf0e10cSrcweir     SvTokenList     aTokList;
158*cdf0e10cSrcweir 	SvToken *		pCurToken;
159*cdf0e10cSrcweir 
160*cdf0e10cSrcweir     void        InitCtor();
161*cdf0e10cSrcweir 
162*cdf0e10cSrcweir     ByteString      	aBufStr;
163*cdf0e10cSrcweir     int         	GetNextChar();
164*cdf0e10cSrcweir     int         	GetFastNextChar()
165*cdf0e10cSrcweir 					{
166*cdf0e10cSrcweir                         return aBufStr.GetChar((sal_uInt16)nBufPos++);
167*cdf0e10cSrcweir 					}
168*cdf0e10cSrcweir 
169*cdf0e10cSrcweir 	void			FillTokenList();
170*cdf0e10cSrcweir     sal_uLong       	GetNumber();
171*cdf0e10cSrcweir     sal_Bool        	MakeToken( SvToken & );
172*cdf0e10cSrcweir 	sal_Bool			IsEof() const { return rInStream.IsEof(); }
173*cdf0e10cSrcweir 	void			SetMax()
174*cdf0e10cSrcweir 					{
175*cdf0e10cSrcweir 						sal_uLong n = Tell();
176*cdf0e10cSrcweir 						if( n > nMaxPos )
177*cdf0e10cSrcweir 							nMaxPos = n;
178*cdf0e10cSrcweir 					}
179*cdf0e10cSrcweir 	void			CalcColumn()
180*cdf0e10cSrcweir 					{
181*cdf0e10cSrcweir 						// wenn Zeilenende berechnung sparen
182*cdf0e10cSrcweir 						if( 0 != c )
183*cdf0e10cSrcweir 						{
184*cdf0e10cSrcweir 							sal_uInt16 n = 0;
185*cdf0e10cSrcweir 							nColumn = 0;
186*cdf0e10cSrcweir 							while( n < nBufPos )
187*cdf0e10cSrcweir                                 nColumn += aBufStr.GetChar(n++) == '\t' ? nTabSize : 1;
188*cdf0e10cSrcweir 						}
189*cdf0e10cSrcweir 					}
190*cdf0e10cSrcweir public:
191*cdf0e10cSrcweir                     SvTokenStream( const String & rFileName );
192*cdf0e10cSrcweir                     SvTokenStream( SvStream & rInStream, const String & rFileName );
193*cdf0e10cSrcweir                     ~SvTokenStream();
194*cdf0e10cSrcweir 
195*cdf0e10cSrcweir     const String &  GetFileName() const { return aFileName; }
196*cdf0e10cSrcweir     SvStream &      GetStream() { return rInStream; }
197*cdf0e10cSrcweir 
198*cdf0e10cSrcweir     void            SetCharSet( CharSet nSet );
199*cdf0e10cSrcweir     CharSet         GetCharSet() const { return nCharSet; }
200*cdf0e10cSrcweir 
201*cdf0e10cSrcweir     void            SetTabSize( sal_uInt16 nTabSizeP )
202*cdf0e10cSrcweir                     { nTabSize = nTabSizeP; }
203*cdf0e10cSrcweir     sal_uInt16          GetTabSize() const { return nTabSize; }
204*cdf0e10cSrcweir 
205*cdf0e10cSrcweir     SvToken *       GetToken_PrevAll()
206*cdf0e10cSrcweir 					{
207*cdf0e10cSrcweir 					    SvToken * pRetToken = pCurToken;
208*cdf0e10cSrcweir 					    if( NULL == (pCurToken = aTokList.Prev()) )
209*cdf0e10cSrcweir 							// Current Zeiger nie Null
210*cdf0e10cSrcweir 							pCurToken = pRetToken;
211*cdf0e10cSrcweir 
212*cdf0e10cSrcweir 					    return pRetToken;
213*cdf0e10cSrcweir 					}
214*cdf0e10cSrcweir     SvToken *       GetToken_NextAll()
215*cdf0e10cSrcweir 					{
216*cdf0e10cSrcweir 					    SvToken * pRetToken = pCurToken;
217*cdf0e10cSrcweir 					    if( NULL == (pCurToken = aTokList.Next()) )
218*cdf0e10cSrcweir 							// Current Zeiger nie Null
219*cdf0e10cSrcweir 							pCurToken = pRetToken;
220*cdf0e10cSrcweir 						SetMax();
221*cdf0e10cSrcweir 					    return pRetToken;
222*cdf0e10cSrcweir 					}
223*cdf0e10cSrcweir     SvToken *       GetToken_Next()
224*cdf0e10cSrcweir 					{
225*cdf0e10cSrcweir 						// Kommentare werden initial entfernt
226*cdf0e10cSrcweir 						return GetToken_NextAll();
227*cdf0e10cSrcweir 					}
228*cdf0e10cSrcweir     SvToken *       GetToken() const { return pCurToken; }
229*cdf0e10cSrcweir     sal_Bool            Read( char cChar )
230*cdf0e10cSrcweir                     {
231*cdf0e10cSrcweir 					    if( pCurToken->IsChar()
232*cdf0e10cSrcweir 						  && cChar == pCurToken->GetChar() )
233*cdf0e10cSrcweir 						{
234*cdf0e10cSrcweir 							GetToken_Next();
235*cdf0e10cSrcweir 							return sal_True;
236*cdf0e10cSrcweir 						}
237*cdf0e10cSrcweir 						else
238*cdf0e10cSrcweir 							return sal_False;
239*cdf0e10cSrcweir 					}
240*cdf0e10cSrcweir     void            ReadDelemiter()
241*cdf0e10cSrcweir                     {
242*cdf0e10cSrcweir 					    if( pCurToken->IsChar()
243*cdf0e10cSrcweir 						  && (';' == pCurToken->GetChar()
244*cdf0e10cSrcweir 						  	  || ',' == pCurToken->GetChar()) )
245*cdf0e10cSrcweir 						{
246*cdf0e10cSrcweir 							GetToken_Next();
247*cdf0e10cSrcweir 						}
248*cdf0e10cSrcweir 					}
249*cdf0e10cSrcweir 
250*cdf0e10cSrcweir     sal_uInt32          Tell() const
251*cdf0e10cSrcweir                     { return aTokList.GetCurPos(); }
252*cdf0e10cSrcweir     void            Seek( sal_uInt32 nPos )
253*cdf0e10cSrcweir                     {
254*cdf0e10cSrcweir                         pCurToken = aTokList.Seek( nPos );
255*cdf0e10cSrcweir 						SetMax();
256*cdf0e10cSrcweir                     }
257*cdf0e10cSrcweir     void            SeekRel( sal_Int32 nRelPos )
258*cdf0e10cSrcweir                     {
259*cdf0e10cSrcweir                         pCurToken = aTokList.Seek( Tell() + nRelPos );
260*cdf0e10cSrcweir 						SetMax();
261*cdf0e10cSrcweir                     }
262*cdf0e10cSrcweir     void            SeekEnd()
263*cdf0e10cSrcweir                     {
264*cdf0e10cSrcweir                         pCurToken = aTokList.Seek( nMaxPos );
265*cdf0e10cSrcweir                     }
266*cdf0e10cSrcweir };
267*cdf0e10cSrcweir 
268*cdf0e10cSrcweir 
269*cdf0e10cSrcweir 
270*cdf0e10cSrcweir #endif // _LEX_HXX
271*cdf0e10cSrcweir 
272