1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219
|
#ifndef INC_CharScanner_hpp__
#define INC_CharScanner_hpp__
/**
* <b>SOFTWARE RIGHTS</b>
* <p>
* ANTLR 2.6.0 MageLang Insitute, 1999
* <p>
* We reserve no legal rights to the ANTLR--it is fully in the
* public domain. An individual or company may do whatever
* they wish with source code distributed with ANTLR or the
* code generated by ANTLR, including the incorporation of
* ANTLR, or its output, into commerical software.
* <p>
* We encourage users to develop software with ANTLR. However,
* we do ask that credit is given to us for developing
* ANTLR. By "credit", we mean that if you use ANTLR or
* incorporate any source code into one of your programs
* (commercial product, research project, or otherwise) that
* you acknowledge this fact somewhere in the documentation,
* research report, etc... If you like ANTLR and have
* developed a nice tool with the output, please mention that
* you developed it using ANTLR. In addition, we ask that the
* headers remain intact in our source code. As long as these
* guidelines are kept, we expect to continue enhancing this
* system and expect to make other tools available as they are
* completed.
* <p>
* The ANTLR gang:
* @version ANTLR 2.6.0 MageLang Insitute, 1999
* @author Terence Parr, <a href=http://www.MageLang.com>MageLang Institute</a>
* @author <br>John Lilley, <a href=http://www.Empathy.com>Empathy Software</a>
* @author <br><a href="mailto:pete@yamuna.demon.co.uk">Pete Wells</a>
*/
#include "Antlr/config.hpp"
#include "Antlr/TokenStream.hpp"
#include "Antlr/ScannerException.hpp"
#include "Antlr/InputBuffer.hpp"
#include "Antlr/BitSet.hpp"
#include "Antlr/LexerSharedInputState.hpp"
#include <cstdio>
#include <map>
class CharScanner;
class CharScannerLiteralsLess : public std::binary_function<std::string,std::string,bool> {
private:
const CharScanner* scanner;
public:
#ifdef NO_TEMPLATE_PARTS
CharScannerLiteralsLess(); // not really used
#endif
CharScannerLiteralsLess(const CharScanner* theScanner);
bool operator() (const std::string& x,const std::string& y) const;
};
class CharScanner : public TokenStream {
private:
#ifndef NO_STATIC_CONSTS
static const char NO_CHAR = 0;
#else
enum {
NO_CHAR = 0
};
#endif
public:
#ifndef NO_STATIC_CONSTS
static const int EOF_CHAR = EOF;
#else
enum {
EOF_CHAR = EOF
};
#endif
protected:
std::string text; // text of current token
bool saveConsumedInput; // does consume() save characters?
typedef RefToken (*factory_type)();
factory_type tokenFactory; // what kind of tokens to create?
bool caseSensitive;
std::map<std::string,int,CharScannerLiteralsLess> literals; // set by subclass
RefToken _returnToken; // used to return tokens w/o using return val
// Input chars
LexerSharedInputState inputState;
/** Used during filter mode to indicate that path is desired.
* A subsequent scan error will report an error as usual if acceptPath=true;
*/
bool commitToPath;
public:
CharScanner();
CharScanner(InputBuffer& cb);
CharScanner(InputBuffer* cb);
CharScanner(const LexerSharedInputState& state);
virtual ~CharScanner();
virtual void append(char c);
virtual void append(const std::string& s);
virtual void commit();
virtual void consume();
/** Consume chars until one matches the given char */
virtual void consumeUntil(int c);
/** Consume chars until one matches the given set */
virtual void consumeUntil(const BitSet& set);
virtual bool getCaseSensitive() const;
virtual bool getCaseSensitiveLiterals() const=0;
virtual bool getCommitToPath() const;
virtual const std::string& getFilename() const;
virtual InputBuffer& getInputBuffer();
virtual LexerSharedInputState getInputState();
virtual int getLine() const;
// return a copy of the current text buffer
virtual const std::string& getText() const;
virtual RefToken getTokenObject() const;
virtual int LA(int i);
protected:
virtual RefToken makeToken(int t);
public:
virtual int mark();
virtual void match(int c);
virtual void match(const BitSet& b);
virtual void match(const std::string& s);
virtual void matchNot(int c);
virtual void matchRange(int c1, int c2);
virtual void newline();
void panic();
void panic(const std::string& s);
/** Report exception errors caught in nextToken() */
virtual void reportError(const ScannerException& e);
/** Parser error-reporting function can be overridden in subclass */
virtual void reportError(const std::string& s);
/** Parser warning-reporting function can be overridden in subclass */
virtual void reportWarning(const std::string& s);
virtual void resetText();
virtual void rewind(int pos);
virtual void setCaseSensitive(bool t);
virtual void setCommitToPath(bool commit);
virtual void setFilename(const std::string& f);
virtual void setLine(int l);
virtual void setText(const std::string& s);
virtual void setTokenObjectFactory(factory_type factory);
// Test the token text against the literals table
// Override this method to perform a different literals test
virtual int testLiteralsTable(int ttype) const;
// Override this method to get more specific case handling
virtual int toLower(int c) const;
protected:
class Tracer {
private:
CharScanner* parser;
std::string text;
public:
Tracer(CharScanner* p,const std::string& t)
: parser(p), text(t) { parser->traceIn(text); }
~Tracer()
{ parser->traceOut(text); }
};
public:
virtual void traceIn(const std::string& rname);
virtual void traceOut(const std::string& rname);
protected:
static const char* charName(int ch);
};
#endif //INC_CharScanner_hpp__
|