blob: 82442c9d68e833c1a40d07a93338a0747f7d93a6 [file] [log] [blame]
/*
* tokenizer.h - Copyright 2005 Maksim Orlovich <maksim@kde.org>
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
*
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
* IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
* THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#ifndef TOKENIZER_H
#define TOKENIZER_H
#include <q3dict.h>
#include <qstring.h>
#include "step.h"
#include "path.h"
#include "predicate.h"
#include "expression.h"
#include "util.h"
#include "xpath.h"
struct Token
{
int type;
QString value;
int intValue; //0 if not set
Token(int _type): type(_type), intValue(0) {}
Token(QString _value): type(ERROR+1), value(_value),intValue(0) {}
Token(int _type, QString _value): type(_type), value(_value) {}
Token(int _type, int _value): type(_type), intValue(_value) {}
};
class Tokenizer
{
friend class TokenizerDeleter;
private:
unsigned int m_nextPos;
QString m_data;
int m_lastTokenType;
static Q3Dict<Step::AxisType>* s_axisNamesDict;
static Q3Dict<char>* s_nodeTypeNamesDict;
static Tokenizer* s_instance;
enum XMLCat {
NameStart,
NameCont,
NotPartOfName
};
XMLCat charCat(QChar aChar);
bool isAxisName(QString name, Step::AxisType *type = 0);
bool isNodeTypeName(QString name);
bool isOperatorContext();
void skipWS();
Token makeTokenAndAdvance(int code, int advance = 1);
Token makeIntTokenAndAdvance(int code, int val, int advance = 1);
char peekAheadHelper();
char peekCurHelper();
Token lexString();
Token lexNumber();
Token lexNCName();
Token lexQName();
Token nextTokenInternal();
Tokenizer();
Tokenizer(const Tokenizer &rhs); // disabled
Tokenizer &operator=(const Tokenizer &rhs); // disabled
public:
static Tokenizer &self();
void reset(QString);
Token nextToken();
};
// Interface to the parser
int xpathyylex();
void xpathyyerror(const char *str);
void initTokenizer(QString string);
#endif
// kate: indent-width 4; replace-tabs off; tab-width 4; indent-spaces: off;