blob: 93da4ad0c5186dfc1598a1a01ea28e1d55ad8ebe [file] [log] [blame]
/*
* Copyright (C) 2009 Apple Inc. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY
* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#pragma once
#include "Identifier.h"
#include "JSCJSValue.h"
#include <array>
#include <wtf/text/StringBuilder.h>
#include <wtf/text/WTFString.h>
namespace JSC {
typedef enum { StrictJSON, NonStrictJSON, JSONP } ParserMode;
enum JSONPPathEntryType {
JSONPPathEntryTypeDeclareVar, // var pathEntryName = JSON
JSONPPathEntryTypeDot, // <prior entries>.pathEntryName = JSON
JSONPPathEntryTypeLookup, // <prior entries>[pathIndex] = JSON
JSONPPathEntryTypeCall // <prior entries>(JSON)
};
enum ParserState { StartParseObject, StartParseArray, StartParseExpression,
StartParseStatement, StartParseStatementEndStatement,
DoParseObjectStartExpression, DoParseObjectEndExpression,
DoParseArrayStartExpression, DoParseArrayEndExpression };
enum TokenType { TokLBracket, TokRBracket, TokLBrace, TokRBrace,
TokString, TokIdentifier, TokNumber, TokColon,
TokLParen, TokRParen, TokComma, TokTrue, TokFalse,
TokNull, TokEnd, TokDot, TokAssign, TokSemi, TokError };
struct JSONPPathEntry {
JSONPPathEntryType m_type;
Identifier m_pathEntryName;
int m_pathIndex;
};
struct JSONPData {
Vector<JSONPPathEntry> m_path;
Strong<Unknown> m_value;
};
template <typename CharType>
struct LiteralParserToken {
private:
WTF_MAKE_NONCOPYABLE(LiteralParserToken<CharType>);
public:
LiteralParserToken() = default;
TokenType type;
const CharType* start;
const CharType* end;
union {
double numberToken;
struct {
union {
const LChar* stringToken8;
const UChar* stringToken16;
};
unsigned stringIs8Bit : 1;
unsigned stringLength : 31;
};
};
};
template <typename CharType>
ALWAYS_INLINE void setParserTokenString(LiteralParserToken<CharType>&, const CharType* string);
template <typename CharType>
class LiteralParser {
public:
LiteralParser(JSGlobalObject* globalObject, const CharType* characters, unsigned length, ParserMode mode, CodeBlock* nullOrCodeBlock = nullptr)
: m_globalObject(globalObject)
, m_nullOrCodeBlock(nullOrCodeBlock)
, m_lexer(characters, length, mode)
, m_mode(mode)
{
}
String getErrorMessage()
{
if (!m_lexer.getErrorMessage().isEmpty())
return "JSON Parse error: " + m_lexer.getErrorMessage();
if (!m_parseErrorMessage.isEmpty())
return "JSON Parse error: " + m_parseErrorMessage;
return "JSON Parse error: Unable to parse JSON string"_s;
}
JSValue tryLiteralParse()
{
m_lexer.next();
JSValue result = parse(m_mode == StrictJSON ? StartParseExpression : StartParseStatement);
if (m_lexer.currentToken()->type == TokSemi)
m_lexer.next();
if (m_lexer.currentToken()->type != TokEnd)
return JSValue();
return result;
}
bool tryJSONPParse(Vector<JSONPData>&, bool needsFullSourceInfo);
private:
class Lexer {
public:
Lexer(const CharType* characters, unsigned length, ParserMode mode)
: m_mode(mode)
, m_ptr(characters)
, m_end(characters + length)
{
}
TokenType next();
#if ASSERT_DISABLED
typedef const LiteralParserToken<CharType>* LiteralParserTokenPtr;
LiteralParserTokenPtr currentToken()
{
return &m_currentToken;
}
#else
class LiteralParserTokenPtr;
friend class LiteralParserTokenPtr;
class LiteralParserTokenPtr {
public:
LiteralParserTokenPtr(Lexer& lexer)
: m_lexer(lexer)
, m_tokenID(lexer.m_currentTokenID)
{
}
ALWAYS_INLINE const LiteralParserToken<CharType>* operator->() const
{
ASSERT(m_tokenID == m_lexer.m_currentTokenID);
return &m_lexer.m_currentToken;
}
private:
Lexer& m_lexer;
unsigned m_tokenID;
};
LiteralParserTokenPtr currentToken()
{
return LiteralParserTokenPtr(*this);
}
#endif
String getErrorMessage() { return m_lexErrorMessage; }
private:
String m_lexErrorMessage;
TokenType lex(LiteralParserToken<CharType>&);
ALWAYS_INLINE TokenType lexIdentifier(LiteralParserToken<CharType>&);
ALWAYS_INLINE TokenType lexString(LiteralParserToken<CharType>&, CharType terminator);
TokenType lexStringSlow(LiteralParserToken<CharType>&, const CharType* runStart, CharType terminator);
ALWAYS_INLINE TokenType lexNumber(LiteralParserToken<CharType>&);
LiteralParserToken<CharType> m_currentToken;
ParserMode m_mode;
const CharType* m_ptr;
const CharType* m_end;
StringBuilder m_builder;
#if !ASSERT_DISABLED
unsigned m_currentTokenID { 0 };
#endif
};
class StackGuard;
JSValue parse(ParserState);
JSGlobalObject* m_globalObject;
CodeBlock* m_nullOrCodeBlock;
typename LiteralParser<CharType>::Lexer m_lexer;
ParserMode m_mode;
String m_parseErrorMessage;
static unsigned const MaximumCachableCharacter = 128;
std::array<Identifier, MaximumCachableCharacter> m_shortIdentifiers;
std::array<Identifier, MaximumCachableCharacter> m_recentIdentifiers;
ALWAYS_INLINE const Identifier makeIdentifier(const LChar* characters, size_t length);
ALWAYS_INLINE const Identifier makeIdentifier(const UChar* characters, size_t length);
};
} // namespace JSC